2016-04-04 12:27:51 +02:00
/ *
Copyright 2016 GitHub Inc .
2016-05-16 11:09:17 +02:00
See https : //github.com/github/gh-ost/blob/master/LICENSE
2016-04-04 12:27:51 +02:00
* /
package logic
import (
gosql "database/sql"
"fmt"
2016-10-20 11:29:30 +02:00
"reflect"
2016-04-04 12:27:51 +02:00
"strings"
2016-07-29 10:40:23 +02:00
"sync/atomic"
2016-11-02 12:48:35 +01:00
"time"
2016-04-04 12:27:51 +02:00
2016-05-16 11:09:17 +02:00
"github.com/github/gh-ost/go/base"
"github.com/github/gh-ost/go/mysql"
"github.com/github/gh-ost/go/sql"
2016-04-04 12:27:51 +02:00
"github.com/outbrain/golib/log"
"github.com/outbrain/golib/sqlutils"
)
2016-12-13 12:27:20 +01:00
const startSlavePostWaitMilliseconds = 500 * time . Millisecond
2016-04-04 12:27:51 +02:00
// Inspector reads data from the read-MySQL-server (typically a replica, but can be the master)
// It is used for gaining initial status and structure, and later also follow up on progress and changelog
type Inspector struct {
2017-09-22 16:06:06 -07:00
connectionConfig * mysql . ConnectionConfig
db * gosql . DB
informationSchemaDb * gosql . DB
migrationContext * base . MigrationContext
2016-04-04 12:27:51 +02:00
}
2017-08-08 13:36:54 -07:00
func NewInspector ( migrationContext * base . MigrationContext ) * Inspector {
2016-04-04 12:27:51 +02:00
return & Inspector {
2017-08-08 13:36:54 -07:00
connectionConfig : migrationContext . InspectorConnectionConfig ,
migrationContext : migrationContext ,
2016-04-04 12:27:51 +02:00
}
}
func ( this * Inspector ) InitDBConnections ( ) ( err error ) {
2018-03-07 16:30:02 +02:00
inspectorUri := this . connectionConfig . GetDBUri ( this . migrationContext . DatabaseName , this . migrationContext . IncludeRiskyCharsets )
2017-12-14 15:53:29 -08:00
if this . db , _ , err = mysql . GetDB ( this . migrationContext . Uuid , inspectorUri ) ; err != nil {
2016-04-04 12:27:51 +02:00
return err
}
2017-09-22 16:06:06 -07:00
2018-01-15 23:39:02 +08:00
informationSchemaUri := this . connectionConfig . GetDBUri ( "information_schema" , false )
2017-12-14 15:53:29 -08:00
if this . informationSchemaDb , _ , err = mysql . GetDB ( this . migrationContext . Uuid , informationSchemaUri ) ; err != nil {
2017-09-22 16:06:06 -07:00
return err
}
2016-04-04 12:27:51 +02:00
if err := this . validateConnection ( ) ; err != nil {
return err
}
2016-06-19 17:55:37 +02:00
if impliedKey , err := mysql . GetInstanceKey ( this . db ) ; err != nil {
return err
} else {
this . connectionConfig . ImpliedKey = impliedKey
}
2016-04-04 12:27:51 +02:00
if err := this . validateGrants ( ) ; err != nil {
return err
}
2016-04-18 10:57:18 -07:00
if err := this . validateBinlogs ( ) ; err != nil {
2016-04-11 17:27:16 +02:00
return err
}
2016-04-18 10:57:18 -07:00
if err := this . applyBinlogFormat ( ) ; err != nil {
2016-04-04 12:27:51 +02:00
return err
}
2017-02-07 09:41:33 +02:00
log . Infof ( "Inspector initiated on %+v, version %+v" , this . connectionConfig . ImpliedKey , this . migrationContext . InspectorMySQLVersion )
2016-04-07 15:57:12 +02:00
return nil
}
func ( this * Inspector ) ValidateOriginalTable ( ) ( err error ) {
2016-04-04 12:27:51 +02:00
if err := this . validateTable ( ) ; err != nil {
return err
}
2016-10-10 12:28:56 +02:00
if err := this . validateTableForeignKeys ( this . migrationContext . DiscardForeignKeys ) ; err != nil {
2016-04-04 18:19:46 +02:00
return err
}
2016-08-11 14:10:35 +02:00
if err := this . validateTableTriggers ( ) ; err != nil {
return err
}
2016-06-06 12:33:05 +02:00
if err := this . estimateTableRowsViaExplain ( ) ; err != nil {
return err
2016-04-04 12:27:51 +02:00
}
return nil
}
2016-04-11 17:27:16 +02:00
func ( this * Inspector ) InspectTableColumnsAndUniqueKeys ( tableName string ) ( columns * sql . ColumnList , uniqueKeys [ ] ( * sql . UniqueKey ) , err error ) {
2016-04-08 14:35:06 +02:00
uniqueKeys , err = this . getCandidateUniqueKeys ( tableName )
2016-04-04 12:27:51 +02:00
if err != nil {
2016-04-08 14:35:06 +02:00
return columns , uniqueKeys , err
2016-04-04 12:27:51 +02:00
}
if len ( uniqueKeys ) == 0 {
2016-04-08 14:35:06 +02:00
return columns , uniqueKeys , fmt . Errorf ( "No PRIMARY nor UNIQUE key found in table! Bailing out" )
}
2016-10-20 11:29:30 +02:00
columns , err = mysql . GetTableColumns ( this . db , this . migrationContext . DatabaseName , tableName )
2016-04-08 14:35:06 +02:00
if err != nil {
return columns , uniqueKeys , err
}
return columns , uniqueKeys , nil
}
func ( this * Inspector ) InspectOriginalTable ( ) ( err error ) {
this . migrationContext . OriginalTableColumns , this . migrationContext . OriginalTableUniqueKeys , err = this . InspectTableColumnsAndUniqueKeys ( this . migrationContext . OriginalTableName )
2016-12-11 02:19:19 +01:00
if err != nil {
2016-04-08 14:35:06 +02:00
return err
}
return nil
}
2016-10-20 11:29:30 +02:00
// inspectOriginalAndGhostTables compares original and ghost tables to see whether the migration
2016-06-06 12:33:05 +02:00
// makes sense and is valid. It extracts the list of shared columns and the chosen migration unique key
2016-10-20 11:29:30 +02:00
func ( this * Inspector ) inspectOriginalAndGhostTables ( ) ( err error ) {
originalNamesOnApplier := this . migrationContext . OriginalTableColumnsOnApplier . Names ( )
originalNames := this . migrationContext . OriginalTableColumns . Names ( )
if ! reflect . DeepEqual ( originalNames , originalNamesOnApplier ) {
return fmt . Errorf ( "It seems like table structure is not identical between master and replica. This scenario is not supported." )
}
2016-04-08 14:35:06 +02:00
this . migrationContext . GhostTableColumns , this . migrationContext . GhostTableUniqueKeys , err = this . InspectTableColumnsAndUniqueKeys ( this . migrationContext . GetGhostTableName ( ) )
if err != nil {
return err
}
sharedUniqueKeys , err := this . getSharedUniqueKeys ( this . migrationContext . OriginalTableUniqueKeys , this . migrationContext . GhostTableUniqueKeys )
if err != nil {
return err
}
2017-09-03 09:57:26 +03:00
for i , sharedUniqueKey := range sharedUniqueKeys {
this . applyColumnTypes ( this . migrationContext . DatabaseName , this . migrationContext . OriginalTableName , & sharedUniqueKey . Columns )
uniqueKeyIsValid := true
for _ , column := range sharedUniqueKey . Columns . Columns ( ) {
switch column . Type {
case sql . FloatColumnType :
{
log . Warning ( "Will not use %+v as shared key due to FLOAT data type" , sharedUniqueKey . Name )
uniqueKeyIsValid = false
}
case sql . JSONColumnType :
{
// Noteworthy that at this time MySQL does not allow JSON indexing anyhow, but this code
// will remain in place to potentially handle the future case where JSON is supported in indexes.
log . Warning ( "Will not use %+v as shared key due to JSON data type" , sharedUniqueKey . Name )
uniqueKeyIsValid = false
}
}
}
if uniqueKeyIsValid {
this . migrationContext . UniqueKey = sharedUniqueKeys [ i ]
break
}
}
if this . migrationContext . UniqueKey == nil {
2016-04-08 14:35:06 +02:00
return fmt . Errorf ( "No shared unique key can be found after ALTER! Bailing out" )
2016-04-04 12:27:51 +02:00
}
2016-04-08 14:35:06 +02:00
log . Infof ( "Chosen shared unique key is %s" , this . migrationContext . UniqueKey . Name )
2016-05-20 12:52:14 +02:00
if this . migrationContext . UniqueKey . HasNullable {
if this . migrationContext . NullableUniqueKeyAllowed {
log . Warningf ( "Chosen key (%s) has nullable columns. You have supplied with --allow-nullable-unique-key and so this migration proceeds. As long as there aren't NULL values in this key's column, migration should be fine. NULL values will corrupt migration's data" , this . migrationContext . UniqueKey )
} else {
return fmt . Errorf ( "Chosen key (%s) has nullable columns. Bailing out. To force this operation to continue, supply --allow-nullable-unique-key flag. Only do so if you are certain there are no actual NULL values in this key. As long as there aren't, migration should be fine. NULL values in columns of this key will corrupt migration's data" , this . migrationContext . UniqueKey )
}
}
2016-04-11 17:27:16 +02:00
if ! this . migrationContext . UniqueKey . IsPrimary ( ) {
2016-05-20 12:52:14 +02:00
if this . migrationContext . OriginalBinlogRowImage != "FULL" {
return fmt . Errorf ( "binlog_row_image is '%s' and chosen key is %s, which is not the primary key. This operation cannot proceed. You may `set global binlog_row_image='full'` and try again" , this . migrationContext . OriginalBinlogRowImage , this . migrationContext . UniqueKey )
2016-04-11 17:27:16 +02:00
}
}
2016-04-08 14:35:06 +02:00
2016-06-17 08:03:18 +02:00
this . migrationContext . SharedColumns , this . migrationContext . MappedSharedColumns = this . getSharedColumns ( this . migrationContext . OriginalTableColumns , this . migrationContext . GhostTableColumns , this . migrationContext . ColumnRenameMap )
2016-04-08 14:35:06 +02:00
log . Infof ( "Shared columns are %s" , this . migrationContext . SharedColumns )
// By fact that a non-empty unique key exists we also know the shared columns are non-empty
2016-08-17 06:51:58 +02:00
// This additional step looks at which columns are unsigned. We could have merged this within
// the `getTableColumns()` function, but it's a later patch and introduces some complexity; I feel
// comfortable in doing this as a separate step.
2016-10-20 15:05:47 +02:00
this . applyColumnTypes ( this . migrationContext . DatabaseName , this . migrationContext . OriginalTableName , this . migrationContext . OriginalTableColumns , this . migrationContext . SharedColumns )
this . applyColumnTypes ( this . migrationContext . DatabaseName , this . migrationContext . OriginalTableName , & this . migrationContext . UniqueKey . Columns )
2016-09-07 14:24:11 +02:00
this . applyColumnTypes ( this . migrationContext . DatabaseName , this . migrationContext . GetGhostTableName ( ) , this . migrationContext . GhostTableColumns , this . migrationContext . MappedSharedColumns )
2016-08-17 06:51:58 +02:00
2016-10-13 13:09:58 +02:00
for i := range this . migrationContext . SharedColumns . Columns ( ) {
column := this . migrationContext . SharedColumns . Columns ( ) [ i ]
mappedColumn := this . migrationContext . MappedSharedColumns . Columns ( ) [ i ]
if column . Name == mappedColumn . Name && column . Type == sql . DateTimeColumnType && mappedColumn . Type == sql . TimestampColumnType {
this . migrationContext . MappedSharedColumns . SetConvertDatetimeToTimestamp ( column . Name , this . migrationContext . ApplierTimeZone )
}
}
2016-10-14 09:33:53 +02:00
for _ , column := range this . migrationContext . UniqueKey . Columns . Columns ( ) {
if this . migrationContext . MappedSharedColumns . HasTimezoneConversion ( column . Name ) {
return fmt . Errorf ( "No support at this time for converting a column from DATETIME to TIMESTAMP that is also part of the chosen unique key. Column: %s, key: %s" , column . Name , this . migrationContext . UniqueKey . Name )
}
}
2016-04-08 14:35:06 +02:00
return nil
2016-04-04 12:27:51 +02:00
}
// validateConnection issues a simple can-connect to MySQL
func ( this * Inspector ) validateConnection ( ) error {
2017-09-03 10:27:04 +03:00
if len ( this . connectionConfig . Password ) > mysql . MaxReplicationPasswordLength {
return fmt . Errorf ( "MySQL replication length limited to 32 characters. See https://dev.mysql.com/doc/refman/5.7/en/assigning-passwords.html" )
}
2017-09-06 14:25:35 -04:00
version , err := base . ValidateConnection ( this . db , this . connectionConfig )
this . migrationContext . InspectorMySQLVersion = version
return err
2016-04-04 12:27:51 +02:00
}
// validateGrants verifies the user by which we're executing has necessary grants
2017-11-08 01:02:32 +00:00
// to do its thing.
2016-04-04 12:27:51 +02:00
func ( this * Inspector ) validateGrants ( ) error {
2016-05-16 11:09:17 +02:00
query := ` show /* gh-ost */ grants for current_user() `
2016-04-04 12:27:51 +02:00
foundAll := false
foundSuper := false
2016-08-12 14:26:58 +02:00
foundReplicationClient := false
2016-04-04 12:27:51 +02:00
foundReplicationSlave := false
foundDBAll := false
err := sqlutils . QueryRowsMap ( this . db , query , func ( rowMap sqlutils . RowMap ) error {
for _ , grantData := range rowMap {
grant := grantData . String
if strings . Contains ( grant , ` GRANT ALL PRIVILEGES ON *.* ` ) {
foundAll = true
}
if strings . Contains ( grant , ` SUPER ` ) && strings . Contains ( grant , ` ON *.* ` ) {
foundSuper = true
}
2016-08-12 14:26:58 +02:00
if strings . Contains ( grant , ` REPLICATION CLIENT ` ) && strings . Contains ( grant , ` ON *.* ` ) {
foundReplicationClient = true
}
2016-04-04 12:27:51 +02:00
if strings . Contains ( grant , ` REPLICATION SLAVE ` ) && strings . Contains ( grant , ` ON *.* ` ) {
foundReplicationSlave = true
}
if strings . Contains ( grant , fmt . Sprintf ( "GRANT ALL PRIVILEGES ON `%s`.*" , this . migrationContext . DatabaseName ) ) {
foundDBAll = true
}
2016-06-17 08:03:18 +02:00
if base . StringContainsAll ( grant , ` ALTER ` , ` CREATE ` , ` DELETE ` , ` DROP ` , ` INDEX ` , ` INSERT ` , ` LOCK TABLES ` , ` SELECT ` , ` TRIGGER ` , ` UPDATE ` , ` ON *.* ` ) {
2016-06-16 16:06:26 +02:00
foundDBAll = true
}
2016-06-17 08:03:18 +02:00
if base . StringContainsAll ( grant , ` ALTER ` , ` CREATE ` , ` DELETE ` , ` DROP ` , ` INDEX ` , ` INSERT ` , ` LOCK TABLES ` , ` SELECT ` , ` TRIGGER ` , ` UPDATE ` , fmt . Sprintf ( " ON `%s`.*" , this . migrationContext . DatabaseName ) ) {
2016-06-16 16:06:26 +02:00
foundDBAll = true
}
2016-04-04 12:27:51 +02:00
}
return nil
} )
if err != nil {
2016-04-04 15:29:02 +02:00
return err
2016-04-04 12:27:51 +02:00
}
2016-08-12 14:26:58 +02:00
this . migrationContext . HasSuperPrivilege = foundSuper
2016-04-04 12:27:51 +02:00
if foundAll {
log . Infof ( "User has ALL privileges" )
return nil
}
if foundSuper && foundReplicationSlave && foundDBAll {
2016-08-05 11:41:36 +02:00
log . Infof ( "User has SUPER, REPLICATION SLAVE privileges, and has ALL privileges on %s.*" , sql . EscapeName ( this . migrationContext . DatabaseName ) )
2016-04-04 12:27:51 +02:00
return nil
}
2016-08-12 14:26:58 +02:00
if foundReplicationClient && foundReplicationSlave && foundDBAll {
log . Infof ( "User has REPLICATION CLIENT, REPLICATION SLAVE privileges, and has ALL privileges on %s.*" , sql . EscapeName ( this . migrationContext . DatabaseName ) )
return nil
}
log . Debugf ( "Privileges: Super: %t, REPLICATION CLIENT: %t, REPLICATION SLAVE: %t, ALL on *.*: %t, ALL on %s.*: %t" , foundSuper , foundReplicationClient , foundReplicationSlave , foundAll , sql . EscapeName ( this . migrationContext . DatabaseName ) , foundDBAll )
2016-08-29 12:39:31 +02:00
return log . Errorf ( "User has insufficient privileges for migration. Needed: SUPER|REPLICATION CLIENT, REPLICATION SLAVE and ALL on %s.*" , sql . EscapeName ( this . migrationContext . DatabaseName ) )
2016-04-04 12:27:51 +02:00
}
2016-04-11 17:27:16 +02:00
// restartReplication is required so that we are _certain_ the binlog format and
// row image settings have actually been applied to the replication thread.
2017-11-08 00:47:36 +00:00
// It is entirely possible, for example, that the replication is using 'STATEMENT'
2016-04-11 17:27:16 +02:00
// binlog format even as the variable says 'ROW'
func ( this * Inspector ) restartReplication ( ) error {
log . Infof ( "Restarting replication on %s:%d to make sure binlog settings apply to replication thread" , this . connectionConfig . Key . Hostname , this . connectionConfig . Key . Port )
2016-05-01 21:36:36 +03:00
masterKey , _ := mysql . GetMasterKeyFromSlaveStatus ( this . connectionConfig )
2016-04-14 13:37:56 +02:00
if masterKey == nil {
// This is not a replica
return nil
}
2016-04-11 17:27:16 +02:00
var stopError , startError error
_ , stopError = sqlutils . ExecNoPrepare ( this . db , ` stop slave ` )
_ , startError = sqlutils . ExecNoPrepare ( this . db , ` start slave ` )
if stopError != nil {
return stopError
}
if startError != nil {
return startError
}
2016-12-13 12:27:20 +01:00
time . Sleep ( startSlavePostWaitMilliseconds )
2016-04-11 17:27:16 +02:00
log . Debugf ( "Replication restarted" )
return nil
}
2016-04-18 10:57:18 -07:00
// applyBinlogFormat sets ROW binlog format and restarts replication to make
// the replication thread apply it.
func ( this * Inspector ) applyBinlogFormat ( ) error {
if this . migrationContext . RequiresBinlogFormatChange ( ) {
2016-08-12 14:26:58 +02:00
if ! this . migrationContext . SwitchToRowBinlogFormat {
return fmt . Errorf ( "Existing binlog_format is %s. Am not switching it to ROW unless you specify --switch-to-rbr" , this . migrationContext . OriginalBinlogFormat )
}
2016-04-18 10:57:18 -07:00
if _ , err := sqlutils . ExecNoPrepare ( this . db , ` set global binlog_format='ROW' ` ) ; err != nil {
return err
}
if _ , err := sqlutils . ExecNoPrepare ( this . db , ` set session binlog_format='ROW' ` ) ; err != nil {
return err
}
2016-08-12 14:26:58 +02:00
if err := this . restartReplication ( ) ; err != nil {
return err
}
2016-04-18 10:57:18 -07:00
log . Debugf ( "'ROW' binlog format applied" )
2016-08-12 14:26:58 +02:00
return nil
2016-04-18 10:57:18 -07:00
}
2016-08-12 14:26:58 +02:00
// We already have RBR, no explicit switch
2016-08-15 11:05:51 +02:00
if ! this . migrationContext . AssumeRBR {
2016-08-12 14:26:58 +02:00
if err := this . restartReplication ( ) ; err != nil {
return err
}
2016-04-18 10:57:18 -07:00
}
return nil
}
2016-04-06 13:05:58 +02:00
// validateBinlogs checks that binary log configuration is good to go
2016-04-04 12:27:51 +02:00
func ( this * Inspector ) validateBinlogs ( ) error {
2016-08-11 14:49:14 +02:00
query := ` select @@global.log_bin, @@global.binlog_format `
var hasBinaryLogs bool
if err := this . db . QueryRow ( query ) . Scan ( & hasBinaryLogs , & this . migrationContext . OriginalBinlogFormat ) ; err != nil {
2016-04-04 12:27:51 +02:00
return err
}
if ! hasBinaryLogs {
2016-04-04 15:29:02 +02:00
return fmt . Errorf ( "%s:%d must have binary logs enabled" , this . connectionConfig . Key . Hostname , this . connectionConfig . Key . Port )
2016-04-04 12:27:51 +02:00
}
if this . migrationContext . RequiresBinlogFormatChange ( ) {
2016-04-18 10:57:18 -07:00
if ! this . migrationContext . SwitchToRowBinlogFormat {
return fmt . Errorf ( "You must be using ROW binlog format. I can switch it for you, provided --switch-to-rbr and that %s:%d doesn't have replicas" , this . connectionConfig . Key . Hostname , this . connectionConfig . Key . Port )
}
2016-05-16 11:09:17 +02:00
query := fmt . Sprintf ( ` show /* gh-ost */ slave hosts ` )
2016-04-04 12:27:51 +02:00
countReplicas := 0
err := sqlutils . QueryRowsMap ( this . db , query , func ( rowMap sqlutils . RowMap ) error {
countReplicas ++
return nil
} )
if err != nil {
2016-04-04 15:29:02 +02:00
return err
2016-04-04 12:27:51 +02:00
}
if countReplicas > 0 {
2016-04-04 15:29:02 +02:00
return fmt . Errorf ( "%s:%d has %s binlog_format, but I'm too scared to change it to ROW because it has replicas. Bailing out" , this . connectionConfig . Key . Hostname , this . connectionConfig . Key . Port , this . migrationContext . OriginalBinlogFormat )
2016-04-04 12:27:51 +02:00
}
2016-04-18 10:57:18 -07:00
log . Infof ( "%s:%d has %s binlog_format. I will change it to ROW, and will NOT change it back, even in the event of failure." , this . connectionConfig . Key . Hostname , this . connectionConfig . Key . Port , this . migrationContext . OriginalBinlogFormat )
2016-04-04 12:27:51 +02:00
}
query = ` select @@global.binlog_row_image `
if err := this . db . QueryRow ( query ) . Scan ( & this . migrationContext . OriginalBinlogRowImage ) ; err != nil {
// Only as of 5.6. We wish to support 5.5 as well
2016-08-25 16:49:25 +02:00
this . migrationContext . OriginalBinlogRowImage = "FULL"
2016-04-04 12:27:51 +02:00
}
2016-05-20 12:52:14 +02:00
this . migrationContext . OriginalBinlogRowImage = strings . ToUpper ( this . migrationContext . OriginalBinlogRowImage )
2016-04-04 12:27:51 +02:00
2016-04-04 15:29:02 +02:00
log . Infof ( "binary logs validated on %s:%d" , this . connectionConfig . Key . Hostname , this . connectionConfig . Key . Port )
2016-04-04 12:27:51 +02:00
return nil
}
2016-08-11 17:37:50 +02:00
// validateLogSlaveUpdates checks that binary log log_slave_updates is set. This test is not required when migrating on replica or when migrating directly on master
func ( this * Inspector ) validateLogSlaveUpdates ( ) error {
2016-08-11 14:49:14 +02:00
query := ` select @@global.log_slave_updates `
var logSlaveUpdates bool
if err := this . db . QueryRow ( query ) . Scan ( & logSlaveUpdates ) ; err != nil {
return err
}
2016-10-31 10:25:34 +01:00
if logSlaveUpdates {
log . Infof ( "log_slave_updates validated on %s:%d" , this . connectionConfig . Key . Hostname , this . connectionConfig . Key . Port )
return nil
2016-08-11 14:49:14 +02:00
}
2016-10-31 10:25:34 +01:00
if this . migrationContext . IsTungsten {
2017-02-24 14:48:10 -07:00
log . Warningf ( "log_slave_updates not found on %s:%d, but --tungsten provided, so I'm proceeding" , this . connectionConfig . Key . Hostname , this . connectionConfig . Key . Port )
2016-10-31 10:25:34 +01:00
return nil
}
if this . migrationContext . TestOnReplica || this . migrationContext . MigrateOnReplica {
return fmt . Errorf ( "%s:%d must have log_slave_updates enabled for testing/migrating on replica" , this . connectionConfig . Key . Hostname , this . connectionConfig . Key . Port )
}
if this . migrationContext . InspectorIsAlsoApplier ( ) {
2017-11-08 00:50:56 +00:00
log . Warningf ( "log_slave_updates not found on %s:%d, but executing directly on master, so I'm proceeding" , this . connectionConfig . Key . Hostname , this . connectionConfig . Key . Port )
2016-10-31 10:25:34 +01:00
return nil
}
return fmt . Errorf ( "%s:%d must have log_slave_updates enabled for executing migration" , this . connectionConfig . Key . Hostname , this . connectionConfig . Key . Port )
2016-04-04 12:27:51 +02:00
}
// validateTable makes sure the table we need to operate on actually exists
func ( this * Inspector ) validateTable ( ) error {
2016-05-16 11:09:17 +02:00
query := fmt . Sprintf ( ` show /* gh-ost */ table status from %s like '%s' ` , sql . EscapeName ( this . migrationContext . DatabaseName ) , this . migrationContext . OriginalTableName )
2016-04-04 12:27:51 +02:00
tableFound := false
err := sqlutils . QueryRowsMap ( this . db , query , func ( rowMap sqlutils . RowMap ) error {
this . migrationContext . TableEngine = rowMap . GetString ( "Engine" )
this . migrationContext . RowsEstimate = rowMap . GetInt64 ( "Rows" )
this . migrationContext . UsedRowsEstimateMethod = base . TableStatusRowsEstimate
if rowMap . GetString ( "Comment" ) == "VIEW" {
return fmt . Errorf ( "%s.%s is a VIEW, not a real table. Bailing out" , sql . EscapeName ( this . migrationContext . DatabaseName ) , sql . EscapeName ( this . migrationContext . OriginalTableName ) )
}
tableFound = true
return nil
} )
if err != nil {
2016-04-04 15:29:02 +02:00
return err
2016-04-04 12:27:51 +02:00
}
if ! tableFound {
return log . Errorf ( "Cannot find table %s.%s!" , sql . EscapeName ( this . migrationContext . DatabaseName ) , sql . EscapeName ( this . migrationContext . OriginalTableName ) )
}
log . Infof ( "Table found. Engine=%s" , this . migrationContext . TableEngine )
log . Debugf ( "Estimated number of rows via STATUS: %d" , this . migrationContext . RowsEstimate )
return nil
}
2016-06-19 17:55:37 +02:00
// validateTableForeignKeys makes sure no foreign keys exist on the migrated table
2016-10-10 12:28:56 +02:00
func ( this * Inspector ) validateTableForeignKeys ( allowChildForeignKeys bool ) error {
2016-11-21 09:18:40 +01:00
if this . migrationContext . SkipForeignKeyChecks {
log . Warning ( "--skip-foreign-key-checks provided: will not check for foreign keys" )
return nil
}
2016-04-04 18:19:46 +02:00
query := `
2016-10-10 12:28:56 +02:00
SELECT
SUM ( REFERENCED_TABLE_NAME IS NOT NULL AND TABLE_SCHEMA = ? AND TABLE_NAME = ? ) as num_child_side_fk ,
SUM ( REFERENCED_TABLE_NAME IS NOT NULL AND REFERENCED_TABLE_SCHEMA = ? AND REFERENCED_TABLE_NAME = ? ) as num_parent_side_fk
2016-04-04 18:19:46 +02:00
FROM INFORMATION_SCHEMA . KEY_COLUMN_USAGE
WHERE
REFERENCED_TABLE_NAME IS NOT NULL
AND ( ( TABLE_SCHEMA = ? AND TABLE_NAME = ? )
OR ( REFERENCED_TABLE_SCHEMA = ? AND REFERENCED_TABLE_NAME = ? )
)
`
2016-10-10 12:28:56 +02:00
numParentForeignKeys := 0
numChildForeignKeys := 0
err := sqlutils . QueryRowsMap ( this . db , query , func ( m sqlutils . RowMap ) error {
numChildForeignKeys = m . GetInt ( "num_child_side_fk" )
numParentForeignKeys = m . GetInt ( "num_parent_side_fk" )
2016-04-04 18:19:46 +02:00
return nil
} ,
this . migrationContext . DatabaseName ,
this . migrationContext . OriginalTableName ,
this . migrationContext . DatabaseName ,
this . migrationContext . OriginalTableName ,
2016-10-10 12:28:56 +02:00
this . migrationContext . DatabaseName ,
this . migrationContext . OriginalTableName ,
this . migrationContext . DatabaseName ,
this . migrationContext . OriginalTableName ,
2016-04-04 18:19:46 +02:00
)
if err != nil {
return err
}
2016-10-10 12:28:56 +02:00
if numParentForeignKeys > 0 {
return log . Errorf ( "Found %d parent-side foreign keys on %s.%s. Parent-side foreign keys are not supported. Bailing out" , numParentForeignKeys , sql . EscapeName ( this . migrationContext . DatabaseName ) , sql . EscapeName ( this . migrationContext . OriginalTableName ) )
2016-04-04 18:19:46 +02:00
}
2016-10-10 12:28:56 +02:00
if numChildForeignKeys > 0 {
if allowChildForeignKeys {
log . Debugf ( "Foreign keys found and will be dropped, as per given --discard-foreign-keys flag" )
return nil
}
return log . Errorf ( "Found %d child-side foreign keys on %s.%s. Child-side foreign keys are not supported. Bailing out" , numChildForeignKeys , sql . EscapeName ( this . migrationContext . DatabaseName ) , sql . EscapeName ( this . migrationContext . OriginalTableName ) )
2016-04-04 18:19:46 +02:00
}
log . Debugf ( "Validated no foreign keys exist on table" )
return nil
}
2016-08-11 14:10:35 +02:00
// validateTableTriggers makes sure no triggers exist on the migrated table
func ( this * Inspector ) validateTableTriggers ( ) error {
query := `
SELECT COUNT ( * ) AS num_triggers
FROM INFORMATION_SCHEMA . TRIGGERS
WHERE
TRIGGER_SCHEMA = ?
AND EVENT_OBJECT_TABLE = ?
`
numTriggers := 0
err := sqlutils . QueryRowsMap ( this . db , query , func ( rowMap sqlutils . RowMap ) error {
numTriggers = rowMap . GetInt ( "num_triggers" )
return nil
} ,
this . migrationContext . DatabaseName ,
this . migrationContext . OriginalTableName ,
)
if err != nil {
return err
}
if numTriggers > 0 {
return log . Errorf ( "Found triggers on %s.%s. Triggers are not supported at this time. Bailing out" , sql . EscapeName ( this . migrationContext . DatabaseName ) , sql . EscapeName ( this . migrationContext . OriginalTableName ) )
}
log . Debugf ( "Validated no triggers exist on table" )
return nil
}
2016-06-19 17:55:37 +02:00
// estimateTableRowsViaExplain estimates number of rows on original table
2016-04-04 12:27:51 +02:00
func ( this * Inspector ) estimateTableRowsViaExplain ( ) error {
2016-05-16 11:09:17 +02:00
query := fmt . Sprintf ( ` explain select /* gh-ost */ * from %s.%s where 1=1 ` , sql . EscapeName ( this . migrationContext . DatabaseName ) , sql . EscapeName ( this . migrationContext . OriginalTableName ) )
2016-04-04 12:27:51 +02:00
outputFound := false
err := sqlutils . QueryRowsMap ( this . db , query , func ( rowMap sqlutils . RowMap ) error {
this . migrationContext . RowsEstimate = rowMap . GetInt64 ( "rows" )
this . migrationContext . UsedRowsEstimateMethod = base . ExplainRowsEstimate
outputFound = true
return nil
} )
if err != nil {
2016-04-04 15:29:02 +02:00
return err
2016-04-04 12:27:51 +02:00
}
if ! outputFound {
return log . Errorf ( "Cannot run EXPLAIN on %s.%s!" , sql . EscapeName ( this . migrationContext . DatabaseName ) , sql . EscapeName ( this . migrationContext . OriginalTableName ) )
}
log . Infof ( "Estimated number of rows via EXPLAIN: %d" , this . migrationContext . RowsEstimate )
return nil
}
2016-06-19 17:55:37 +02:00
// CountTableRows counts exact number of rows on the original table
2016-06-06 12:33:05 +02:00
func ( this * Inspector ) CountTableRows ( ) error {
2016-07-29 10:40:23 +02:00
atomic . StoreInt64 ( & this . migrationContext . CountingRowsFlag , 1 )
defer atomic . StoreInt64 ( & this . migrationContext . CountingRowsFlag , 0 )
2016-04-04 12:27:51 +02:00
log . Infof ( "As instructed, I'm issuing a SELECT COUNT(*) on the table. This may take a while" )
2016-07-29 10:40:23 +02:00
2016-05-16 11:09:17 +02:00
query := fmt . Sprintf ( ` select /* gh-ost */ count(*) as rows from %s.%s ` , sql . EscapeName ( this . migrationContext . DatabaseName ) , sql . EscapeName ( this . migrationContext . OriginalTableName ) )
2016-08-24 11:39:44 +02:00
var rowsEstimate int64
if err := this . db . QueryRow ( query ) . Scan ( & rowsEstimate ) ; err != nil {
2016-04-04 12:27:51 +02:00
return err
}
2016-08-24 11:39:44 +02:00
atomic . StoreInt64 ( & this . migrationContext . RowsEstimate , rowsEstimate )
2016-04-04 12:27:51 +02:00
this . migrationContext . UsedRowsEstimateMethod = base . CountRowsEstimate
2016-07-29 10:40:23 +02:00
2016-08-24 11:39:44 +02:00
log . Infof ( "Exact number of rows via COUNT: %d" , rowsEstimate )
2016-07-29 10:40:23 +02:00
2016-04-04 12:27:51 +02:00
return nil
}
2016-09-07 14:24:11 +02:00
// applyColumnTypes
func ( this * Inspector ) applyColumnTypes ( databaseName , tableName string , columnsLists ... * sql . ColumnList ) error {
query := `
select
*
from
information_schema . columns
where
table_schema = ?
and table_name = ?
`
err := sqlutils . QueryRowsMap ( this . db , query , func ( m sqlutils . RowMap ) error {
columnName := m . GetString ( "COLUMN_NAME" )
2016-10-13 13:09:58 +02:00
columnType := m . GetString ( "COLUMN_TYPE" )
if strings . Contains ( columnType , "unsigned" ) {
2016-08-17 06:51:58 +02:00
for _ , columnsList := range columnsLists {
columnsList . SetUnsigned ( columnName )
}
}
2017-01-10 09:57:42 +02:00
if strings . Contains ( columnType , "mediumint" ) {
for _ , columnsList := range columnsLists {
columnsList . GetColumn ( columnName ) . Type = sql . MediumIntColumnType
}
}
2016-10-13 13:09:58 +02:00
if strings . Contains ( columnType , "timestamp" ) {
for _ , columnsList := range columnsLists {
columnsList . GetColumn ( columnName ) . Type = sql . TimestampColumnType
}
}
if strings . Contains ( columnType , "datetime" ) {
for _ , columnsList := range columnsLists {
columnsList . GetColumn ( columnName ) . Type = sql . DateTimeColumnType
}
}
2017-08-22 11:51:20 +03:00
if strings . Contains ( columnType , "json" ) {
for _ , columnsList := range columnsLists {
columnsList . GetColumn ( columnName ) . Type = sql . JSONColumnType
}
}
2017-09-03 09:57:26 +03:00
if strings . Contains ( columnType , "float" ) {
for _ , columnsList := range columnsLists {
columnsList . GetColumn ( columnName ) . Type = sql . FloatColumnType
}
}
2016-10-19 15:22:29 +02:00
if strings . HasPrefix ( columnType , "enum" ) {
for _ , columnsList := range columnsLists {
2017-01-10 09:57:42 +02:00
columnsList . GetColumn ( columnName ) . Type = sql . EnumColumnType
2016-10-19 15:22:29 +02:00
}
}
2016-09-07 14:24:11 +02:00
if charset := m . GetString ( "CHARACTER_SET_NAME" ) ; charset != "" {
for _ , columnsList := range columnsLists {
columnsList . SetCharset ( columnName , charset )
}
}
2016-08-17 06:51:58 +02:00
return nil
2016-09-07 14:24:11 +02:00
} , databaseName , tableName )
2016-08-17 06:51:58 +02:00
return err
}
2016-04-04 12:27:51 +02:00
// getCandidateUniqueKeys investigates a table and returns the list of unique keys
// candidate for chunking
func ( this * Inspector ) getCandidateUniqueKeys ( tableName string ) ( uniqueKeys [ ] ( * sql . UniqueKey ) , err error ) {
query := `
SELECT
COLUMNS . TABLE_SCHEMA ,
COLUMNS . TABLE_NAME ,
COLUMNS . COLUMN_NAME ,
UNIQUES . INDEX_NAME ,
UNIQUES . COLUMN_NAMES ,
UNIQUES . COUNT_COLUMN_IN_INDEX ,
COLUMNS . DATA_TYPE ,
COLUMNS . CHARACTER_SET_NAME ,
2016-04-18 10:57:18 -07:00
LOCATE ( ' auto_increment ' , EXTRA ) > 0 as is_auto_increment ,
2016-04-04 12:27:51 +02:00
has_nullable
FROM INFORMATION_SCHEMA . COLUMNS INNER JOIN (
SELECT
TABLE_SCHEMA ,
TABLE_NAME ,
INDEX_NAME ,
COUNT ( * ) AS COUNT_COLUMN_IN_INDEX ,
GROUP_CONCAT ( COLUMN_NAME ORDER BY SEQ_IN_INDEX ASC ) AS COLUMN_NAMES ,
SUBSTRING_INDEX ( GROUP_CONCAT ( COLUMN_NAME ORDER BY SEQ_IN_INDEX ASC ) , ',' , 1 ) AS FIRST_COLUMN_NAME ,
SUM ( NULLABLE = ' YES ' ) > 0 AS has_nullable
FROM INFORMATION_SCHEMA . STATISTICS
2016-05-04 09:50:00 +03:00
WHERE
NON_UNIQUE = 0
AND TABLE_SCHEMA = ?
AND TABLE_NAME = ?
2016-04-04 12:27:51 +02:00
GROUP BY TABLE_SCHEMA , TABLE_NAME , INDEX_NAME
) AS UNIQUES
ON (
COLUMNS . TABLE_SCHEMA = UNIQUES . TABLE_SCHEMA AND
COLUMNS . TABLE_NAME = UNIQUES . TABLE_NAME AND
COLUMNS . COLUMN_NAME = UNIQUES . FIRST_COLUMN_NAME
)
WHERE
COLUMNS . TABLE_SCHEMA = ?
AND COLUMNS . TABLE_NAME = ?
ORDER BY
COLUMNS . TABLE_SCHEMA , COLUMNS . TABLE_NAME ,
CASE UNIQUES . INDEX_NAME
WHEN ' PRIMARY ' THEN 0
ELSE 1
END ,
CASE has_nullable
WHEN 0 THEN 0
ELSE 1
END ,
CASE IFNULL ( CHARACTER_SET_NAME , ' ' )
WHEN ' ' THEN 0
ELSE 1
END ,
CASE DATA_TYPE
WHEN ' tinyint ' THEN 0
WHEN ' smallint ' THEN 1
WHEN ' int ' THEN 2
WHEN ' bigint ' THEN 3
ELSE 100
END ,
COUNT_COLUMN_IN_INDEX
`
2016-04-18 10:57:18 -07:00
err = sqlutils . QueryRowsMap ( this . db , query , func ( m sqlutils . RowMap ) error {
2016-04-04 12:27:51 +02:00
uniqueKey := & sql . UniqueKey {
2016-04-18 10:57:18 -07:00
Name : m . GetString ( "INDEX_NAME" ) ,
Columns : * sql . ParseColumnList ( m . GetString ( "COLUMN_NAMES" ) ) ,
HasNullable : m . GetBool ( "has_nullable" ) ,
IsAutoIncrement : m . GetBool ( "is_auto_increment" ) ,
2016-04-04 12:27:51 +02:00
}
uniqueKeys = append ( uniqueKeys , uniqueKey )
return nil
2016-05-04 09:50:00 +03:00
} , this . migrationContext . DatabaseName , tableName , this . migrationContext . DatabaseName , tableName )
2016-04-04 12:27:51 +02:00
if err != nil {
return uniqueKeys , err
}
2016-04-18 10:57:18 -07:00
log . Debugf ( "Potential unique keys in %+v: %+v" , tableName , uniqueKeys )
2016-04-04 12:27:51 +02:00
return uniqueKeys , nil
}
2016-04-08 14:35:06 +02:00
// getSharedUniqueKeys returns the intersection of two given unique keys,
// testing by list of columns
func ( this * Inspector ) getSharedUniqueKeys ( originalUniqueKeys , ghostUniqueKeys [ ] ( * sql . UniqueKey ) ) ( uniqueKeys [ ] ( * sql . UniqueKey ) , err error ) {
2016-04-04 12:27:51 +02:00
// We actually do NOT rely on key name, just on the set of columns. This is because maybe
// the ALTER is on the name itself...
for _ , originalUniqueKey := range originalUniqueKeys {
for _ , ghostUniqueKey := range ghostUniqueKeys {
2016-09-07 14:24:11 +02:00
if originalUniqueKey . Columns . EqualsByNames ( & ghostUniqueKey . Columns ) {
2016-04-04 12:27:51 +02:00
uniqueKeys = append ( uniqueKeys , originalUniqueKey )
}
}
}
return uniqueKeys , nil
}
2016-04-04 15:29:02 +02:00
2016-04-08 14:35:06 +02:00
// getSharedColumns returns the intersection of two lists of columns in same order as the first list
2016-06-17 08:03:18 +02:00
func ( this * Inspector ) getSharedColumns ( originalColumns , ghostColumns * sql . ColumnList , columnRenameMap map [ string ] string ) ( * sql . ColumnList , * sql . ColumnList ) {
2016-04-11 17:27:16 +02:00
sharedColumnNames := [ ] string { }
2016-09-07 14:24:11 +02:00
for _ , originalColumn := range originalColumns . Names ( ) {
2017-04-23 08:38:35 +03:00
isSharedColumn := false
2017-07-12 12:33:32 +03:00
for _ , ghostColumn := range ghostColumns . Names ( ) {
if strings . EqualFold ( originalColumn , ghostColumn ) {
isSharedColumn = true
}
if strings . EqualFold ( columnRenameMap [ originalColumn ] , ghostColumn ) {
isSharedColumn = true
}
2017-04-23 08:38:35 +03:00
}
2017-07-12 12:33:32 +03:00
for droppedColumn := range this . migrationContext . DroppedColumnsMap {
if strings . EqualFold ( originalColumn , droppedColumn ) {
isSharedColumn = false
}
2017-04-23 08:38:35 +03:00
}
if isSharedColumn {
2016-04-11 17:27:16 +02:00
sharedColumnNames = append ( sharedColumnNames , originalColumn )
2016-04-08 14:35:06 +02:00
}
}
2016-06-17 08:03:18 +02:00
mappedSharedColumnNames := [ ] string { }
for _ , columnName := range sharedColumnNames {
if mapped , ok := columnRenameMap [ columnName ] ; ok {
mappedSharedColumnNames = append ( mappedSharedColumnNames , mapped )
} else {
mappedSharedColumnNames = append ( mappedSharedColumnNames , columnName )
}
}
return sql . NewColumnList ( sharedColumnNames ) , sql . NewColumnList ( mappedSharedColumnNames )
2016-04-08 14:35:06 +02:00
}
2016-06-22 12:39:13 +02:00
// showCreateTable returns the `show create table` statement for given table
func ( this * Inspector ) showCreateTable ( tableName string ) ( createTableStatement string , err error ) {
var dummy string
query := fmt . Sprintf ( ` show /* gh-ost */ create table %s.%s ` , sql . EscapeName ( this . migrationContext . DatabaseName ) , sql . EscapeName ( tableName ) )
err = this . db . QueryRow ( query ) . Scan ( & dummy , & createTableStatement )
return createTableStatement , err
}
2016-06-19 17:55:37 +02:00
// readChangelogState reads changelog hints
2016-12-26 21:31:35 +02:00
func ( this * Inspector ) readChangelogState ( hint string ) ( string , error ) {
2016-04-14 13:37:56 +02:00
query := fmt . Sprintf ( `
2016-12-26 21:31:35 +02:00
select hint , value from % s . % s where hint = ? and id <= 255
2016-04-14 13:37:56 +02:00
` ,
sql . EscapeName ( this . migrationContext . DatabaseName ) ,
sql . EscapeName ( this . migrationContext . GetChangelogTableName ( ) ) ,
)
2016-12-26 21:31:35 +02:00
result := ""
2016-04-14 13:37:56 +02:00
err := sqlutils . QueryRowsMap ( this . db , query , func ( m sqlutils . RowMap ) error {
2016-12-26 21:31:35 +02:00
result = m . GetString ( "value" )
2016-04-14 13:37:56 +02:00
return nil
2016-12-26 21:31:35 +02:00
} , hint )
2016-04-14 13:37:56 +02:00
return result , err
2016-04-04 15:29:02 +02:00
}
2016-04-14 13:37:56 +02:00
func ( this * Inspector ) getMasterConnectionConfig ( ) ( applierConfig * mysql . ConnectionConfig , err error ) {
2016-12-05 13:41:49 +01:00
log . Infof ( "Recursively searching for replication master" )
2016-04-14 13:37:56 +02:00
visitedKeys := mysql . NewInstanceKeyMap ( )
2016-06-22 10:38:13 +02:00
return mysql . GetMasterConnectionConfigSafe ( this . connectionConfig , visitedKeys , this . migrationContext . AllowedMasterMaster )
2016-04-04 15:29:02 +02:00
}
2016-11-02 12:48:35 +01:00
func ( this * Inspector ) getReplicationLag ( ) ( replicationLag time . Duration , err error ) {
2016-11-03 12:14:53 +01:00
replicationLag , err = mysql . GetReplicationLag (
2017-09-22 16:06:06 -07:00
this . informationSchemaDb ,
2016-11-02 12:48:35 +01:00
this . migrationContext . InspectorConnectionConfig ,
)
2016-11-03 12:14:53 +01:00
return replicationLag , err
2016-11-02 12:48:35 +01:00
}
2017-08-28 15:53:47 -07:00
func ( this * Inspector ) Teardown ( ) {
this . db . Close ( )
2017-09-22 16:06:06 -07:00
this . informationSchemaDb . Close ( )
2017-08-28 15:53:47 -07:00
return
}