2016-04-04 15:30:49 +02:00
/ *
Copyright 2016 GitHub Inc .
2016-05-16 11:09:17 +02:00
See https : //github.com/github/gh-ost/blob/master/LICENSE
2016-04-04 15:30:49 +02:00
* /
package logic
import (
gosql "database/sql"
"fmt"
2016-04-08 10:34:44 +02:00
"sync/atomic"
2016-04-07 15:57:12 +02:00
"time"
2016-05-16 11:09:17 +02:00
"github.com/github/gh-ost/go/base"
"github.com/github/gh-ost/go/binlog"
"github.com/github/gh-ost/go/mysql"
"github.com/github/gh-ost/go/sql"
2016-04-04 15:30:49 +02:00
"github.com/outbrain/golib/log"
"github.com/outbrain/golib/sqlutils"
)
2016-06-27 11:08:06 +02:00
const (
atomicCutOverMagicHint = "ghost-cut-over-sentry"
)
2016-06-19 17:55:37 +02:00
// Applier connects and writes the the applier-server, which is the server where migration
// happens. This is typically the master, but could be a replica when `--test-on-replica` or
// `--execute-on-replica` are given.
// Applier is the one to actually write row data and apply binlog events onto the ghost table.
// It is where the ghost & changelog tables get created. It is where the cut-over phase happens.
2016-04-04 15:30:49 +02:00
type Applier struct {
connectionConfig * mysql . ConnectionConfig
db * gosql . DB
2016-04-18 10:57:18 -07:00
singletonDB * gosql . DB
2016-04-04 15:30:49 +02:00
migrationContext * base . MigrationContext
}
func NewApplier ( ) * Applier {
return & Applier {
2016-04-14 13:37:56 +02:00
connectionConfig : base . GetMigrationContext ( ) . ApplierConnectionConfig ,
2016-04-04 15:30:49 +02:00
migrationContext : base . GetMigrationContext ( ) ,
}
}
func ( this * Applier ) InitDBConnections ( ) ( err error ) {
2016-04-18 10:57:18 -07:00
applierUri := this . connectionConfig . GetDBUri ( this . migrationContext . DatabaseName )
if this . db , _ , err = sqlutils . GetDB ( applierUri ) ; err != nil {
2016-04-04 15:30:49 +02:00
return err
}
2016-04-18 10:57:18 -07:00
singletonApplierUri := fmt . Sprintf ( "%s?timeout=0" , applierUri )
if this . singletonDB , _ , err = sqlutils . GetDB ( singletonApplierUri ) ; err != nil {
return err
}
this . singletonDB . SetMaxOpenConns ( 1 )
if err := this . validateConnection ( this . db ) ; err != nil {
return err
}
if err := this . validateConnection ( this . singletonDB ) ; err != nil {
2016-04-04 15:30:49 +02:00
return err
}
2016-06-19 17:55:37 +02:00
if impliedKey , err := mysql . GetInstanceKey ( this . db ) ; err != nil {
return err
} else {
this . connectionConfig . ImpliedKey = impliedKey
}
2016-04-04 15:30:49 +02:00
return nil
}
// validateConnection issues a simple can-connect to MySQL
2016-04-18 10:57:18 -07:00
func ( this * Applier ) validateConnection ( db * gosql . DB ) error {
2016-04-04 15:30:49 +02:00
query := ` select @@global.port `
var port int
2016-04-18 10:57:18 -07:00
if err := db . QueryRow ( query ) . Scan ( & port ) ; err != nil {
2016-04-04 15:30:49 +02:00
return err
}
if port != this . connectionConfig . Key . Port {
return fmt . Errorf ( "Unexpected database port reported: %+v" , port )
}
log . Infof ( "connection validated on %+v" , this . connectionConfig . Key )
return nil
}
2016-06-27 11:08:06 +02:00
// showTableStatus returns the output of `show table status like '...'` command
func ( this * Applier ) showTableStatus ( tableName string ) ( rowMap sqlutils . RowMap ) {
rowMap = nil
2016-05-16 11:09:17 +02:00
query := fmt . Sprintf ( ` show /* gh-ost */ table status from %s like '%s' ` , sql . EscapeName ( this . migrationContext . DatabaseName ) , tableName )
2016-05-03 12:55:17 +03:00
sqlutils . QueryRowsMap ( this . db , query , func ( m sqlutils . RowMap ) error {
2016-06-27 11:08:06 +02:00
rowMap = m
2016-05-03 12:55:17 +03:00
return nil
} )
2016-06-27 11:08:06 +02:00
return rowMap
}
// tableExists checks if a given table exists in database
func ( this * Applier ) tableExists ( tableName string ) ( tableFound bool ) {
m := this . showTableStatus ( tableName )
return ( m != nil )
2016-05-03 12:55:17 +03:00
}
2016-06-19 17:55:37 +02:00
// ValidateOrDropExistingTables verifies ghost and changelog tables do not exist,
// or attempts to drop them if instructed to.
2016-05-03 12:55:17 +03:00
func ( this * Applier ) ValidateOrDropExistingTables ( ) error {
if this . migrationContext . InitiallyDropGhostTable {
if err := this . DropGhostTable ( ) ; err != nil {
return err
}
}
if this . tableExists ( this . migrationContext . GetGhostTableName ( ) ) {
return fmt . Errorf ( "Table %s already exists. Panicking. Use --initially-drop-ghost-table to force dropping it" , sql . EscapeName ( this . migrationContext . GetGhostTableName ( ) ) )
}
if this . migrationContext . InitiallyDropOldTable {
if err := this . DropOldTable ( ) ; err != nil {
return err
}
}
if this . tableExists ( this . migrationContext . GetOldTableName ( ) ) {
return fmt . Errorf ( "Table %s already exists. Panicking. Use --initially-drop-old-table to force dropping it" , sql . EscapeName ( this . migrationContext . GetOldTableName ( ) ) )
}
return nil
}
2016-04-11 17:27:16 +02:00
// CreateGhostTable creates the ghost table on the applier host
2016-04-04 15:30:49 +02:00
func ( this * Applier ) CreateGhostTable ( ) error {
2016-05-16 11:09:17 +02:00
query := fmt . Sprintf ( ` create /* gh-ost */ table %s.%s like %s.%s ` ,
2016-04-04 15:30:49 +02:00
sql . EscapeName ( this . migrationContext . DatabaseName ) ,
sql . EscapeName ( this . migrationContext . GetGhostTableName ( ) ) ,
sql . EscapeName ( this . migrationContext . DatabaseName ) ,
sql . EscapeName ( this . migrationContext . OriginalTableName ) ,
)
log . Infof ( "Creating ghost table %s.%s" ,
sql . EscapeName ( this . migrationContext . DatabaseName ) ,
sql . EscapeName ( this . migrationContext . GetGhostTableName ( ) ) ,
)
if _ , err := sqlutils . ExecNoPrepare ( this . db , query ) ; err != nil {
return err
}
2016-04-07 15:57:12 +02:00
log . Infof ( "Ghost table created" )
2016-04-04 15:30:49 +02:00
return nil
}
2016-04-11 17:27:16 +02:00
// AlterGhost applies `alter` statement on ghost table
2016-04-04 15:30:49 +02:00
func ( this * Applier ) AlterGhost ( ) error {
2016-05-16 11:09:17 +02:00
query := fmt . Sprintf ( ` alter /* gh-ost */ table %s.%s %s ` ,
2016-04-04 15:30:49 +02:00
sql . EscapeName ( this . migrationContext . DatabaseName ) ,
sql . EscapeName ( this . migrationContext . GetGhostTableName ( ) ) ,
this . migrationContext . AlterStatement ,
)
log . Infof ( "Altering ghost table %s.%s" ,
sql . EscapeName ( this . migrationContext . DatabaseName ) ,
sql . EscapeName ( this . migrationContext . GetGhostTableName ( ) ) ,
)
log . Debugf ( "ALTER statement: %s" , query )
if _ , err := sqlutils . ExecNoPrepare ( this . db , query ) ; err != nil {
return err
}
2016-04-07 15:57:12 +02:00
log . Infof ( "Ghost table altered" )
return nil
}
2016-04-11 17:27:16 +02:00
// CreateChangelogTable creates the changelog table on the applier host
2016-04-07 15:57:12 +02:00
func ( this * Applier ) CreateChangelogTable ( ) error {
2016-05-03 12:55:17 +03:00
if err := this . DropChangelogTable ( ) ; err != nil {
return err
}
2016-05-16 11:09:17 +02:00
query := fmt . Sprintf ( ` create /* gh-ost */ table % s . % s (
2016-04-08 14:35:06 +02:00
id bigint auto_increment ,
2016-04-07 15:57:12 +02:00
last_update timestamp not null DEFAULT CURRENT_TIMESTAMP ON UPDATE CURRENT_TIMESTAMP ,
hint varchar ( 64 ) charset ascii not null ,
2016-04-08 14:35:06 +02:00
value varchar ( 255 ) charset ascii not null ,
2016-04-07 15:57:12 +02:00
primary key ( id ) ,
unique key hint_uidx ( hint )
2016-04-11 17:27:16 +02:00
) auto_increment = 256
2016-04-07 15:57:12 +02:00
` ,
sql . EscapeName ( this . migrationContext . DatabaseName ) ,
sql . EscapeName ( this . migrationContext . GetChangelogTableName ( ) ) ,
)
log . Infof ( "Creating changelog table %s.%s" ,
sql . EscapeName ( this . migrationContext . DatabaseName ) ,
sql . EscapeName ( this . migrationContext . GetChangelogTableName ( ) ) ,
)
if _ , err := sqlutils . ExecNoPrepare ( this . db , query ) ; err != nil {
return err
}
log . Infof ( "Changelog table created" )
return nil
}
2016-04-11 17:27:16 +02:00
// dropTable drops a given table on the applied host
func ( this * Applier ) dropTable ( tableName string ) error {
2016-05-16 11:09:17 +02:00
query := fmt . Sprintf ( ` drop /* gh-ost */ table if exists %s.%s ` ,
2016-04-07 15:57:12 +02:00
sql . EscapeName ( this . migrationContext . DatabaseName ) ,
2016-04-11 17:27:16 +02:00
sql . EscapeName ( tableName ) ,
2016-04-07 15:57:12 +02:00
)
2016-04-11 17:27:16 +02:00
log . Infof ( "Droppping table %s.%s" ,
2016-04-07 15:57:12 +02:00
sql . EscapeName ( this . migrationContext . DatabaseName ) ,
2016-04-11 17:27:16 +02:00
sql . EscapeName ( tableName ) ,
2016-04-07 15:57:12 +02:00
)
if _ , err := sqlutils . ExecNoPrepare ( this . db , query ) ; err != nil {
return err
}
2016-04-11 17:27:16 +02:00
log . Infof ( "Table dropped" )
2016-04-04 15:30:49 +02:00
return nil
}
2016-04-04 18:19:46 +02:00
2016-04-11 17:27:16 +02:00
// DropChangelogTable drops the changelog table on the applier host
func ( this * Applier ) DropChangelogTable ( ) error {
return this . dropTable ( this . migrationContext . GetChangelogTableName ( ) )
}
2016-05-03 12:55:17 +03:00
// DropOldTable drops the _Old table on the applier host
func ( this * Applier ) DropOldTable ( ) error {
return this . dropTable ( this . migrationContext . GetOldTableName ( ) )
}
2016-04-11 17:27:16 +02:00
// DropGhostTable drops the ghost table on the applier host
func ( this * Applier ) DropGhostTable ( ) error {
return this . dropTable ( this . migrationContext . GetGhostTableName ( ) )
}
2016-04-07 15:57:12 +02:00
// WriteChangelog writes a value to the changelog table.
// It returns the hint as given, for convenience
func ( this * Applier ) WriteChangelog ( hint , value string ) ( string , error ) {
2016-04-14 13:37:56 +02:00
explicitId := 0
switch hint {
case "heartbeat" :
explicitId = 1
case "state" :
explicitId = 2
case "throttle" :
explicitId = 3
}
2016-04-07 15:57:12 +02:00
query := fmt . Sprintf ( `
2016-05-16 11:09:17 +02:00
insert /* gh-ost */ into % s . % s
2016-04-07 15:57:12 +02:00
( id , hint , value )
values
2016-04-14 13:37:56 +02:00
( NULLIF ( ? , 0 ) , ? , ? )
2016-04-07 15:57:12 +02:00
on duplicate key update
last_update = NOW ( ) ,
value = VALUES ( value )
` ,
sql . EscapeName ( this . migrationContext . DatabaseName ) ,
sql . EscapeName ( this . migrationContext . GetChangelogTableName ( ) ) ,
)
2016-04-14 13:37:56 +02:00
_ , err := sqlutils . Exec ( this . db , query , explicitId , hint , value )
2016-04-07 15:57:12 +02:00
return hint , err
}
2016-04-11 17:27:16 +02:00
func ( this * Applier ) WriteAndLogChangelog ( hint , value string ) ( string , error ) {
2016-04-08 14:35:06 +02:00
this . WriteChangelog ( hint , value )
return this . WriteChangelog ( fmt . Sprintf ( "%s at %d" , hint , time . Now ( ) . UnixNano ( ) ) , value )
}
2016-04-11 17:27:16 +02:00
func ( this * Applier ) WriteChangelogState ( value string ) ( string , error ) {
return this . WriteAndLogChangelog ( "state" , value )
}
2016-04-07 15:57:12 +02:00
// InitiateHeartbeat creates a heartbeat cycle, writing to the changelog table.
// This is done asynchronously
2016-04-14 13:37:56 +02:00
func ( this * Applier ) InitiateHeartbeat ( heartbeatIntervalMilliseconds int64 ) {
2016-06-19 17:55:37 +02:00
var numSuccessiveFailures int64
2016-04-14 13:37:56 +02:00
injectHeartbeat := func ( ) error {
2016-04-18 10:57:18 -07:00
if _ , err := this . WriteChangelog ( "heartbeat" , time . Now ( ) . Format ( time . RFC3339Nano ) ) ; err != nil {
2016-04-14 13:37:56 +02:00
numSuccessiveFailures ++
if numSuccessiveFailures > this . migrationContext . MaxRetries ( ) {
return log . Errore ( err )
2016-04-07 15:57:12 +02:00
}
2016-04-14 13:37:56 +02:00
} else {
numSuccessiveFailures = 0
2016-04-07 15:57:12 +02:00
}
2016-04-14 13:37:56 +02:00
return nil
}
injectHeartbeat ( )
heartbeatTick := time . Tick ( time . Duration ( heartbeatIntervalMilliseconds ) * time . Millisecond )
for range heartbeatTick {
// Generally speaking, we would issue a goroutine, but I'd actually rather
// have this blocked rather than spam the master in the event something
// goes wrong
if err := injectHeartbeat ( ) ; err != nil {
return
2016-04-07 15:57:12 +02:00
}
2016-04-14 13:37:56 +02:00
}
2016-04-07 15:57:12 +02:00
}
2016-06-19 17:55:37 +02:00
// ExecuteThrottleQuery executes the `--throttle-query` and returns its results.
2016-06-18 21:12:07 +02:00
func ( this * Applier ) ExecuteThrottleQuery ( ) ( int64 , error ) {
throttleQuery := this . migrationContext . GetThrottleQuery ( )
if throttleQuery == "" {
return 0 , nil
}
var result int64
if err := this . db . QueryRow ( throttleQuery ) . Scan ( & result ) ; err != nil {
return 0 , log . Errore ( err )
}
return result , nil
}
2016-06-19 17:55:37 +02:00
// ReadMigrationMinValues returns the minimum values to be iterated on rowcopy
2016-04-04 18:19:46 +02:00
func ( this * Applier ) ReadMigrationMinValues ( uniqueKey * sql . UniqueKey ) error {
log . Debugf ( "Reading migration range according to key: %s" , uniqueKey . Name )
2016-04-11 17:27:16 +02:00
query , err := sql . BuildUniqueKeyMinValuesPreparedQuery ( this . migrationContext . DatabaseName , this . migrationContext . OriginalTableName , uniqueKey . Columns . Names )
2016-04-04 18:19:46 +02:00
if err != nil {
return err
}
rows , err := this . db . Query ( query )
if err != nil {
return err
}
for rows . Next ( ) {
2016-04-11 17:27:16 +02:00
this . migrationContext . MigrationRangeMinValues = sql . NewColumnValues ( uniqueKey . Len ( ) )
2016-04-04 18:19:46 +02:00
if err = rows . Scan ( this . migrationContext . MigrationRangeMinValues . ValuesPointers ... ) ; err != nil {
return err
}
}
log . Infof ( "Migration min values: [%s]" , this . migrationContext . MigrationRangeMinValues )
return err
}
2016-06-19 17:55:37 +02:00
// ReadMigrationMaxValues returns the maximum values to be iterated on rowcopy
2016-04-04 18:19:46 +02:00
func ( this * Applier ) ReadMigrationMaxValues ( uniqueKey * sql . UniqueKey ) error {
log . Debugf ( "Reading migration range according to key: %s" , uniqueKey . Name )
2016-04-11 17:27:16 +02:00
query , err := sql . BuildUniqueKeyMaxValuesPreparedQuery ( this . migrationContext . DatabaseName , this . migrationContext . OriginalTableName , uniqueKey . Columns . Names )
2016-04-04 18:19:46 +02:00
if err != nil {
return err
}
rows , err := this . db . Query ( query )
if err != nil {
return err
}
for rows . Next ( ) {
2016-04-11 17:27:16 +02:00
this . migrationContext . MigrationRangeMaxValues = sql . NewColumnValues ( uniqueKey . Len ( ) )
2016-04-04 18:19:46 +02:00
if err = rows . Scan ( this . migrationContext . MigrationRangeMaxValues . ValuesPointers ... ) ; err != nil {
return err
}
}
log . Infof ( "Migration max values: [%s]" , this . migrationContext . MigrationRangeMaxValues )
return err
}
2016-06-19 17:55:37 +02:00
// ReadMigrationRangeValues reads min/max values that will be used for rowcopy
2016-04-05 09:14:22 +02:00
func ( this * Applier ) ReadMigrationRangeValues ( ) error {
if err := this . ReadMigrationMinValues ( this . migrationContext . UniqueKey ) ; err != nil {
2016-04-04 18:19:46 +02:00
return err
}
2016-04-05 09:14:22 +02:00
if err := this . ReadMigrationMaxValues ( this . migrationContext . UniqueKey ) ; err != nil {
2016-04-04 18:19:46 +02:00
return err
}
return nil
}
2016-04-08 10:34:44 +02:00
// CalculateNextIterationRangeEndValues reads the next-iteration-range-end unique key values,
// which will be used for copying the next chunk of rows. Ir returns "false" if there is
// no further chunk to work through, i.e. we're past the last chunk and are done with
// itrating the range (and this done with copying row chunks)
func ( this * Applier ) CalculateNextIterationRangeEndValues ( ) ( hasFurtherRange bool , err error ) {
2016-04-05 09:14:22 +02:00
this . migrationContext . MigrationIterationRangeMinValues = this . migrationContext . MigrationIterationRangeMaxValues
2016-04-06 13:05:58 +02:00
if this . migrationContext . MigrationIterationRangeMinValues == nil {
this . migrationContext . MigrationIterationRangeMinValues = this . migrationContext . MigrationRangeMinValues
2016-04-05 09:14:22 +02:00
}
2016-04-05 19:50:49 +02:00
query , explodedArgs , err := sql . BuildUniqueKeyRangeEndPreparedQuery (
this . migrationContext . DatabaseName ,
this . migrationContext . OriginalTableName ,
2016-04-11 17:27:16 +02:00
this . migrationContext . UniqueKey . Columns . Names ,
2016-04-06 13:05:58 +02:00
this . migrationContext . MigrationIterationRangeMinValues . AbstractValues ( ) ,
2016-04-05 19:50:49 +02:00
this . migrationContext . MigrationRangeMaxValues . AbstractValues ( ) ,
2016-06-07 11:59:17 +02:00
atomic . LoadInt64 ( & this . migrationContext . ChunkSize ) ,
2016-05-18 14:53:09 +02:00
this . migrationContext . GetIteration ( ) == 0 ,
2016-04-08 14:35:06 +02:00
fmt . Sprintf ( "iteration:%d" , this . migrationContext . GetIteration ( ) ) ,
2016-04-05 19:50:49 +02:00
)
if err != nil {
2016-04-08 10:34:44 +02:00
return hasFurtherRange , err
2016-04-05 19:50:49 +02:00
}
rows , err := this . db . Query ( query , explodedArgs ... )
2016-04-05 09:14:22 +02:00
if err != nil {
2016-04-08 10:34:44 +02:00
return hasFurtherRange , err
2016-04-05 09:14:22 +02:00
}
2016-04-11 17:27:16 +02:00
iterationRangeMaxValues := sql . NewColumnValues ( this . migrationContext . UniqueKey . Len ( ) )
2016-04-05 09:14:22 +02:00
for rows . Next ( ) {
if err = rows . Scan ( iterationRangeMaxValues . ValuesPointers ... ) ; err != nil {
2016-04-08 10:34:44 +02:00
return hasFurtherRange , err
2016-04-05 09:14:22 +02:00
}
2016-04-08 10:34:44 +02:00
hasFurtherRange = true
2016-04-05 09:14:22 +02:00
}
2016-04-08 10:34:44 +02:00
if ! hasFurtherRange {
2016-04-14 13:37:56 +02:00
log . Debugf ( "Iteration complete: no further range to iterate" )
2016-04-08 10:34:44 +02:00
return hasFurtherRange , nil
2016-04-05 09:14:22 +02:00
}
this . migrationContext . MigrationIterationRangeMaxValues = iterationRangeMaxValues
2016-04-08 10:34:44 +02:00
return hasFurtherRange , nil
2016-04-06 13:05:58 +02:00
}
2016-06-19 17:55:37 +02:00
// ApplyIterationInsertQuery issues a chunk-INSERT query on the ghost table. It is where
// data actually gets copied from original table.
2016-04-08 10:34:44 +02:00
func ( this * Applier ) ApplyIterationInsertQuery ( ) ( chunkSize int64 , rowsAffected int64 , duration time . Duration , err error ) {
startTime := time . Now ( )
chunkSize = atomic . LoadInt64 ( & this . migrationContext . ChunkSize )
2016-04-06 13:05:58 +02:00
query , explodedArgs , err := sql . BuildRangeInsertPreparedQuery (
this . migrationContext . DatabaseName ,
this . migrationContext . OriginalTableName ,
this . migrationContext . GetGhostTableName ( ) ,
2016-04-11 17:27:16 +02:00
this . migrationContext . SharedColumns . Names ,
2016-06-17 08:03:18 +02:00
this . migrationContext . MappedSharedColumns . Names ,
2016-04-06 13:05:58 +02:00
this . migrationContext . UniqueKey . Name ,
2016-04-11 17:27:16 +02:00
this . migrationContext . UniqueKey . Columns . Names ,
2016-04-06 13:05:58 +02:00
this . migrationContext . MigrationIterationRangeMinValues . AbstractValues ( ) ,
this . migrationContext . MigrationIterationRangeMaxValues . AbstractValues ( ) ,
2016-04-08 14:35:06 +02:00
this . migrationContext . GetIteration ( ) == 0 ,
2016-04-08 10:34:44 +02:00
this . migrationContext . IsTransactionalTable ( ) ,
2016-04-06 13:05:58 +02:00
)
if err != nil {
2016-04-08 10:34:44 +02:00
return chunkSize , rowsAffected , duration , err
2016-04-06 13:05:58 +02:00
}
2016-04-08 10:34:44 +02:00
sqlResult , err := sqlutils . Exec ( this . db , query , explodedArgs ... )
if err != nil {
return chunkSize , rowsAffected , duration , err
2016-04-06 13:05:58 +02:00
}
2016-04-08 10:34:44 +02:00
rowsAffected , _ = sqlResult . RowsAffected ( )
duration = time . Now ( ) . Sub ( startTime )
2016-04-06 13:05:58 +02:00
log . Debugf (
"Issued INSERT on range: [%s]..[%s]; iteration: %d; chunk-size: %d" ,
this . migrationContext . MigrationIterationRangeMinValues ,
this . migrationContext . MigrationIterationRangeMaxValues ,
2016-04-08 14:35:06 +02:00
this . migrationContext . GetIteration ( ) ,
2016-04-08 10:34:44 +02:00
chunkSize )
return chunkSize , rowsAffected , duration , nil
2016-04-05 09:14:22 +02:00
}
2016-06-14 08:35:07 +02:00
// LockOriginalTable places a write lock on the original table
func ( this * Applier ) LockOriginalTable ( ) error {
2016-05-16 11:09:17 +02:00
query := fmt . Sprintf ( ` lock /* gh-ost */ tables %s.%s write ` ,
2016-04-08 10:34:44 +02:00
sql . EscapeName ( this . migrationContext . DatabaseName ) ,
sql . EscapeName ( this . migrationContext . OriginalTableName ) ,
)
2016-06-14 08:35:07 +02:00
log . Infof ( "Locking %s.%s" ,
sql . EscapeName ( this . migrationContext . DatabaseName ) ,
sql . EscapeName ( this . migrationContext . OriginalTableName ) ,
)
2016-04-18 10:57:18 -07:00
this . migrationContext . LockTablesStartTime = time . Now ( )
if _ , err := sqlutils . ExecNoPrepare ( this . singletonDB , query ) ; err != nil {
2016-04-04 18:19:46 +02:00
return err
}
2016-06-14 08:35:07 +02:00
log . Infof ( "Table locked" )
2016-04-08 10:34:44 +02:00
return nil
}
2016-04-04 18:19:46 +02:00
2016-06-19 17:55:37 +02:00
// UnlockTables makes tea. No wait, it unlocks tables.
2016-04-08 10:34:44 +02:00
func ( this * Applier ) UnlockTables ( ) error {
2016-05-16 11:09:17 +02:00
query := ` unlock /* gh-ost */ tables `
2016-04-08 10:34:44 +02:00
log . Infof ( "Unlocking tables" )
2016-04-18 10:57:18 -07:00
if _ , err := sqlutils . ExecNoPrepare ( this . singletonDB , query ) ; err != nil {
2016-04-04 18:19:46 +02:00
return err
}
2016-04-08 10:34:44 +02:00
log . Infof ( "Tables unlocked" )
2016-04-04 18:19:46 +02:00
return nil
}
2016-04-08 14:35:06 +02:00
2016-06-19 17:55:37 +02:00
// SwapTablesQuickAndBumpy issues a two-step swap table operation:
// - rename original table to _old
// - rename ghost table to original
// There is a point in time in between where the table does not exist.
2016-04-22 13:41:20 -07:00
func ( this * Applier ) SwapTablesQuickAndBumpy ( ) error {
2016-05-16 11:09:17 +02:00
query := fmt . Sprintf ( ` alter /* gh-ost */ table %s.%s rename %s ` ,
2016-04-18 10:57:18 -07:00
sql . EscapeName ( this . migrationContext . DatabaseName ) ,
sql . EscapeName ( this . migrationContext . OriginalTableName ) ,
sql . EscapeName ( this . migrationContext . GetOldTableName ( ) ) ,
)
log . Infof ( "Renaming original table" )
this . migrationContext . RenameTablesStartTime = time . Now ( )
if _ , err := sqlutils . ExecNoPrepare ( this . singletonDB , query ) ; err != nil {
return err
}
2016-05-16 11:09:17 +02:00
query = fmt . Sprintf ( ` alter /* gh-ost */ table %s.%s rename %s ` ,
2016-04-18 10:57:18 -07:00
sql . EscapeName ( this . migrationContext . DatabaseName ) ,
sql . EscapeName ( this . migrationContext . GetGhostTableName ( ) ) ,
sql . EscapeName ( this . migrationContext . OriginalTableName ) ,
)
log . Infof ( "Renaming ghost table" )
if _ , err := sqlutils . ExecNoPrepare ( this . db , query ) ; err != nil {
return err
}
this . migrationContext . RenameTablesEndTime = time . Now ( )
log . Infof ( "Tables renamed" )
return nil
}
2016-06-19 17:55:37 +02:00
// RenameTablesRollback renames back both table: original back to ghost,
// _old back to original. This is used by `--test-on-replica`
2016-06-14 09:01:06 +02:00
func ( this * Applier ) RenameTablesRollback ( ) ( renameError error ) {
// Restoring tables to original names.
// We prefer the single, atomic operation:
query := fmt . Sprintf ( ` rename /* gh-ost */ table %s.%s to %s.%s, %s.%s to %s.%s ` ,
2016-04-22 13:41:20 -07:00
sql . EscapeName ( this . migrationContext . DatabaseName ) ,
sql . EscapeName ( this . migrationContext . OriginalTableName ) ,
sql . EscapeName ( this . migrationContext . DatabaseName ) ,
sql . EscapeName ( this . migrationContext . GetGhostTableName ( ) ) ,
sql . EscapeName ( this . migrationContext . DatabaseName ) ,
2016-06-14 09:01:06 +02:00
sql . EscapeName ( this . migrationContext . GetOldTableName ( ) ) ,
sql . EscapeName ( this . migrationContext . DatabaseName ) ,
2016-04-22 13:41:20 -07:00
sql . EscapeName ( this . migrationContext . OriginalTableName ) ,
)
2016-06-14 09:01:06 +02:00
log . Infof ( "Renaming back both tables" )
if _ , err := sqlutils . ExecNoPrepare ( this . db , query ) ; err == nil {
return nil
2016-04-22 13:41:20 -07:00
}
2016-06-14 09:01:06 +02:00
// But, if for some reason the above was impossible to do, we rename one by one.
query = fmt . Sprintf ( ` rename /* gh-ost */ table %s.%s to %s.%s ` ,
2016-06-10 11:15:11 +02:00
sql . EscapeName ( this . migrationContext . DatabaseName ) ,
sql . EscapeName ( this . migrationContext . OriginalTableName ) ,
sql . EscapeName ( this . migrationContext . DatabaseName ) ,
sql . EscapeName ( this . migrationContext . GetGhostTableName ( ) ) ,
)
log . Infof ( "Renaming back to ghost table" )
if _ , err := sqlutils . ExecNoPrepare ( this . db , query ) ; err != nil {
renameError = err
}
query = fmt . Sprintf ( ` rename /* gh-ost */ table %s.%s to %s.%s ` ,
sql . EscapeName ( this . migrationContext . DatabaseName ) ,
sql . EscapeName ( this . migrationContext . GetOldTableName ( ) ) ,
sql . EscapeName ( this . migrationContext . DatabaseName ) ,
sql . EscapeName ( this . migrationContext . OriginalTableName ) ,
)
log . Infof ( "Renaming back to original table" )
if _ , err := sqlutils . ExecNoPrepare ( this . db , query ) ; err != nil {
renameError = err
}
return log . Errore ( renameError )
}
2016-04-22 19:46:34 -07:00
// StopSlaveIOThread is applicable with --test-on-replica; it stops the IO thread, duh.
// We need to keep the SQL thread active so as to complete processing received events,
2016-06-14 09:01:06 +02:00
// and have them written to the binary log, so that we can then read them via streamer.
2016-04-18 10:57:18 -07:00
func ( this * Applier ) StopSlaveIOThread ( ) error {
2016-05-16 11:09:17 +02:00
query := ` stop /* gh-ost */ slave io_thread `
2016-04-18 10:57:18 -07:00
log . Infof ( "Stopping replication" )
if _ , err := sqlutils . ExecNoPrepare ( this . db , query ) ; err != nil {
return err
}
log . Infof ( "Replication stopped" )
return nil
}
2016-06-14 12:50:07 +02:00
// StartSlaveSQLThread is applicable with --test-on-replica
func ( this * Applier ) StopSlaveSQLThread ( ) error {
query := ` stop /* gh-ost */ slave sql_thread `
log . Infof ( "Verifying SQL thread is stopped" )
if _ , err := sqlutils . ExecNoPrepare ( this . db , query ) ; err != nil {
return err
}
log . Infof ( "SQL thread stopped" )
return nil
}
2016-05-20 12:52:14 +02:00
// StartSlaveSQLThread is applicable with --test-on-replica
func ( this * Applier ) StartSlaveSQLThread ( ) error {
query := ` start /* gh-ost */ slave sql_thread `
log . Infof ( "Verifying SQL thread is running" )
if _ , err := sqlutils . ExecNoPrepare ( this . db , query ) ; err != nil {
return err
}
log . Infof ( "SQL thread started" )
return nil
}
2016-06-19 17:55:37 +02:00
// StopReplication is used by `--test-on-replica` and stops replication.
func ( this * Applier ) StopReplication ( ) error {
2016-05-16 11:03:15 +02:00
if err := this . StopSlaveIOThread ( ) ; err != nil {
return err
}
2016-06-14 12:50:07 +02:00
if err := this . StopSlaveSQLThread ( ) ; err != nil {
2016-05-20 12:52:14 +02:00
return err
}
2016-05-19 15:11:36 +02:00
readBinlogCoordinates , executeBinlogCoordinates , err := mysql . GetReplicationBinlogCoordinates ( this . db )
2016-05-16 11:03:15 +02:00
if err != nil {
return err
}
2016-05-19 15:11:36 +02:00
log . Infof ( "Replication IO thread at %+v. SQL thread is at %+v" , * readBinlogCoordinates , * executeBinlogCoordinates )
2016-05-16 11:03:15 +02:00
return nil
}
2016-06-19 17:55:37 +02:00
// GetSessionLockName returns a name for the special hint session voluntary lock
2016-06-14 08:35:07 +02:00
func ( this * Applier ) GetSessionLockName ( sessionId int64 ) string {
return fmt . Sprintf ( "gh-ost.%d.lock" , sessionId )
}
2016-06-19 17:55:37 +02:00
// ExpectUsedLock expects the special hint voluntary lock to exist on given session
2016-06-14 08:35:07 +02:00
func ( this * Applier ) ExpectUsedLock ( sessionId int64 ) error {
var result int64
query := ` select is_used_lock(?) `
lockName := this . GetSessionLockName ( sessionId )
log . Infof ( "Checking session lock: %s" , lockName )
if err := this . db . QueryRow ( query , lockName ) . Scan ( & result ) ; err != nil || result != sessionId {
return fmt . Errorf ( "Session lock %s expected to be found but wasn't" , lockName )
}
return nil
}
2016-06-19 17:55:37 +02:00
// ExpectProcess expects a process to show up in `SHOW PROCESSLIST` that has given characteristics
2016-04-22 19:46:34 -07:00
func ( this * Applier ) ExpectProcess ( sessionId int64 , stateHint , infoHint string ) error {
found := false
query := `
select id
from information_schema . processlist
where
id != connection_id ( )
and ? in ( 0 , id )
and state like concat ( '%' , ? , '%' )
and info like concat ( '%' , ? , '%' )
`
err := sqlutils . QueryRowsMap ( this . db , query , func ( m sqlutils . RowMap ) error {
found = true
return nil
} , sessionId , stateHint , infoHint )
if err != nil {
return err
}
if ! found {
return fmt . Errorf ( "Cannot find process. Hints: %s, %s" , stateHint , infoHint )
}
return nil
}
2016-06-27 11:08:06 +02:00
// DropAtomicCutOverSentryTableIfExists checks if the "old" table name
// happens to be a cut-over magic table; if so, it drops it.
func ( this * Applier ) DropAtomicCutOverSentryTableIfExists ( ) error {
log . Infof ( "Looking for magic cut-over table" )
tableName := this . migrationContext . GetOldTableName ( )
rowMap := this . showTableStatus ( tableName )
if rowMap == nil {
// Table does not exist
return nil
}
if rowMap [ "Comment" ] . String != atomicCutOverMagicHint {
return fmt . Errorf ( "Expected magic comment on %s, did not find it" , tableName )
}
log . Infof ( "Dropping magic cut-over table" )
return this . dropTable ( tableName )
}
// DropAtomicCutOverSentryTableIfExists checks if the "old" table name
// happens to be a cut-over magic table; if so, it drops it.
func ( this * Applier ) CreateAtomicCutOverSentryTable ( ) error {
if err := this . DropAtomicCutOverSentryTableIfExists ( ) ; err != nil {
return err
}
tableName := this . migrationContext . GetOldTableName ( )
query := fmt . Sprintf ( ` create /* gh-ost */ table % s . % s (
id int auto_increment primary key
) comment = ' % s '
` ,
sql . EscapeName ( this . migrationContext . DatabaseName ) ,
sql . EscapeName ( tableName ) ,
atomicCutOverMagicHint ,
)
log . Infof ( "Creating magic cut-over table %s.%s" ,
sql . EscapeName ( this . migrationContext . DatabaseName ) ,
sql . EscapeName ( tableName ) ,
)
if _ , err := sqlutils . ExecNoPrepare ( this . db , query ) ; err != nil {
return err
}
log . Infof ( "Magic cut-over table created" )
return nil
}
// AtomicCutOverMagicLock
func ( this * Applier ) AtomicCutOverMagicLock ( sessionIdChan chan int64 , tableLocked chan <- error , okToUnlockTable <- chan bool , tableUnlocked chan <- error ) error {
tx , err := this . db . Begin ( )
if err != nil {
tableLocked <- err
return err
}
defer func ( ) {
sessionIdChan <- - 1
tableLocked <- fmt . Errorf ( "Unexpected error in AtomicCutOverMagicLock(), injected to release blocking channel reads" )
tableUnlocked <- fmt . Errorf ( "Unexpected error in AtomicCutOverMagicLock(), injected to release blocking channel reads" )
tx . Rollback ( )
} ( )
var sessionId int64
if err := tx . QueryRow ( ` select connection_id() ` ) . Scan ( & sessionId ) ; err != nil {
tableLocked <- err
return err
}
sessionIdChan <- sessionId
lockResult := 0
query := ` select get_lock(?, 0) `
lockName := this . GetSessionLockName ( sessionId )
log . Infof ( "Grabbing voluntary lock: %s" , lockName )
if err := tx . QueryRow ( query , lockName ) . Scan ( & lockResult ) ; err != nil || lockResult != 1 {
err := fmt . Errorf ( "Unable to acquire lock %s" , lockName )
tableLocked <- err
return err
}
2016-07-08 10:14:58 +02:00
tableLockTimeoutSeconds := this . migrationContext . CutOverLockTimeoutSeconds * 2
2016-06-27 11:08:06 +02:00
log . Infof ( "Setting LOCK timeout as %d seconds" , tableLockTimeoutSeconds )
query = fmt . Sprintf ( ` set session lock_wait_timeout:=%d ` , tableLockTimeoutSeconds )
if _ , err := tx . Exec ( query ) ; err != nil {
tableLocked <- err
return err
}
if err := this . CreateAtomicCutOverSentryTable ( ) ; err != nil {
tableLocked <- err
return err
}
query = fmt . Sprintf ( ` lock /* gh-ost */ tables %s.%s write, %s.%s write ` ,
sql . EscapeName ( this . migrationContext . DatabaseName ) ,
sql . EscapeName ( this . migrationContext . OriginalTableName ) ,
sql . EscapeName ( this . migrationContext . DatabaseName ) ,
sql . EscapeName ( this . migrationContext . GetOldTableName ( ) ) ,
)
log . Infof ( "Locking %s.%s, %s.%s" ,
sql . EscapeName ( this . migrationContext . DatabaseName ) ,
sql . EscapeName ( this . migrationContext . OriginalTableName ) ,
sql . EscapeName ( this . migrationContext . DatabaseName ) ,
sql . EscapeName ( this . migrationContext . GetOldTableName ( ) ) ,
)
this . migrationContext . LockTablesStartTime = time . Now ( )
if _ , err := tx . Exec ( query ) ; err != nil {
tableLocked <- err
return err
}
log . Infof ( "Tables locked" )
tableLocked <- nil // No error.
// From this point on, we are committed to UNLOCK TABLES. No matter what happens,
// the UNLOCK must execute (or, alternatively, this connection dies, which gets the same impact)
// The cut-over phase will proceed to apply remaining backlog onto ghost table,
// and issue RENAME. We wait here until told to proceed.
<- okToUnlockTable
log . Infof ( "Will now proceed to drop magic table and unlock tables" )
// The magic table is here because we locked it. And we are the only ones allowed to drop it.
// And in fact, we will:
log . Infof ( "Dropping magic cut-over table" )
query = fmt . Sprintf ( ` drop /* gh-ost */ table if exists %s.%s ` ,
sql . EscapeName ( this . migrationContext . DatabaseName ) ,
sql . EscapeName ( this . migrationContext . GetOldTableName ( ) ) ,
)
if _ , err := tx . Exec ( query ) ; err != nil {
log . Errore ( err )
// We DO NOT return here because we must `UNLOCK TABLES`!
}
// Tables still locked
log . Infof ( "Releasing lock from %s.%s, %s.%s" ,
sql . EscapeName ( this . migrationContext . DatabaseName ) ,
sql . EscapeName ( this . migrationContext . OriginalTableName ) ,
sql . EscapeName ( this . migrationContext . DatabaseName ) ,
sql . EscapeName ( this . migrationContext . GetOldTableName ( ) ) ,
)
query = ` unlock tables `
if _ , err := tx . Exec ( query ) ; err != nil {
tableUnlocked <- err
return log . Errore ( err )
}
log . Infof ( "Tables unlocked" )
tableUnlocked <- nil
return nil
}
2016-07-16 08:12:19 -06:00
// AtomicCutoverRename
2016-06-27 11:08:06 +02:00
func ( this * Applier ) AtomicCutoverRename ( sessionIdChan chan int64 , tablesRenamed chan <- error ) error {
tx , err := this . db . Begin ( )
if err != nil {
return err
}
defer func ( ) {
tx . Rollback ( )
sessionIdChan <- - 1
tablesRenamed <- fmt . Errorf ( "Unexpected error in AtomicCutoverRename(), injected to release blocking channel reads" )
} ( )
var sessionId int64
if err := tx . QueryRow ( ` select connection_id() ` ) . Scan ( & sessionId ) ; err != nil {
return err
}
sessionIdChan <- sessionId
2016-07-08 10:14:58 +02:00
log . Infof ( "Setting RENAME timeout as %d seconds" , this . migrationContext . CutOverLockTimeoutSeconds )
query := fmt . Sprintf ( ` set session lock_wait_timeout:=%d ` , this . migrationContext . CutOverLockTimeoutSeconds )
2016-06-27 11:08:06 +02:00
if _ , err := tx . Exec ( query ) ; err != nil {
return err
}
query = fmt . Sprintf ( ` rename /* gh-ost */ table %s.%s to %s.%s, %s.%s to %s.%s ` ,
sql . EscapeName ( this . migrationContext . DatabaseName ) ,
sql . EscapeName ( this . migrationContext . OriginalTableName ) ,
sql . EscapeName ( this . migrationContext . DatabaseName ) ,
sql . EscapeName ( this . migrationContext . GetOldTableName ( ) ) ,
sql . EscapeName ( this . migrationContext . DatabaseName ) ,
sql . EscapeName ( this . migrationContext . GetGhostTableName ( ) ) ,
sql . EscapeName ( this . migrationContext . DatabaseName ) ,
sql . EscapeName ( this . migrationContext . OriginalTableName ) ,
)
log . Infof ( "Issuing and expecting this to block: %s" , query )
if _ , err := tx . Exec ( query ) ; err != nil {
tablesRenamed <- err
return log . Errore ( err )
}
tablesRenamed <- nil
log . Infof ( "Tables renamed" )
return nil
}
2016-04-08 14:35:06 +02:00
func ( this * Applier ) ShowStatusVariable ( variableName string ) ( result int64 , err error ) {
query := fmt . Sprintf ( ` show global status like '%s' ` , variableName )
if err := this . db . QueryRow ( query ) . Scan ( & variableName , & result ) ; err != nil {
return 0 , err
}
return result , nil
}
2016-04-11 17:27:16 +02:00
2016-06-19 17:55:37 +02:00
// buildDMLEventQuery creates a query to operate on the ghost table, based on an intercepted binlog
// event entry on the original table.
2016-05-04 08:23:34 +03:00
func ( this * Applier ) buildDMLEventQuery ( dmlEvent * binlog . BinlogDMLEvent ) ( query string , args [ ] interface { } , rowsDelta int64 , err error ) {
2016-04-11 17:27:16 +02:00
switch dmlEvent . DML {
case binlog . DeleteDML :
{
2016-04-14 13:37:56 +02:00
query , uniqueKeyArgs , err := sql . BuildDMLDeleteQuery ( dmlEvent . DatabaseName , this . migrationContext . GetGhostTableName ( ) , this . migrationContext . OriginalTableColumns , & this . migrationContext . UniqueKey . Columns , dmlEvent . WhereColumnValues . AbstractValues ( ) )
2016-05-04 08:23:34 +03:00
return query , uniqueKeyArgs , - 1 , err
2016-04-14 13:37:56 +02:00
}
case binlog . InsertDML :
{
2016-06-17 08:03:18 +02:00
query , sharedArgs , err := sql . BuildDMLInsertQuery ( dmlEvent . DatabaseName , this . migrationContext . GetGhostTableName ( ) , this . migrationContext . OriginalTableColumns , this . migrationContext . MappedSharedColumns , dmlEvent . NewColumnValues . AbstractValues ( ) )
2016-05-04 08:23:34 +03:00
return query , sharedArgs , 1 , err
2016-04-14 13:37:56 +02:00
}
case binlog . UpdateDML :
{
2016-06-17 08:03:18 +02:00
query , sharedArgs , uniqueKeyArgs , err := sql . BuildDMLUpdateQuery ( dmlEvent . DatabaseName , this . migrationContext . GetGhostTableName ( ) , this . migrationContext . OriginalTableColumns , this . migrationContext . MappedSharedColumns , & this . migrationContext . UniqueKey . Columns , dmlEvent . NewColumnValues . AbstractValues ( ) , dmlEvent . WhereColumnValues . AbstractValues ( ) )
2016-04-14 13:37:56 +02:00
args = append ( args , sharedArgs ... )
args = append ( args , uniqueKeyArgs ... )
2016-05-04 08:23:34 +03:00
return query , args , 0 , err
2016-04-11 17:27:16 +02:00
}
}
2016-05-04 08:23:34 +03:00
return "" , args , 0 , fmt . Errorf ( "Unknown dml event type: %+v" , dmlEvent . DML )
2016-04-14 13:37:56 +02:00
}
2016-06-19 17:55:37 +02:00
// ApplyDMLEventQuery writes an entry to the ghost table, in response to an intercepted
// original-table binlog event
2016-04-14 13:37:56 +02:00
func ( this * Applier ) ApplyDMLEventQuery ( dmlEvent * binlog . BinlogDMLEvent ) error {
2016-05-04 08:23:34 +03:00
query , args , rowDelta , err := this . buildDMLEventQuery ( dmlEvent )
2016-04-14 13:37:56 +02:00
if err != nil {
return err
}
_ , err = sqlutils . Exec ( this . db , query , args ... )
2016-04-19 04:25:32 -07:00
if err == nil {
atomic . AddInt64 ( & this . migrationContext . TotalDMLEventsApplied , 1 )
}
2016-05-04 08:23:34 +03:00
if this . migrationContext . CountTableRows {
atomic . AddInt64 ( & this . migrationContext . RowsEstimate , rowDelta )
}
2016-04-14 13:37:56 +02:00
return err
2016-04-11 17:27:16 +02:00
}