2016-06-07 09:59:17 +00:00
|
|
|
/*
|
|
|
|
Copyright 2016 GitHub Inc.
|
|
|
|
See https://github.com/github/gh-ost/blob/master/LICENSE
|
|
|
|
*/
|
|
|
|
|
|
|
|
package logic
|
|
|
|
|
|
|
|
import (
|
|
|
|
"bufio"
|
|
|
|
"fmt"
|
2016-09-12 10:38:14 +00:00
|
|
|
"io"
|
2016-06-07 09:59:17 +00:00
|
|
|
"net"
|
|
|
|
"os"
|
2016-09-12 10:38:14 +00:00
|
|
|
"strconv"
|
|
|
|
"strings"
|
|
|
|
"sync/atomic"
|
2016-06-07 09:59:17 +00:00
|
|
|
|
|
|
|
"github.com/github/gh-ost/go/base"
|
|
|
|
"github.com/outbrain/golib/log"
|
|
|
|
)
|
|
|
|
|
2016-09-12 10:38:14 +00:00
|
|
|
type printStatusFunc func(PrintStatusRule, io.Writer)
|
2016-06-07 09:59:17 +00:00
|
|
|
|
|
|
|
// Server listens for requests on a socket file or via TCP
|
|
|
|
type Server struct {
|
|
|
|
migrationContext *base.MigrationContext
|
|
|
|
unixListener net.Listener
|
|
|
|
tcpListener net.Listener
|
2016-09-12 10:38:14 +00:00
|
|
|
hooksExecutor *HooksExecutor
|
|
|
|
printStatus printStatusFunc
|
2016-12-18 07:23:51 +00:00
|
|
|
panicAbort chan error
|
2016-06-07 09:59:17 +00:00
|
|
|
}
|
|
|
|
|
2016-12-18 07:23:51 +00:00
|
|
|
func NewServer(hooksExecutor *HooksExecutor, printStatus printStatusFunc, panicAbort chan error) *Server {
|
2016-06-07 09:59:17 +00:00
|
|
|
return &Server{
|
|
|
|
migrationContext: base.GetMigrationContext(),
|
2016-09-12 10:38:14 +00:00
|
|
|
hooksExecutor: hooksExecutor,
|
|
|
|
printStatus: printStatus,
|
2016-12-18 07:23:51 +00:00
|
|
|
panicAbort: panicAbort,
|
2016-06-07 09:59:17 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (this *Server) BindSocketFile() (err error) {
|
|
|
|
if this.migrationContext.ServeSocketFile == "" {
|
|
|
|
return nil
|
|
|
|
}
|
2016-07-22 15:34:18 +00:00
|
|
|
if this.migrationContext.DropServeSocket && base.FileExists(this.migrationContext.ServeSocketFile) {
|
2016-06-07 09:59:17 +00:00
|
|
|
os.Remove(this.migrationContext.ServeSocketFile)
|
|
|
|
}
|
|
|
|
this.unixListener, err = net.Listen("unix", this.migrationContext.ServeSocketFile)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
log.Infof("Listening on unix socket file: %s", this.migrationContext.ServeSocketFile)
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2016-08-11 07:01:14 +00:00
|
|
|
func (this *Server) RemoveSocketFile() (err error) {
|
2016-08-11 07:03:39 +00:00
|
|
|
log.Infof("Removing socket file: %s", this.migrationContext.ServeSocketFile)
|
2016-08-11 07:01:14 +00:00
|
|
|
return os.Remove(this.migrationContext.ServeSocketFile)
|
|
|
|
}
|
|
|
|
|
2016-06-07 09:59:17 +00:00
|
|
|
func (this *Server) BindTCPPort() (err error) {
|
|
|
|
if this.migrationContext.ServeTCPPort == 0 {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
this.tcpListener, err = net.Listen("tcp", fmt.Sprintf(":%d", this.migrationContext.ServeTCPPort))
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
log.Infof("Listening on tcp port: %d", this.migrationContext.ServeTCPPort)
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2016-06-19 15:55:37 +00:00
|
|
|
// Serve begins listening & serving on whichever device was configured
|
2016-06-07 09:59:17 +00:00
|
|
|
func (this *Server) Serve() (err error) {
|
|
|
|
go func() {
|
|
|
|
for {
|
|
|
|
conn, err := this.unixListener.Accept()
|
|
|
|
if err != nil {
|
|
|
|
log.Errore(err)
|
|
|
|
}
|
|
|
|
go this.handleConnection(conn)
|
|
|
|
}
|
|
|
|
}()
|
|
|
|
go func() {
|
2016-06-07 12:24:30 +00:00
|
|
|
if this.tcpListener == nil {
|
|
|
|
return
|
|
|
|
}
|
2016-06-07 09:59:17 +00:00
|
|
|
for {
|
|
|
|
conn, err := this.tcpListener.Accept()
|
|
|
|
if err != nil {
|
|
|
|
log.Errore(err)
|
|
|
|
}
|
|
|
|
go this.handleConnection(conn)
|
|
|
|
}
|
|
|
|
}()
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (this *Server) handleConnection(conn net.Conn) (err error) {
|
|
|
|
defer conn.Close()
|
|
|
|
command, _, err := bufio.NewReader(conn).ReadLine()
|
2016-09-12 10:38:14 +00:00
|
|
|
return this.onServerCommand(string(command), bufio.NewWriter(conn))
|
|
|
|
}
|
|
|
|
|
|
|
|
// onServerCommand responds to a user's interactive command
|
|
|
|
func (this *Server) onServerCommand(command string, writer *bufio.Writer) (err error) {
|
|
|
|
defer writer.Flush()
|
|
|
|
|
|
|
|
printStatusRule, err := this.applyServerCommand(command, writer)
|
|
|
|
if err == nil {
|
|
|
|
this.printStatus(printStatusRule, writer)
|
|
|
|
} else {
|
|
|
|
fmt.Fprintf(writer, "%s\n", err.Error())
|
|
|
|
}
|
|
|
|
return log.Errore(err)
|
|
|
|
}
|
|
|
|
|
|
|
|
// applyServerCommand parses and executes commands by user
|
|
|
|
func (this *Server) applyServerCommand(command string, writer *bufio.Writer) (printStatusRule PrintStatusRule, err error) {
|
|
|
|
printStatusRule = NoPrintStatusRule
|
|
|
|
|
|
|
|
tokens := strings.SplitN(command, "=", 2)
|
|
|
|
command = strings.TrimSpace(tokens[0])
|
|
|
|
arg := ""
|
|
|
|
if len(tokens) > 1 {
|
|
|
|
arg = strings.TrimSpace(tokens[1])
|
|
|
|
}
|
|
|
|
|
|
|
|
throttleHint := "# Note: you may only throttle for as long as your binary logs are not purged\n"
|
|
|
|
|
|
|
|
if err := this.hooksExecutor.onInteractiveCommand(command); err != nil {
|
|
|
|
return NoPrintStatusRule, err
|
|
|
|
}
|
|
|
|
|
|
|
|
switch command {
|
|
|
|
case "help":
|
|
|
|
{
|
|
|
|
fmt.Fprintln(writer, `available commands:
|
|
|
|
status # Print a detailed status message
|
|
|
|
sup # Print a short status message
|
|
|
|
chunk-size=<newsize> # Set a new chunk-size
|
|
|
|
nice-ratio=<ratio> # Set a new nice-ratio, immediate sleep after each row-copy operation, float (examples: 0 is agrressive, 0.7 adds 70% runtime, 1.0 doubles runtime, 2.0 triples runtime, ...)
|
|
|
|
critical-load=<load> # Set a new set of max-load thresholds
|
|
|
|
max-lag-millis=<max-lag> # Set a new replication lag threshold
|
|
|
|
replication-lag-query=<query> # Set a new query that determines replication lag (no quotes)
|
|
|
|
max-load=<load> # Set a new set of max-load thresholds
|
|
|
|
throttle-query=<query> # Set a new throttle-query (no quotes)
|
|
|
|
throttle-control-replicas=<replicas> # Set a new comma delimited list of throttle control replicas
|
|
|
|
throttle # Force throttling
|
|
|
|
no-throttle # End forced throttling (other throttling may still apply)
|
|
|
|
unpostpone # Bail out a cut-over postpone; proceed to cut-over
|
|
|
|
panic # panic and quit without cleanup
|
|
|
|
help # This message
|
|
|
|
`)
|
|
|
|
}
|
|
|
|
case "sup":
|
|
|
|
return ForcePrintStatusOnlyRule, nil
|
|
|
|
case "info", "status":
|
|
|
|
return ForcePrintStatusAndHintRule, nil
|
|
|
|
case "chunk-size":
|
|
|
|
{
|
|
|
|
if chunkSize, err := strconv.Atoi(arg); err != nil {
|
|
|
|
return NoPrintStatusRule, err
|
|
|
|
} else {
|
|
|
|
this.migrationContext.SetChunkSize(int64(chunkSize))
|
|
|
|
return ForcePrintStatusAndHintRule, nil
|
|
|
|
}
|
|
|
|
}
|
|
|
|
case "max-lag-millis":
|
|
|
|
{
|
|
|
|
if maxLagMillis, err := strconv.Atoi(arg); err != nil {
|
|
|
|
return NoPrintStatusRule, err
|
|
|
|
} else {
|
|
|
|
this.migrationContext.SetMaxLagMillisecondsThrottleThreshold(int64(maxLagMillis))
|
|
|
|
return ForcePrintStatusAndHintRule, nil
|
|
|
|
}
|
|
|
|
}
|
|
|
|
case "replication-lag-query":
|
|
|
|
{
|
|
|
|
this.migrationContext.SetReplicationLagQuery(arg)
|
|
|
|
return ForcePrintStatusAndHintRule, nil
|
|
|
|
}
|
|
|
|
case "nice-ratio":
|
|
|
|
{
|
|
|
|
if niceRatio, err := strconv.ParseFloat(arg, 64); err != nil {
|
|
|
|
return NoPrintStatusRule, err
|
|
|
|
} else {
|
|
|
|
this.migrationContext.SetNiceRatio(niceRatio)
|
|
|
|
return ForcePrintStatusAndHintRule, nil
|
|
|
|
}
|
|
|
|
}
|
|
|
|
case "max-load":
|
|
|
|
{
|
|
|
|
if err := this.migrationContext.ReadMaxLoad(arg); err != nil {
|
|
|
|
return NoPrintStatusRule, err
|
|
|
|
}
|
|
|
|
return ForcePrintStatusAndHintRule, nil
|
|
|
|
}
|
|
|
|
case "critical-load":
|
|
|
|
{
|
|
|
|
if err := this.migrationContext.ReadCriticalLoad(arg); err != nil {
|
|
|
|
return NoPrintStatusRule, err
|
|
|
|
}
|
|
|
|
return ForcePrintStatusAndHintRule, nil
|
|
|
|
}
|
|
|
|
case "throttle-query":
|
|
|
|
{
|
|
|
|
this.migrationContext.SetThrottleQuery(arg)
|
|
|
|
fmt.Fprintf(writer, throttleHint)
|
|
|
|
return ForcePrintStatusAndHintRule, nil
|
|
|
|
}
|
|
|
|
case "throttle-control-replicas":
|
|
|
|
{
|
|
|
|
if err := this.migrationContext.ReadThrottleControlReplicaKeys(arg); err != nil {
|
|
|
|
return NoPrintStatusRule, err
|
|
|
|
}
|
|
|
|
fmt.Fprintf(writer, "%s\n", this.migrationContext.GetThrottleControlReplicaKeys().ToCommaDelimitedList())
|
|
|
|
return ForcePrintStatusAndHintRule, nil
|
|
|
|
}
|
|
|
|
case "throttle", "pause", "suspend":
|
|
|
|
{
|
|
|
|
atomic.StoreInt64(&this.migrationContext.ThrottleCommandedByUser, 1)
|
|
|
|
fmt.Fprintf(writer, throttleHint)
|
|
|
|
return ForcePrintStatusAndHintRule, nil
|
|
|
|
}
|
|
|
|
case "no-throttle", "unthrottle", "resume", "continue":
|
|
|
|
{
|
|
|
|
atomic.StoreInt64(&this.migrationContext.ThrottleCommandedByUser, 0)
|
|
|
|
return ForcePrintStatusAndHintRule, nil
|
|
|
|
}
|
|
|
|
case "unpostpone", "no-postpone", "cut-over":
|
|
|
|
{
|
2016-09-12 17:17:36 +00:00
|
|
|
if arg == "" && this.migrationContext.ForceNamedCutOverCommand {
|
|
|
|
err := fmt.Errorf("User commanded 'unpostpone' without specifying table name, but --force-named-cut-over is set")
|
|
|
|
return NoPrintStatusRule, err
|
|
|
|
}
|
|
|
|
if arg != "" && arg != this.migrationContext.OriginalTableName {
|
|
|
|
// User exlpicitly provided table name. This is a courtesy protection mechanism
|
|
|
|
err := fmt.Errorf("User commanded 'unpostpone' on %s, but migrated table is %s; ingoring request.", arg, this.migrationContext.OriginalTableName)
|
|
|
|
return NoPrintStatusRule, err
|
2016-09-12 10:38:14 +00:00
|
|
|
}
|
|
|
|
if atomic.LoadInt64(&this.migrationContext.IsPostponingCutOver) > 0 {
|
|
|
|
atomic.StoreInt64(&this.migrationContext.UserCommandedUnpostponeFlag, 1)
|
|
|
|
fmt.Fprintf(writer, "Unpostponed\n")
|
|
|
|
return ForcePrintStatusAndHintRule, nil
|
|
|
|
}
|
|
|
|
fmt.Fprintf(writer, "You may only invoke this when gh-ost is actively postponing migration. At this time it is not.\n")
|
|
|
|
return NoPrintStatusRule, nil
|
|
|
|
}
|
|
|
|
case "panic":
|
|
|
|
{
|
|
|
|
err := fmt.Errorf("User commanded 'panic'. I will now panic, without cleanup. PANIC!")
|
2016-12-18 07:23:51 +00:00
|
|
|
this.panicAbort <- err
|
2016-09-12 10:38:14 +00:00
|
|
|
return NoPrintStatusRule, err
|
|
|
|
}
|
|
|
|
default:
|
|
|
|
err = fmt.Errorf("Unknown command: %s", command)
|
|
|
|
return NoPrintStatusRule, err
|
|
|
|
}
|
|
|
|
return NoPrintStatusRule, nil
|
2016-06-07 09:59:17 +00:00
|
|
|
}
|