tile38/internal/server/follow.go

360 lines
7.9 KiB
Go
Raw Normal View History

package server
2016-03-05 02:08:16 +03:00
import (
"errors"
"fmt"
"io"
"strconv"
"strings"
"time"
2016-04-01 02:26:36 +03:00
"github.com/tidwall/resp"
"github.com/tidwall/tile38/internal/log"
2016-03-05 02:08:16 +03:00
)
var errNoLongerFollowing = errors.New("no longer following")
const checksumsz = 512 * 1024
func (s *Server) cmdFollow(msg *Message) (res resp.Value, err error) {
2016-04-01 02:26:36 +03:00
start := time.Now()
vs := msg.Args[1:]
2016-04-01 02:26:36 +03:00
var ok bool
2016-03-05 02:08:16 +03:00
var host, sport string
2017-10-05 18:20:40 +03:00
2016-04-01 02:26:36 +03:00
if vs, host, ok = tokenval(vs); !ok || host == "" {
return NOMessage, errInvalidNumberOfArguments
2016-03-05 02:08:16 +03:00
}
2016-04-01 02:26:36 +03:00
if vs, sport, ok = tokenval(vs); !ok || sport == "" {
return NOMessage, errInvalidNumberOfArguments
2016-03-05 02:08:16 +03:00
}
2016-04-01 02:26:36 +03:00
if len(vs) != 0 {
return NOMessage, errInvalidNumberOfArguments
2016-03-05 02:08:16 +03:00
}
host = strings.ToLower(host)
sport = strings.ToLower(sport)
var update bool
if host == "no" && sport == "one" {
update = s.config.followHost() != "" || s.config.followPort() != 0
s.config.setFollowHost("")
s.config.setFollowPort(0)
2016-03-05 02:08:16 +03:00
} else {
n, err := strconv.ParseUint(sport, 10, 64)
if err != nil {
return NOMessage, errInvalidArgument(sport)
2016-03-05 02:08:16 +03:00
}
port := int(n)
update = s.config.followHost() != host || s.config.followPort() != port
auth := s.config.leaderAuth()
2016-03-05 02:08:16 +03:00
if update {
s.mu.Unlock()
2016-04-01 02:26:36 +03:00
conn, err := DialTimeout(fmt.Sprintf("%s:%d", host, port), time.Second*2)
2016-03-05 02:08:16 +03:00
if err != nil {
s.mu.Lock()
return NOMessage, fmt.Errorf("cannot follow: %v", err)
2016-03-05 02:08:16 +03:00
}
defer conn.Close()
2016-03-08 18:35:43 +03:00
if auth != "" {
if err := s.followDoLeaderAuth(conn, auth); err != nil {
return NOMessage, fmt.Errorf("cannot follow: %v", err)
2016-03-08 18:35:43 +03:00
}
}
2016-04-01 02:26:36 +03:00
m, err := doServer(conn)
2016-03-05 02:08:16 +03:00
if err != nil {
s.mu.Lock()
return NOMessage, fmt.Errorf("cannot follow: %v", err)
2016-03-05 02:08:16 +03:00
}
2016-04-01 02:26:36 +03:00
if m["id"] == "" {
s.mu.Lock()
return NOMessage, fmt.Errorf("cannot follow: invalid id")
2016-03-05 02:08:16 +03:00
}
if m["id"] == s.config.serverID() {
s.mu.Lock()
return NOMessage, fmt.Errorf("cannot follow self")
2016-04-01 02:26:36 +03:00
}
if m["following"] != "" {
s.mu.Lock()
return NOMessage, fmt.Errorf("cannot follow a follower")
2016-03-05 02:08:16 +03:00
}
s.mu.Lock()
2016-03-05 02:08:16 +03:00
}
s.config.setFollowHost(host)
s.config.setFollowPort(port)
2016-03-05 02:08:16 +03:00
}
s.config.write(false)
2016-03-05 02:08:16 +03:00
if update {
s.followc.Add(1)
if s.config.followHost() != "" {
2016-03-05 02:08:16 +03:00
log.Infof("following new host '%s' '%s'.", host, sport)
go s.follow(s.config.followHost(), s.config.followPort(),
int(s.followc.Load()))
2016-03-05 02:08:16 +03:00
} else {
log.Infof("following no one")
}
}
return OKMessage(msg, start), nil
2016-04-01 02:26:36 +03:00
}
// cmdReplConf is a command handler that sets replication configuration info
func (s *Server) cmdReplConf(msg *Message, client *Client) (res resp.Value, err error) {
start := time.Now()
vs := msg.Args[1:]
var ok bool
var cmd, val string
// Parse the message
if vs, cmd, ok = tokenval(vs); !ok || cmd == "" {
return NOMessage, errInvalidNumberOfArguments
}
if _, val, ok = tokenval(vs); !ok || val == "" {
return NOMessage, errInvalidNumberOfArguments
}
// Switch on the command received
switch cmd {
case "listening-port":
// Parse the port as an integer
port, err := strconv.Atoi(val)
if err != nil {
return NOMessage, errInvalidArgument(val)
}
// Apply the replication port to the client and return
s.connsmu.RLock()
defer s.connsmu.RUnlock()
for _, c := range s.conns {
if c.remoteAddr == client.remoteAddr {
c.mu.Lock()
c.replPort = port
c.mu.Unlock()
return OKMessage(msg, start), nil
}
}
case "ip-address":
// Apply the replication ip to the client and return
s.connsmu.RLock()
defer s.connsmu.RUnlock()
for _, c := range s.conns {
if c.remoteAddr == client.remoteAddr {
c.mu.Lock()
c.replAddr = val
c.mu.Unlock()
return OKMessage(msg, start), nil
}
}
}
return NOMessage, fmt.Errorf("cannot find follower")
}
func doServer(conn *RESPConn) (map[string]string, error) {
2016-04-01 02:26:36 +03:00
v, err := conn.Do("server")
if err != nil {
return nil, err
}
if v.Error() != nil {
return nil, v.Error()
}
arr := v.Array()
m := make(map[string]string)
for i := 0; i < len(arr)/2; i++ {
m[arr[i*2+0].String()] = arr[i*2+1].String()
}
return m, err
2016-03-05 02:08:16 +03:00
}
func (s *Server) followHandleCommand(args []string, followc int, w io.Writer) (int, error) {
s.mu.Lock()
defer s.mu.Unlock()
if int(s.followc.Load()) != followc {
return s.aofsz, errNoLongerFollowing
2016-04-01 02:26:36 +03:00
}
msg := &Message{Args: args}
_, d, err := s.command(msg, nil)
2016-04-01 02:26:36 +03:00
if err != nil {
if commandErrIsFatal(err) {
return s.aofsz, err
2016-04-01 02:26:36 +03:00
}
}
if err := s.writeAOF(args, &d); err != nil {
return s.aofsz, err
2016-04-01 02:26:36 +03:00
}
if len(s.aofbuf) > 10240 {
s.flushAOF(false)
2018-11-13 22:04:16 +03:00
}
return s.aofsz, nil
2016-03-05 02:08:16 +03:00
}
func (s *Server) followDoLeaderAuth(conn *RESPConn, auth string) error {
2016-04-01 02:26:36 +03:00
v, err := conn.Do("auth", auth)
2016-03-08 18:35:43 +03:00
if err != nil {
return err
}
2016-04-01 02:26:36 +03:00
if v.Error() != nil {
return v.Error()
2016-03-08 18:35:43 +03:00
}
2016-04-01 02:26:36 +03:00
if v.String() != "OK" {
return errors.New("cannot follow: auth no ok")
2016-03-08 18:35:43 +03:00
}
return nil
}
func (s *Server) followStep(host string, port int, followc int) error {
if int(s.followc.Load()) != followc {
2016-03-05 02:08:16 +03:00
return errNoLongerFollowing
}
s.mu.Lock()
2023-05-21 18:22:27 +03:00
s.faofsz = 0
s.fcup = false
auth := s.config.leaderAuth()
s.mu.Unlock()
2016-03-05 02:08:16 +03:00
addr := fmt.Sprintf("%s:%d", host, port)
2016-04-01 02:26:36 +03:00
2016-03-05 02:08:16 +03:00
// check if we are following self
2016-04-01 02:26:36 +03:00
conn, err := DialTimeout(addr, time.Second*2)
2016-03-05 02:08:16 +03:00
if err != nil {
return fmt.Errorf("cannot follow: %v", err)
}
defer conn.Close()
2016-03-08 18:35:43 +03:00
if auth != "" {
if err := s.followDoLeaderAuth(conn, auth); err != nil {
2016-03-08 18:35:43 +03:00
return fmt.Errorf("cannot follow: %v", err)
}
}
2016-04-01 02:26:36 +03:00
m, err := doServer(conn)
2016-03-05 02:08:16 +03:00
if err != nil {
return fmt.Errorf("cannot follow: %v", err)
}
2016-04-01 02:26:36 +03:00
if m["id"] == "" {
return fmt.Errorf("cannot follow: invalid id")
}
if m["id"] == s.config.serverID() {
2016-03-05 02:08:16 +03:00
return fmt.Errorf("cannot follow self")
}
2016-04-01 02:26:36 +03:00
if m["following"] != "" {
2016-03-05 02:08:16 +03:00
return fmt.Errorf("cannot follow a follower")
}
2016-04-01 02:26:36 +03:00
2016-03-05 02:08:16 +03:00
// verify checksum
pos, err := s.followCheckSome(addr, followc, auth)
2016-03-05 02:08:16 +03:00
if err != nil {
return err
}
// Send the replication port to the leader
p := s.config.announcePort()
if p == 0 {
p = s.port
}
v, err := conn.Do("replconf", "listening-port", p)
if err != nil {
return err
}
if v.Error() != nil {
return v.Error()
}
if v.String() != "OK" {
return errors.New("invalid response to replconf request")
}
// Send the replication ip to the leader
ip := s.config.announceIP()
if ip != "" {
v, err := conn.Do("replconf", "ip-address", ip)
if err != nil {
return err
}
if v.Error() != nil {
return v.Error()
}
if v.String() != "OK" {
return errors.New("invalid response to replconf request")
}
}
if s.opts.ShowDebugMessages {
log.Debug("follow:", addr, ":replconf")
}
v, err = conn.Do("aof", pos)
2016-03-05 02:08:16 +03:00
if err != nil {
return err
}
2016-04-01 02:26:36 +03:00
if v.Error() != nil {
return v.Error()
}
if v.String() != "OK" {
2016-03-05 02:08:16 +03:00
return errors.New("invalid response to aof live request")
}
if s.opts.ShowDebugMessages {
2016-03-05 02:08:16 +03:00
log.Debug("follow:", addr, ":read aof")
}
2016-04-01 02:26:36 +03:00
aofSize, err := strconv.ParseInt(m["aof_size"], 10, 64)
if err != nil {
return err
}
2023-05-21 18:22:27 +03:00
s.mu.Lock()
s.faofsz = int(aofSize)
s.mu.Unlock()
2016-04-01 02:26:36 +03:00
caughtUp := pos >= aofSize
2016-03-05 02:08:16 +03:00
if caughtUp {
s.mu.Lock()
s.fcup = true
s.fcuponce = true
s.mu.Unlock()
2016-03-05 02:08:16 +03:00
log.Info("caught up")
}
2023-05-21 18:22:27 +03:00
2022-09-13 03:06:27 +03:00
nullw := io.Discard
2016-03-05 02:08:16 +03:00
for {
2016-04-01 02:26:36 +03:00
v, telnet, _, err := conn.rd.ReadMultiBulk()
2016-03-05 02:08:16 +03:00
if err != nil {
return err
}
2016-04-01 02:26:36 +03:00
vals := v.Array()
if telnet || v.Type() != resp.Array {
return errors.New("invalid multibulk")
}
svals := make([]string, len(vals))
for i := 0; i < len(vals); i++ {
svals[i] = vals[i].String()
}
2016-04-01 03:58:02 +03:00
aofsz, err := s.followHandleCommand(svals, followc, nullw)
2016-03-05 02:08:16 +03:00
if err != nil {
return err
}
2023-05-21 18:22:27 +03:00
s.mu.Lock()
s.faofsz = aofsz
s.mu.Unlock()
2016-03-05 02:08:16 +03:00
if !caughtUp {
2016-04-01 02:26:36 +03:00
if aofsz >= int(aofSize) {
2016-03-05 02:08:16 +03:00
caughtUp = true
2023-05-21 18:29:30 +03:00
s.mu.Lock()
s.flushAOF(false)
s.fcup = true
s.fcuponce = true
s.mu.Unlock()
2016-03-05 02:08:16 +03:00
log.Info("caught up")
}
}
}
}
func (s *Server) follow(host string, port int, followc int) {
2016-03-05 02:08:16 +03:00
for {
err := s.followStep(host, port, followc)
2016-03-05 02:08:16 +03:00
if err == errNoLongerFollowing {
return
}
if err != nil && err != io.EOF {
2016-03-08 18:35:43 +03:00
log.Error("follow: " + err.Error())
2016-03-05 02:08:16 +03:00
}
time.Sleep(time.Second)
}
}