2014-06-06 10:57:18 +04:00
|
|
|
package server
|
|
|
|
|
2014-06-08 12:43:59 +04:00
|
|
|
import (
|
2014-06-09 13:23:32 +04:00
|
|
|
"bufio"
|
|
|
|
"bytes"
|
|
|
|
"encoding/binary"
|
2014-06-08 12:43:59 +04:00
|
|
|
"encoding/json"
|
2014-06-09 13:23:32 +04:00
|
|
|
"errors"
|
|
|
|
"fmt"
|
2014-07-04 09:27:57 +04:00
|
|
|
"github.com/siddontang/go-log/log"
|
2014-07-04 13:55:47 +04:00
|
|
|
"github.com/siddontang/go-snappy/snappy"
|
2014-06-09 13:23:32 +04:00
|
|
|
"github.com/siddontang/ledisdb/ledis"
|
2014-06-08 12:43:59 +04:00
|
|
|
"io/ioutil"
|
2014-06-09 13:23:32 +04:00
|
|
|
"net"
|
2014-06-08 12:43:59 +04:00
|
|
|
"os"
|
|
|
|
"path"
|
2014-06-09 13:23:32 +04:00
|
|
|
"strconv"
|
|
|
|
"sync"
|
|
|
|
"time"
|
2014-06-08 12:43:59 +04:00
|
|
|
)
|
|
|
|
|
2014-06-09 13:23:32 +04:00
|
|
|
var (
|
|
|
|
errConnectMaster = errors.New("connect master error")
|
|
|
|
)
|
|
|
|
|
2014-07-11 12:57:19 +04:00
|
|
|
type MasterInfo struct {
|
|
|
|
Addr string `json:"addr"`
|
|
|
|
LogFileIndex int64 `json:"log_file_index"`
|
|
|
|
LogPos int64 `json:"log_pos"`
|
|
|
|
}
|
|
|
|
|
|
|
|
func (m *MasterInfo) Save(filePath string) error {
|
|
|
|
data, err := json.Marshal(m)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
filePathBak := fmt.Sprintf("%s.bak", filePath)
|
|
|
|
|
|
|
|
var fd *os.File
|
|
|
|
fd, err = os.OpenFile(filePathBak, os.O_CREATE|os.O_WRONLY, os.ModePerm)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
if _, err = fd.Write(data); err != nil {
|
|
|
|
fd.Close()
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
fd.Close()
|
|
|
|
return os.Rename(filePathBak, filePath)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (m *MasterInfo) Load(filePath string) error {
|
|
|
|
data, err := ioutil.ReadFile(filePath)
|
|
|
|
if err != nil {
|
|
|
|
if os.IsNotExist(err) {
|
|
|
|
return nil
|
|
|
|
} else {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if err = json.Unmarshal(data, m); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2014-06-09 13:23:32 +04:00
|
|
|
type master struct {
|
|
|
|
sync.Mutex
|
|
|
|
|
2014-07-31 10:38:20 +04:00
|
|
|
conn net.Conn
|
|
|
|
rb *bufio.Reader
|
2014-06-09 13:23:32 +04:00
|
|
|
|
|
|
|
app *App
|
|
|
|
|
|
|
|
quit chan struct{}
|
|
|
|
|
2014-07-11 12:57:19 +04:00
|
|
|
infoName string
|
|
|
|
|
|
|
|
info *MasterInfo
|
2014-06-09 13:23:32 +04:00
|
|
|
|
|
|
|
wg sync.WaitGroup
|
|
|
|
|
|
|
|
syncBuf bytes.Buffer
|
2014-07-04 13:55:47 +04:00
|
|
|
|
|
|
|
compressBuf []byte
|
2014-06-09 13:23:32 +04:00
|
|
|
}
|
|
|
|
|
|
|
|
func newMaster(app *App) *master {
|
|
|
|
m := new(master)
|
|
|
|
m.app = app
|
|
|
|
|
|
|
|
m.infoName = path.Join(m.app.cfg.DataDir, "master.info")
|
|
|
|
|
2014-06-10 06:41:50 +04:00
|
|
|
m.quit = make(chan struct{}, 1)
|
2014-06-09 13:23:32 +04:00
|
|
|
|
2014-07-04 13:55:47 +04:00
|
|
|
m.compressBuf = make([]byte, 256)
|
|
|
|
|
2014-07-11 12:57:19 +04:00
|
|
|
m.info = new(MasterInfo)
|
|
|
|
|
2014-06-09 13:23:32 +04:00
|
|
|
//if load error, we will start a fullsync later
|
|
|
|
m.loadInfo()
|
|
|
|
|
|
|
|
return m
|
2014-06-08 12:43:59 +04:00
|
|
|
}
|
|
|
|
|
2014-06-09 13:23:32 +04:00
|
|
|
func (m *master) Close() {
|
2014-06-10 06:41:50 +04:00
|
|
|
select {
|
|
|
|
case m.quit <- struct{}{}:
|
|
|
|
default:
|
|
|
|
}
|
2014-06-09 13:23:32 +04:00
|
|
|
|
2014-07-31 10:38:20 +04:00
|
|
|
if m.conn != nil {
|
|
|
|
m.conn.Close()
|
|
|
|
m.conn = nil
|
2014-06-09 13:23:32 +04:00
|
|
|
}
|
|
|
|
|
|
|
|
m.wg.Wait()
|
2014-06-08 12:43:59 +04:00
|
|
|
}
|
|
|
|
|
2014-06-09 13:23:32 +04:00
|
|
|
func (m *master) loadInfo() error {
|
2014-07-11 12:57:19 +04:00
|
|
|
return m.info.Load(m.infoName)
|
2014-06-08 12:43:59 +04:00
|
|
|
}
|
|
|
|
|
2014-06-09 13:23:32 +04:00
|
|
|
func (m *master) saveInfo() error {
|
2014-07-11 12:57:19 +04:00
|
|
|
return m.info.Save(m.infoName)
|
2014-06-08 12:43:59 +04:00
|
|
|
}
|
|
|
|
|
2014-06-09 13:23:32 +04:00
|
|
|
func (m *master) connect() error {
|
2014-07-11 12:57:19 +04:00
|
|
|
if len(m.info.Addr) == 0 {
|
2014-06-09 13:23:32 +04:00
|
|
|
return fmt.Errorf("no assign master addr")
|
|
|
|
}
|
|
|
|
|
2014-07-31 10:38:20 +04:00
|
|
|
if m.conn != nil {
|
|
|
|
m.conn.Close()
|
|
|
|
m.conn = nil
|
2014-06-08 12:43:59 +04:00
|
|
|
}
|
|
|
|
|
2014-07-31 10:38:20 +04:00
|
|
|
if conn, err := net.Dial("tcp", m.info.Addr); err != nil {
|
2014-06-09 13:23:32 +04:00
|
|
|
return err
|
|
|
|
} else {
|
2014-07-31 10:38:20 +04:00
|
|
|
m.conn = conn
|
2014-06-09 13:23:32 +04:00
|
|
|
|
2014-07-31 10:38:20 +04:00
|
|
|
m.rb = bufio.NewReaderSize(m.conn, 4096)
|
2014-06-09 13:23:32 +04:00
|
|
|
}
|
2014-06-06 10:57:18 +04:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2014-06-09 13:23:32 +04:00
|
|
|
func (m *master) resetInfo(addr string) {
|
2014-07-11 12:57:19 +04:00
|
|
|
m.info.Addr = addr
|
|
|
|
m.info.LogFileIndex = 0
|
|
|
|
m.info.LogPos = 0
|
2014-06-08 12:43:59 +04:00
|
|
|
}
|
|
|
|
|
2014-06-09 13:23:32 +04:00
|
|
|
func (m *master) stopReplication() error {
|
|
|
|
m.Close()
|
|
|
|
|
|
|
|
if err := m.saveInfo(); err != nil {
|
|
|
|
log.Error("save master info error %s", err.Error())
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (m *master) startReplication(masterAddr string) error {
|
|
|
|
//stop last replcation, if avaliable
|
|
|
|
m.Close()
|
|
|
|
|
2014-07-11 12:57:19 +04:00
|
|
|
if masterAddr != m.info.Addr {
|
2014-06-09 13:23:32 +04:00
|
|
|
m.resetInfo(masterAddr)
|
|
|
|
if err := m.saveInfo(); err != nil {
|
|
|
|
log.Error("save master info error %s", err.Error())
|
2014-06-08 12:43:59 +04:00
|
|
|
return err
|
|
|
|
}
|
2014-06-09 13:23:32 +04:00
|
|
|
}
|
|
|
|
|
2014-06-10 06:41:50 +04:00
|
|
|
m.quit = make(chan struct{}, 1)
|
2014-06-09 13:23:32 +04:00
|
|
|
|
|
|
|
go m.runReplication()
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (m *master) runReplication() {
|
|
|
|
m.wg.Add(1)
|
|
|
|
defer m.wg.Done()
|
|
|
|
|
|
|
|
for {
|
|
|
|
select {
|
|
|
|
case <-m.quit:
|
|
|
|
return
|
|
|
|
default:
|
|
|
|
if err := m.connect(); err != nil {
|
2014-07-11 12:57:19 +04:00
|
|
|
log.Error("connect master %s error %s, try 2s later", m.info.Addr, err.Error())
|
2014-06-09 13:23:32 +04:00
|
|
|
time.Sleep(2 * time.Second)
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2014-07-11 12:57:19 +04:00
|
|
|
if m.info.LogFileIndex == 0 {
|
2014-06-09 13:23:32 +04:00
|
|
|
//try a fullsync
|
|
|
|
if err := m.fullSync(); err != nil {
|
2014-09-05 06:01:38 +04:00
|
|
|
if m.conn != nil {
|
|
|
|
//if conn == nil, other close the replication, not error
|
|
|
|
log.Warn("full sync error %s", err.Error())
|
|
|
|
}
|
2014-06-09 13:23:32 +04:00
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2014-07-11 12:57:19 +04:00
|
|
|
if m.info.LogFileIndex == 0 {
|
2014-06-09 13:23:32 +04:00
|
|
|
//master not support binlog, we cannot sync, so stop replication
|
|
|
|
m.stopReplication()
|
|
|
|
return
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
for {
|
2014-09-05 06:01:38 +04:00
|
|
|
if err := m.sync(); err != nil {
|
|
|
|
if m.conn != nil {
|
|
|
|
//if conn == nil, other close the replication, not error
|
2014-06-09 13:23:32 +04:00
|
|
|
log.Warn("sync error %s", err.Error())
|
2014-06-10 06:41:50 +04:00
|
|
|
}
|
2014-09-05 06:01:38 +04:00
|
|
|
return
|
2014-06-10 06:41:50 +04:00
|
|
|
}
|
|
|
|
|
|
|
|
select {
|
2014-06-09 13:23:32 +04:00
|
|
|
case <-m.quit:
|
|
|
|
return
|
2014-09-05 06:01:38 +04:00
|
|
|
default:
|
2014-06-10 06:41:50 +04:00
|
|
|
break
|
2014-06-09 13:23:32 +04:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
var (
|
2014-06-10 06:41:50 +04:00
|
|
|
fullSyncCmd = []byte("*1\r\n$8\r\nfullsync\r\n") //fullsync
|
|
|
|
syncCmdFormat = "*3\r\n$4\r\nsync\r\n$%d\r\n%s\r\n$%d\r\n%s\r\n" //sync index pos
|
2014-06-09 13:23:32 +04:00
|
|
|
)
|
2014-06-06 10:57:18 +04:00
|
|
|
|
2014-06-09 13:23:32 +04:00
|
|
|
func (m *master) fullSync() error {
|
2014-07-31 10:38:20 +04:00
|
|
|
if _, err := m.conn.Write(fullSyncCmd); err != nil {
|
2014-06-09 13:23:32 +04:00
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
dumpPath := path.Join(m.app.cfg.DataDir, "master.dump")
|
|
|
|
f, err := os.OpenFile(dumpPath, os.O_CREATE|os.O_WRONLY, os.ModePerm)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
defer os.Remove(dumpPath)
|
|
|
|
|
2014-07-11 06:43:39 +04:00
|
|
|
err = ReadBulkTo(m.rb, f)
|
2014-06-09 13:23:32 +04:00
|
|
|
f.Close()
|
|
|
|
if err != nil {
|
|
|
|
log.Error("read dump data error %s", err.Error())
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
if err = m.app.ldb.FlushAll(); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2014-09-04 18:43:56 +04:00
|
|
|
var head *ledis.BinLogAnchor
|
2014-06-09 13:23:32 +04:00
|
|
|
head, err = m.app.ldb.LoadDumpFile(dumpPath)
|
|
|
|
|
|
|
|
if err != nil {
|
|
|
|
log.Error("load dump file error %s", err.Error())
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2014-07-11 12:57:19 +04:00
|
|
|
m.info.LogFileIndex = head.LogFileIndex
|
|
|
|
m.info.LogPos = head.LogPos
|
2014-06-09 13:23:32 +04:00
|
|
|
|
2014-06-12 17:29:41 +04:00
|
|
|
return m.saveInfo()
|
2014-06-09 13:23:32 +04:00
|
|
|
}
|
|
|
|
|
|
|
|
func (m *master) sync() error {
|
2014-07-11 12:57:19 +04:00
|
|
|
logIndexStr := strconv.FormatInt(m.info.LogFileIndex, 10)
|
|
|
|
logPosStr := strconv.FormatInt(m.info.LogPos, 10)
|
2014-06-09 13:23:32 +04:00
|
|
|
|
2014-06-10 06:41:50 +04:00
|
|
|
cmd := ledis.Slice(fmt.Sprintf(syncCmdFormat, len(logIndexStr),
|
|
|
|
logIndexStr, len(logPosStr), logPosStr))
|
2014-09-05 06:01:38 +04:00
|
|
|
|
2014-07-31 10:38:20 +04:00
|
|
|
if _, err := m.conn.Write(cmd); err != nil {
|
2014-06-09 13:23:32 +04:00
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
m.syncBuf.Reset()
|
|
|
|
|
2014-07-11 06:43:39 +04:00
|
|
|
err := ReadBulkTo(m.rb, &m.syncBuf)
|
2014-06-09 13:23:32 +04:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2014-07-04 13:55:47 +04:00
|
|
|
var buf []byte
|
|
|
|
buf, err = snappy.Decode(m.compressBuf, m.syncBuf.Bytes())
|
2014-06-09 13:23:32 +04:00
|
|
|
if err != nil {
|
|
|
|
return err
|
2014-07-04 13:55:47 +04:00
|
|
|
} else if len(buf) > len(m.compressBuf) {
|
|
|
|
m.compressBuf = buf
|
2014-06-09 13:23:32 +04:00
|
|
|
}
|
|
|
|
|
2014-07-04 13:55:47 +04:00
|
|
|
if len(buf) < 16 {
|
|
|
|
return fmt.Errorf("invalid sync data len %d", len(buf))
|
2014-06-09 13:23:32 +04:00
|
|
|
}
|
|
|
|
|
2014-07-11 12:57:19 +04:00
|
|
|
m.info.LogFileIndex = int64(binary.BigEndian.Uint64(buf[0:8]))
|
|
|
|
m.info.LogPos = int64(binary.BigEndian.Uint64(buf[8:16]))
|
2014-07-04 13:55:47 +04:00
|
|
|
|
2014-07-11 12:57:19 +04:00
|
|
|
if m.info.LogFileIndex == 0 {
|
2014-06-09 13:23:32 +04:00
|
|
|
//master now not support binlog, stop replication
|
|
|
|
m.stopReplication()
|
|
|
|
return nil
|
2014-07-11 12:57:19 +04:00
|
|
|
} else if m.info.LogFileIndex == -1 {
|
2014-06-09 13:23:32 +04:00
|
|
|
//-1 means than binlog index and pos are lost, we must start a full sync instead
|
|
|
|
return m.fullSync()
|
|
|
|
}
|
|
|
|
|
2014-07-04 13:55:47 +04:00
|
|
|
err = m.app.ldb.ReplicateFromData(buf[16:])
|
2014-06-09 13:23:32 +04:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2014-06-12 17:29:41 +04:00
|
|
|
return m.saveInfo()
|
2014-06-09 13:23:32 +04:00
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
func (app *App) slaveof(masterAddr string) error {
|
|
|
|
app.m.Lock()
|
|
|
|
defer app.m.Unlock()
|
|
|
|
|
|
|
|
if len(masterAddr) == 0 {
|
|
|
|
return app.m.stopReplication()
|
|
|
|
} else {
|
|
|
|
return app.m.startReplication(masterAddr)
|
2014-06-08 12:43:59 +04:00
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
2014-06-06 10:57:18 +04:00
|
|
|
}
|