redis/sentinel.go

348 lines
7.3 KiB
Go
Raw Normal View History

2014-05-11 18:11:55 +04:00
package redis
import (
"crypto/tls"
2014-05-11 18:11:55 +04:00
"errors"
"net"
"strings"
"sync"
"time"
2017-02-18 17:42:34 +03:00
"github.com/go-redis/redis/internal"
"github.com/go-redis/redis/internal/pool"
2014-05-11 18:11:55 +04:00
)
//------------------------------------------------------------------------------
// FailoverOptions are used to configure a failover client and should
// be passed to NewFailoverClient.
2014-05-11 18:11:55 +04:00
type FailoverOptions struct {
2015-01-31 17:54:37 +03:00
// The master name.
MasterName string
// A seed list of host:port addresses of sentinel nodes.
2014-05-11 18:11:55 +04:00
SentinelAddrs []string
// Following options are copied from Options struct.
2017-05-25 14:16:39 +03:00
OnConnect func(*Conn) error
2014-05-11 18:11:55 +04:00
Password string
DB int
MaxRetries int
MinRetryBackoff time.Duration
MaxRetryBackoff time.Duration
2016-03-17 19:00:47 +03:00
DialTimeout time.Duration
ReadTimeout time.Duration
2015-01-31 17:54:37 +03:00
WriteTimeout time.Duration
2014-05-11 18:11:55 +04:00
2016-03-17 19:00:47 +03:00
PoolSize int
MinIdleConns int
MaxConnAge time.Duration
2016-03-17 19:00:47 +03:00
PoolTimeout time.Duration
IdleTimeout time.Duration
IdleCheckFrequency time.Duration
TLSConfig *tls.Config
2014-05-11 18:11:55 +04:00
}
func (opt *FailoverOptions) options() *Options {
return &Options{
Addr: "FailoverClient",
2014-05-11 18:11:55 +04:00
2017-05-25 14:16:39 +03:00
OnConnect: opt.OnConnect,
2014-05-11 18:11:55 +04:00
DB: opt.DB,
Password: opt.Password,
2016-03-17 19:00:47 +03:00
MaxRetries: opt.MaxRetries,
DialTimeout: opt.DialTimeout,
2014-05-11 18:11:55 +04:00
ReadTimeout: opt.ReadTimeout,
WriteTimeout: opt.WriteTimeout,
2016-03-17 19:00:47 +03:00
PoolSize: opt.PoolSize,
PoolTimeout: opt.PoolTimeout,
IdleTimeout: opt.IdleTimeout,
IdleCheckFrequency: opt.IdleCheckFrequency,
TLSConfig: opt.TLSConfig,
2014-05-11 18:11:55 +04:00
}
}
2015-09-12 09:36:03 +03:00
// NewFailoverClient returns a Redis client that uses Redis Sentinel
// for automatic failover. It's safe for concurrent use by multiple
// goroutines.
2014-05-11 18:11:55 +04:00
func NewFailoverClient(failoverOpt *FailoverOptions) *Client {
opt := failoverOpt.options()
2016-06-05 14:10:30 +03:00
opt.init()
2014-05-11 18:11:55 +04:00
failover := &sentinelFailover{
masterName: failoverOpt.MasterName,
sentinelAddrs: failoverOpt.SentinelAddrs,
opt: opt,
}
2016-06-05 14:10:30 +03:00
2018-01-20 13:26:33 +03:00
c := Client{
baseClient: baseClient{
opt: opt,
connPool: failover.Pool(),
onClose: func() error {
return failover.Close()
},
},
}
2018-01-20 13:26:33 +03:00
c.baseClient.init()
2018-08-12 11:11:01 +03:00
c.cmdable.setProcessor(c.Process)
2016-06-05 14:10:30 +03:00
2018-01-20 13:26:33 +03:00
return &c
2014-05-11 18:11:55 +04:00
}
//------------------------------------------------------------------------------
2018-05-31 13:15:52 +03:00
type SentinelClient struct {
baseClient
2014-05-11 18:11:55 +04:00
}
2018-05-31 13:15:52 +03:00
func NewSentinelClient(opt *Options) *SentinelClient {
2016-06-05 14:10:30 +03:00
opt.init()
2018-05-31 13:15:52 +03:00
c := &SentinelClient{
baseClient: baseClient{
opt: opt,
connPool: newConnPool(opt),
},
2014-05-11 18:11:55 +04:00
}
2018-01-20 13:26:33 +03:00
c.baseClient.init()
2018-05-31 13:15:52 +03:00
return c
2014-05-11 18:11:55 +04:00
}
2018-05-31 13:15:52 +03:00
func (c *SentinelClient) PubSub() *PubSub {
2018-07-23 15:55:13 +03:00
pubsub := &PubSub{
2017-07-09 10:07:20 +03:00
opt: c.opt,
newConn: func(channels []string) (*pool.Conn, error) {
return c.newConn()
2014-05-11 18:11:55 +04:00
},
2017-07-09 10:07:20 +03:00
closeConn: c.connPool.CloseConn,
2014-05-11 18:11:55 +04:00
}
2018-07-23 15:55:13 +03:00
pubsub.init()
return pubsub
2014-05-11 18:11:55 +04:00
}
2018-05-31 13:15:52 +03:00
func (c *SentinelClient) GetMasterAddrByName(name string) *StringSliceCmd {
2014-05-11 18:11:55 +04:00
cmd := NewStringSliceCmd("SENTINEL", "get-master-addr-by-name", name)
c.Process(cmd)
return cmd
}
2018-05-31 13:15:52 +03:00
func (c *SentinelClient) Sentinels(name string) *SliceCmd {
2014-05-11 18:11:55 +04:00
cmd := NewSliceCmd("SENTINEL", "sentinels", name)
c.Process(cmd)
return cmd
}
type sentinelFailover struct {
sentinelAddrs []string
opt *Options
2014-05-11 18:11:55 +04:00
pool *pool.ConnPool
2014-05-11 18:11:55 +04:00
poolOnce sync.Once
mu sync.RWMutex
masterName string
_masterAddr string
2018-05-31 13:15:52 +03:00
sentinel *SentinelClient
}
func (d *sentinelFailover) Close() error {
return d.resetSentinel()
2014-05-11 18:11:55 +04:00
}
func (d *sentinelFailover) Pool() *pool.ConnPool {
2014-05-11 18:11:55 +04:00
d.poolOnce.Do(func() {
d.opt.Dialer = d.dial
d.pool = newConnPool(d.opt)
2014-05-11 18:11:55 +04:00
})
return d.pool
}
2017-07-09 10:07:20 +03:00
func (d *sentinelFailover) dial() (net.Conn, error) {
addr, err := d.MasterAddr()
if err != nil {
return nil, err
}
return net.DialTimeout("tcp", addr, d.opt.DialTimeout)
}
2014-05-11 18:11:55 +04:00
func (d *sentinelFailover) MasterAddr() (string, error) {
d.mu.Lock()
2017-01-28 11:53:10 +03:00
defer d.mu.Unlock()
2014-05-11 18:11:55 +04:00
addr, err := d.masterAddr()
if err != nil {
return "", err
}
2018-07-23 15:55:13 +03:00
d._switchMaster(addr)
return addr, nil
}
func (d *sentinelFailover) masterAddr() (string, error) {
2014-05-11 18:11:55 +04:00
// Try last working sentinel.
if d.sentinel != nil {
addr, err := d.sentinel.GetMasterAddrByName(d.masterName).Result()
if err == nil {
2014-05-11 18:11:55 +04:00
addr := net.JoinHostPort(addr[0], addr[1])
return addr, nil
}
2018-07-23 15:55:13 +03:00
internal.Logf("sentinel: GetMasterAddrByName name=%q failed: %s",
d.masterName, err)
d._resetSentinel()
2014-05-11 18:11:55 +04:00
}
for i, sentinelAddr := range d.sentinelAddrs {
2018-05-31 13:15:52 +03:00
sentinel := NewSentinelClient(&Options{
Addr: sentinelAddr,
2014-05-11 18:11:55 +04:00
DialTimeout: d.opt.DialTimeout,
ReadTimeout: d.opt.ReadTimeout,
WriteTimeout: d.opt.WriteTimeout,
PoolSize: d.opt.PoolSize,
2015-01-31 16:20:37 +03:00
PoolTimeout: d.opt.PoolTimeout,
2014-05-11 18:11:55 +04:00
IdleTimeout: d.opt.IdleTimeout,
})
masterAddr, err := sentinel.GetMasterAddrByName(d.masterName).Result()
2014-05-11 18:11:55 +04:00
if err != nil {
2018-05-31 13:15:52 +03:00
internal.Logf("sentinel: GetMasterAddrByName master=%q failed: %s",
d.masterName, err)
sentinel.Close()
continue
2014-05-11 18:11:55 +04:00
}
// Push working sentinel to the top.
d.sentinelAddrs[0], d.sentinelAddrs[i] = d.sentinelAddrs[i], d.sentinelAddrs[0]
d.setSentinel(sentinel)
addr := net.JoinHostPort(masterAddr[0], masterAddr[1])
return addr, nil
2014-05-11 18:11:55 +04:00
}
return "", errors.New("redis: all sentinels are unreachable")
}
2018-07-23 15:55:13 +03:00
func (c *sentinelFailover) switchMaster(addr string) {
c.mu.Lock()
c._switchMaster(addr)
c.mu.Unlock()
}
func (c *sentinelFailover) _switchMaster(addr string) {
if c._masterAddr == addr {
return
}
internal.Logf("sentinel: new master=%q addr=%q",
c.masterName, addr)
_ = c.Pool().Filter(func(cn *pool.Conn) bool {
return cn.RemoteAddr().String() != addr
})
2018-07-23 15:55:13 +03:00
c._masterAddr = addr
}
2018-05-31 13:15:52 +03:00
func (d *sentinelFailover) setSentinel(sentinel *SentinelClient) {
2014-05-11 18:11:55 +04:00
d.discoverSentinels(sentinel)
d.sentinel = sentinel
go d.listen(sentinel)
2014-05-11 18:11:55 +04:00
}
func (d *sentinelFailover) resetSentinel() error {
var err error
d.mu.Lock()
if d.sentinel != nil {
err = d._resetSentinel()
}
d.mu.Unlock()
return err
}
func (d *sentinelFailover) _resetSentinel() error {
err := d.sentinel.Close()
d.sentinel = nil
return err
}
2018-05-31 13:15:52 +03:00
func (d *sentinelFailover) discoverSentinels(sentinel *SentinelClient) {
2014-05-11 18:11:55 +04:00
sentinels, err := sentinel.Sentinels(d.masterName).Result()
if err != nil {
internal.Logf("sentinel: Sentinels master=%q failed: %s", d.masterName, err)
2014-05-11 18:11:55 +04:00
return
}
for _, sentinel := range sentinels {
vals := sentinel.([]interface{})
for i := 0; i < len(vals); i += 2 {
key := vals[i].(string)
if key == "name" {
sentinelAddr := vals[i+1].(string)
if !contains(d.sentinelAddrs, sentinelAddr) {
2016-04-09 14:52:01 +03:00
internal.Logf(
"sentinel: discovered new sentinel=%q for master=%q",
sentinelAddr, d.masterName,
2014-05-11 18:11:55 +04:00
)
d.sentinelAddrs = append(d.sentinelAddrs, sentinelAddr)
}
}
}
}
}
2018-05-31 13:15:52 +03:00
func (d *sentinelFailover) listen(sentinel *SentinelClient) {
2018-07-23 15:55:13 +03:00
pubsub := sentinel.PubSub()
defer pubsub.Close()
2018-07-23 15:55:13 +03:00
err := pubsub.Subscribe("+switch-master")
if err != nil {
internal.Logf("sentinel: Subscribe failed: %s", err)
d.resetSentinel()
return
}
2014-05-11 18:11:55 +04:00
2018-07-23 15:55:13 +03:00
for {
msg, err := pubsub.ReceiveMessage()
2014-05-11 18:11:55 +04:00
if err != nil {
2018-07-23 15:55:13 +03:00
if err == pool.ErrClosed {
d.resetSentinel()
return
}
2018-07-23 15:55:13 +03:00
internal.Logf("sentinel: ReceiveMessage failed: %s", err)
continue
2014-05-11 18:11:55 +04:00
}
switch msg.Channel {
case "+switch-master":
parts := strings.Split(msg.Payload, " ")
if parts[0] != d.masterName {
internal.Logf("sentinel: ignore addr for master=%q", parts[0])
continue
2014-05-11 18:11:55 +04:00
}
addr := net.JoinHostPort(parts[3], parts[4])
2018-07-23 15:55:13 +03:00
d.switchMaster(addr)
2014-05-11 18:11:55 +04:00
}
}
}
func contains(slice []string, str string) bool {
for _, s := range slice {
if s == str {
return true
}
}
return false
}