mirror of https://github.com/go-redis/redis.git
461 lines
9.9 KiB
Go
461 lines
9.9 KiB
Go
package redis
|
|
|
|
import (
|
|
"math/rand"
|
|
"sync"
|
|
"sync/atomic"
|
|
"time"
|
|
|
|
"gopkg.in/redis.v4/internal/hashtag"
|
|
"gopkg.in/redis.v4/internal/pool"
|
|
)
|
|
|
|
// ClusterClient is a Redis Cluster client representing a pool of zero
|
|
// or more underlying connections. It's safe for concurrent use by
|
|
// multiple goroutines.
|
|
type ClusterClient struct {
|
|
commandable
|
|
|
|
opt *ClusterOptions
|
|
|
|
slotsMx sync.RWMutex // protects slots and addrs
|
|
addrs []string
|
|
slots [][]string
|
|
|
|
clientsMx sync.RWMutex // protects clients and closed
|
|
clients map[string]*Client
|
|
|
|
_closed int32 // atomic
|
|
|
|
// Reports where slots reloading is in progress.
|
|
reloading uint32
|
|
}
|
|
|
|
// NewClusterClient returns a Redis Cluster client as described in
|
|
// http://redis.io/topics/cluster-spec.
|
|
func NewClusterClient(opt *ClusterOptions) *ClusterClient {
|
|
client := &ClusterClient{
|
|
opt: opt,
|
|
addrs: opt.Addrs,
|
|
slots: make([][]string, hashtag.SlotNumber),
|
|
clients: make(map[string]*Client),
|
|
}
|
|
client.commandable.process = client.process
|
|
client.reloadSlots()
|
|
return client
|
|
}
|
|
|
|
// getClients returns a snapshot of clients for cluster nodes
|
|
// this ClusterClient has been working with recently.
|
|
// Note that snapshot can contain closed clients.
|
|
func (c *ClusterClient) getClients() map[string]*Client {
|
|
c.clientsMx.RLock()
|
|
clients := make(map[string]*Client, len(c.clients))
|
|
for addr, client := range c.clients {
|
|
clients[addr] = client
|
|
}
|
|
c.clientsMx.RUnlock()
|
|
return clients
|
|
}
|
|
|
|
// Watch creates new transaction and marks the keys to be watched
|
|
// for conditional execution of a transaction.
|
|
func (c *ClusterClient) Watch(keys ...string) (*Tx, error) {
|
|
addr := c.slotMasterAddr(hashtag.Slot(keys[0]))
|
|
client, err := c.getClient(addr)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
return client.Watch(keys...)
|
|
}
|
|
|
|
// PoolStats returns accumulated connection pool stats.
|
|
func (c *ClusterClient) PoolStats() *PoolStats {
|
|
acc := PoolStats{}
|
|
for _, client := range c.getClients() {
|
|
s := client.connPool.Stats()
|
|
acc.Requests += s.Requests
|
|
acc.Hits += s.Hits
|
|
acc.Timeouts += s.Timeouts
|
|
acc.TotalConns += s.TotalConns
|
|
acc.FreeConns += s.FreeConns
|
|
}
|
|
return &acc
|
|
}
|
|
|
|
func (c *ClusterClient) closed() bool {
|
|
return atomic.LoadInt32(&c._closed) == 1
|
|
}
|
|
|
|
// Close closes the cluster client, releasing any open resources.
|
|
//
|
|
// It is rare to Close a ClusterClient, as the ClusterClient is meant
|
|
// to be long-lived and shared between many goroutines.
|
|
func (c *ClusterClient) Close() error {
|
|
if !atomic.CompareAndSwapInt32(&c._closed, 0, 1) {
|
|
return pool.ErrClosed
|
|
}
|
|
|
|
c.clientsMx.Lock()
|
|
c.resetClients()
|
|
c.clientsMx.Unlock()
|
|
c.setSlots(nil)
|
|
return nil
|
|
}
|
|
|
|
// getClient returns a Client for a given address.
|
|
func (c *ClusterClient) getClient(addr string) (*Client, error) {
|
|
if c.closed() {
|
|
return nil, pool.ErrClosed
|
|
}
|
|
|
|
if addr == "" {
|
|
return c.randomClient()
|
|
}
|
|
|
|
c.clientsMx.RLock()
|
|
client, ok := c.clients[addr]
|
|
c.clientsMx.RUnlock()
|
|
if ok {
|
|
return client, nil
|
|
}
|
|
|
|
c.clientsMx.Lock()
|
|
client, ok = c.clients[addr]
|
|
if !ok {
|
|
opt := c.opt.clientOptions()
|
|
opt.Addr = addr
|
|
client = NewClient(opt)
|
|
c.clients[addr] = client
|
|
}
|
|
c.clientsMx.Unlock()
|
|
|
|
return client, nil
|
|
}
|
|
|
|
func (c *ClusterClient) slotAddrs(slot int) []string {
|
|
c.slotsMx.RLock()
|
|
addrs := c.slots[slot]
|
|
c.slotsMx.RUnlock()
|
|
return addrs
|
|
}
|
|
|
|
func (c *ClusterClient) slotMasterAddr(slot int) string {
|
|
addrs := c.slotAddrs(slot)
|
|
if len(addrs) > 0 {
|
|
return addrs[0]
|
|
}
|
|
return ""
|
|
}
|
|
|
|
// randomClient returns a Client for the first live node.
|
|
func (c *ClusterClient) randomClient() (client *Client, err error) {
|
|
for i := 0; i < 10; i++ {
|
|
n := rand.Intn(len(c.addrs))
|
|
client, err = c.getClient(c.addrs[n])
|
|
if err != nil {
|
|
continue
|
|
}
|
|
err = client.ClusterInfo().Err()
|
|
if err == nil {
|
|
return client, nil
|
|
}
|
|
}
|
|
return nil, err
|
|
}
|
|
|
|
func (c *ClusterClient) process(cmd Cmder) {
|
|
var ask bool
|
|
|
|
slot := hashtag.Slot(cmd.clusterKey())
|
|
|
|
addr := c.slotMasterAddr(slot)
|
|
client, err := c.getClient(addr)
|
|
if err != nil {
|
|
cmd.setErr(err)
|
|
return
|
|
}
|
|
|
|
for attempt := 0; attempt <= c.opt.getMaxRedirects(); attempt++ {
|
|
if attempt > 0 {
|
|
cmd.reset()
|
|
}
|
|
|
|
if ask {
|
|
pipe := client.Pipeline()
|
|
pipe.Process(NewCmd("ASKING"))
|
|
pipe.Process(cmd)
|
|
_, _ = pipe.Exec()
|
|
pipe.Close()
|
|
ask = false
|
|
} else {
|
|
client.Process(cmd)
|
|
}
|
|
|
|
// If there is no (real) error, we are done!
|
|
err := cmd.Err()
|
|
if err == nil {
|
|
return
|
|
}
|
|
|
|
// On network errors try random node.
|
|
if shouldRetry(err) {
|
|
client, err = c.randomClient()
|
|
if err != nil {
|
|
return
|
|
}
|
|
continue
|
|
}
|
|
|
|
var moved bool
|
|
var addr string
|
|
moved, ask, addr = isMovedError(err)
|
|
if moved || ask {
|
|
if moved && c.slotMasterAddr(slot) != addr {
|
|
c.lazyReloadSlots()
|
|
}
|
|
client, err = c.getClient(addr)
|
|
if err != nil {
|
|
return
|
|
}
|
|
continue
|
|
}
|
|
|
|
break
|
|
}
|
|
}
|
|
|
|
// Closes all clients and returns last error if there are any.
|
|
func (c *ClusterClient) resetClients() (retErr error) {
|
|
for addr, client := range c.clients {
|
|
if err := client.Close(); err != nil && retErr == nil {
|
|
retErr = err
|
|
}
|
|
delete(c.clients, addr)
|
|
}
|
|
return retErr
|
|
}
|
|
|
|
func (c *ClusterClient) setSlots(slots []ClusterSlot) {
|
|
c.slotsMx.Lock()
|
|
|
|
seen := make(map[string]struct{})
|
|
for _, addr := range c.addrs {
|
|
seen[addr] = struct{}{}
|
|
}
|
|
|
|
for i := 0; i < hashtag.SlotNumber; i++ {
|
|
c.slots[i] = c.slots[i][:0]
|
|
}
|
|
for _, slot := range slots {
|
|
var addrs []string
|
|
for _, node := range slot.Nodes {
|
|
addrs = append(addrs, node.Addr)
|
|
}
|
|
|
|
for i := slot.Start; i <= slot.End; i++ {
|
|
c.slots[i] = addrs
|
|
}
|
|
|
|
for _, node := range slot.Nodes {
|
|
if _, ok := seen[node.Addr]; !ok {
|
|
c.addrs = append(c.addrs, node.Addr)
|
|
seen[node.Addr] = struct{}{}
|
|
}
|
|
}
|
|
}
|
|
|
|
c.slotsMx.Unlock()
|
|
}
|
|
|
|
func (c *ClusterClient) reloadSlots() {
|
|
defer atomic.StoreUint32(&c.reloading, 0)
|
|
|
|
client, err := c.randomClient()
|
|
if err != nil {
|
|
Logger.Printf("randomClient failed: %s", err)
|
|
return
|
|
}
|
|
|
|
slots, err := client.ClusterSlots().Result()
|
|
if err != nil {
|
|
Logger.Printf("ClusterSlots failed: %s", err)
|
|
return
|
|
}
|
|
c.setSlots(slots)
|
|
}
|
|
|
|
func (c *ClusterClient) lazyReloadSlots() {
|
|
if !atomic.CompareAndSwapUint32(&c.reloading, 0, 1) {
|
|
return
|
|
}
|
|
go c.reloadSlots()
|
|
}
|
|
|
|
// reaper closes idle connections to the cluster.
|
|
func (c *ClusterClient) reaper(frequency time.Duration) {
|
|
ticker := time.NewTicker(frequency)
|
|
defer ticker.Stop()
|
|
|
|
for _ = range ticker.C {
|
|
if c.closed() {
|
|
break
|
|
}
|
|
|
|
var n int
|
|
for _, client := range c.getClients() {
|
|
nn, err := client.connPool.(*pool.ConnPool).ReapStaleConns()
|
|
if err != nil {
|
|
Logger.Printf("ReapStaleConns failed: %s", err)
|
|
} else {
|
|
n += nn
|
|
}
|
|
}
|
|
|
|
s := c.PoolStats()
|
|
Logger.Printf(
|
|
"reaper: removed %d stale conns (TotalConns=%d FreeConns=%d Requests=%d Hits=%d Timeouts=%d)",
|
|
n, s.TotalConns, s.FreeConns, s.Requests, s.Hits, s.Timeouts,
|
|
)
|
|
}
|
|
}
|
|
|
|
func (c *ClusterClient) Pipeline() *Pipeline {
|
|
pipe := &Pipeline{
|
|
exec: c.pipelineExec,
|
|
}
|
|
pipe.commandable.process = pipe.process
|
|
return pipe
|
|
}
|
|
|
|
func (c *ClusterClient) Pipelined(fn func(*Pipeline) error) ([]Cmder, error) {
|
|
return c.Pipeline().pipelined(fn)
|
|
}
|
|
|
|
func (c *ClusterClient) pipelineExec(cmds []Cmder) error {
|
|
var retErr error
|
|
|
|
cmdsMap := make(map[string][]Cmder)
|
|
for _, cmd := range cmds {
|
|
slot := hashtag.Slot(cmd.clusterKey())
|
|
addr := c.slotMasterAddr(slot)
|
|
cmdsMap[addr] = append(cmdsMap[addr], cmd)
|
|
}
|
|
|
|
for attempt := 0; attempt <= c.opt.getMaxRedirects(); attempt++ {
|
|
failedCmds := make(map[string][]Cmder)
|
|
|
|
for addr, cmds := range cmdsMap {
|
|
client, err := c.getClient(addr)
|
|
if err != nil {
|
|
setCmdsErr(cmds, err)
|
|
retErr = err
|
|
continue
|
|
}
|
|
|
|
cn, err := client.conn()
|
|
if err != nil {
|
|
setCmdsErr(cmds, err)
|
|
retErr = err
|
|
continue
|
|
}
|
|
|
|
failedCmds, err = c.execClusterCmds(cn, cmds, failedCmds)
|
|
if err != nil {
|
|
retErr = err
|
|
}
|
|
client.putConn(cn, err, false)
|
|
}
|
|
|
|
cmdsMap = failedCmds
|
|
}
|
|
|
|
return retErr
|
|
}
|
|
|
|
func (c *ClusterClient) execClusterCmds(
|
|
cn *pool.Conn, cmds []Cmder, failedCmds map[string][]Cmder,
|
|
) (map[string][]Cmder, error) {
|
|
if err := writeCmd(cn, cmds...); err != nil {
|
|
setCmdsErr(cmds, err)
|
|
return failedCmds, err
|
|
}
|
|
|
|
var firstCmdErr error
|
|
for i, cmd := range cmds {
|
|
err := cmd.readReply(cn)
|
|
if err == nil {
|
|
continue
|
|
}
|
|
if isNetworkError(err) {
|
|
cmd.reset()
|
|
failedCmds[""] = append(failedCmds[""], cmds[i:]...)
|
|
break
|
|
} else if moved, ask, addr := isMovedError(err); moved {
|
|
c.lazyReloadSlots()
|
|
cmd.reset()
|
|
failedCmds[addr] = append(failedCmds[addr], cmd)
|
|
} else if ask {
|
|
cmd.reset()
|
|
failedCmds[addr] = append(failedCmds[addr], NewCmd("ASKING"), cmd)
|
|
} else if firstCmdErr == nil {
|
|
firstCmdErr = err
|
|
}
|
|
}
|
|
|
|
return failedCmds, firstCmdErr
|
|
}
|
|
|
|
//------------------------------------------------------------------------------
|
|
|
|
// ClusterOptions are used to configure a cluster client and should be
|
|
// passed to NewClusterClient.
|
|
type ClusterOptions struct {
|
|
// A seed list of host:port addresses of cluster nodes.
|
|
Addrs []string
|
|
|
|
// The maximum number of retries before giving up. Command is retried
|
|
// on network errors and MOVED/ASK redirects.
|
|
// Default is 16.
|
|
MaxRedirects int
|
|
|
|
// Following options are copied from Options struct.
|
|
|
|
Password string
|
|
|
|
DialTimeout time.Duration
|
|
ReadTimeout time.Duration
|
|
WriteTimeout time.Duration
|
|
|
|
// PoolSize applies per cluster node and not for the whole cluster.
|
|
PoolSize int
|
|
PoolTimeout time.Duration
|
|
IdleTimeout time.Duration
|
|
IdleCheckFrequency time.Duration
|
|
}
|
|
|
|
func (opt *ClusterOptions) getMaxRedirects() int {
|
|
if opt.MaxRedirects == -1 {
|
|
return 0
|
|
}
|
|
if opt.MaxRedirects == 0 {
|
|
return 16
|
|
}
|
|
return opt.MaxRedirects
|
|
}
|
|
|
|
func (opt *ClusterOptions) clientOptions() *Options {
|
|
return &Options{
|
|
Password: opt.Password,
|
|
|
|
DialTimeout: opt.DialTimeout,
|
|
ReadTimeout: opt.ReadTimeout,
|
|
WriteTimeout: opt.WriteTimeout,
|
|
|
|
PoolSize: opt.PoolSize,
|
|
PoolTimeout: opt.PoolTimeout,
|
|
IdleTimeout: opt.IdleTimeout,
|
|
// IdleCheckFrequency is not copied to disable reaper
|
|
}
|
|
}
|