redis/ring.go

421 lines
8.6 KiB
Go
Raw Normal View History

2015-05-25 16:22:27 +03:00
package redis
import (
"errors"
"fmt"
"math/rand"
"strconv"
2015-05-25 16:22:27 +03:00
"sync"
"sync/atomic"
2015-05-25 16:22:27 +03:00
"time"
2016-10-09 13:49:28 +03:00
"gopkg.in/redis.v5/internal"
"gopkg.in/redis.v5/internal/consistenthash"
"gopkg.in/redis.v5/internal/hashtag"
"gopkg.in/redis.v5/internal/pool"
2015-05-25 16:22:27 +03:00
)
2016-08-09 16:32:08 +03:00
var errRingShardsDown = errors.New("redis: all ring shards are down")
2015-05-25 16:22:27 +03:00
// RingOptions are used to configure a ring client and should be
// passed to NewRing.
type RingOptions struct {
2016-08-09 16:32:08 +03:00
// Map of name => host:port addresses of ring shards.
2015-05-25 16:22:27 +03:00
Addrs map[string]string
2016-08-09 16:32:08 +03:00
// Frequency of PING commands sent to check shards availability.
// Shard is considered down after 3 subsequent failed checks.
HeartbeatFrequency time.Duration
2015-05-25 16:22:27 +03:00
// Following options are copied from Options struct.
DB int
2015-05-25 16:22:27 +03:00
Password string
2015-06-04 11:50:24 +03:00
MaxRetries int
2015-05-25 16:22:27 +03:00
DialTimeout time.Duration
ReadTimeout time.Duration
WriteTimeout time.Duration
2016-03-17 19:00:47 +03:00
PoolSize int
PoolTimeout time.Duration
IdleTimeout time.Duration
IdleCheckFrequency time.Duration
2015-05-25 16:22:27 +03:00
}
2016-08-09 16:32:08 +03:00
func (opt *RingOptions) init() {
if opt.HeartbeatFrequency == 0 {
opt.HeartbeatFrequency = 500 * time.Millisecond
}
}
2016-06-05 14:10:30 +03:00
2015-05-25 16:22:27 +03:00
func (opt *RingOptions) clientOptions() *Options {
return &Options{
DB: opt.DB,
Password: opt.Password,
DialTimeout: opt.DialTimeout,
ReadTimeout: opt.ReadTimeout,
WriteTimeout: opt.WriteTimeout,
2016-03-17 19:00:47 +03:00
PoolSize: opt.PoolSize,
PoolTimeout: opt.PoolTimeout,
IdleTimeout: opt.IdleTimeout,
IdleCheckFrequency: opt.IdleCheckFrequency,
2015-05-25 16:22:27 +03:00
}
}
type ringShard struct {
Client *Client
down int32
2015-05-25 16:22:27 +03:00
}
func (shard *ringShard) String() string {
var state string
if shard.IsUp() {
state = "up"
} else {
state = "down"
}
return fmt.Sprintf("%s is %s", shard.Client, state)
}
func (shard *ringShard) IsDown() bool {
2016-08-09 16:32:08 +03:00
const threshold = 3
return atomic.LoadInt32(&shard.down) >= threshold
2015-05-25 16:22:27 +03:00
}
func (shard *ringShard) IsUp() bool {
return !shard.IsDown()
}
// Vote votes to set shard state and returns true if state was changed.
func (shard *ringShard) Vote(up bool) bool {
if up {
changed := shard.IsDown()
atomic.StoreInt32(&shard.down, 0)
2015-05-25 16:22:27 +03:00
return changed
}
if shard.IsDown() {
return false
}
atomic.AddInt32(&shard.down, 1)
2015-05-25 16:22:27 +03:00
return shard.IsDown()
}
// Ring is a Redis client that uses constistent hashing to distribute
2015-09-12 09:36:03 +03:00
// keys across multiple Redis servers (shards). It's safe for
// concurrent use by multiple goroutines.
2015-05-25 16:22:27 +03:00
//
2015-11-21 11:20:01 +03:00
// Ring monitors the state of each shard and removes dead shards from
2016-07-02 11:07:27 +03:00
// the ring. When shard comes online it is added back to the ring. This
2015-05-25 16:22:27 +03:00
// gives you maximum availability and partition tolerance, but no
// consistency between different shards or even clients. Each client
// uses shards that are available to the client and does not do any
// coordination when shard state is changed.
//
2016-08-09 16:32:08 +03:00
// Ring should be used when you need multiple Redis servers for caching
2015-05-25 16:22:27 +03:00
// and can tolerate losing data when one of the servers dies.
// Otherwise you should use Redis Cluster.
type Ring struct {
cmdable
2015-05-25 16:22:27 +03:00
2015-06-04 11:50:24 +03:00
opt *RingOptions
2015-05-25 16:22:27 +03:00
nreplicas int
mu sync.RWMutex
2015-05-25 16:22:27 +03:00
hash *consistenthash.Map
shards map[string]*ringShard
cmdsInfoOnce *sync.Once
cmdsInfo map[string]*CommandInfo
2015-05-25 16:22:27 +03:00
closed bool
}
func NewRing(opt *RingOptions) *Ring {
const nreplicas = 100
2016-06-05 14:10:30 +03:00
opt.init()
2015-05-25 16:22:27 +03:00
ring := &Ring{
2015-06-04 11:50:24 +03:00
opt: opt,
2015-05-25 16:22:27 +03:00
nreplicas: nreplicas,
2015-06-04 11:50:24 +03:00
hash: consistenthash.New(nreplicas, nil),
shards: make(map[string]*ringShard),
cmdsInfoOnce: new(sync.Once),
2015-05-25 16:22:27 +03:00
}
ring.cmdable.process = ring.Process
2015-05-25 16:22:27 +03:00
for name, addr := range opt.Addrs {
clopt := opt.clientOptions()
clopt.Addr = addr
ring.addClient(name, NewClient(clopt))
}
go ring.heartbeat()
return ring
}
// PoolStats returns accumulated connection pool stats.
func (c *Ring) PoolStats() *PoolStats {
var acc PoolStats
for _, shard := range c.shards {
s := shard.Client.connPool.Stats()
acc.Requests += s.Requests
acc.Hits += s.Hits
acc.Timeouts += s.Timeouts
acc.TotalConns += s.TotalConns
acc.FreeConns += s.FreeConns
}
return &acc
}
// ForEachShard concurrently calls the fn on each live shard in the ring.
// It returns the first error if any.
func (c *Ring) ForEachShard(fn func(client *Client) error) error {
var wg sync.WaitGroup
errCh := make(chan error, 1)
for _, shard := range c.shards {
if shard.IsDown() {
continue
}
wg.Add(1)
go func(shard *ringShard) {
defer wg.Done()
err := fn(shard.Client)
if err != nil {
select {
case errCh <- err:
default:
}
}
}(shard)
}
wg.Wait()
select {
case err := <-errCh:
return err
default:
return nil
}
}
func (c *Ring) cmdInfo(name string) *CommandInfo {
c.cmdsInfoOnce.Do(func() {
for _, shard := range c.shards {
cmdsInfo, err := shard.Client.Command().Result()
if err == nil {
c.cmdsInfo = cmdsInfo
return
}
}
c.cmdsInfoOnce = &sync.Once{}
})
if c.cmdsInfo == nil {
return nil
}
return c.cmdsInfo[name]
}
func (c *Ring) addClient(name string, cl *Client) {
c.mu.Lock()
c.hash.Add(name)
c.shards[name] = &ringShard{Client: cl}
c.mu.Unlock()
2015-05-25 16:22:27 +03:00
}
func (c *Ring) shardByKey(key string) (*ringShard, error) {
key = hashtag.Key(key)
c.mu.RLock()
2015-05-25 16:22:27 +03:00
if c.closed {
c.mu.RUnlock()
return nil, pool.ErrClosed
2015-05-25 16:22:27 +03:00
}
name := c.hash.Get(key)
2015-05-25 16:22:27 +03:00
if name == "" {
c.mu.RUnlock()
2015-05-25 16:22:27 +03:00
return nil, errRingShardsDown
}
shard := c.shards[name]
c.mu.RUnlock()
return shard, nil
2015-05-25 16:22:27 +03:00
}
func (c *Ring) randomShard() (*ringShard, error) {
return c.shardByKey(strconv.Itoa(rand.Int()))
}
func (c *Ring) shardByName(name string) (*ringShard, error) {
if name == "" {
return c.randomShard()
}
c.mu.RLock()
shard := c.shards[name]
c.mu.RUnlock()
return shard, nil
}
func (c *Ring) cmdShard(cmd Cmder) (*ringShard, error) {
2017-01-13 14:39:59 +03:00
cmdInfo := c.cmdInfo(cmd.name())
firstKey := cmd.arg(cmdFirstKeyPos(cmd, cmdInfo))
return c.shardByKey(firstKey)
}
func (c *Ring) Process(cmd Cmder) error {
shard, err := c.cmdShard(cmd)
2015-05-25 16:22:27 +03:00
if err != nil {
cmd.setErr(err)
2016-06-17 15:09:38 +03:00
return err
2015-05-25 16:22:27 +03:00
}
return shard.Client.Process(cmd)
2015-05-25 16:22:27 +03:00
}
// rebalance removes dead shards from the Ring.
func (c *Ring) rebalance() {
hash := consistenthash.New(c.nreplicas, nil)
for name, shard := range c.shards {
2015-05-25 16:22:27 +03:00
if shard.IsUp() {
hash.Add(name)
2015-05-25 16:22:27 +03:00
}
}
c.mu.Lock()
c.hash = hash
c.mu.Unlock()
2015-05-25 16:22:27 +03:00
}
2016-07-02 11:07:27 +03:00
// heartbeat monitors state of each shard in the ring.
func (c *Ring) heartbeat() {
2016-08-09 16:32:08 +03:00
ticker := time.NewTicker(c.opt.HeartbeatFrequency)
2015-05-25 16:22:27 +03:00
defer ticker.Stop()
for _ = range ticker.C {
var rebalance bool
c.mu.RLock()
2015-05-25 16:22:27 +03:00
if c.closed {
c.mu.RUnlock()
2015-05-25 16:22:27 +03:00
break
}
for _, shard := range c.shards {
2015-05-25 16:22:27 +03:00
err := shard.Client.Ping().Err()
if shard.Vote(err == nil || err == pool.ErrPoolTimeout) {
2016-04-09 14:52:01 +03:00
internal.Logf("ring shard state changed: %s", shard)
2015-05-25 16:22:27 +03:00
rebalance = true
}
}
c.mu.RUnlock()
2015-05-25 16:22:27 +03:00
if rebalance {
c.rebalance()
2015-05-25 16:22:27 +03:00
}
}
}
// Close closes the ring client, releasing any open resources.
//
2015-09-12 09:36:03 +03:00
// It is rare to Close a Ring, as the Ring is meant to be long-lived
// and shared between many goroutines.
func (c *Ring) Close() error {
c.mu.Lock()
2017-01-28 11:53:10 +03:00
defer c.mu.Unlock()
2015-05-25 16:22:27 +03:00
if c.closed {
2015-05-25 16:22:27 +03:00
return nil
}
c.closed = true
2015-05-25 16:22:27 +03:00
var firstErr error
for _, shard := range c.shards {
if err := shard.Client.Close(); err != nil && firstErr == nil {
firstErr = err
2015-05-25 16:22:27 +03:00
}
}
c.hash = nil
c.shards = nil
2015-05-25 16:22:27 +03:00
return firstErr
2015-05-25 16:22:27 +03:00
}
2015-06-04 11:50:24 +03:00
func (c *Ring) Pipeline() *Pipeline {
pipe := Pipeline{
exec: c.pipelineExec,
2015-06-04 11:50:24 +03:00
}
pipe.cmdable.process = pipe.Process
pipe.statefulCmdable.process = pipe.Process
return &pipe
2015-06-04 11:50:24 +03:00
}
func (c *Ring) Pipelined(fn func(*Pipeline) error) ([]Cmder, error) {
return c.Pipeline().pipelined(fn)
2015-06-04 11:50:24 +03:00
}
func (c *Ring) pipelineExec(cmds []Cmder) (firstErr error) {
2015-06-04 11:50:24 +03:00
cmdsMap := make(map[string][]Cmder)
for _, cmd := range cmds {
2017-01-13 14:39:59 +03:00
cmdInfo := c.cmdInfo(cmd.name())
name := cmd.arg(cmdFirstKeyPos(cmd, cmdInfo))
if name != "" {
name = c.hash.Get(hashtag.Key(name))
}
2015-06-04 11:50:24 +03:00
cmdsMap[name] = append(cmdsMap[name], cmd)
}
for i := 0; i <= c.opt.MaxRetries; i++ {
var failedCmdsMap map[string][]Cmder
2015-06-04 11:50:24 +03:00
for name, cmds := range cmdsMap {
shard, err := c.shardByName(name)
if err != nil {
setCmdsErr(cmds, err)
if firstErr == nil {
firstErr = err
}
continue
}
cn, _, err := shard.Client.conn()
2015-06-04 11:50:24 +03:00
if err != nil {
setCmdsErr(cmds, err)
if firstErr == nil {
firstErr = err
2015-06-04 11:50:24 +03:00
}
continue
}
2016-12-13 18:28:39 +03:00
canRetry, err := shard.Client.pipelineProcessCmds(cn, cmds)
shard.Client.putConn(cn, err, false)
if err == nil {
continue
2015-06-04 11:50:24 +03:00
}
if firstErr == nil {
firstErr = err
}
2016-12-13 18:28:39 +03:00
if canRetry && internal.IsRetryableError(err) {
if failedCmdsMap == nil {
failedCmdsMap = make(map[string][]Cmder)
}
failedCmdsMap[name] = cmds
2015-06-04 11:50:24 +03:00
}
}
if len(failedCmdsMap) == 0 {
break
}
cmdsMap = failedCmdsMap
}
return firstErr
2015-06-04 11:50:24 +03:00
}