2022-10-11 15:37:34 +03:00
|
|
|
package redisotel
|
|
|
|
|
|
|
|
import (
|
|
|
|
"context"
|
|
|
|
"fmt"
|
|
|
|
"net"
|
|
|
|
"time"
|
|
|
|
|
|
|
|
"github.com/go-redis/redis/v9"
|
|
|
|
"go.opentelemetry.io/otel"
|
|
|
|
"go.opentelemetry.io/otel/attribute"
|
|
|
|
"go.opentelemetry.io/otel/metric"
|
|
|
|
"go.opentelemetry.io/otel/metric/instrument"
|
2022-11-18 16:32:17 +03:00
|
|
|
"go.opentelemetry.io/otel/metric/instrument/syncfloat64"
|
2022-10-11 15:37:34 +03:00
|
|
|
)
|
|
|
|
|
|
|
|
// InstrumentMetrics starts reporting OpenTelemetry Metrics.
|
|
|
|
//
|
|
|
|
// Based on https://github.com/open-telemetry/opentelemetry-specification/blob/main/specification/metrics/semantic_conventions/database-metrics.md
|
|
|
|
func InstrumentMetrics(rdb redis.UniversalClient, opts ...MetricsOption) error {
|
|
|
|
baseOpts := make([]baseOption, len(opts))
|
|
|
|
for i, opt := range opts {
|
|
|
|
baseOpts[i] = opt
|
|
|
|
}
|
|
|
|
conf := newConfig(baseOpts...)
|
|
|
|
|
|
|
|
if conf.meter == nil {
|
|
|
|
conf.meter = conf.mp.Meter(
|
|
|
|
instrumName,
|
|
|
|
metric.WithInstrumentationVersion("semver:"+redis.Version()),
|
|
|
|
)
|
|
|
|
}
|
|
|
|
|
|
|
|
switch rdb := rdb.(type) {
|
|
|
|
case *redis.Client:
|
|
|
|
if conf.poolName == "" {
|
|
|
|
opt := rdb.Options()
|
|
|
|
conf.poolName = opt.Addr
|
|
|
|
}
|
|
|
|
conf.attrs = append(conf.attrs, attribute.String("pool.name", conf.poolName))
|
|
|
|
|
|
|
|
if err := reportPoolStats(rdb, conf); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
if err := addMetricsHook(rdb, conf); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
case *redis.ClusterClient:
|
|
|
|
rdb.OnNewNode(func(rdb *redis.Client) {
|
|
|
|
if conf.poolName == "" {
|
|
|
|
opt := rdb.Options()
|
|
|
|
conf.poolName = opt.Addr
|
|
|
|
}
|
|
|
|
conf.attrs = append(conf.attrs, attribute.String("pool.name", conf.poolName))
|
|
|
|
|
|
|
|
if err := reportPoolStats(rdb, conf); err != nil {
|
|
|
|
otel.Handle(err)
|
|
|
|
}
|
|
|
|
if err := addMetricsHook(rdb, conf); err != nil {
|
|
|
|
otel.Handle(err)
|
|
|
|
}
|
|
|
|
})
|
|
|
|
return nil
|
|
|
|
case *redis.Ring:
|
|
|
|
rdb.OnNewNode(func(rdb *redis.Client) {
|
2022-11-18 16:32:17 +03:00
|
|
|
if conf.poolName == "" {
|
|
|
|
opt := rdb.Options()
|
|
|
|
conf.poolName = opt.Addr
|
|
|
|
}
|
|
|
|
conf.attrs = append(conf.attrs, attribute.String("pool.name", conf.poolName))
|
|
|
|
|
2022-10-11 15:37:34 +03:00
|
|
|
if err := reportPoolStats(rdb, conf); err != nil {
|
|
|
|
otel.Handle(err)
|
|
|
|
}
|
|
|
|
if err := addMetricsHook(rdb, conf); err != nil {
|
|
|
|
otel.Handle(err)
|
|
|
|
}
|
|
|
|
})
|
|
|
|
return nil
|
|
|
|
default:
|
|
|
|
return fmt.Errorf("redisotel: %T not supported", rdb)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func reportPoolStats(rdb *redis.Client, conf *config) error {
|
|
|
|
labels := conf.attrs
|
|
|
|
idleAttrs := append(labels, attribute.String("state", "idle"))
|
|
|
|
usedAttrs := append(labels, attribute.String("state", "used"))
|
|
|
|
|
2022-11-17 17:24:16 +03:00
|
|
|
idleMax, err := conf.meter.AsyncInt64().UpDownCounter(
|
|
|
|
"db.client.connections.idle.max",
|
|
|
|
instrument.WithDescription("The maximum number of idle open connections allowed"),
|
|
|
|
)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
idleMin, err := conf.meter.AsyncInt64().UpDownCounter(
|
|
|
|
"db.client.connections.idle.min",
|
|
|
|
instrument.WithDescription("The minimum number of idle open connections allowed"),
|
|
|
|
)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
connsMax, err := conf.meter.AsyncInt64().UpDownCounter(
|
|
|
|
"db.client.connections.max",
|
|
|
|
instrument.WithDescription("The maximum number of open connections allowed"),
|
|
|
|
)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2022-10-11 15:37:34 +03:00
|
|
|
usage, err := conf.meter.AsyncInt64().UpDownCounter(
|
|
|
|
"db.client.connections.usage",
|
|
|
|
instrument.WithDescription("The number of connections that are currently in state described by the state attribute"),
|
|
|
|
)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
timeouts, err := conf.meter.AsyncInt64().UpDownCounter(
|
|
|
|
"db.client.connections.timeouts",
|
|
|
|
instrument.WithDescription("The number of connection timeouts that have occurred trying to obtain a connection from the pool"),
|
|
|
|
)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2022-11-17 17:24:16 +03:00
|
|
|
redisConf := rdb.Options()
|
2022-10-11 15:37:34 +03:00
|
|
|
return conf.meter.RegisterCallback(
|
|
|
|
[]instrument.Asynchronous{
|
2022-11-17 17:24:16 +03:00
|
|
|
idleMax,
|
|
|
|
idleMin,
|
|
|
|
connsMax,
|
2022-10-11 15:37:34 +03:00
|
|
|
usage,
|
|
|
|
timeouts,
|
|
|
|
},
|
|
|
|
func(ctx context.Context) {
|
|
|
|
stats := rdb.PoolStats()
|
|
|
|
|
2022-11-18 16:32:17 +03:00
|
|
|
idleMax.Observe(ctx, int64(redisConf.MaxIdleConns), labels...)
|
|
|
|
idleMin.Observe(ctx, int64(redisConf.MinIdleConns), labels...)
|
|
|
|
connsMax.Observe(ctx, int64(redisConf.PoolSize), labels...)
|
2022-11-17 17:24:16 +03:00
|
|
|
|
2022-10-11 15:37:34 +03:00
|
|
|
usage.Observe(ctx, int64(stats.IdleConns), idleAttrs...)
|
|
|
|
usage.Observe(ctx, int64(stats.TotalConns-stats.IdleConns), usedAttrs...)
|
|
|
|
|
|
|
|
timeouts.Observe(ctx, int64(stats.Timeouts), labels...)
|
|
|
|
},
|
|
|
|
)
|
|
|
|
}
|
|
|
|
|
|
|
|
func addMetricsHook(rdb *redis.Client, conf *config) error {
|
2022-11-18 16:32:17 +03:00
|
|
|
createTime, err := conf.meter.SyncFloat64().Histogram(
|
2022-10-11 15:37:34 +03:00
|
|
|
"db.client.connections.create_time",
|
|
|
|
instrument.WithDescription("The time it took to create a new connection."),
|
|
|
|
instrument.WithUnit("ms"),
|
|
|
|
)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2022-11-18 16:32:17 +03:00
|
|
|
useTime, err := conf.meter.SyncFloat64().Histogram(
|
2022-10-11 15:37:34 +03:00
|
|
|
"db.client.connections.use_time",
|
|
|
|
instrument.WithDescription("The time between borrowing a connection and returning it to the pool."),
|
|
|
|
instrument.WithUnit("ms"),
|
|
|
|
)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
rdb.AddHook(&metricsHook{
|
|
|
|
createTime: createTime,
|
|
|
|
useTime: useTime,
|
2022-11-18 16:32:17 +03:00
|
|
|
attrs: conf.attrs,
|
2022-10-11 15:37:34 +03:00
|
|
|
})
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
type metricsHook struct {
|
2022-11-18 16:32:17 +03:00
|
|
|
createTime syncfloat64.Histogram
|
|
|
|
useTime syncfloat64.Histogram
|
|
|
|
attrs []attribute.KeyValue
|
2022-10-11 15:37:34 +03:00
|
|
|
}
|
|
|
|
|
|
|
|
var _ redis.Hook = (*metricsHook)(nil)
|
|
|
|
|
|
|
|
func (mh *metricsHook) DialHook(hook redis.DialHook) redis.DialHook {
|
|
|
|
return func(ctx context.Context, network, addr string) (net.Conn, error) {
|
|
|
|
start := time.Now()
|
|
|
|
|
|
|
|
conn, err := hook(ctx, network, addr)
|
|
|
|
|
2022-12-23 15:40:07 +03:00
|
|
|
attrs := make([]attribute.KeyValue, 0, len(mh.attrs)+1)
|
|
|
|
attrs = append(attrs, mh.attrs...)
|
|
|
|
attrs = append(attrs, statusAttr(err))
|
|
|
|
|
|
|
|
mh.createTime.Record(ctx, milliseconds(time.Since(start)), attrs...)
|
2022-10-11 15:37:34 +03:00
|
|
|
return conn, err
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (mh *metricsHook) ProcessHook(hook redis.ProcessHook) redis.ProcessHook {
|
|
|
|
return func(ctx context.Context, cmd redis.Cmder) error {
|
|
|
|
start := time.Now()
|
|
|
|
|
|
|
|
err := hook(ctx, cmd)
|
|
|
|
|
2022-11-18 16:32:17 +03:00
|
|
|
dur := time.Since(start)
|
|
|
|
|
|
|
|
attrs := make([]attribute.KeyValue, 0, len(mh.attrs)+2)
|
|
|
|
attrs = append(attrs, mh.attrs...)
|
|
|
|
attrs = append(attrs, attribute.String("type", "command"))
|
|
|
|
attrs = append(attrs, statusAttr(err))
|
|
|
|
|
|
|
|
mh.useTime.Record(ctx, milliseconds(dur), attrs...)
|
2022-10-11 15:37:34 +03:00
|
|
|
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (mh *metricsHook) ProcessPipelineHook(
|
|
|
|
hook redis.ProcessPipelineHook,
|
|
|
|
) redis.ProcessPipelineHook {
|
|
|
|
return func(ctx context.Context, cmds []redis.Cmder) error {
|
|
|
|
start := time.Now()
|
|
|
|
|
|
|
|
err := hook(ctx, cmds)
|
|
|
|
|
2022-11-18 16:32:17 +03:00
|
|
|
dur := time.Since(start)
|
|
|
|
|
|
|
|
attrs := make([]attribute.KeyValue, 0, len(mh.attrs)+2)
|
|
|
|
attrs = append(attrs, mh.attrs...)
|
|
|
|
attrs = append(attrs, attribute.String("type", "pipeline"))
|
|
|
|
attrs = append(attrs, statusAttr(err))
|
|
|
|
|
|
|
|
mh.useTime.Record(ctx, milliseconds(dur), attrs...)
|
2022-10-11 15:37:34 +03:00
|
|
|
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-11-18 16:32:17 +03:00
|
|
|
func milliseconds(d time.Duration) float64 {
|
|
|
|
return float64(d) / float64(time.Millisecond)
|
|
|
|
}
|
|
|
|
|
2022-10-11 15:37:34 +03:00
|
|
|
func statusAttr(err error) attribute.KeyValue {
|
|
|
|
if err != nil {
|
|
|
|
return attribute.String("status", "error")
|
|
|
|
}
|
|
|
|
return attribute.String("status", "ok")
|
|
|
|
}
|