Skip to content

Commit

Permalink
Add native histogram support to remaining histograms
Browse files Browse the repository at this point in the history
  • Loading branch information
zalegrala committed Jul 19, 2024
1 parent 25abbc5 commit ce2a279
Show file tree
Hide file tree
Showing 11 changed files with 77 additions and 42 deletions.
11 changes: 7 additions & 4 deletions modules/distributor/distributor.go
Original file line number Diff line number Diff line change
Expand Up @@ -91,10 +91,13 @@ var (
Help: "The total number of proto bytes received per tenant",
}, []string{"tenant"})
metricTracesPerBatch = promauto.NewHistogram(prometheus.HistogramOpts{
Namespace: "tempo",
Name: "distributor_traces_per_batch",
Help: "The number of traces in each batch",
Buckets: prometheus.ExponentialBuckets(2, 2, 10),
Namespace: "tempo",
Name: "distributor_traces_per_batch",
Help: "The number of traces in each batch",
Buckets: prometheus.ExponentialBuckets(2, 2, 10),
NativeHistogramBucketFactor: 1.1,
NativeHistogramMaxBucketNumber: 100,
NativeHistogramMinResetDuration: 1 * time.Hour,
})
metricIngesterClients = promauto.NewGauge(prometheus.GaugeOpts{
Namespace: "tempo",
Expand Down
11 changes: 7 additions & 4 deletions modules/distributor/receiver/shim.go
Original file line number Diff line number Diff line change
Expand Up @@ -49,10 +49,13 @@ const (

var (
metricPushDuration = promauto.NewHistogram(prom_client.HistogramOpts{
Namespace: "tempo",
Name: "distributor_push_duration_seconds",
Help: "Records the amount of time to push a batch to the ingester.",
Buckets: prom_client.DefBuckets,
Namespace: "tempo",
Name: "distributor_push_duration_seconds",
Help: "Records the amount of time to push a batch to the ingester.",
Buckets: prom_client.DefBuckets,
NativeHistogramBucketFactor: 1.1,
NativeHistogramMaxBucketNumber: 100,
NativeHistogramMinResetDuration: 1 * time.Hour,
})

statReceiverOtlp = usagestats.NewInt("receiver_enabled_otlp")
Expand Down
12 changes: 8 additions & 4 deletions modules/frontend/pipeline/sync_handler_retry.go
Original file line number Diff line number Diff line change
Expand Up @@ -6,6 +6,7 @@ import (
"io"
"net/http"
"strings"
"time"

"github.com/grafana/dskit/httpgrpc"
"github.com/grafana/tempo/modules/frontend/queue"
Expand All @@ -18,10 +19,13 @@ import (

func NewRetryWare(maxRetries int, registerer prometheus.Registerer) Middleware {
retriesCount := promauto.With(registerer).NewHistogram(prometheus.HistogramOpts{
Namespace: "tempo",
Name: "query_frontend_retries",
Help: "Number of times a request is retried.",
Buckets: []float64{0, 1, 2, 3, 4, 5},
Namespace: "tempo",
Name: "query_frontend_retries",
Help: "Number of times a request is retried.",
Buckets: []float64{0, 1, 2, 3, 4, 5},
NativeHistogramBucketFactor: 1.1,
NativeHistogramMaxBucketNumber: 100,
NativeHistogramMinResetDuration: 1 * time.Hour,
})

return MiddlewareFunc(func(next http.RoundTripper) http.RoundTripper {
Expand Down
11 changes: 7 additions & 4 deletions modules/frontend/slos.go
Original file line number Diff line number Diff line change
Expand Up @@ -44,10 +44,13 @@ var (
metricsCounter = queriesPerTenant.MustCurryWith(prometheus.Labels{"op": metricsOp})

queryThroughput = promauto.NewHistogramVec(prometheus.HistogramOpts{
Namespace: "tempo",
Name: "query_frontend_bytes_processed_per_second",
Help: "Bytes processed per second in the query per tenant",
Buckets: prometheus.ExponentialBuckets(8*1024*1024, 2, 12), // from 8MB up to 16GB
Namespace: "tempo",
Name: "query_frontend_bytes_processed_per_second",
Help: "Bytes processed per second in the query per tenant",
Buckets: prometheus.ExponentialBuckets(8*1024*1024, 2, 12), // from 8MB up to 16GB
NativeHistogramBucketFactor: 1.1,
NativeHistogramMaxBucketNumber: 100,
NativeHistogramMinResetDuration: 1 * time.Hour,
}, []string{"tenant", "op"})

searchThroughput = queryThroughput.MustCurryWith(prometheus.Labels{"op": searchOp})
Expand Down
9 changes: 6 additions & 3 deletions modules/frontend/v1/frontend.go
Original file line number Diff line number Diff line change
Expand Up @@ -100,9 +100,12 @@ func New(cfg Config, limits Limits, log log.Logger, registerer prometheus.Regist
Help: "Total number of query requests discarded.",
}, []string{"user"}),
queueDuration: promauto.With(registerer).NewHistogram(prometheus.HistogramOpts{
Name: "tempo_query_frontend_queue_duration_seconds",
Help: "Time spend by requests queued.",
Buckets: prometheus.DefBuckets,
Name: "tempo_query_frontend_queue_duration_seconds",
Help: "Time spend by requests queued.",
Buckets: prometheus.DefBuckets,
NativeHistogramBucketFactor: 1.1,
NativeHistogramMaxBucketNumber: 100,
NativeHistogramMinResetDuration: 1 * time.Hour,
}),
actualBatchSize: promauto.With(registerer).NewHistogram(prometheus.HistogramOpts{
Name: "tempo_query_frontend_actual_batch_size",
Expand Down
11 changes: 7 additions & 4 deletions modules/ingester/flush.go
Original file line number Diff line number Diff line change
Expand Up @@ -45,10 +45,13 @@ var (
Help: "The total number of failed retries after a failed flush",
})
metricFlushDuration = promauto.NewHistogram(prometheus.HistogramOpts{
Namespace: "tempo",
Name: "ingester_flush_duration_seconds",
Help: "Records the amount of time to flush a complete block.",
Buckets: prometheus.ExponentialBuckets(1, 2, 10),
Namespace: "tempo",
Name: "ingester_flush_duration_seconds",
Help: "Records the amount of time to flush a complete block.",
Buckets: prometheus.ExponentialBuckets(1, 2, 10),
NativeHistogramBucketFactor: 1.1,
NativeHistogramMaxBucketNumber: 100,
NativeHistogramMinResetDuration: 1 * time.Hour,
})
metricFlushSize = promauto.NewHistogram(prometheus.HistogramOpts{
Namespace: "tempo",
Expand Down
11 changes: 7 additions & 4 deletions modules/querier/external/client.go
Original file line number Diff line number Diff line change
Expand Up @@ -21,10 +21,13 @@ import (

var (
metricEndpointDuration = promauto.NewHistogramVec(prometheus.HistogramOpts{
Namespace: "tempo",
Name: "querier_external_endpoint_duration_seconds",
Help: "The duration of the external endpoints.",
Buckets: prometheus.DefBuckets,
Namespace: "tempo",
Name: "querier_external_endpoint_duration_seconds",
Help: "The duration of the external endpoints.",
Buckets: prometheus.DefBuckets,
NativeHistogramBucketFactor: 1.1,
NativeHistogramMaxBucketNumber: 100,
NativeHistogramMinResetDuration: 1 * time.Hour,
}, []string{"endpoint"})
metricExternalHedgedRequests = promauto.NewGauge(
prometheus.GaugeOpts{
Expand Down
7 changes: 5 additions & 2 deletions pkg/cache/memcached.go
Original file line number Diff line number Diff line change
Expand Up @@ -60,8 +60,11 @@ func NewMemcached(cfg MemcachedConfig, client MemcachedClient, name string, reg
Name: "memcache_request_duration_seconds",
Help: "Total time spent in seconds doing memcache requests.",
// Memcached requests are very quick: smallest bucket is 16us, biggest is 1s
Buckets: prometheus.ExponentialBuckets(0.000016, 4, 8),
ConstLabels: prometheus.Labels{"name": name},
Buckets: prometheus.ExponentialBuckets(0.000016, 4, 8),
NativeHistogramBucketFactor: 1.1,
NativeHistogramMaxBucketNumber: 100,
NativeHistogramMinResetDuration: 1 * time.Hour,
ConstLabels: prometheus.Labels{"name": name},
}, []string{"method", "status_code"}),
),
}
Expand Down
14 changes: 9 additions & 5 deletions pkg/cache/redis_cache.go
Original file line number Diff line number Diff line change
Expand Up @@ -2,6 +2,7 @@ package cache

import (
"context"
"time"

"github.com/go-kit/log"
"github.com/go-kit/log/level"
Expand Down Expand Up @@ -31,11 +32,14 @@ func NewRedisCache(name string, redisClient *RedisClient, reg prometheus.Registe
logger: logger,
requestDuration: instr.NewHistogramCollector(
promauto.With(reg).NewHistogramVec(prometheus.HistogramOpts{
Namespace: "tempo",
Name: "rediscache_request_duration_seconds",
Help: "Total time spent in seconds doing Redis requests.",
Buckets: prometheus.ExponentialBuckets(0.000016, 4, 8),
ConstLabels: prometheus.Labels{"name": name},
Namespace: "tempo",
Name: "rediscache_request_duration_seconds",
Help: "Total time spent in seconds doing Redis requests.",
Buckets: prometheus.ExponentialBuckets(0.000016, 4, 8),
NativeHistogramBucketFactor: 1.1,
NativeHistogramMaxBucketNumber: 100,
NativeHistogramMinResetDuration: 1 * time.Hour,
ConstLabels: prometheus.Labels{"name": name},
}, []string{"method", "status_code"}),
),
}
Expand Down
11 changes: 7 additions & 4 deletions tempodb/backend/instrumentation/backend_transports.go
Original file line number Diff line number Diff line change
Expand Up @@ -10,10 +10,13 @@ import (
)

var requestDuration = promauto.NewHistogramVec(prometheus.HistogramOpts{
Namespace: "tempodb",
Name: "backend_request_duration_seconds",
Help: "Time spent doing backend storage requests.",
Buckets: prometheus.ExponentialBuckets(0.005, 4, 6),
Namespace: "tempodb",
Name: "backend_request_duration_seconds",
Help: "Time spent doing backend storage requests.",
Buckets: prometheus.ExponentialBuckets(0.005, 4, 6),
NativeHistogramBucketFactor: 1.1,
NativeHistogramMaxBucketNumber: 100,
NativeHistogramMinResetDuration: 1 * time.Hour,
}, []string{"operation", "status_code"})

type instrumentedTransport struct {
Expand Down
11 changes: 7 additions & 4 deletions tempodb/tempodb.go
Original file line number Diff line number Diff line change
Expand Up @@ -45,10 +45,13 @@ const (

var (
metricRetentionDuration = promauto.NewHistogram(prometheus.HistogramOpts{
Namespace: "tempodb",
Name: "retention_duration_seconds",
Help: "Records the amount of time to perform retention tasks.",
Buckets: prometheus.ExponentialBuckets(.25, 2, 6),
Namespace: "tempodb",
Name: "retention_duration_seconds",
Help: "Records the amount of time to perform retention tasks.",
Buckets: prometheus.ExponentialBuckets(.25, 2, 6),
NativeHistogramBucketFactor: 1.1,
NativeHistogramMaxBucketNumber: 100,
NativeHistogramMinResetDuration: 1 * time.Hour,
})
metricRetentionErrors = promauto.NewCounter(prometheus.CounterOpts{
Namespace: "tempodb",
Expand Down

0 comments on commit ce2a279

Please sign in to comment.