pkg/traceql/engine_metrics_compare.go

package traceql

import (
	"fmt"
	"math"
	"sort"
	"time"

	"github.com/grafana/tempo/pkg/tempopb"
)

const (
	internalMetaTypeBaseline       = "baseline"
	internalMetaTypeSelection      = "selection"
	internalMetaTypeBaselineTotal  = "baseline_total"
	internalMetaTypeSelectionTotal = "selection_total"

	// internalLabelBaseline      = "__baseline"
	internalLabelError         = "__meta_error"
	internalErrorTooManyValues = "__too_many_values__"
)

var (
	internalLabelTypeBaseline       = Label{Name: internalLabelMetaType, Value: NewStaticString(internalMetaTypeBaseline)}
	internalLabelTypeBaselineTotal  = Label{Name: internalLabelMetaType, Value: NewStaticString(internalMetaTypeBaselineTotal)}
	internalLabelTypeSelection      = Label{Name: internalLabelMetaType, Value: NewStaticString(internalMetaTypeSelection)}
	internalLabelTypeSelectionTotal = Label{Name: internalLabelMetaType, Value: NewStaticString(internalMetaTypeSelectionTotal)}
	internalLabelErrorTooManyValues = Label{Name: internalLabelError, Value: NewStaticString(internalErrorTooManyValues)}
)

type MetricsCompare struct {
	f                   *SpansetFilter
	qstart, qend, qstep uint64
	len                 int
	start, end          int
	topN                int
	baselines           map[Attribute]map[StaticMapKey]staticWithCounts
	selections          map[Attribute]map[StaticMapKey]staticWithCounts
	baselineTotals      map[Attribute][]float64
	selectionTotals     map[Attribute][]float64
	baselineExemplars   []Exemplar
	selectionExemplars  []Exemplar
	seriesAgg           SeriesAggregator
}

type staticWithCounts struct {
	val    Static
	counts []float64
}

func newMetricsCompare(f *SpansetFilter, topN, start, end int) *MetricsCompare {
	return &MetricsCompare{
		f:     f,
		topN:  topN,
		start: start,
		end:   end,
	}
}

func (m *MetricsCompare) extractConditions(request *FetchSpansRequest) {
	request.SecondPassSelectAll = true
	if !request.HasAttribute(IntrinsicSpanStartTimeAttribute) {
		request.SecondPassConditions = append(request.SecondPassConditions, Condition{Attribute: IntrinsicSpanStartTimeAttribute})
	}
	// We don't need to extract conditions from the comparison expression
	// because we're already selecting all.
}

func (m *MetricsCompare) init(q *tempopb.QueryRangeRequest, mode AggregateMode) {
	switch mode {
	case AggregateModeRaw:
		m.qstart = q.Start
		m.qend = q.End
		m.qstep = q.Step
		m.len = IntervalCount(q.Start, q.End, q.Step)
		m.baselines = make(map[Attribute]map[StaticMapKey]staticWithCounts)
		m.selections = make(map[Attribute]map[StaticMapKey]staticWithCounts)
		m.baselineTotals = make(map[Attribute][]float64)
		m.selectionTotals = make(map[Attribute][]float64)

	case AggregateModeSum:
		m.seriesAgg = NewSimpleCombiner(q, sumAggregation)
		return

	case AggregateModeFinal:
		m.seriesAgg = NewBaselineAggregator(q, m.topN)
		return
	}
}

func (m *MetricsCompare) isSelection(span Span) Static {
	st := span.StartTimeUnixNanos()

	// Determine if this span is inside the selection
	isSelection := StaticFalse
	if m.start > 0 && m.end > 0 {
		// Timestamp filtering
		if st >= uint64(m.start) && st < uint64(m.end) {
			isSelection, _ = m.f.Expression.execute(span)
		}
	} else {
		// No timestamp filtering
		isSelection, _ = m.f.Expression.execute(span)
	}
	return isSelection
}

func (m *MetricsCompare) observe(span Span) {
	// For performance, MetricsCompare doesn't use the Range/StepAggregator abstractions.
	// This lets us:
	// * Include the same attribute value in multiple series. This doesn't fit within
	//   the existing by() grouping or even the potential byeach() (which was in this branch and then deleted)
	// * Avoid reading the span start time twice, once for the selection window filter, and
	//   then again instead of StepAggregator.
	// TODO - It would be nice to use those abstractions, area for future improvement
	st := span.StartTimeUnixNanos()

	// Determine if this span is inside the selection
	isSelection := m.isSelection(span)

	// Choose destination buffers
	dest := m.baselines
	destTotals := m.baselineTotals
	if isSelection.Equals(&StaticTrue) {
		dest = m.selections
		destTotals = m.selectionTotals
	}

	i := IntervalOf(st, m.qstart, m.qend, m.qstep)
	// Increment values for all attributes of this span
	span.AllAttributesFunc(func(a Attribute, v Static) {
		// We don't group by attributes of these types because the
		// cardinality isn't useful.
		switch v.Type {
		case TypeDuration:
			return
		}

		// These attributes get pulled back by select all but we never
		// group by them because the cardinality isn't useful.
		switch a {
		case IntrinsicSpanStartTimeAttribute,
			IntrinsicTraceIDAttribute:
			return
		}

		values, ok := dest[a]
		if !ok {
			values = make(map[StaticMapKey]staticWithCounts, m.len)
			dest[a] = values
		}

		vk := v.MapKey()
		sc, ok := values[vk]
		if !ok {
			sc = staticWithCounts{val: v, counts: make([]float64, m.len)}
			values[vk] = sc
		}
		sc.counts[i]++

		// TODO - It's probably faster to aggregate these at the end
		// instead of incrementing in the hotpath twice
		totals, ok := destTotals[a]
		if !ok {
			totals = make([]float64, m.len)
			destTotals[a] = totals
		}
		totals[i]++
	})
}

func (m *MetricsCompare) observeExemplar(span Span) {
	isSelection := m.isSelection(span)

	// Exemplars
	if len(m.baselineExemplars) >= maxExemplars || len(m.selectionExemplars) >= maxExemplars {
		return
	}

	all := span.AllAttributes()
	lbls := make(Labels, 0, len(all))
	for a, v := range all {
		lbls = append(lbls, Label{Name: a.String(), Value: v})
	}
	exemplar := Exemplar{
		Labels:      lbls,
		Value:       math.NaN(), // TODO: What value?
		TimestampMs: span.StartTimeUnixNanos() / uint64(time.Millisecond),
	}
	if isSelection.Equals(&StaticTrue) {
		m.selectionExemplars = append(m.selectionExemplars, exemplar)
	} else {
		m.baselineExemplars = append(m.baselineExemplars, exemplar)
	}
}

func (m *MetricsCompare) observeSeries(ss []*tempopb.TimeSeries) {
	m.seriesAgg.Combine(ss)
}

func (m *MetricsCompare) result() SeriesSet {
	// In the other modes return these results
	if m.seriesAgg != nil {
		return m.seriesAgg.Results()
	}

	var (
		top   = topN[Static]{}
		ss    = make(SeriesSet)
		erred = make(map[Attribute]struct{})
	)

	add := func(ls Labels, counts []float64) {
		ss[ls.String()] = TimeSeries{
			Labels: ls,
			Values: counts,
		}
	}

	addValues := func(prefix Label, data map[Attribute]map[StaticMapKey]staticWithCounts) {
		for a, values := range data {
			// Compute topN values for this attribute
			top.reset()
			for _, sc := range values {
				top.add(sc.val, sc.counts)
			}

			top.get(m.topN, func(v Static) {
				add(Labels{
					prefix,
					{Name: a.String(), Value: v},
				}, values[v.MapKey()].counts)
			})

			if len(values) > m.topN {
				erred[a] = struct{}{}
			}
		}
	}

	addValues(internalLabelTypeBaseline, m.baselines)
	addValues(internalLabelTypeSelection, m.selections)

	// Add errors for attributes that hit the limit in either area
	for a := range erred {
		add(Labels{
			internalLabelErrorTooManyValues,
			{Name: a.String()},
		}, nil)
	}

	addTotals := func(prefix Label, data map[Attribute][]float64) {
		for a, counts := range data {
			add(Labels{
				prefix,
				{Name: a.String()},
			}, counts)
		}
	}

	addTotals(internalLabelTypeBaselineTotal, m.baselineTotals)
	addTotals(internalLabelTypeSelectionTotal, m.selectionTotals)

	// Add exemplars
	addExemplar := func(prefix Label, e Exemplar) {
		for _, l := range e.Labels {
			seriesLabels := Labels{
				prefix,
				{Name: l.Name},
			}
			if ts, ok := ss[seriesLabels.String()]; ok {
				ts.Exemplars = append(ts.Exemplars, e)
				ss[seriesLabels.String()] = ts
			}
		}
	}

	for _, e := range m.baselineExemplars {
		addExemplar(internalLabelTypeBaselineTotal, e)
	}
	for _, e := range m.selectionExemplars {
		addExemplar(internalLabelTypeSelectionTotal, e)
	}

	return ss
}

func (m *MetricsCompare) validate() error {
	err := m.f.validate()
	if err != nil {
		return err
	}

	if m.topN <= 0 {
		return fmt.Errorf("compare() top number of values must be integer greater than 0")
	}

	if m.start == 0 && m.end == 0 {
		return nil
	}

	if m.start <= 0 || m.end <= 0 {
		return fmt.Errorf("compare() timestamps must be positive integer unix nanoseconds")
	}
	if m.end <= m.start {
		return fmt.Errorf("compare() end timestamp must be greater than start timestamp")
	}
	return nil
}

func (m *MetricsCompare) String() string {
	return "compare(" + m.f.String() + "}"
}

var _ metricsFirstStageElement = (*MetricsCompare)(nil)

// BaselineAggregator is a special series combiner for the compare() function.
// It resplits job-level results into baseline and selection buffers, and if
// an attribute reached max cardinality at the job-level, it will be marked
// as such at the query-level.
type BaselineAggregator struct {
	topN             int
	len              int
	start, end, step uint64
	baseline         map[string]map[StaticMapKey]staticWithTimeSeries
	selection        map[string]map[StaticMapKey]staticWithTimeSeries
	baselineTotals   map[string]map[StaticMapKey]staticWithTimeSeries
	selectionTotals  map[string]map[StaticMapKey]staticWithTimeSeries
	maxed            map[string]struct{}
	exemplarBuckets  *bucketSet
}

type staticWithTimeSeries struct {
	val    Static
	series TimeSeries
}

func NewBaselineAggregator(req *tempopb.QueryRangeRequest, topN int) *BaselineAggregator {
	l := IntervalCount(req.Start, req.End, req.Step)
	return &BaselineAggregator{
		baseline:        make(map[string]map[StaticMapKey]staticWithTimeSeries),
		selection:       make(map[string]map[StaticMapKey]staticWithTimeSeries),
		baselineTotals:  make(map[string]map[StaticMapKey]staticWithTimeSeries),
		selectionTotals: make(map[string]map[StaticMapKey]staticWithTimeSeries),
		maxed:           make(map[string]struct{}),
		len:             l,
		start:           req.Start,
		end:             req.End,
		step:            req.Step,
		topN:            topN,
		exemplarBuckets: newBucketSet(l),
	}
}

func (b *BaselineAggregator) Combine(ss []*tempopb.TimeSeries) {
	for _, s := range ss {
		var metaType string
		var err string
		var a string
		var v Static

		// Scan all labels
		for _, l := range s.Labels {
			switch l.Key {
			case internalLabelMetaType:
				metaType = l.Value.GetStringValue()
			case internalLabelError:
				err = l.Value.GetStringValue()
			default:
				a = l.Key
				v = StaticFromAnyValue(l.Value)
			}
		}

		// Check for errors on this attribute
		if err != "" {
			if err == internalErrorTooManyValues {
				// A sub-job reached max values for this attribute.
				// Record the error
				b.maxed[a] = struct{}{}
			}
			// Skip remaining processing regardless of error type
			continue
		}

		// Merge this time series into the destination buffer
		// based on meta type
		var dest map[string]map[StaticMapKey]staticWithTimeSeries
		switch metaType {
		case internalMetaTypeBaseline:
			dest = b.baseline
		case internalMetaTypeSelection:
			dest = b.selection
		case internalMetaTypeBaselineTotal:
			dest = b.baselineTotals
		case internalMetaTypeSelectionTotal:
			dest = b.selectionTotals
		default:
			// Unknown type, ignore
			continue
		}

		attr, ok := dest[a]
		if !ok {
			attr = make(map[StaticMapKey]staticWithTimeSeries)
			dest[a] = attr
		}

		vk := v.MapKey()
		ts, ok := attr[vk]
		if !ok {
			ts = staticWithTimeSeries{val: v, series: TimeSeries{Values: make([]float64, b.len)}}
			attr[vk] = ts
		}

		if len(attr) > b.topN {
			// This attribute just reached max cardinality overall (not within a sub-job)
			// Record the error
			b.maxed[a] = struct{}{}
		}

		for _, sample := range s.Samples {
			j := IntervalOfMs(sample.TimestampMs, b.start, b.end, b.step)
			if j >= 0 && j < len(ts.series.Values) {
				ts.series.Values[j] += sample.Value
			}
		}

		for _, exemplar := range s.Exemplars {
			if b.exemplarBuckets.testTotal() {
				break
			}
			interval := IntervalOfMs(exemplar.TimestampMs, b.start, b.end, b.step)
			if b.exemplarBuckets.addAndTest(interval) {
				continue
			}

			lbls := make(Labels, 0, len(exemplar.Labels))
			for _, l := range exemplar.Labels {
				lbls = append(lbls, Label{Name: l.Key, Value: StaticFromAnyValue(l.Value)})
			}
			ts.series.Exemplars = append(ts.series.Exemplars, Exemplar{
				Labels:      lbls,
				Value:       exemplar.Value,
				TimestampMs: uint64(exemplar.TimestampMs),
			})
		}
		attr[vk] = ts
	}
}

func (b *BaselineAggregator) Results() SeriesSet {
	output := make(SeriesSet)
	topN := &topN[Static]{}

	addSeries := func(prefix Label, name string, value Static, samples []float64, exemplars []Exemplar) {
		ls := Labels{
			prefix,
			{Name: name, Value: value},
		}
		output[ls.String()] = TimeSeries{
			Labels:    ls,
			Values:    samples,
			Exemplars: exemplars,
		}
	}

	do := func(buffer map[string]map[StaticMapKey]staticWithTimeSeries, prefix Label) {
		for a, m := range buffer {

			topN.reset()
			for _, ts := range m {
				topN.add(ts.val, ts.series.Values)
			}

			topN.get(b.topN, func(key Static) {
				ts := m[key.MapKey()]
				addSeries(prefix, a, key, ts.series.Values, ts.series.Exemplars)
			})
		}
	}

	do(b.baseline, internalLabelTypeBaseline)
	do(b.selection, internalLabelTypeSelection)
	do(b.baselineTotals, internalLabelTypeBaselineTotal)
	do(b.selectionTotals, internalLabelTypeSelectionTotal)

	// Add series for every attribute that exceeded max value.
	for a := range b.maxed {
		addSeries(internalLabelErrorTooManyValues, a, NewStaticNil(), nil, nil)
	}

	return output
}

var _ SeriesAggregator = (*BaselineAggregator)(nil)

// topN is a helper struct that gets the topN keys based on total sum
type topN[T any] struct {
	entries []struct {
		key   T
		total float64
	}
}

func (t *topN[T]) add(key T, values []float64) {
	sum := 0.0
	for _, v := range values {
		sum += v
	}
	t.entries = append(t.entries, struct {
		key   T
		total float64
	}{key, sum})
}

// get the top N values. Given as a callback to avoid allocating.
// bool result indicates if there were more than N values
func (t *topN[T]) get(n int, cb func(key T)) {
	if len(t.entries) <= n {
		// <= N, no need to sort
		for _, e := range t.entries {
			cb(e.key)
		}
		return
	}

	sort.Slice(t.entries, func(i, j int) bool {
		return t.entries[i].total > t.entries[j].total // Sort descending
	})

	for i := 0; i < n; i++ {
		cb(t.entries[i].key)
	}
}

func (t *topN[T]) reset() {
	t.entries = t.entries[:0]
}