loki/pkg/querier/queryrange/volume.go

package queryrange

import (
	"context"
	"sort"
	"time"

	"github.com/grafana/dskit/concurrency"
	"github.com/prometheus/common/model"
	"github.com/prometheus/prometheus/model/labels"

	"github.com/grafana/loki/v3/pkg/loghttp"
	"github.com/grafana/loki/v3/pkg/logproto"
	"github.com/grafana/loki/v3/pkg/logql/syntax"
	"github.com/grafana/loki/v3/pkg/logqlmodel/stats"
	"github.com/grafana/loki/v3/pkg/querier/queryrange/queryrangebase"
	"github.com/grafana/loki/v3/pkg/querier/queryrange/queryrangebase/definitions"
	"github.com/grafana/loki/v3/pkg/storage/stores/index/seriesvolume"
	"github.com/grafana/loki/v3/pkg/util"
)

func NewVolumeMiddleware() queryrangebase.Middleware {
	return queryrangebase.MiddlewareFunc(func(next queryrangebase.Handler) queryrangebase.Handler {
		return queryrangebase.HandlerFunc(func(ctx context.Context, req queryrangebase.Request) (queryrangebase.Response, error) {
			volReq, ok := req.(*logproto.VolumeRequest)

			if !ok {
				return next.Do(ctx, req)
			}

			reqs := map[time.Time]queryrangebase.Request{}
			startTS := volReq.From.Time()
			endTS := volReq.Through.Time()
			interval := time.Duration(volReq.Step * 1e6)

			util.ForInterval(interval, startTS, endTS, true, func(start, end time.Time) {
				// Always align to the end of the requested range
				// For range queries, this aligns to the end of the period we're returning a bytes aggregation for
				// For instant queries, which are for "this instant", this aligns to the end of the requested range
				reqs[end] = &logproto.VolumeRequest{
					From:         model.TimeFromUnix(start.Unix()),
					Through:      model.TimeFromUnix(end.Unix()),
					Matchers:     volReq.Matchers,
					Limit:        volReq.Limit,
					Step:         volReq.Step,
					TargetLabels: volReq.TargetLabels,
					AggregateBy:  volReq.AggregateBy,
				}
			})

			type f func(context.Context) (time.Time, definitions.Response, error)
			var jobs []f

			for bucket, req := range reqs {
				b, r := bucket, req
				jobs = append(jobs, f(func(ctx context.Context) (time.Time, definitions.Response, error) {
					resp, err := next.Do(ctx, r)
					if err != nil {
						return b, nil, err
					}

					return b, resp, nil
				}))
			}

			// Update middleware stats
			queryStatsCtx := stats.FromContext(ctx)
			queryStatsCtx.AddSplitQueries(int64(len(jobs)))

			collector := make(chan *bucketedVolumeResponse, len(jobs))
			err := concurrency.ForEachJob(
				ctx,
				len(jobs),
				len(jobs),
				func(ctx context.Context, i int) error {
					bucket, resp, err := jobs[i](ctx)
					if resp == nil {
						collector <- nil
						return err
					}

					collector <- &bucketedVolumeResponse{
						bucket, resp.(*VolumeResponse),
					}
					return err
				})
			close(collector)

			if err != nil {
				return nil, err
			}

			promResp := ToPrometheusResponse(collector, seriesvolume.AggregateBySeries(volReq.AggregateBy))
			return promResp, nil
		})
	})
}

type bucketedVolumeResponse struct {
	bucket   time.Time
	response *VolumeResponse
}

func ToPrometheusResponse(respsCh chan *bucketedVolumeResponse, aggregateBySeries bool) *LokiPromResponse {
	var headers []*definitions.PrometheusResponseHeader
	samplesByName := make(map[string][]logproto.LegacySample)

	for bucketedVolumeResponse := range respsCh {
		if bucketedVolumeResponse == nil {
			continue
		}

		bucket, resp := bucketedVolumeResponse.bucket, bucketedVolumeResponse.response

		if headers == nil {
			headers := make([]*definitions.PrometheusResponseHeader, len(resp.Headers))
			for i, header := range resp.Headers {
				h := header
				headers[i] = &h
			}
		}

		for _, volume := range resp.Response.Volumes {
			if _, ok := samplesByName[volume.Name]; !ok {
				samplesByName[volume.Name] = make([]logproto.LegacySample, 0, 1)
			}

			samplesByName[volume.Name] = append(samplesByName[volume.Name], toPrometheusSample(volume, bucket))
		}
	}

	promResponse := queryrangebase.PrometheusResponse{
		Status:  loghttp.QueryStatusSuccess,
		Data:    toPrometheusData(samplesByName, aggregateBySeries),
		Headers: headers,
	}

	return &LokiPromResponse{
		Response:   &promResponse,
		Statistics: stats.Result{},
	}
}

func toPrometheusSample(volume logproto.Volume, t time.Time) logproto.LegacySample {
	ts := model.TimeFromUnixNano(t.UnixNano())
	return logproto.LegacySample{
		Value:       float64(volume.Volume),
		TimestampMs: ts.UnixNano() / 1e6,
	}
}

type sortableSampleStream struct {
	name    string
	labels  labels.Labels
	samples []logproto.LegacySample
}

func toPrometheusData(series map[string][]logproto.LegacySample, aggregateBySeries bool) queryrangebase.PrometheusData {
	resultType := loghttp.ResultTypeVector
	sortableResult := make([]sortableSampleStream, 0, len(series))

	for name, samples := range series {
		if resultType == loghttp.ResultTypeVector && len(samples) > 1 {
			resultType = loghttp.ResultTypeMatrix
		}

		var lbls labels.Labels
		var err error

		if aggregateBySeries {
			lbls, err = syntax.ParseLabels(name)
		} else {
			lbls = labels.Labels{{
				Name:  name,
				Value: "",
			}}
		}

		if err != nil {
			continue
		}

		sort.Slice(samples, func(i, j int) bool {
			return samples[i].TimestampMs < samples[j].TimestampMs
		})

		sortableResult = append(sortableResult, sortableSampleStream{
			name:    name,
			labels:  lbls,
			samples: samples,
		})
	}

	sort.Slice(sortableResult, func(i, j int) bool {
		// Sorting by value only helps instant queries so just grab the first value
		if sortableResult[i].samples[0].Value == sortableResult[j].samples[0].Value {
			return sortableResult[i].name < sortableResult[j].name
		}
		return sortableResult[i].samples[0].Value > sortableResult[j].samples[0].Value
	})

	result := make([]queryrangebase.SampleStream, 0, len(sortableResult))
	for _, r := range sortableResult {
		result = append(result, queryrangebase.SampleStream{
			Labels:  logproto.FromLabelsToLabelAdapters(r.labels),
			Samples: r.samples,
		})
	}

	return queryrangebase.PrometheusData{
		ResultType: resultType,
		Result:     result,
	}
}
Implement series volume range queries (#9812) This PR adds a `series_volume_range` endpoint which allows for series volume queries over time with a specified step, returning timeseries data in the form of a Prometheus matrix response. The existing `series_volume` endpoint still returns Prometheus vector responses, and hardcodes the step to 0. 2 years ago			`package queryrange`

			`import (`
			`"context"`
			`"sort"`
			`"time"`

			`"github.com/grafana/dskit/concurrency"`
			`"github.com/prometheus/common/model"`
			`"github.com/prometheus/prometheus/model/labels"`

chore: update loki modules for 3.0 release (#12433) Signed-off-by: Edward Welch <edward.welch@grafana.com> 1 year ago			`"github.com/grafana/loki/v3/pkg/loghttp"`
			`"github.com/grafana/loki/v3/pkg/logproto"`
			`"github.com/grafana/loki/v3/pkg/logql/syntax"`
			`"github.com/grafana/loki/v3/pkg/logqlmodel/stats"`
			`"github.com/grafana/loki/v3/pkg/querier/queryrange/queryrangebase"`
			`"github.com/grafana/loki/v3/pkg/querier/queryrange/queryrangebase/definitions"`
			`"github.com/grafana/loki/v3/pkg/storage/stores/index/seriesvolume"`
			`"github.com/grafana/loki/v3/pkg/util"`
Implement series volume range queries (#9812) This PR adds a `series_volume_range` endpoint which allows for series volume queries over time with a specified step, returning timeseries data in the form of a Prometheus matrix response. The existing `series_volume` endpoint still returns Prometheus vector responses, and hardcodes the step to 0. 2 years ago			`)`

Allow volume to be aggregated by label (#9988) Add a `aggregateBy` query parameter to the `series_volume` endpoint, and rename that endpoint to just `volume`. This allows users to get volumes aggregated into top level labels, rather label+value pairs. --------- Co-authored-by: Travis Patterson <travis.patterson@grafana.com> 2 years ago			`func NewVolumeMiddleware() queryrangebase.Middleware {`
Implement series volume range queries (#9812) This PR adds a `series_volume_range` endpoint which allows for series volume queries over time with a specified step, returning timeseries data in the form of a Prometheus matrix response. The existing `series_volume` endpoint still returns Prometheus vector responses, and hardcodes the step to 0. 2 years ago			`return queryrangebase.MiddlewareFunc(func(next queryrangebase.Handler) queryrangebase.Handler {`
			`return queryrangebase.HandlerFunc(func(ctx context.Context, req queryrangebase.Request) (queryrangebase.Response, error) {`
			`volReq, ok := req.(*logproto.VolumeRequest)`

			`if !ok {`
			`return next.Do(ctx, req)`
			`}`

			`reqs := map[time.Time]queryrangebase.Request{}`
			`startTS := volReq.From.Time()`
			`endTS := volReq.Through.Time()`
			`interval := time.Duration(volReq.Step * 1e6)`

			`util.ForInterval(interval, startTS, endTS, true, func(start, end time.Time) {`
always align volume range timestamp to end of step (#11136) What this PR does / why we need it: We had originally assumed that it would be weird for a user to get back a timeseries response from `volume_range` that didn't include a datapoint with a timestamp at the start of their requested range. This was a bad assumption. The `volume_range` endpoint is inherently doing aggregations. For each step, a datapoint is calculated representing the percent of chunk volumes that the selector appeared in. It therefore stands to reason that the steps volume was not that value until the end of the step time range, as we are to assume volume is monotonically increasing. The fact that we were using the start of the range made it difficult to turn this data into a per-second rate, which this PR aims to fix. Which issue(s) this PR fixes: Fixes #11134 2 years ago			`// Always align to the end of the requested range`
			`// For range queries, this aligns to the end of the period we're returning a bytes aggregation for`
			`// For instant queries, which are for "this instant", this aligns to the end of the requested range`
			`reqs[end] = &logproto.VolumeRequest{`
Add targetLabels to SeriesVolume requests (#9878) Adds optional `targetLabels` parameter to `series_volume` and `series_volume_range` requests that controls how volumes are aggregated. When provided, volumes are aggregated into the intersections of the provided `targetLabels` only. 2 years ago			`From: model.TimeFromUnix(start.Unix()),`
			`Through: model.TimeFromUnix(end.Unix()),`
			`Matchers: volReq.Matchers,`
			`Limit: volReq.Limit,`
			`Step: volReq.Step,`
			`TargetLabels: volReq.TargetLabels,`
Allow volume to be aggregated by label (#9988) Add a `aggregateBy` query parameter to the `series_volume` endpoint, and rename that endpoint to just `volume`. This allows users to get volumes aggregated into top level labels, rather label+value pairs. --------- Co-authored-by: Travis Patterson <travis.patterson@grafana.com> 2 years ago			`AggregateBy: volReq.AggregateBy,`
Implement series volume range queries (#9812) This PR adds a `series_volume_range` endpoint which allows for series volume queries over time with a specified step, returning timeseries data in the form of a Prometheus matrix response. The existing `series_volume` endpoint still returns Prometheus vector responses, and hardcodes the step to 0. 2 years ago			`}`
			`})`

			`type f func(context.Context) (time.Time, definitions.Response, error)`
			`var jobs []f`

			`for bucket, req := range reqs {`
			`b, r := bucket, req`
			`jobs = append(jobs, f(func(ctx context.Context) (time.Time, definitions.Response, error) {`
			`resp, err := next.Do(ctx, r)`
			`if err != nil {`
			`return b, nil, err`
			`}`

			`return b, resp, nil`
			`}))`
			`}`

Logging improvements for volume requests (#10099) I noticed we were logging volume requests as metric requests in `metrics.go`. This PR logs volume requests on their own with relevant data. 2 years ago			`// Update middleware stats`
			`queryStatsCtx := stats.FromContext(ctx)`
			`queryStatsCtx.AddSplitQueries(int64(len(jobs)))`

Implement series volume range queries (#9812) This PR adds a `series_volume_range` endpoint which allows for series volume queries over time with a specified step, returning timeseries data in the form of a Prometheus matrix response. The existing `series_volume` endpoint still returns Prometheus vector responses, and hardcodes the step to 0. 2 years ago			`collector := make(chan *bucketedVolumeResponse, len(jobs))`
			`err := concurrency.ForEachJob(`
			`ctx,`
			`len(jobs),`
			`len(jobs),`
			`func(ctx context.Context, i int) error {`
			`bucket, resp, err := jobs[i](ctx)`
			`if resp == nil {`
			`collector <- nil`
			`return err`
			`}`

			`collector <- &bucketedVolumeResponse{`
			`bucket, resp.(*VolumeResponse),`
			`}`
			`return err`
			`})`
			`close(collector)`

			`if err != nil {`
			`return nil, err`
			`}`

Allow volume to be aggregated by label (#9988) Add a `aggregateBy` query parameter to the `series_volume` endpoint, and rename that endpoint to just `volume`. This allows users to get volumes aggregated into top level labels, rather label+value pairs. --------- Co-authored-by: Travis Patterson <travis.patterson@grafana.com> 2 years ago			`promResp := ToPrometheusResponse(collector, seriesvolume.AggregateBySeries(volReq.AggregateBy))`
Implement series volume range queries (#9812) This PR adds a `series_volume_range` endpoint which allows for series volume queries over time with a specified step, returning timeseries data in the form of a Prometheus matrix response. The existing `series_volume` endpoint still returns Prometheus vector responses, and hardcodes the step to 0. 2 years ago			`return promResp, nil`
			`})`
			`})`
			`}`

			`type bucketedVolumeResponse struct {`
			`bucket time.Time`
			`response *VolumeResponse`
			`}`

Allow volume to be aggregated by label (#9988) Add a `aggregateBy` query parameter to the `series_volume` endpoint, and rename that endpoint to just `volume`. This allows users to get volumes aggregated into top level labels, rather label+value pairs. --------- Co-authored-by: Travis Patterson <travis.patterson@grafana.com> 2 years ago			`func ToPrometheusResponse(respsCh chan bucketedVolumeResponse, aggregateBySeries bool) LokiPromResponse {`
Implement series volume range queries (#9812) This PR adds a `series_volume_range` endpoint which allows for series volume queries over time with a specified step, returning timeseries data in the form of a Prometheus matrix response. The existing `series_volume` endpoint still returns Prometheus vector responses, and hardcodes the step to 0. 2 years ago			`var headers []*definitions.PrometheusResponseHeader`
			`samplesByName := make(map[string][]logproto.LegacySample)`

			`for bucketedVolumeResponse := range respsCh {`
			`if bucketedVolumeResponse == nil {`
			`continue`
			`}`

			`bucket, resp := bucketedVolumeResponse.bucket, bucketedVolumeResponse.response`

			`if headers == nil {`
			`headers := make([]*definitions.PrometheusResponseHeader, len(resp.Headers))`
			`for i, header := range resp.Headers {`
			`h := header`
			`headers[i] = &h`
			`}`
			`}`

			`for _, volume := range resp.Response.Volumes {`
			`if _, ok := samplesByName[volume.Name]; !ok {`
			`samplesByName[volume.Name] = make([]logproto.LegacySample, 0, 1)`
			`}`

			`samplesByName[volume.Name] = append(samplesByName[volume.Name], toPrometheusSample(volume, bucket))`
			`}`
			`}`

			`promResponse := queryrangebase.PrometheusResponse{`
			`Status: loghttp.QueryStatusSuccess,`
Allow volume to be aggregated by label (#9988) Add a `aggregateBy` query parameter to the `series_volume` endpoint, and rename that endpoint to just `volume`. This allows users to get volumes aggregated into top level labels, rather label+value pairs. --------- Co-authored-by: Travis Patterson <travis.patterson@grafana.com> 2 years ago			`Data: toPrometheusData(samplesByName, aggregateBySeries),`
Implement series volume range queries (#9812) This PR adds a `series_volume_range` endpoint which allows for series volume queries over time with a specified step, returning timeseries data in the form of a Prometheus matrix response. The existing `series_volume` endpoint still returns Prometheus vector responses, and hardcodes the step to 0. 2 years ago			`Headers: headers,`
			`}`

			`return &LokiPromResponse{`
			`Response: &promResponse,`
			`Statistics: stats.Result{},`
			`}`
			`}`

			`func toPrometheusSample(volume logproto.Volume, t time.Time) logproto.LegacySample {`
Allow volume to be aggregated by label (#9988) Add a `aggregateBy` query parameter to the `series_volume` endpoint, and rename that endpoint to just `volume`. This allows users to get volumes aggregated into top level labels, rather label+value pairs. --------- Co-authored-by: Travis Patterson <travis.patterson@grafana.com> 2 years ago			`ts := model.TimeFromUnixNano(t.UnixNano())`
Implement series volume range queries (#9812) This PR adds a `series_volume_range` endpoint which allows for series volume queries over time with a specified step, returning timeseries data in the form of a Prometheus matrix response. The existing `series_volume` endpoint still returns Prometheus vector responses, and hardcodes the step to 0. 2 years ago			`return logproto.LegacySample{`
			`Value: float64(volume.Volume),`
			`TimestampMs: ts.UnixNano() / 1e6,`
			`}`
			`}`

			`type sortableSampleStream struct {`
			`name string`
			`labels labels.Labels`
			`samples []logproto.LegacySample`
			`}`

Allow volume to be aggregated by label (#9988) Add a `aggregateBy` query parameter to the `series_volume` endpoint, and rename that endpoint to just `volume`. This allows users to get volumes aggregated into top level labels, rather label+value pairs. --------- Co-authored-by: Travis Patterson <travis.patterson@grafana.com> 2 years ago			`func toPrometheusData(series map[string][]logproto.LegacySample, aggregateBySeries bool) queryrangebase.PrometheusData {`
Implement series volume range queries (#9812) This PR adds a `series_volume_range` endpoint which allows for series volume queries over time with a specified step, returning timeseries data in the form of a Prometheus matrix response. The existing `series_volume` endpoint still returns Prometheus vector responses, and hardcodes the step to 0. 2 years ago			`resultType := loghttp.ResultTypeVector`
			`sortableResult := make([]sortableSampleStream, 0, len(series))`

			`for name, samples := range series {`
			`if resultType == loghttp.ResultTypeVector && len(samples) > 1 {`
			`resultType = loghttp.ResultTypeMatrix`
			`}`

Allow volume to be aggregated by label (#9988) Add a `aggregateBy` query parameter to the `series_volume` endpoint, and rename that endpoint to just `volume`. This allows users to get volumes aggregated into top level labels, rather label+value pairs. --------- Co-authored-by: Travis Patterson <travis.patterson@grafana.com> 2 years ago			`var lbls labels.Labels`
			`var err error`

			`if aggregateBySeries {`
			`lbls, err = syntax.ParseLabels(name)`
			`} else {`
			`lbls = labels.Labels{{`
			`Name: name,`
			`Value: "",`
			`}}`
			`}`

Implement series volume range queries (#9812) This PR adds a `series_volume_range` endpoint which allows for series volume queries over time with a specified step, returning timeseries data in the form of a Prometheus matrix response. The existing `series_volume` endpoint still returns Prometheus vector responses, and hardcodes the step to 0. 2 years ago			`if err != nil {`
			`continue`
			`}`

			`sort.Slice(samples, func(i, j int) bool {`
			`return samples[i].TimestampMs < samples[j].TimestampMs`
			`})`

			`sortableResult = append(sortableResult, sortableSampleStream{`
			`name: name,`
			`labels: lbls,`
			`samples: samples,`
			`})`
			`}`

			`sort.Slice(sortableResult, func(i, j int) bool {`
sort sort log volumes by size (#10045) To save some frontend work, this PR sorts all the log volumes by volume rather than name. For range queries, only the first value is used. 2 years ago			`// Sorting by value only helps instant queries so just grab the first value`
			`if sortableResult[i].samples[0].Value == sortableResult[j].samples[0].Value {`
			`return sortableResult[i].name < sortableResult[j].name`
			`}`
			`return sortableResult[i].samples[0].Value > sortableResult[j].samples[0].Value`
Implement series volume range queries (#9812) This PR adds a `series_volume_range` endpoint which allows for series volume queries over time with a specified step, returning timeseries data in the form of a Prometheus matrix response. The existing `series_volume` endpoint still returns Prometheus vector responses, and hardcodes the step to 0. 2 years ago			`})`

			`result := make([]queryrangebase.SampleStream, 0, len(sortableResult))`
			`for _, r := range sortableResult {`
			`result = append(result, queryrangebase.SampleStream{`
			`Labels: logproto.FromLabelsToLabelAdapters(r.labels),`
			`Samples: r.samples,`
			`})`
			`}`

			`return queryrangebase.PrometheusData{`
			`ResultType: resultType,`
			`Result: result,`
			`}`
			`}`