knylander-grafana
diff --git a/‎CHANGELOG.md
Lines changed: 1 addition & 0 deletions b/‎CHANGELOG.md
Lines changed: 1 addition & 0 deletions
diff --git a/‎modules/frontend/metrics_query_range_sharder.go
Lines changed: 3 additions & 3 deletions b/‎modules/frontend/metrics_query_range_sharder.go
Lines changed: 3 additions & 3 deletions
diff --git a/‎modules/frontend/metrics_query_range_sharder_test.go
Lines changed: 194 additions & 0 deletions b/‎modules/frontend/metrics_query_range_sharder_test.go
Lines changed: 194 additions & 0 deletions
diff --git a/‎modules/frontend/search_sharder.go
Lines changed: 4 additions & 0 deletions b/‎modules/frontend/search_sharder.go
Lines changed: 4 additions & 0 deletions
@@ -109,6 +109,7 @@ configurable via the throughput_bytes_slo field, and it will populate op="traces
 * [BUGFIX] Fix `TempoBlockListRisingQuickly` alert grouping. [#4876](https://github.com/grafana/tempo/pull/4876) (@mapno)
 * [BUGFIX] Reset `SkipMetricsGeneration` before reuse. [#5117](https://github.com/grafana/tempo/pull/5117) (@flxbk)
 * [BUGFIX] Fix metrics generator host info processor overrides config. [#5118](https://github.com/grafana/tempo/pull/5118) (@rlankfo)
+* [BUGFIX] Fix for queried number of exemplars (TraceQL Metrics) [#5115](https://github.com/grafana/tempo/pull/5115) (@ruslan-mikhailov)
 
 # v2.7.2
 
 
@@ -166,10 +166,10 @@ func (s queryRangeSharder) RoundTrip(pipelineRequest pipeline.Request) (pipeline
 }
 
 func (s *queryRangeSharder) exemplarsPerShard(total uint32, exemplars uint32) uint32 {
-	if exemplars == 0 {
+	if exemplars == 0 || total == 0 {
 		return 0
 	}
-	return uint32(math.Ceil(float64(exemplars)*1.2)) / total
+	return max(uint32(math.Ceil(float64(exemplars)*1.2))/total, 1) // require at least 1 exemplar per shard
 }
 
 func (s *queryRangeSharder) backendRequests(ctx context.Context, tenantID string, parent pipeline.Request, searchReq tempopb.QueryRangeRequest, cutoff time.Time, targetBytesPerRequest int, reqCh chan pipeline.Request) (totalJobs, totalBlocks uint32, totalBlockBytes uint64) {
@@ -244,7 +244,7 @@ func (s *queryRangeSharder) buildBackendRequests(ctx context.Context, tenantID s
 		if exemplars > 0 {
 			// Scale the number of exemplars per block to match the size
 			// of each sub request on this block. For very small blocks or other edge cases, return at least 1.
-			exemplars = max(uint32(float64(exemplars)*float64(m.TotalRecords)/float64(pages)), 1)
+			exemplars = max(uint32(float64(exemplars)*float64(pages)/float64(m.TotalRecords)), 1)
 		}
 
 		dedColsJSON, err := colsToJSON.JSONForDedicatedColumns(m.DedicatedColumns)
 
@@ -0,0 +1,194 @@
+package frontend
+
+import (
+	"net/http/httptest"
+	"strconv"
+	"strings"
+	"testing"
+	"time"
+
+	"github.com/go-kit/log"
+	"github.com/google/uuid"
+	"github.com/stretchr/testify/assert"
+	"github.com/stretchr/testify/require"
+
+	"github.com/grafana/tempo/modules/frontend/pipeline"
+	"github.com/grafana/tempo/pkg/tempopb"
+	"github.com/grafana/tempo/tempodb/backend"
+)
+
+func FuzzExemplarsPerShard(f *testing.F) {
+	f.Add(uint32(1), uint32(10))  // total = 1, exemplars = 10
+	f.Add(uint32(100), uint32(1)) // total = 100, exemplars = 1
+	f.Add(uint32(10), uint32(0))  // total = 10, exemplars = 0
+
+	s := &queryRangeSharder{}
+
+	f.Fuzz(func(t *testing.T, total uint32, exemplars uint32) {
+		result := s.exemplarsPerShard(total, exemplars)
+
+		if exemplars == 0 || total == 0 {
+			assert.Equal(t, uint32(0), result, "if exemplars is 0 or total is 0, result should be 0")
+		} else {
+			assert.Greater(t, result, uint32(0), "result should be greater than 0")
+		}
+	})
+}
+
+func TestBuildBackendRequestsExemplarsOneBlock(t *testing.T) {
+	// Create the test sharder with exemplars enabled
+	sharder := &queryRangeSharder{
+		logger: log.NewNopLogger(),
+		cfg: QueryRangeSharderConfig{
+			MaxExemplars: 100,
+		},
+	}
+	tenantID := "test-tenant"
+	targetBytesPerRequest := 1000
+
+	testCases := []struct {
+		name              string
+		totalRecords      uint32
+		blockSize         uint64
+		exemplars         uint32
+		expectedBatches   int
+		expectedExemplars int
+	}{
+		{
+			name:              "basic",
+			totalRecords:      100,
+			blockSize:         uint64(targetBytesPerRequest),
+			exemplars:         5,
+			expectedExemplars: 6, // 5 * 1.2
+			expectedBatches:   1,
+		},
+		{
+			name:              "two batches",
+			totalRecords:      100,
+			blockSize:         uint64(2 * targetBytesPerRequest),
+			exemplars:         5,
+			expectedExemplars: 6, // 5 * 1.2
+			expectedBatches:   2,
+		},
+		{
+			name:              "high record count",
+			totalRecords:      10000,
+			blockSize:         50000,
+			exemplars:         10,
+			expectedExemplars: 50, // 1 per each batch
+			expectedBatches:   50,
+		},
+		{
+			name:              "totalRecords == blockSize == targetBytesPerRequest",
+			totalRecords:      uint32(targetBytesPerRequest),
+			blockSize:         uint64(targetBytesPerRequest),
+			exemplars:         10,
+			expectedExemplars: 12, // 10 * 1.2
+			expectedBatches:   1,
+		},
+		{
+			name:              "large block size",
+			totalRecords:      500,
+			blockSize:         50000,
+			exemplars:         20,
+			expectedExemplars: 50, // 1 per each batch
+			expectedBatches:   50,
+		},
+		{
+			name:              "small block",
+			totalRecords:      10,
+			blockSize:         100,
+			exemplars:         1,
+			expectedExemplars: 2, // 1 * 1.2 -> rounded up to 2
+			expectedBatches:   1,
+		},
+		{
+			name:              "block with single record",
+			totalRecords:      1,
+			blockSize:         uint64(2 * targetBytesPerRequest),
+			exemplars:         1,
+			expectedExemplars: 2, // 1 * 1.2 -> rounded up to 2
+			expectedBatches:   1,
+		},
+		{
+			name:              "block with single record",
+			totalRecords:      1,
+			blockSize:         uint64(1.5 * float64(targetBytesPerRequest)),
+			exemplars:         1,
+			expectedExemplars: 2, // 1 * 1.2 -> rounded up to 2
+			expectedBatches:   1,
+		},
+		{
+			name:              "block with 2 records",
+			totalRecords:      2,
+			blockSize:         uint64(2 * targetBytesPerRequest),
+			exemplars:         1,
+			expectedExemplars: 2, // 1 * 1.2 -> rounded up to 2
+			expectedBatches:   2,
+		},
+	}
+
+	for _, tc := range testCases {
+		t.Run(tc.name, func(t *testing.T) {
+			// Create a test requests with exemplars enabled
+			req := httptest.NewRequest("GET", "/test", nil)
+			parentReq := pipeline.NewHTTPRequest(req)
+			searchReq := tempopb.QueryRangeRequest{
+				Query:     "test_query",
+				Start:     uint64(time.Now().Add(-1 * time.Hour).UnixNano()),
+				End:       uint64(time.Now().UnixNano()),
+				Step:      uint64(60 * time.Second.Nanoseconds()),
+				Exemplars: tc.exemplars,
+			}
+
+			// Create mock block metadata
+			blockMeta := &backend.BlockMeta{
+				BlockID:      backend.MustParse(uuid.NewString()),
+				TotalRecords: tc.totalRecords,
+				Size_:        tc.blockSize,
+				StartTime:    time.Now().Add(-1 * time.Hour),
+				EndTime:      time.Now(),
+			}
+
+			reqCh := make(chan pipeline.Request, 10)
+
+			go func() {
+				sharder.buildBackendRequests(t.Context(), tenantID, parentReq, searchReq, []*backend.BlockMeta{blockMeta}, targetBytesPerRequest, reqCh)
+			}()
+
+			// Collect requests
+			var generatedRequests []pipeline.Request
+			for req := range reqCh {
+				generatedRequests = append(generatedRequests, req)
+			}
+			assert.Equal(t, tc.expectedBatches, len(generatedRequests), "Number of generated requests should match expected value")
+
+			var totalExemplars int
+			for _, req := range generatedRequests {
+				uri := req.HTTPRequest().URL.String()
+				exemplarsValue := extractExemplarsValue(t, uri)
+				assert.Greater(t, exemplarsValue, 0, "Exemplars per batch should be at least 1")
+				totalExemplars += exemplarsValue
+			}
+			assert.Equal(t, tc.expectedExemplars, totalExemplars, "Total exemplars should match expected value")
+		})
+	}
+}
+
+// extractExemplarsValue extracts the exemplars value from the URL
+func extractExemplarsValue(t *testing.T, uri string) int {
+	require.True(t, strings.Contains(uri, "exemplars="), "Request should contain exemplars parameter")
+	exemplarsParam := ""
+	for param := range strings.SplitSeq(uri, "&") {
+		if strings.HasPrefix(param, "exemplars=") {
+			exemplarsParam = strings.TrimPrefix(param, "exemplars=")
+			break
+		}
+	}
+	require.NotEmpty(t, exemplarsParam, "Exemplars parameter should not be empty")
+
+	exemplarsValue, err := strconv.Atoi(exemplarsParam)
+	require.NoError(t, err, "Should be able to parse exemplars value")
+
+	return exemplarsValue
+}
@@ -374,6 +374,10 @@ func pagesPerRequest(m *backend.BlockMeta, bytesPerRequest int) int {
 	if m.Size_ == 0 || m.TotalRecords == 0 {
 		return 0
 	}
+	// if the block is smaller than the bytesPerRequest, we can search the entire block
+	if m.Size_ < uint64(bytesPerRequest) {
+		return int(m.TotalRecords)
+	}
 
 	bytesPerPage := m.Size_ / uint64(m.TotalRecords)
 	if bytesPerPage == 0 {
Original file line number	Diff line number	Diff line change
`@@ -166,10 +166,10 @@ func (s queryRangeSharder) RoundTrip(pipelineRequest pipeline.Request) (pipeline`
`166`	`166`	`}`
`167`	`167`
`168`	`168`	`func (s *queryRangeSharder) exemplarsPerShard(total uint32, exemplars uint32) uint32 {`
`169`		`- if exemplars == 0 {`
	`169`	`+ if exemplars == 0 \|\| total == 0 {`
`170`	`170`	`return 0`
`171`	`171`	`}`
`172`		`- return uint32(math.Ceil(float64(exemplars)*1.2)) / total`
	`172`	`+ return max(uint32(math.Ceil(float64(exemplars)*1.2))/total, 1) // require at least 1 exemplar per shard`
`173`	`173`	`}`
`174`	`174`
`175`	`175`	`func (s *queryRangeSharder) backendRequests(ctx context.Context, tenantID string, parent pipeline.Request, searchReq tempopb.QueryRangeRequest, cutoff time.Time, targetBytesPerRequest int, reqCh chan pipeline.Request) (totalJobs, totalBlocks uint32, totalBlockBytes uint64) {`
`@@ -244,7 +244,7 @@ func (s *queryRangeSharder) buildBackendRequests(ctx context.Context, tenantID s`
`244`	`244`	`if exemplars > 0 {`
`245`	`245`	`// Scale the number of exemplars per block to match the size`
`246`	`246`	`// of each sub request on this block. For very small blocks or other edge cases, return at least 1.`
`247`		`- exemplars = max(uint32(float64(exemplars)*float64(m.TotalRecords)/float64(pages)), 1)`
	`247`	`+ exemplars = max(uint32(float64(exemplars)*float64(pages)/float64(m.TotalRecords)), 1)`
`248`	`248`	`}`
`249`	`249`
`250`	`250`	`dedColsJSON, err := colsToJSON.JSONForDedicatedColumns(m.DedicatedColumns)`