microbench-ci: only compare the last run

herkolategan · herkolategan · commit 21a2ce4a8409 · 2025-04-14T10:47:43.000+02:00
Previously, if a regression occurred, the comparison step would compare all
the runs instead of just the last one. The assumption was that if all runs show
a regression we expect the combined result to show a regression, but since the
baseline case shift with each run there's a small chance this does not always
hold true. Hence, we revert here to only comparing the last run.

Epic: None
Release note: None
diff --git a/pkg/cmd/microbench-ci/compare.go b/pkg/cmd/microbench-ci/compare.go
@@ -86,18 +86,6 @@ func (c *CompareResult) status(metricName string) Status {
 	return status
 }
 
-// top returns the top status of all metrics in the comparison.
-func (c *CompareResult) top() Status {
-	topStatus := NoChange
-	for metric := range c.MetricMap {
-		status := c.status(metric)
-		if status > topStatus {
-			topStatus = status
-		}
-	}
-	return topStatus
-}
-
 // compare compares the metrics of a benchmark between two revisions. Only the
 // specified last number of lines of the benchmark logs are considered. If lines
 // is 0, it considers the entire logs.
@@ -153,12 +141,6 @@ func (b Benchmarks) compareBenchmarks() (CompareResults, error) {
 		if err != nil {
 			return nil, err
 		}
-		if compareResult.top() != NoChange {
-			compareResult, err = benchmark.compare(0)
-			if err != nil {
-				return nil, err
-			}
-		}
 		compareResults = append(compareResults, compareResult)
 	}
 	return compareResults, nil
diff --git a/pkg/cmd/microbench-ci/testdata/regression.txt b/pkg/cmd/microbench-ci/testdata/regression.txt
@@ -94,8 +94,8 @@ run group=1
 
 | Metric                      | Old Commit     | New Commit     | Delta      | Note         |
 |-----------------------------|----------------|----------------|------------|--------------|
-| 🔴 **sec/op** | 9.862m ±0% | 9.952m ±0% | +0.91% | p=0.000 n=30    |
-| ⚪ **allocs/op** | 10.38k ±0% | 10.38k ±0% | ~ | p=1.000 n=30    |
+| 🔴 **sec/op** | 9.862m ±1% | 9.952m ±0% | +0.91% | p=0.001 n=10    |
+| ⚪ **allocs/op** | 10.38k ±1% | 10.38k ±1% | ~ | p=1.000 n=10    |
 
 <details><summary>Reproduce</summary>
 
@@ -182,42 +182,22 @@ json
             "Metric": "B/op",
             "Summary": {
               "Center": 2367667,
-              "Lo": 2365463,
-              "Hi": 2368213,
-              "Confidence": 0.95723,
+              "Lo": 2358650,
+              "Hi": 2370670,
+              "Confidence": 0.97852,
               "Warnings": null
             },
             "Sample": {
               "Values": [
                 2352326,
-                2352326,
-                2352326,
-                2358650,
                 2358650,
-                2358650,
-                2364281,
                 2364281,
-                2364281,
-                2365463,
                 2365463,
-                2365463,
-                2367582,
                 2367582,
-                2367582,
-                2367752,
                 2367752,
-                2367752,
-                2368213,
                 2368213,
-                2368213,
-                2369187,
                 2369187,
-                2369187,
-                2370670,
                 2370670,
-                2370670,
-                2375306,
-                2375306,
                 2375306
               ],
               "Thresholds": {
@@ -230,42 +210,22 @@ json
             "Metric": "allocs/op",
             "Summary": {
               "Center": 10378.50000,
-              "Lo": 10377,
-              "Hi": 10386,
-              "Confidence": 0.95723,
+              "Lo": 10287,
+              "Hi": 10398,
+              "Confidence": 0.97852,
               "Warnings": null
             },
             "Sample": {
               "Values": [
                 10246,
-                10246,
-                10246,
-                10287,
                 10287,
-                10287,
-                10361,
                 10361,
-                10361,
-                10377,
                 10377,
-                10377,
-                10378,
                 10378,
-                10378,
-                10379,
                 10379,
-                10379,
-                10386,
                 10386,
-                10386,
-                10392,
                 10392,
-                10392,
-                10398,
                 10398,
-                10398,
-                10411,
-                10411,
                 10411
               ],
               "Thresholds": {
@@ -278,42 +238,22 @@ json
             "Metric": "sec/op",
             "Summary": {
               "Center": 0.00995,
-              "Lo": 0.00995,
-              "Hi": 0.00997,
-              "Confidence": 0.95723,
+              "Lo": 0.00993,
+              "Hi": 0.00998,
+              "Confidence": 0.97852,
               "Warnings": null
             },
             "Sample": {
               "Values": [
                 0.00991,
-                0.00991,
-                0.00991,
-                0.00993,
                 0.00993,
-                0.00993,
-                0.00995,
                 0.00995,
                 0.00995,
                 0.00995,
                 0.00995,
-                0.00995,
-                0.00995,
-                0.00995,
-                0.00995,
-                0.00995,
-                0.00995,
-                0.00995,
-                0.00997,
                 0.00997,
-                0.00997,
-                0.00998,
-                0.00998,
-                0.00998,
                 0.00998,
                 0.00998,
-                0.00998,
-                0.01000,
-                0.01000,
                 0.01000
               ],
               "Thresholds": {
@@ -328,42 +268,22 @@ json
             "Metric": "B/op",
             "Summary": {
               "Center": 2367667,
-              "Lo": 2365463,
-              "Hi": 2368213,
-              "Confidence": 0.95723,
+              "Lo": 2358650,
+              "Hi": 2370670,
+              "Confidence": 0.97852,
               "Warnings": null
             },
             "Sample": {
               "Values": [
                 2352326,
-                2352326,
-                2352326,
-                2358650,
                 2358650,
-                2358650,
-                2364281,
                 2364281,
-                2364281,
-                2365463,
                 2365463,
-                2365463,
-                2367582,
                 2367582,
-                2367582,
-                2367752,
                 2367752,
-                2367752,
-                2368213,
-                2368213,
                 2368213,
                 2369187,
-                2369187,
-                2369187,
                 2370670,
-                2370670,
-                2370670,
-                2375306,
-                2375306,
                 2375306
               ],
               "Thresholds": {
@@ -376,42 +296,22 @@ json
             "Metric": "allocs/op",
             "Summary": {
               "Center": 10378.50000,
-              "Lo": 10377,
-              "Hi": 10386,
-              "Confidence": 0.95723,
+              "Lo": 10287,
+              "Hi": 10398,
+              "Confidence": 0.97852,
               "Warnings": null
             },
             "Sample": {
               "Values": [
-                10246,
-                10246,
                 10246,
                 10287,
-                10287,
-                10287,
-                10361,
-                10361,
                 10361,
                 10377,
-                10377,
-                10377,
-                10378,
-                10378,
                 10378,
                 10379,
-                10379,
-                10379,
-                10386,
-                10386,
                 10386,
                 10392,
-                10392,
-                10392,
-                10398,
-                10398,
                 10398,
-                10411,
-                10411,
                 10411
               ],
               "Thresholds": {
@@ -426,31 +326,11 @@ json
               "Center": 0,
               "Lo": 0,
               "Hi": 0,
-              "Confidence": 0.95723,
+              "Confidence": 0.97852,
               "Warnings": null
             },
             "Sample": {
               "Values": [
-                0,
-                0,
-                0,
-                0,
-                0,
-                0,
-                0,
-                0,
-                0,
-                0,
-                0,
-                0,
-                0,
-                0,
-                0,
-                0,
-                0,
-                0,
-                0,
-                0,
                 0,
                 0,
                 0,
@@ -473,41 +353,21 @@ json
             "Summary": {
               "Center": 0.00986,
               "Lo": 0.00985,
-              "Hi": 0.00988,
-              "Confidence": 0.95723,
+              "Hi": 0.00993,
+              "Confidence": 0.97852,
               "Warnings": null
             },
             "Sample": {
               "Values": [
                 0.00981,
-                0.00981,
-                0.00981,
-                0.00985,
-                0.00985,
                 0.00985,
                 0.00985,
                 0.00985,
                 0.00985,
-                0.00985,
-                0.00985,
-                0.00985,
-                0.00985,
-                0.00985,
-                0.00985,
-                0.00987,
-                0.00987,
                 0.00987,
                 0.00988,
-                0.00988,
-                0.00988,
-                0.00990,
-                0.00990,
                 0.00990,
                 0.00993,
-                0.00993,
-                0.00993,
-                0.00998,
-                0.00998,
                 0.00998
               ],
               "Thresholds": {