wip

lukaszcl · lukaszcl · commit 21bc9278f67d · 2025-02-24T17:47:53.000+01:00
diff --git a/tools/flakeguard/runner/example_test_package/example_tests_test.go b/tools/flakeguard/runner/example_test_package/example_tests_test.go
@@ -212,3 +212,107 @@ func TestTimeout(t *testing.T) {
 	time.Sleep(time.Until(deadline))
 	t.Logf("This test should have timed out")
 }
+
+// 1) No subtests at all
+func TestParentNoSubtests(t *testing.T) {
+	t.Parallel()
+
+	t.Log("No subtests, just a single test that passes.")
+	// (Optional) you could also do t.Fail() or t.Fatal() to produce a fail
+}
+
+// 2) All subtests pass, no parent fail
+func TestParentAllPassSubtests(t *testing.T) {
+	t.Parallel()
+	t.Log("Parent does not fail, subtests all pass")
+
+	t.Run("SubtestA", func(t *testing.T) {
+		t.Parallel()
+		t.Log("passes")
+	})
+	t.Run("SubtestB", func(t *testing.T) {
+		t.Parallel()
+		t.Log("passes")
+	})
+}
+
+// 3) All subtests fail, no parent fail
+func TestParentAllFailSubtests(t *testing.T) {
+	t.Parallel()
+	t.Log("Parent does not fail, subtests all fail => typically the parent is marked fail by Go")
+
+	t.Run("FailA", func(t *testing.T) {
+		t.Parallel()
+		t.Fatal("This subtest always fails")
+	})
+	t.Run("FailB", func(t *testing.T) {
+		t.Parallel()
+		t.Fatal("This subtest always fails")
+	})
+}
+
+// 4) Some subtests pass, some fail, parent does NOT do its own fail
+func TestParentSomeFailSubtests(t *testing.T) {
+	t.Parallel()
+	t.Log("Parent does not fail, subtests partially pass/fail => parent is typically fail unless 'zeroOutParentFailsIfSubtestOnlyFails' modifies it")
+
+	t.Run("Pass", func(t *testing.T) {
+		t.Parallel()
+		t.Log("This subtest passes")
+	})
+	t.Run("Fail", func(t *testing.T) {
+		t.Parallel()
+		t.Fatal("This subtest fails")
+	})
+}
+
+// 5) Parent fails *after* subtests
+func TestParentOwnFailAfterSubtests(t *testing.T) {
+	t.Parallel()
+	t.Log("Parent fails after subtests pass => genuine parent-level failure")
+
+	t.Run("Pass1", func(t *testing.T) {
+		t.Parallel()
+		t.Log("This subtest always passes")
+	})
+	t.Run("Pass2", func(t *testing.T) {
+		t.Parallel()
+		t.Log("This subtest always passes")
+	})
+
+	// Finally, parent fails
+	t.Fatal("Parent test fails after subtests pass")
+}
+
+// 6) Parent fails *before* subtests
+func TestParentOwnFailBeforeSubtests(t *testing.T) {
+	t.Parallel()
+	t.Log("Parent fails before subtests => subtests might not even run in real usage, or still get reported, depending on concurrency")
+
+	t.Fatal("Parent test fails immediately")
+
+	t.Run("WouldPassButNeverRuns", func(t *testing.T) {
+		t.Parallel()
+		t.Log("Normally passes, but might not even run now.")
+	})
+}
+
+// 7) Nested subtests: parent -> child -> grandchild
+func TestNestedSubtests(t *testing.T) {
+	t.Parallel()
+	t.Log("Deep nesting example")
+
+	t.Run("Level1", func(t *testing.T) {
+		t.Parallel()
+
+		t.Run("Level2Pass", func(t *testing.T) {
+			t.Parallel()
+			t.Log("This sub-subtest passes")
+		})
+
+		t.Run("Level2Fail", func(t *testing.T) {
+			t.Parallel()
+			t.Fatal("This sub-subtest fails")
+		})
+	})
+}
diff --git a/tools/flakeguard/runner/runner.go b/tools/flakeguard/runner/runner.go
@@ -565,6 +565,10 @@ func (r *Runner) parseTestResults(filePaths []string) ([]reports.TestResult, err
 			log.Warn().Str("parent test", parentTestKey).Msg("expected parent test not found")
 		}
 	}
+
+	// Zero out parent test's failures if they are purely caused by subtest fails
+	zeroOutParentFailsIfSubtestOnlyFails(testDetails, testsWithSubTests)
+
 	for _, result := range testDetails {
 		if result.Runs > expectedRuns { // Panics can introduce double-counting test failures, this is a correction for it
 			if result.Panic {
@@ -595,6 +599,87 @@ func (r *Runner) parseTestResults(filePaths []string) ([]reports.TestResult, err
 	return results, nil
 }
 
+// zeroOutParentFailsIfSubtestOnlyFails scans through parent tests in `testDetails`.
+// If a parent test's failures only reference subtests (no genuine parent-level lines),
+// we zero out the parent's failures, so the parent is considered passed.
+func zeroOutParentFailsIfSubtestOnlyFails(
+	testDetails map[string]*reports.TestResult,
+	testsWithSubTests map[string][]string,
+) {
+	for parentTestKey, subTests := range testsWithSubTests {
+		parentResult, ok := testDetails[parentTestKey]
+		if !ok {
+			continue
+		}
+		// If the parent has zero failures, no need to adjust.
+		if parentResult.Failures == 0 {
+			continue
+		}
+
+		parentHasOwnFailure := false
+
+		// For each run's fail lines
+		for _, failLines := range parentResult.FailedOutputs {
+			for _, line := range failLines {
+
+				// 1) If line doesn't even mention parent test name (e.g. "example_tests_test.go:315: This sub-subtest fails"),
+				//    skip it. It's presumably sub-subtest detail.
+				if !strings.Contains(line, parentResult.TestName) {
+					continue
+				}
+
+				// 2) If it's the summary line, e.g. "--- FAIL: TestNestedSubtests (0.00s)",
+				//    skip it. It's not a genuine parent-level fail for your purposes.
+				if strings.HasPrefix(line, "--- FAIL: "+parentResult.TestName+" (") {
+					continue
+				}
+
+				// 3) Check if it references "TestParent/SubtestName"
+				//    e.g. "TestNestedSubtests/Level1"
+				isSubtestLine := false
+				for _, subName := range subTests {
+					expected := parentResult.TestName + "/" + subName
+					if strings.Contains(line, expected) {
+						isSubtestLine = true
+						break
+					}
+				}
+
+				// If we *still* can’t identify it as purely subtest-based => it's a genuine parent-level fail.
+				if !isSubtestLine {
+					parentHasOwnFailure = true
+					break
+				}
+			}
+			if parentHasOwnFailure {
+				break
+			}
+		}
+
+		// If the parent has no genuine failure lines, zero out its fail
+		if !parentHasOwnFailure {
+			parentResult.Runs -= parentResult.Failures
+			parentResult.Failures = 0
+
+			// Adjust successes if needed
+			if parentResult.Runs < parentResult.Successes {
+				parentResult.Successes = parentResult.Runs
+			}
+
+			// Recompute pass ratio
+			if parentResult.Runs > 0 {
+				parentResult.PassRatio = float64(parentResult.Successes) / float64(parentResult.Runs)
+			} else {
+				// If no runs remain, we consider it "passed"
+				parentResult.PassRatio = 1
+			}
+
+			// Clear the parent's failed outputs
+			parentResult.FailedOutputs = make(map[string][]string)
+		}
+	}
+}
+
 // attributePanicToTest properly attributes panics to the test that caused them.
 func attributePanicToTest(panicPackage string, panicEntries []entry) (test string, timeout bool, err error) {
 	regexSanitizePanicPackage := filepath.Base(panicPackage)
diff --git a/tools/flakeguard/runner/runner_test.go b/tools/flakeguard/runner/runner_test.go