Add integration tests for the runner package in Flakeguard

lukaszcl · lukaszcl · commit e0487f829b9e · 2025-04-11T11:52:40.000+02:00
diff --git a/tools/flakeguard/runner/runner_integration_test.go b/tools/flakeguard/runner/runner_integration_test.go
@@ -0,0 +1,361 @@
+//go:build integration_tests
+// +build integration_tests
+
+// Integration tests for the runner package, executing real tests.
+package runner_test
+
+import (
+	"encoding/json"
+	"fmt"
+	"os"
+	"path/filepath"
+	"strings"
+	"testing"
+
+	"github.com/stretchr/testify/assert"
+	"github.com/stretchr/testify/require"
+
+	"github.com/smartcontractkit/chainlink-testing-framework/tools/flakeguard/reports"
+	"github.com/smartcontractkit/chainlink-testing-framework/tools/flakeguard/runner"
+	// We will use the actual runner, executor, and parser implementations
+)
+
+var (
+	// Use relative path from runner directory for example tests
+	flakyTestPackagePath = "./example_test_package"
+	// Use a subdirectory within runner for debug output
+	debugDir = "_debug_outputs_integration"
+)
+
+// expectedTestResult mirrors the structure from the old tests
+type expectedTestResult struct {
+	allSuccesses  bool
+	someSuccesses bool
+	allFailures   bool
+	someFailures  bool
+	allSkips      bool
+	testPanic     bool
+	packagePanic  bool
+	race          bool
+	maximumRuns   int
+
+	exactRuns       *int
+	minimumRuns     *int
+	exactPassRate   *float64
+	minimumPassRate *float64
+	maximumPassRate *float64
+
+	seen bool
+}
+
+// TestRunIntegration adapts the original TestRun to use the refactored runner.
+func TestRunIntegration(t *testing.T) {
+	var (
+		zeroRuns        = 0
+		oneCount        = 1
+		defaultRunCount = 3 // Use a smaller count for faster integration tests
+		successPassRate = 1.0
+		failPassRate    = 0.0
+	)
+	testCases := []struct {
+		name           string
+		cfg            runnerConfig // Use a helper struct for clarity
+		expectedTests  map[string]*expectedTestResult
+		expectBuildErr bool
+	}{
+		{
+			name: "default (integration)",
+			cfg: runnerConfig{
+				ProjectPath:      "../",
+				RunCount:         defaultRunCount,
+				SkipTests:        []string{"TestPanic", "TestFlakyPanic", "TestSubTestsSomePanic", "TestTimeout"},
+				GoTestCountFlag:  &oneCount, // Force count=1 internally for predictability
+				OmitOutputs:      true,
+				IgnoreSubtestErr: false,
+			},
+			expectedTests: map[string]*expectedTestResult{
+				"TestFlaky":                           {exactRuns: &defaultRunCount, someSuccesses: true, someFailures: true},
+				"TestFail":                            {exactRuns: &defaultRunCount, allFailures: true, exactPassRate: &failPassRate},
+				"TestFailLargeOutput":                 {exactRuns: &defaultRunCount, allFailures: true, exactPassRate: &failPassRate},
+				"TestPass":                            {exactRuns: &defaultRunCount, allSuccesses: true, exactPassRate: &successPassRate},
+				"TestSkipped":                         {exactRuns: &zeroRuns, allSkips: true, exactPassRate: &successPassRate},
+				"TestRace":                            {exactRuns: &defaultRunCount, allSuccesses: true, exactPassRate: &successPassRate},
+				"TestSubTestsAllPass":                 {exactRuns: &defaultRunCount, allSuccesses: true},
+				"TestSubTestsAllPass/Pass1":           {exactRuns: &defaultRunCount, allSuccesses: true},
+				"TestSubTestsAllPass/Pass2":           {exactRuns: &defaultRunCount, allSuccesses: true},
+				"TestFailInParentAfterSubTests":       {exactRuns: &defaultRunCount, allFailures: true},
+				"TestFailInParentAfterSubTests/Pass1": {exactRuns: &defaultRunCount, allSuccesses: true},
+				"TestFailInParentAfterSubTests/Pass2": {exactRuns: &defaultRunCount, allSuccesses: true},
+				"TestFailInParentBeforeSubTests":      {exactRuns: &defaultRunCount, allFailures: true},
+				"TestSubTestsAllFail":                 {exactRuns: &defaultRunCount, allFailures: true},
+				"TestSubTestsAllFail/Fail1":           {exactRuns: &defaultRunCount, allFailures: true},
+				"TestSubTestsAllFail/Fail2":           {exactRuns: &defaultRunCount, allFailures: true},
+				"TestSubTestsSomeFail":                {exactRuns: &defaultRunCount, allFailures: true},
+				"TestSubTestsSomeFail/Pass":           {exactRuns: &defaultRunCount, allSuccesses: true},
+				"TestSubTestsSomeFail/Fail":           {exactRuns: &defaultRunCount, allFailures: true},
+			},
+		},
+		{
+			name: "race (integration)",
+			cfg: runnerConfig{
+				ProjectPath:      "../", // Set ProjectPath relative to runner dir -> flakeguard dir
+				RunCount:         defaultRunCount,
+				SelectTests:      []string{"TestRace"},
+				GoTestRaceFlag:   true,
+				OmitOutputs:      true,
+				IgnoreSubtestErr: false,
+			},
+			expectedTests: map[string]*expectedTestResult{
+				"TestRace": {race: true, maximumRuns: defaultRunCount, allFailures: true}, // Races cause failures
+			},
+		},
+		// Add other cases like panic, subtest panic, failfast if needed
+		{
+			name: "always panic (integration)",
+			cfg: runnerConfig{
+				ProjectPath:     "../",
+				RunCount:        defaultRunCount,
+				SelectTests:     []string{"TestPanic"},
+				GoTestCountFlag: &oneCount, // Force count=1 for predictability
+				OmitOutputs:     true,
+			},
+			expectedTests: map[string]*expectedTestResult{
+				"TestPanic": {packagePanic: true, testPanic: true, maximumRuns: defaultRunCount, allFailures: true},
+			},
+		},
+		{
+			name: "flaky panic (integration)",
+			cfg: runnerConfig{
+				ProjectPath:     "../",
+				RunCount:        defaultRunCount,
+				SelectTests:     []string{"TestFlakyPanic"},
+				GoTestCountFlag: &oneCount,
+				OmitOutputs:     true,
+			},
+			expectedTests: map[string]*expectedTestResult{
+				// This test panics on first run, passes on second. We run 3 times.
+				// Expect PackagePanic=true, TestPanic=true (as it panicked at least once)
+				// Expect some failures (at least 1), some successes (at least 1).
+				// Exact runs should be defaultRunCount.
+				"TestFlakyPanic": {exactRuns: &defaultRunCount, packagePanic: true, testPanic: true, someSuccesses: true, someFailures: true},
+			},
+		},
+		{
+			name: "subtest panic (integration)",
+			cfg: runnerConfig{
+				ProjectPath:     "../",
+				RunCount:        defaultRunCount,
+				SelectTests:     []string{"TestSubTestsSomePanic"},
+				GoTestCountFlag: &oneCount,
+				OmitOutputs:     true,
+			},
+			expectedTests: map[string]*expectedTestResult{
+				"TestSubTestsSomePanic":       {exactRuns: &defaultRunCount, packagePanic: true, testPanic: true, allFailures: true}, // Parent fails due to subtest panic
+				"TestSubTestsSomePanic/Pass":  {exactRuns: &defaultRunCount, packagePanic: true, testPanic: true, allFailures: true}, // Inherits panic, successes become failures
+				"TestSubTestsSomePanic/Panic": {exactRuns: &defaultRunCount, packagePanic: true, testPanic: true, allFailures: true}, // Panics directly
+			},
+		},
+		{
+			name: "failfast (integration)",
+			cfg: runnerConfig{
+				ProjectPath:     "../",
+				RunCount:        defaultRunCount, // Will try 3 times, but fail-fast stops early
+				SelectTests:     []string{"TestFail", "TestPass"},
+				GoTestCountFlag: &oneCount,
+				FailFast:        true,
+				OmitOutputs:     true,
+			},
+			expectedTests: map[string]*expectedTestResult{
+				// Only one execution attempt happens because FailFast=true and TestFail fails.
+				"TestFail": {exactRuns: &oneCount, allFailures: true},
+				"TestPass": {exactRuns: &oneCount, allSuccesses: true},
+			},
+		},
+	}
+
+	for _, tc := range testCases {
+		tc := tc // Capture range variable
+		t.Run(tc.name, func(t *testing.T) {
+			// Integration tests cannot run in parallel as they modify shared state (files)
+			// t.Parallel()
+
+			// Adjust project path relative to this test file's location
+			absProjectPath, err := filepath.Abs(tc.cfg.ProjectPath)
+			require.NoError(t, err)
+
+			// Initialize runner using the constructor
+			testRunner := runner.NewRunner(
+				absProjectPath,
+				false, // Verbose off for integration tests unless debugging
+				tc.cfg.RunCount,
+				tc.cfg.GoTestCountFlag,
+				tc.cfg.GoTestRaceFlag,
+				tc.cfg.GoTestTimeoutFlag,
+				tc.cfg.Tags,
+				tc.cfg.UseShuffle,
+				tc.cfg.ShuffleSeed,
+				tc.cfg.FailFast,
+				tc.cfg.SkipTests,
+				tc.cfg.SelectTests,
+				tc.cfg.IgnoreSubtestErr,
+				tc.cfg.OmitOutputs,
+				nil, // Use default executor
+				nil, // Use default parser
+			)
+
+			// Use package path relative to the ProjectPath (flakeguard dir)
+			testResults, err := testRunner.RunTestPackages([]string{"./runner/example_test_package"})
+
+			if tc.expectBuildErr {
+				require.Error(t, err)
+				// Assuming ErrBuild is exported from parser and accessible via runner
+				// require.ErrorIs(t, err, runner.ErrBuild) // Need to check how to access this error
+				return
+			}
+			require.NoError(t, err)
+
+			t.Cleanup(func() {
+				if !t.Failed() {
+					return
+				}
+				if err := os.MkdirAll(debugDir, 0755); err != nil {
+					t.Logf("error creating directory: %v", err)
+					return
+				}
+				saniTName := strings.ReplaceAll(t.Name(), "/", "_")
+				resultsFileName := filepath.Join(debugDir, fmt.Sprintf("test_results_%s.json", saniTName))
+				jsonResults, err := json.MarshalIndent(testResults, "", "  ")
+				if err != nil {
+					t.Logf("error marshalling test report: %v", err)
+					return
+				}
+				err = os.WriteFile(resultsFileName, jsonResults, 0644) //nolint:gosec
+				if err != nil {
+					t.Logf("error writing test results: %v", err)
+					return
+				}
+				t.Logf("Saved failing test results to %s", resultsFileName)
+			})
+
+			// Assertions
+			checkTestResults(t, tc.expectedTests, testResults)
+		})
+	}
+}
+
+// Helper function to check results against expectations
+func checkTestResults(t *testing.T, expectedTests map[string]*expectedTestResult, actualResults []reports.TestResult) {
+	t.Helper()
+	assert.Equal(t, len(expectedTests), len(actualResults), "unexpected number of test results recorded")
+
+	for _, result := range actualResults {
+		t.Run(fmt.Sprintf("checking results of %s", result.TestName), func(t *testing.T) {
+			require.NotNil(t, result, "test result was nil")
+			expected, ok := expectedTests[result.TestName]
+			require.True(t, ok, "unexpected test name found in results: %s", result.TestName)
+			require.False(t, expected.seen, "test '%s' was seen multiple times", result.TestName)
+			expected.seen = true
+
+			// Assertions adapted from original test
+			if !expected.testPanic { // Panics end up wrecking durations
+				// Can't reliably assert duration length == runs if some runs panicked and didn't report duration
+				// assert.Len(t, result.Durations, result.Runs, "test '%s' has mismatch of runs %d and duration counts %d", result.TestName, result.Runs, len(result.Durations))
+				assert.False(t, result.Panic, "test '%s' should not have panicked", result.TestName)
+			}
+			// Runs count is now calculated differently (based on processed terminal actions)
+			// The assertion result.Runs == result.Successes + result.Failures is no longer always true if skips occurred.
+			// We rely on the specific run count assertions below.
+
+			if expected.minimumRuns != nil {
+				assert.GreaterOrEqual(t, result.Runs, *expected.minimumRuns, "test '%s' had fewer runs (%d) than expected minimum (%d)", result.TestName, result.Runs, *expected.minimumRuns)
+			}
+			if expected.exactRuns != nil {
+				assert.Equal(t, *expected.exactRuns, result.Runs, "test '%s' had an unexpected number of runs", result.TestName)
+			} else {
+				assert.LessOrEqual(t, result.Runs, expected.maximumRuns, "test '%s' had more runs (%d) than expected maximum (%d)", result.TestName, result.Runs, expected.maximumRuns)
+			}
+			if expected.exactPassRate != nil {
+				assert.InDelta(t, *expected.exactPassRate, result.PassRatio, 0.001, "test '%s' had an unexpected pass ratio", result.TestName)
+			}
+			if expected.minimumPassRate != nil {
+				assert.Greater(t, result.PassRatio, *expected.minimumPassRate, "test '%s' had a pass ratio below the minimum", result.TestName)
+			}
+			if expected.maximumPassRate != nil {
+				assert.Less(t, result.PassRatio, *expected.maximumPassRate, "test '%s' had a pass ratio above the maximum", result.TestName)
+			}
+			if expected.allSuccesses {
+				assert.Equal(t, result.Runs, result.Successes, "test '%s' has %d runs and should have passed all, only passed %d", result.TestName, result.Runs, result.Successes)
+				assert.Zero(t, result.Failures, "test '%s' has %d runs and should have passed all, but failed %d", result.TestName, result.Runs, result.Failures)
+				assert.False(t, result.Panic, "test '%s' should not have panicked", result.TestName)
+				assert.False(t, result.Race, "test '%s' should not have raced", result.TestName)
+			}
+			if expected.someSuccesses {
+				assert.Greater(t, result.Successes, 0, "test '%s' has %d runs and should have passed some runs, passed none", result.TestName, result.Runs)
+			}
+			if expected.allFailures {
+				assert.Equal(t, result.Runs, result.Failures, "test '%s' has %d runs and should have failed all, only failed %d", result.TestName, result.Runs, result.Failures)
+				assert.Zero(t, result.Successes, "test '%s' has %d runs and should have failed all, but succeeded %d", result.TestName, result.Runs, result.Successes)
+				// Do not assert Race == false here, a test could fail for other reasons even if race detector was on
+			}
+			if expected.packagePanic {
+				assert.True(t, result.PackagePanic, "test '%s' should have package panicked", result.TestName)
+			}
+			if expected.testPanic {
+				assert.True(t, result.Panic, "test '%s' should have panicked", result.TestName)
+				assert.True(t, result.PackagePanic, "test '%s' should have package panicked", result.TestName)
+				expected.someFailures = true // Panic implies failure
+			}
+			if expected.someFailures {
+				assert.Greater(t, result.Failures, 0, "test '%s' has %d runs and should have failed some runs, failed none", result.TestName, result.Runs)
+			}
+			if expected.allSkips {
+				assert.Equal(t, 0, result.Runs, "test '%s' has %d runs and should have skipped all of them, no runs expected", result.TestName, result.Runs)
+				assert.True(t, result.Skipped, "test '%s' should be marked skipped", result.TestName)
+				assert.Zero(t, result.Successes, "test '%s' should have skipped all runs, but succeeded some", result.TestName)
+				assert.Zero(t, result.Failures, "test '%s' should have skipped all runs, but failed some", result.TestName)
+				assert.False(t, result.Panic, "test '%s' should not have panicked", result.TestName)
+				assert.False(t, result.Race, "test '%s' should not have raced", result.TestName)
+			}
+			if expected.race {
+				assert.True(t, result.Race, "test '%s' should have a data race", result.TestName)
+				// A race condition implies a failure in Go's test output
+				assert.GreaterOrEqual(t, result.Failures, 1, "test '%s' should have failed due to race", result.TestName)
+			}
+		})
+	}
+
+	// Final check to ensure all expected tests were seen
+	allTestsRun := []string{}
+	for testName, expected := range expectedTests {
+		if expected.seen {
+			allTestsRun = append(allTestsRun, testName)
+		}
+	}
+	for testName, expected := range expectedTests {
+		require.True(t, expected.seen, "expected test '%s' not found in test runs\nAll tests run: %s", testName, strings.Join(allTestsRun, ", "))
+	}
+}
+
+// resultsString helper (copied from old test)
+func resultsString(result reports.TestResult) string {
+	resultCounts := result.Successes + result.Failures + result.Skips
+	return fmt.Sprintf("Runs: %d\nPanicked: %t\nRace: %t\nSuccesses: %d\nFailures: %d\nSkips: %d\nTotal Results: %d",
+		result.Runs, result.Panic, result.Race, result.Successes, result.Failures, result.Skips, resultCounts)
+}
+
+// runnerConfig helper struct for test cases
+type runnerConfig struct {
+	ProjectPath       string
+	RunCount          int
+	GoTestCountFlag   *int
+	GoTestRaceFlag    bool
+	GoTestTimeoutFlag string
+	Tags              []string
+	UseShuffle        bool
+	ShuffleSeed       string
+	FailFast          bool
+	SkipTests         []string
+	SelectTests       []string
+	OmitOutputs       bool
+	IgnoreSubtestErr  bool
+}