Skip to content

Commit e1d8fe0

Browse files
Merge pull request #259 from codeflash-ai/increase-the-min-test-case-passed
increase the min number of test cases passed
2 parents e18dcde + 9080051 commit e1d8fe0

File tree

3 files changed

+13
-9
lines changed

3 files changed

+13
-9
lines changed

codeflash/code_utils/config_consts.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -8,3 +8,4 @@
88
N_TESTS_TO_GENERATE = 2
99
TOTAL_LOOPING_TIME = 10.0 # 10 second candidate benchmarking budget
1010
COVERAGE_THRESHOLD = 60.0
11+
MIN_TESTCASE_PASSED_THRESHOLD = 6

codeflash/result/critic.py

Lines changed: 6 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,11 @@
44

55
from codeflash.cli_cmds.console import logger
66
from codeflash.code_utils import env_utils
7-
from codeflash.code_utils.config_consts import COVERAGE_THRESHOLD, MIN_IMPROVEMENT_THRESHOLD
7+
from codeflash.code_utils.config_consts import (
8+
COVERAGE_THRESHOLD,
9+
MIN_IMPROVEMENT_THRESHOLD,
10+
MIN_TESTCASE_PASSED_THRESHOLD,
11+
)
812
from codeflash.models.models import TestType
913

1014
if TYPE_CHECKING:
@@ -50,7 +54,7 @@ def quantity_of_tests_critic(candidate_result: OptimizedCandidateResult) -> bool
5054
for test_type in report:
5155
pass_count += report[test_type]["passed"]
5256

53-
if pass_count >= 4:
57+
if pass_count >= MIN_TESTCASE_PASSED_THRESHOLD:
5458
return True
5559
# If only one test passed, check if it's a REPLAY_TEST
5660
return bool(pass_count == 1 and report[TestType.REPLAY_TEST]["passed"] == 1)

tests/test_critic.py

Lines changed: 6 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -195,8 +195,7 @@ def test_generated_test_critic() -> None:
195195
timed_out=False,
196196
loop_index=1,
197197
)
198-
199-
test_results = [test_1, test_2, test_3, test_7]
198+
test_results = [test_1, test_2, test_3, test_4, test_5, test_6, test_7, test_1]
200199

201200
candidate_result = OptimizedCandidateResult(
202201
max_loop_count=5,
@@ -209,7 +208,7 @@ def test_generated_test_critic() -> None:
209208

210209
assert quantity_of_tests_critic(candidate_result)
211210

212-
test_results = [test_1, test_2, test_3, test_6, test_7]
211+
test_results = [test_1, test_2, test_3, test_6, test_7, test_1, test_4, test_1]
213212

214213
candidate_result = OptimizedCandidateResult(
215214
max_loop_count=5,
@@ -222,7 +221,7 @@ def test_generated_test_critic() -> None:
222221

223222
assert quantity_of_tests_critic(candidate_result)
224223

225-
test_results = [test_1, test_3, test_4, test_2, test_7]
224+
test_results = [test_1, test_3, test_4, test_2, test_7, test_1, test_6, test_1]
226225

227226
candidate_result = OptimizedCandidateResult(
228227
max_loop_count=5,
@@ -248,7 +247,7 @@ def test_generated_test_critic() -> None:
248247

249248
assert not quantity_of_tests_critic(candidate_result)
250249

251-
test_results = [test_1, test_2, test_3, test_4, test_5]
250+
test_results = [test_1, test_2, test_3, test_4, test_5, test_1, test_1, test_1]
252251

253252
candidate_result = OptimizedCandidateResult(
254253
max_loop_count=5,
@@ -287,7 +286,7 @@ def test_generated_test_critic() -> None:
287286

288287
assert quantity_of_tests_critic(candidate_result)
289288

290-
test_results = [test_1, test_2, test_3, test_4, test_5]
289+
test_results = [test_1, test_2, test_3, test_4, test_5, test_1, test_1, test_1]
291290

292291
candidate_result = OptimizedCandidateResult(
293292
max_loop_count=5,
@@ -328,7 +327,7 @@ def test_generated_test_critic() -> None:
328327

329328
assert not quantity_of_tests_critic(candidate_result)
330329

331-
test_results = [test_1, test_2, test_3, test_5]
330+
test_results = [test_1, test_2, test_3, test_5, test_1, test_1, test_1, test_1]
332331

333332
candidate_result = OptimizedCandidateResult(
334333
max_loop_count=5,

0 commit comments

Comments
 (0)