We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent e34a1be commit 7ce1e13Copy full SHA for 7ce1e13
examples/scaffolding/run_majority_vote_aime24.py
@@ -116,10 +116,15 @@ def main():
116
print(
117
f'Controller {controller_name} Accuracy: {correct_count} out of {total_count}'
118
)
119
+
120
if args.threshold is not None:
- assert correct_count >= args.threshold * total_count, \
121
+ accuracy = correct_count / total_count
122
+ if accuracy < args.threshold:
123
+ print(
124
f'Accuracy check failed with {correct_count}/{total_count} < {args.threshold}'
- print(f'Accuracy check passed with threshold={args.threshold}')
125
+ )
126
+ else:
127
+ print(f'Accuracy check passed with threshold={args.threshold}')
128
129
if args.static_with_benchmark:
130
print(f'Total time: {total_time}')
0 commit comments