Skip to content

Commit 50ac90e

Browse files
committed
Update eval_aime_benchmark.py
1 parent 120ad87 commit 50ac90e

File tree

1 file changed

+1
-5
lines changed

1 file changed

+1
-5
lines changed

scripts/eval_aime_benchmark.py

Lines changed: 1 addition & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -781,11 +781,7 @@ def main(model: str, n_attempts: int, analyze_thoughts: bool = False, analyze_lo
781781

782782
suffix = "_" + "_".join(suffix_parts) if suffix_parts else ""
783783
results_file = f"results/evaluation_results_{model.replace('/', '_')}_pass_at_{n_attempts}{suffix}.json"
784-
785-
# Create raw data directory if analyzing logits
786-
if analyze_logits:
787-
os.makedirs("results/raw", exist_ok=True)
788-
784+
789785
dataset = load_2024_dataset()
790786
existing_results = load_existing_results(results_file)
791787

0 commit comments

Comments
 (0)