Skip to content

Commit 910d3b3

Browse files
committed
Update eval_aime_benchmark.py
1 parent eb9ca3a commit 910d3b3

File tree

1 file changed

+1
-2
lines changed

1 file changed

+1
-2
lines changed

scripts/eval_aime_benchmark.py

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -104,11 +104,10 @@ def get_llm_response(problem: str, model: str) -> Union[str, List[Dict]]:
104104
try:
105105
response = client.with_options(timeout=1000.0).chat.completions.create(
106106
model=model,
107-
temperature=0.2,
108107
messages=[
109108
{"role": "user", "content": SYSTEM_PROMPT + problem}
110109
],
111-
max_tokens=40000,
110+
max_tokens=8192,
112111
)
113112

114113
# If there's more than one choice, format as attempts

0 commit comments

Comments
 (0)