Skip to content

Commit 5c8d627

Browse files
gasseTLSDC
andauthored
Max new tokens fix (#118)
* Lower max_new_tokens for OpenAI models * updating configs --------- Co-authored-by: Thibault LSDC <[email protected]> Co-authored-by: ThibaultLSDC <[email protected]>
1 parent 1196455 commit 5c8d627

File tree

1 file changed

+21
-21
lines changed

1 file changed

+21
-21
lines changed

src/agentlab/llm/llm_configs.py

Lines changed: 21 additions & 21 deletions
Original file line numberDiff line numberDiff line change
@@ -20,41 +20,41 @@
2020
"openai/gpt-4o-mini-2024-07-18": OpenAIModelArgs(
2121
model_name="gpt-4o-mini-2024-07-18",
2222
max_total_tokens=128_000,
23-
max_input_tokens=100_000,
24-
max_new_tokens=28_000,
23+
max_input_tokens=128_000,
24+
max_new_tokens=16_384,
2525
vision_support=True,
2626
),
2727
"openai/gpt-4-1106-preview": OpenAIModelArgs(
2828
model_name="gpt-4-1106-preview",
2929
max_total_tokens=128_000,
30-
max_input_tokens=100_000,
31-
max_new_tokens=28_000,
30+
max_input_tokens=128_000,
31+
max_new_tokens=4_096,
3232
),
3333
"openai/gpt-4-vision-preview": OpenAIModelArgs(
3434
model_name="gpt-4-vision-preview",
3535
max_total_tokens=128_000,
36-
max_input_tokens=100_000,
37-
max_new_tokens=28_000, # I think this model has very small default value if we don't set max_new_tokens
36+
max_input_tokens=128_000,
37+
max_new_tokens=16_384, # I think this model has very small default value if we don't set max_new_tokens
3838
vision_support=True,
3939
),
4040
"openai/gpt-4o-2024-05-13": OpenAIModelArgs(
4141
model_name="gpt-4o-2024-05-13",
4242
max_total_tokens=128_000,
43-
max_input_tokens=100_000,
44-
max_new_tokens=28_000, # I think this model has very small default value if we don't set max_new_tokens
43+
max_input_tokens=128_000,
44+
max_new_tokens=4_096, # I think this model has very small default value if we don't set max_new_tokens
4545
vision_support=True,
4646
),
4747
"openai/gpt-3.5-turbo-0125": OpenAIModelArgs(
4848
model_name="gpt-3.5-turbo-0125",
4949
max_total_tokens=16_384,
50-
max_input_tokens=15_000,
51-
max_new_tokens=1_000,
50+
max_input_tokens=16_384,
51+
max_new_tokens=4096,
5252
),
5353
"openai/gpt-3.5-turbo-1106": OpenAIModelArgs(
5454
model_name="gpt-3.5-turbo-1106",
5555
max_total_tokens=16_384,
56-
max_input_tokens=15_000,
57-
max_new_tokens=1_000,
56+
max_input_tokens=16_384,
57+
max_new_tokens=4096,
5858
),
5959
"azure/gpt-35-turbo/gpt-35-turbo": AzureModelArgs(
6060
model_name="gpt-35-turbo",
@@ -68,23 +68,23 @@
6868
deployment_name="gpt-4o-2024-05-13",
6969
max_total_tokens=128_000,
7070
max_input_tokens=100_000,
71-
max_new_tokens=28_000,
71+
max_new_tokens=16_384,
7272
vision_support=True,
7373
),
7474
"azure/gpt-4o-2024-08-06": AzureModelArgs(
7575
model_name="gpt-4o",
7676
deployment_name="gpt-4o-2024-08-06",
7777
max_total_tokens=128_000,
78-
max_input_tokens=100_000,
79-
max_new_tokens=28_000,
78+
max_input_tokens=128_000,
79+
max_new_tokens=16_384,
8080
vision_support=True,
8181
),
8282
"azure/gpt-4o-mini-2024-07-18": AzureModelArgs(
8383
model_name="gpt-4o-mini",
8484
deployment_name="gpt-4o-mini-2024-07-18",
8585
max_total_tokens=128_000,
86-
max_input_tokens=100_000,
87-
max_new_tokens=28_000,
86+
max_input_tokens=128_000,
87+
max_new_tokens=16_384,
8888
vision_support=True,
8989
),
9090
# ---------------- OSS LLMs ----------------#
@@ -151,8 +151,8 @@
151151
"openrouter/anthropic/claude-3.5-sonnet:beta": OpenRouterModelArgs(
152152
model_name="anthropic/claude-3.5-sonnet:beta",
153153
max_total_tokens=200_000,
154-
max_input_tokens=160_000,
155-
max_new_tokens=40_000,
154+
max_input_tokens=200_000,
155+
max_new_tokens=8_192,
156156
temperature=1e-1,
157157
vision_support=True,
158158
),
@@ -166,8 +166,8 @@
166166
"openrouter/openai/o1-mini-2024-09-12": OpenRouterModelArgs(
167167
model_name="openai/o1-mini-2024-09-12",
168168
max_total_tokens=128_000,
169-
max_input_tokens=100_000,
170-
max_new_tokens=28_000,
169+
max_input_tokens=128_000,
170+
max_new_tokens=64_000,
171171
temperature=1e-1,
172172
),
173173
}

0 commit comments

Comments
 (0)