|
20 | 20 | "openai/gpt-4o-mini-2024-07-18": OpenAIModelArgs( |
21 | 21 | model_name="gpt-4o-mini-2024-07-18", |
22 | 22 | max_total_tokens=128_000, |
23 | | - max_input_tokens=100_000, |
24 | | - max_new_tokens=28_000, |
| 23 | + max_input_tokens=128_000, |
| 24 | + max_new_tokens=16_384, |
25 | 25 | vision_support=True, |
26 | 26 | ), |
27 | 27 | "openai/gpt-4-1106-preview": OpenAIModelArgs( |
28 | 28 | model_name="gpt-4-1106-preview", |
29 | 29 | max_total_tokens=128_000, |
30 | | - max_input_tokens=100_000, |
31 | | - max_new_tokens=28_000, |
| 30 | + max_input_tokens=128_000, |
| 31 | + max_new_tokens=4_096, |
32 | 32 | ), |
33 | 33 | "openai/gpt-4-vision-preview": OpenAIModelArgs( |
34 | 34 | model_name="gpt-4-vision-preview", |
35 | 35 | max_total_tokens=128_000, |
36 | | - max_input_tokens=100_000, |
37 | | - max_new_tokens=28_000, # I think this model has very small default value if we don't set max_new_tokens |
| 36 | + max_input_tokens=128_000, |
| 37 | + max_new_tokens=16_384, # I think this model has very small default value if we don't set max_new_tokens |
38 | 38 | vision_support=True, |
39 | 39 | ), |
40 | 40 | "openai/gpt-4o-2024-05-13": OpenAIModelArgs( |
41 | 41 | model_name="gpt-4o-2024-05-13", |
42 | 42 | max_total_tokens=128_000, |
43 | | - max_input_tokens=100_000, |
44 | | - max_new_tokens=28_000, # I think this model has very small default value if we don't set max_new_tokens |
| 43 | + max_input_tokens=128_000, |
| 44 | + max_new_tokens=4_096, # I think this model has very small default value if we don't set max_new_tokens |
45 | 45 | vision_support=True, |
46 | 46 | ), |
47 | 47 | "openai/gpt-3.5-turbo-0125": OpenAIModelArgs( |
48 | 48 | model_name="gpt-3.5-turbo-0125", |
49 | 49 | max_total_tokens=16_384, |
50 | | - max_input_tokens=15_000, |
51 | | - max_new_tokens=1_000, |
| 50 | + max_input_tokens=16_384, |
| 51 | + max_new_tokens=4096, |
52 | 52 | ), |
53 | 53 | "openai/gpt-3.5-turbo-1106": OpenAIModelArgs( |
54 | 54 | model_name="gpt-3.5-turbo-1106", |
55 | 55 | max_total_tokens=16_384, |
56 | | - max_input_tokens=15_000, |
57 | | - max_new_tokens=1_000, |
| 56 | + max_input_tokens=16_384, |
| 57 | + max_new_tokens=4096, |
58 | 58 | ), |
59 | 59 | "azure/gpt-35-turbo/gpt-35-turbo": AzureModelArgs( |
60 | 60 | model_name="gpt-35-turbo", |
|
68 | 68 | deployment_name="gpt-4o-2024-05-13", |
69 | 69 | max_total_tokens=128_000, |
70 | 70 | max_input_tokens=100_000, |
71 | | - max_new_tokens=28_000, |
| 71 | + max_new_tokens=16_384, |
72 | 72 | vision_support=True, |
73 | 73 | ), |
74 | 74 | "azure/gpt-4o-2024-08-06": AzureModelArgs( |
75 | 75 | model_name="gpt-4o", |
76 | 76 | deployment_name="gpt-4o-2024-08-06", |
77 | 77 | max_total_tokens=128_000, |
78 | | - max_input_tokens=100_000, |
79 | | - max_new_tokens=28_000, |
| 78 | + max_input_tokens=128_000, |
| 79 | + max_new_tokens=16_384, |
80 | 80 | vision_support=True, |
81 | 81 | ), |
82 | 82 | "azure/gpt-4o-mini-2024-07-18": AzureModelArgs( |
83 | 83 | model_name="gpt-4o-mini", |
84 | 84 | deployment_name="gpt-4o-mini-2024-07-18", |
85 | 85 | max_total_tokens=128_000, |
86 | | - max_input_tokens=100_000, |
87 | | - max_new_tokens=28_000, |
| 86 | + max_input_tokens=128_000, |
| 87 | + max_new_tokens=16_384, |
88 | 88 | vision_support=True, |
89 | 89 | ), |
90 | 90 | # ---------------- OSS LLMs ----------------# |
|
151 | 151 | "openrouter/anthropic/claude-3.5-sonnet:beta": OpenRouterModelArgs( |
152 | 152 | model_name="anthropic/claude-3.5-sonnet:beta", |
153 | 153 | max_total_tokens=200_000, |
154 | | - max_input_tokens=160_000, |
155 | | - max_new_tokens=40_000, |
| 154 | + max_input_tokens=200_000, |
| 155 | + max_new_tokens=8_192, |
156 | 156 | temperature=1e-1, |
157 | 157 | vision_support=True, |
158 | 158 | ), |
|
166 | 166 | "openrouter/openai/o1-mini-2024-09-12": OpenRouterModelArgs( |
167 | 167 | model_name="openai/o1-mini-2024-09-12", |
168 | 168 | max_total_tokens=128_000, |
169 | | - max_input_tokens=100_000, |
170 | | - max_new_tokens=28_000, |
| 169 | + max_input_tokens=128_000, |
| 170 | + max_new_tokens=64_000, |
171 | 171 | temperature=1e-1, |
172 | 172 | ), |
173 | 173 | } |
0 commit comments