Skip to content

Commit 82ec9bc

Browse files
committed
adding new models R1 and o3-mini
1 parent 1e19949 commit 82ec9bc

File tree

1 file changed

+16
-6
lines changed

1 file changed

+16
-6
lines changed

src/agentlab/llm/llm_configs.py

Lines changed: 16 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -1,9 +1,5 @@
1-
from agentlab.llm.chat_api import (
2-
AzureModelArgs,
3-
OpenAIModelArgs,
4-
OpenRouterModelArgs,
5-
SelfHostedModelArgs,
6-
)
1+
from agentlab.llm.chat_api import (AzureModelArgs, OpenAIModelArgs,
2+
OpenRouterModelArgs, SelfHostedModelArgs)
73

84
default_oss_llms_args = {
95
"n_retry_server": 4,
@@ -17,6 +13,13 @@
1713
]
1814

1915
CHAT_MODEL_ARGS_DICT = {
16+
"openai/o3-mini-2025-01-31": OpenAIModelArgs(
17+
model_name="o3-mini-2025-01-31",
18+
max_total_tokens=200_000,
19+
max_input_tokens=200_000,
20+
max_new_tokens=100_000,
21+
vision_support=False,
22+
),
2023
"openai/gpt-4o-mini-2024-07-18": OpenAIModelArgs(
2124
model_name="gpt-4o-mini-2024-07-18",
2225
max_total_tokens=128_000,
@@ -113,6 +116,13 @@
113116
**default_oss_llms_args,
114117
),
115118
# ---------------- OPENROUTER ----------------#
119+
"openrouter/deepseek/deepseek-r1": OpenRouterModelArgs(
120+
model_name="deepseek/deepseek-r1",
121+
max_total_tokens=128_000,
122+
max_input_tokens=100_000,
123+
max_new_tokens=128_000,
124+
temperature=1e-1,
125+
),
116126
"openrouter/meta-llama/llama-3.1-405b-instruct": OpenRouterModelArgs(
117127
model_name="meta-llama/llama-3.1-405b-instruct",
118128
max_total_tokens=128_000,

0 commit comments

Comments
 (0)