Skip to content

Commit 5f675ba

Browse files
committed
Merge branch 'main' of github.com:ServiceNow/AgentLab into tlsdc/tool_use_agent
2 parents 8a17470 + f041e64 commit 5f675ba

File tree

7 files changed

+30
-4
lines changed

7 files changed

+30
-4
lines changed

README.md

Lines changed: 9 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -275,6 +275,15 @@ dynamic benchmarks.
275275
between the two executions. **Note**: this is a beta feature and will need some adaptation for your
276276
own agent.
277277

278+
## Variables
279+
Here's a list of relevant env. variables that are used by AgentLab:
280+
- `OPEAI_API_KEY` which is used by default for OpenAI LLMs.
281+
- `AZURE_OPENAI_API_KEY`, used by default for AzureOpenAI LLMs.
282+
- `AZURE_OPENAI_ENDPOINT` to specify your Azure endpoint.
283+
- `OPENAI_API_VERSION` for the Azure API.
284+
- `OPENROUTER_API_KEY` for the Openrouter API
285+
- `AGENTLAB_EXP_ROOT`, desired path for your experiments to be stored, defaults to `~/agentlab-results`.
286+
- `AGENTXRAY_SHARE_GRADIO`, which prompts AgentXRay to open a public tunnel on launch.
278287

279288
## Misc
280289

pyproject.toml

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -13,10 +13,11 @@ authors = [
1313
{name = "Alex Lacoste", email = "[email protected]"},
1414
{name = "Tom Marty", email = "[email protected]"},
1515
{name = "Massimo Caccia", email = "[email protected]"},
16-
{name = "Thibault Le Sellier de Chezelles", email = "[email protected]"}
16+
{name = "Thibault Le Sellier de Chezelles", email = "[email protected]"},
17+
{name = "Aman Jaiswal", email = "[email protected]"},
1718
]
1819
readme = "README.md"
19-
requires-python = ">3.7"
20+
requires-python = ">3.10"
2021
license = {text = "Apache-2.0"}
2122
classifiers = [
2223
"Development Status :: 2 - Pre-Alpha",

reproducibility_journal.csv

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -74,3 +74,5 @@ Leo Boisvert,GenericAgent-openai_o1-mini-2024-09-12,workarena_l1,0.4.1,2025-02-0
7474
M: src/agentlab/analyze/agent_xray.py
7575
M: src/agentlab/llm/llm_configs.py",0.13.3,1d2d7160e5b7ec9954ecb48988f71eb56288dd29,"
7676
Leo Boisvert,GenericAgent-anthropic_claude-3.7-sonnet,workarena_l1,0.4.1,2025-02-25_02-32-09,d4f900c2-1de1-4e4b-a3ab-495ff2675fff,0.515,0.028,0,330/330,None,Linux (#68-Ubuntu SMP Mon Oct 7 14:34:20 UTC 2024),3.12.3,1.44.0,v0.4.0,c9d2ef9648435ef1119950ecb1a0734497ccc33b,,0.13.3,1d2d7160e5b7ec9954ecb48988f71eb56288dd29,
77+
agentlabtraces,GenericAgent-meta-llama_llama-4-maverick,workarena_l1,0.4.1,2025-04-14_17-15-56,a6dc4022-2bb7-4b46-8b37-f62c010defc1,0.27,0.024,0,330/330,None,Linux (#135-Ubuntu SMP Fri Sep 27 13:53:58 UTC 2024),3.12.7,1.39.0,v0.4.0,5eb2ecb5e5b293170230bcbed8b17fe192af214a,,0.13.3,70dac253628c476aff1af6a975f27f8563453ad2,
78+
agentlabtraces,GenericAgent-meta-llama_llama-4-maverick,workarena_l2_agent_curriculum_eval,0.4.1,2025-04-22_15-38-44,d62fed39-caac-4ef3-92ac-b29897c69f88,0.085,0.018,1,235/235,None,Linux (#68-Ubuntu SMP Mon Oct 7 14:34:20 UTC 2024),3.12.7,1.39.0,v0.4.0,43bafbcfbe398fca39e4ffdc57b2f226d2c6d3e1,,0.13.3,70dac253628c476aff1af6a975f27f8563453ad2,

src/agentlab/agents/generic_agent/__init__.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -10,6 +10,7 @@
1010
AGENT_3_5,
1111
AGENT_8B,
1212
AGENT_CUSTOM,
13+
AGENT_LLAMA4_17B_INSTRUCT,
1314
AGENT_LLAMA3_70B,
1415
AGENT_LLAMA31_70B,
1516
RANDOM_SEARCH_AGENT,
@@ -31,6 +32,7 @@
3132
"AGENT_4o_VISION",
3233
"AGENT_o3_MINI",
3334
"AGENT_o1_MINI",
35+
"AGENT_LLAMA4_17B_INSTRUCT",
3436
"AGENT_LLAMA3_70B",
3537
"AGENT_LLAMA31_70B",
3638
"AGENT_8B",

src/agentlab/agents/generic_agent/agent_configs.py

Lines changed: 5 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -11,6 +11,7 @@
1111

1212
from .generic_agent import GenericAgentArgs
1313
from .generic_agent_prompt import GenericPromptFlags
14+
from .tmlr_config import BASE_FLAGS
1415

1516
FLAGS_CUSTOM = GenericPromptFlags(
1617
obs=dp.ObsFlags(
@@ -297,7 +298,10 @@
297298
chat_model_args=CHAT_MODEL_ARGS_DICT["openrouter/anthropic/claude-3.5-sonnet:beta"],
298299
flags=FLAGS_GPT_4o_VISION,
299300
)
300-
301+
AGENT_LLAMA4_17B_INSTRUCT = GenericAgentArgs(
302+
chat_model_args=CHAT_MODEL_ARGS_DICT["openrouter/meta-llama/llama-4-maverick"],
303+
flags=BASE_FLAGS,
304+
)
301305

302306
DEFAULT_RS_FLAGS = GenericPromptFlags(
303307
flag_group="default_rs",

src/agentlab/analyze/agent_xray.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -551,7 +551,7 @@ def tag_screenshot_with_action(screenshot: Image, action: str) -> Image:
551551
try:
552552
coords = action[action.index("(") + 1 : action.index(")")].split(",")
553553
coords = [c.strip() for c in coords]
554-
if len(coords) != 2:
554+
if len(coords) not in [2, 3]:
555555
raise ValueError(f"Invalid coordinate format: {coords}")
556556
if coords[0].startswith("x="):
557557
coords[0] = coords[0][2:]

src/agentlab/llm/llm_configs.py

Lines changed: 8 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -155,6 +155,14 @@
155155
max_new_tokens=28_000,
156156
temperature=1e-1,
157157
),
158+
"openrouter/meta-llama/llama-4-maverick": OpenRouterModelArgs(
159+
model_name="meta-llama/llama-4-maverick",
160+
max_total_tokens=128_000,
161+
max_input_tokens=100_000,
162+
max_new_tokens=28_000,
163+
temperature=1e-1,
164+
vision_support=True,
165+
),
158166
"openrouter/meta-llama/llama-3.1-8b-instruct:free": OpenRouterModelArgs(
159167
model_name="meta-llama/llama-3.1-8b-instruct:free",
160168
max_total_tokens=128_000,

0 commit comments

Comments
 (0)