|
4 | 4 | from bgym import DEFAULT_BENCHMARKS |
5 | 5 | from dotenv import load_dotenv |
6 | 6 |
|
7 | | -from agentlab.agents.generic_agent.agent_configs import FLAGS_GPT_4o |
| 7 | +from agentlab.agents.generic_agent.agent_configs import GPT5_MINI_FLAGS |
8 | 8 | from agentlab.agents.generic_agent.generic_agent import GenericAgentArgs |
9 | 9 | from agentlab.agents.tapeagent.agent import TapeAgentArgs, load_config |
10 | 10 | from agentlab.backends.browser.mcp_playwright import MCPPlaywright |
11 | | -from agentlab.backends.browser.playwright import PlaywrightSyncBackend |
| 11 | +from agentlab.backends.browser.playwright import AsyncPlaywright |
12 | 12 | from agentlab.benchmarks.miniwob import MiniWobBenchmark |
13 | 13 | from agentlab.experiments.study import make_study |
14 | 14 | from agentlab.llm.llm_configs import CHAT_MODEL_ARGS_DICT |
|
22 | 22 | config = load_config("miniwob") |
23 | 23 |
|
24 | 24 | # benchmark = DEFAULT_BENCHMARKS["miniwob"](n_repeats=1) |
25 | | - benchmark = MiniWobBenchmark(backend=MCPPlaywright()) |
| 25 | + # benchmark = MiniWobBenchmark(backend=MCPPlaywright()) |
| 26 | + benchmark = MiniWobBenchmark(backend=AsyncPlaywright()) |
26 | 27 |
|
27 | 28 | # agent_args = GenericAgentArgs( |
28 | | - # chat_model_args=CHAT_MODEL_ARGS_DICT["openrouter/openai/gpt-5-mini"], |
29 | | - # flags=FLAGS_GPT_4o, |
| 29 | + # chat_model_args=CHAT_MODEL_ARGS_DICT["azure/gpt-5-mini-2025-08-07"], |
| 30 | + # flags=GPT5_MINI_FLAGS, |
30 | 31 | # ) |
31 | 32 | # agent_args.flags.obs.use_ax_tree = False |
32 | 33 | # agent_args.flags.obs.use_html = True |
|
0 commit comments