File tree Expand file tree Collapse file tree 5 files changed +30
-5
lines changed Expand file tree Collapse file tree 5 files changed +30
-5
lines changed Original file line number Diff line number Diff line change 2121 - name : Set up Python
2222 uses : actions/setup-python@v5
2323 with :
24- python-version : ' 3.10 '
24+ python-version : ' 3.11 '
2525 cache : ' pip' # caching pip dependencies
2626
2727 - name : Pip install
3131 run : pip list
3232
3333 - name : Code Formatting
34- run : black . --check
34+ run : black . --check --diff
Original file line number Diff line number Diff line change 1515 RANDOM_SEARCH_AGENT ,
1616 AGENT_4o ,
1717 AGENT_4o_MINI ,
18+ AGENT_CLAUDE_SONNET_35 ,
1819 AGENT_4o_VISION ,
20+ AGENT_4o_MINI_VISION ,
21+ AGENT_CLAUDE_SONNET_35_VISION ,
1922)
2023
2124__all__ = [
2831 "AGENT_8B" ,
2932 "RANDOM_SEARCH_AGENT" ,
3033 "AGENT_CUSTOM" ,
34+ "AGENT_CLAUDE_SONNET_35" ,
35+ "AGENT_4o_VISION" ,
36+ "AGENT_4o_MINI_VISION" ,
37+ "AGENT_CLAUDE_SONNET_35_VISION" ,
3138]
Original file line number Diff line number Diff line change 260260 chat_model_args = CHAT_MODEL_ARGS_DICT ["openai/gpt-4o-mini-2024-07-18" ],
261261 flags = FLAGS_GPT_4o ,
262262)
263+ AGENT_CLAUDE_SONNET_35 = GenericAgentArgs (
264+ chat_model_args = CHAT_MODEL_ARGS_DICT ["openrouter/anthropic/claude-3.5-sonnet:beta" ],
265+ flags = FLAGS_GPT_4o ,
266+ )
263267
264268# GPT-4o vision default config
265269FLAGS_GPT_4o_VISION = FLAGS_GPT_4o .copy ()
271275 flags = FLAGS_GPT_4o_VISION ,
272276)
273277
278+ AGENT_4o_MINI_VISION = GenericAgentArgs (
279+ chat_model_args = CHAT_MODEL_ARGS_DICT ["openai/gpt-4o-mini-2024-07-18" ],
280+ flags = FLAGS_GPT_4o_VISION ,
281+ )
282+
283+ AGENT_CLAUDE_SONNET_35_VISION = GenericAgentArgs (
284+ chat_model_args = CHAT_MODEL_ARGS_DICT ["openrouter/anthropic/claude-3.5-sonnet:beta" ],
285+ flags = FLAGS_GPT_4o_VISION ,
286+ )
287+
274288
275289DEFAULT_RS_FLAGS = GenericPromptFlags (
276290 flag_group = "default_rs" ,
Original file line number Diff line number Diff line change 55This module contains the classes and functions to reproduce the results of a
66study. It is used to create a new study that will run the same experiments as
77the original study, but with a reproducibility agent that will mimic the same
8- answers as the original agent.
8+ answers as the original agent.
99
1010Stats are collected to compare the original agent's answers with the new agent's
1111answers. Load the this reproducibility study in agent-xray to compare the results.
Original file line number Diff line number Diff line change 1- from agentlab .llm .chat_api import (AzureModelArgs , OpenAIModelArgs ,
2- OpenRouterModelArgs , SelfHostedModelArgs )
1+ from agentlab .llm .chat_api import (
2+ AzureModelArgs ,
3+ OpenAIModelArgs ,
4+ OpenRouterModelArgs ,
5+ SelfHostedModelArgs ,
6+ )
37
48default_oss_llms_args = {
59 "n_retry_server" : 4 ,
You can’t perform that action at this time.
0 commit comments