1- from abc import ABC , abstractmethod
21import gzip
32import logging
43import pickle
1817from agentlab .experiments .exp_utils import RESULTS_DIR , add_dependencies
1918from agentlab .experiments .launch_exp import find_incomplete , non_dummy_count , run_experiments
2019
21-
2220logger = logging .getLogger (__name__ )
2321
2422
@@ -186,7 +184,15 @@ def load_exp_args_list(self):
186184 def set_reproducibility_info (self , strict_reproducibility = False , comment = None ):
187185 """Gather relevant information that may affect the reproducibility of the experiment
188186
189- e.g.: versions of BrowserGym, benchmark, AgentLab..."""
187+ e.g.: versions of BrowserGym, benchmark, AgentLab...
188+
189+ Args:
190+ strict_reproducibility: bool
191+ If True, all modifications have to be committed before running the experiments.
192+ Also, if relaunching a study, it will not be possible if the code has changed.
193+ comment: str
194+ Extra comment to add to the reproducibility information.
195+ """
190196 agent_names = [a .agent_name for a in self .agent_args ]
191197 info = repro .get_reproducibility_info (
192198 agent_names ,
@@ -252,13 +258,14 @@ def _run(self, n_jobs=1, parallel_backend="joblib", strict_reproducibility=False
252258 Args:
253259 n_jobs: int
254260 Number of parallel jobs.
255-
256261 parallel_backend: str
257262 Parallel backend to use. Either "joblib", "dask" or "sequential".
258-
259263 strict_reproducibility: bool
260264 If True, all modifications have to be committed before running the experiments.
261265 Also, if relaunching a study, it will not be possible if the code has changed.
266+
267+ Raises:
268+ ValueError: If the exp_args_list is None.
262269 """
263270
264271 if self .exp_args_list is None :
@@ -276,10 +283,6 @@ def append_to_journal(self, strict_reproducibility=True):
276283 Args:
277284 strict_reproducibility: bool
278285 If True, incomplete experiments will raise an error.
279-
280- Raises:
281- ValueError: If the reproducibility information is not compatible
282- with the report.
283286 """
284287 _ , summary_df , _ = self .get_results ()
285288 repro .append_to_journal (
@@ -447,9 +450,16 @@ def _agents_on_benchmark(
447450 If True, the experiments will be run in demo mode.
448451 logging_level: int
449452 The logging level for individual jobs.
453+ logging_level_stdout: int
454+ The logging level for the stdout.
455+ ignore_dependencies: bool
456+ If True, the dependencies will be ignored and all experiments can be run in parallel.
450457
451458 Returns:
452459 list[ExpArgs]: The list of experiments to run.
460+
461+ Raises:
462+ ValueError: If multiple agents are run on a benchmark that requires manual reset.
453463 """
454464
455465 if not isinstance (agents , (list , tuple )):
0 commit comments