|
| 1 | +import os |
| 2 | + |
| 3 | +from dotenv import load_dotenv |
| 4 | + |
| 5 | +from paperbench.utils import find_dotenv |
| 6 | + |
| 7 | +load_dotenv(find_dotenv()) |
| 8 | + |
| 9 | +from alcatraz.clusters.local import LocalConfig |
| 10 | +from preparedness_turn_completer.oai_turn_completer import OpenAITurnCompleter |
| 11 | + |
| 12 | +from paperbench.nano.eval import ( |
| 13 | + ExternalPythonCodingSolver, |
| 14 | +) |
| 15 | +from paperbench.nano.structs import ( |
| 16 | + JudgeConfig, |
| 17 | + ReproductionConfig, |
| 18 | +) |
| 19 | +from paperbench.solvers.dummy.solver import PaperBenchDummySolver |
| 20 | + |
| 21 | +OPENAI_API_KEY = os.getenv("OPENAI_API_KEY", None) |
| 22 | +GRADER_OPENAI_API_KEY = os.getenv("GRADER_OPENAI_API_KEY", OPENAI_API_KEY) |
| 23 | +DEFAULT_AZURE_VM_SKU = "Standard_D2as_v4" |
| 24 | + |
| 25 | +LOCAL_DUMMY_SOLVER_CONFIG = PaperBenchDummySolver() |
| 26 | + |
| 27 | +LOCAL_AISI_SOLVER_CONFIG = ExternalPythonCodingSolver( |
| 28 | + agent_id="aisi-basic-agent-openai-dev", |
| 29 | + cluster_config=LocalConfig( |
| 30 | + image="aisi-basic-agent:latest", |
| 31 | + pull_from_registry=False, |
| 32 | + ), |
| 33 | +) |
| 34 | + |
| 35 | +LOCAL_REPRODUCTION_CONFIG = ReproductionConfig( |
| 36 | + timeout=100 * 3600, |
| 37 | + retry_threshold=600, |
| 38 | + overwrite_existing_output=False, |
| 39 | + skip_reproduction=True, |
| 40 | + cluster_config=LocalConfig( |
| 41 | + image="pb-reproducer:latest", |
| 42 | + pull_from_registry=False, |
| 43 | + ), |
| 44 | +) |
| 45 | + |
| 46 | +LOCAL_REPRODUCTION_WITHOUT_SKIP_CONFIG = ReproductionConfig( |
| 47 | + timeout=100 * 3600, |
| 48 | + retry_threshold=600, |
| 49 | + overwrite_existing_output=False, |
| 50 | + skip_reproduction=False, |
| 51 | + cluster_config=LocalConfig( |
| 52 | + image="pb-reproducer:latest", |
| 53 | + pull_from_registry=False, |
| 54 | + ), |
| 55 | +) |
| 56 | + |
| 57 | +LOCAL_JUDGE_CONFIG = JudgeConfig( |
| 58 | + grade=True, |
| 59 | + grade_locally=True, |
| 60 | + grade_id=0, |
| 61 | + overwrite_existing_output=False, |
| 62 | + scaffold="dummy", |
| 63 | + completer_config=OpenAITurnCompleter.Config( |
| 64 | + model="gpt-4o-mini", |
| 65 | + ), |
| 66 | + code_only=False, |
| 67 | + resources_provided=False, |
| 68 | + cluster_config=LocalConfig( |
| 69 | + image="pb-env:latest", |
| 70 | + pull_from_registry=False, |
| 71 | + environment={"OPENAI_API_KEY": GRADER_OPENAI_API_KEY}, |
| 72 | + ), |
| 73 | +) |
0 commit comments