|
18 | 18 | get_default_on_result_writer, |
19 | 19 | ) |
20 | 20 | from benchmarks.utils.fake_user_response import run_conversation_with_fake_user_response |
21 | | -from benchmarks.utils.image_utils import image_exists |
| 21 | +from benchmarks.utils.image_utils import create_docker_workspace, image_exists |
22 | 22 | from benchmarks.utils.llm_config import load_llm_config |
23 | 23 | from benchmarks.utils.models import ( |
24 | 24 | EvalInstance, |
|
31 | 31 | from openhands.sdk.workspace import RemoteWorkspace |
32 | 32 | from openhands.tools.delegate import DelegateTool |
33 | 33 | from openhands.tools.preset.default import get_default_tools |
34 | | -from openhands.workspace import APIRemoteWorkspace, DockerDevWorkspace, DockerWorkspace |
| 34 | +from openhands.workspace import APIRemoteWorkspace |
35 | 35 |
|
36 | 36 |
|
37 | 37 | logger = get_logger(__name__) |
@@ -171,30 +171,12 @@ def prepare_workspace( |
171 | 171 | agent_server_image = ( |
172 | 172 | f"{EVAL_AGENT_SERVER_IMAGE}:{SDK_SHORT_SHA}-{custom_tag}{suffix}" |
173 | 173 | ) |
174 | | - SKIP_BUILD = os.getenv("SKIP_BUILD", "1").lower() in ("1", "true", "yes") |
175 | | - logger.info(f"SKIP_BUILD={SKIP_BUILD}") |
176 | | - if not SKIP_BUILD: |
177 | | - logger.info( |
178 | | - f"Building workspace from {official_docker_image} " |
179 | | - f"for instance {instance.id}. " |
180 | | - "This may take a while...\n" |
181 | | - "You can run benchmarks/swtbench/build_images.py and set " |
182 | | - "SKIP_BUILD=1 to skip building and use pre-built " |
183 | | - "agent-server image." |
184 | | - ) |
185 | | - # For SWT-bench, we use DockerDevWorkspace with base_image |
186 | | - workspace = DockerDevWorkspace( |
187 | | - base_image=official_docker_image, |
188 | | - working_dir="/workspace", |
189 | | - target=build_target, |
190 | | - forward_env=forward_env or [], |
191 | | - ) |
192 | | - else: |
193 | | - workspace = DockerWorkspace( |
194 | | - server_image=agent_server_image, |
195 | | - working_dir="/workspace", |
196 | | - forward_env=forward_env or [], |
197 | | - ) |
| 174 | + workspace = create_docker_workspace( |
| 175 | + agent_server_image=agent_server_image, |
| 176 | + base_image=official_docker_image, |
| 177 | + build_target=build_target, |
| 178 | + forward_env=forward_env, |
| 179 | + ) |
198 | 180 | elif self.metadata.workspace_type == "remote": |
199 | 181 | runtime_api_key = os.getenv("RUNTIME_API_KEY") |
200 | 182 | sdk_short_sha = os.getenv("SDK_SHORT_SHA", SDK_SHORT_SHA) |
|
0 commit comments