diff --git a/packages/evals/.docker/entrypoints/runner.sh b/packages/evals/.docker/entrypoints/runner.sh index 5445bf335e..84f35c3f2a 100644 --- a/packages/evals/.docker/entrypoints/runner.sh +++ b/packages/evals/.docker/entrypoints/runner.sh @@ -1,5 +1,8 @@ #!/bin/bash +# Set environment variable to suppress WSL install prompt for VS Code +export DONT_PROMPT_WSL_INSTALL=1 + if [ $# -eq 0 ]; then exec bash else diff --git a/packages/evals/Dockerfile.runner b/packages/evals/Dockerfile.runner index ec3277461c..b718b9cd7b 100644 --- a/packages/evals/Dockerfile.runner +++ b/packages/evals/Dockerfile.runner @@ -59,11 +59,11 @@ ARG PYTHON_EXT_VERSION=2025.6.1 ARG RUST_EXT_VERSION=0.3.2482 RUN mkdir -p /roo/.vscode-template \ - && code --no-sandbox --user-data-dir /roo/.vscode-template --install-extension golang.go@${GOLANG_EXT_VERSION} \ - && code --no-sandbox --user-data-dir /roo/.vscode-template --install-extension dbaeumer.vscode-eslint@${ESLINT_EXT_VERSION} \ - && code --no-sandbox --user-data-dir /roo/.vscode-template --install-extension redhat.java@${JAVA_EXT_VERSION} \ - && code --no-sandbox --user-data-dir /roo/.vscode-template --install-extension ms-python.python@${PYTHON_EXT_VERSION} \ - && code --no-sandbox --user-data-dir /roo/.vscode-template --install-extension rust-lang.rust-analyzer@${RUST_EXT_VERSION} + && yes | code --no-sandbox --user-data-dir /roo/.vscode-template --install-extension golang.go@${GOLANG_EXT_VERSION} \ + && yes | code --no-sandbox --user-data-dir /roo/.vscode-template --install-extension dbaeumer.vscode-eslint@${ESLINT_EXT_VERSION} \ + && yes | code --no-sandbox --user-data-dir /roo/.vscode-template --install-extension redhat.java@${JAVA_EXT_VERSION} \ + && yes | code --no-sandbox --user-data-dir /roo/.vscode-template --install-extension ms-python.python@${PYTHON_EXT_VERSION} \ + && yes | code --no-sandbox --user-data-dir /roo/.vscode-template --install-extension rust-lang.rust-analyzer@${RUST_EXT_VERSION} # Copy evals ARG EVALS_COMMIT=main @@ -128,7 +128,7 @@ RUN cp -r /roo/.vscode-template /roo/.vscode # Build the Roo Code extension RUN pnpm vsix -- --out ../bin/roo-code.vsix \ - && code --no-sandbox --user-data-dir /roo/.vscode --install-extension bin/roo-code.vsix + && yes | code --no-sandbox --user-data-dir /roo/.vscode --install-extension bin/roo-code.vsix # Copy entrypoint script COPY packages/evals/.docker/entrypoints/runner.sh /usr/local/bin/entrypoint.sh diff --git a/packages/evals/README.md b/packages/evals/README.md index 95ef52bb49..a33c7a81cf 100644 --- a/packages/evals/README.md +++ b/packages/evals/README.md @@ -35,7 +35,7 @@ The initial build process can take a minute or two. Upon success you should see Additionally, you'll find in Docker Desktop that database and redis services are running: Screenshot 2025-06-05 at 12 07 09 PM -Navigate to [localhost:3000](http://localhost:3000/) in your browser and click the 🚀 button. +Navigate to [localhost:3446](http://localhost:3446/) in your browser and click the 🚀 button. By default a evals run will run all programming exercises in [Roo Code Evals](https://github.com/RooCodeInc/Roo-Code-Evals) repository with the Claude Sonnet 4 model and default settings. For basic configuration you can specify the LLM to use and any subset of the exercises you'd like. For advanced configuration you can import a Roo Code settings file which will allow you to run the evals with Roo Code configured any way you'd like (this includes custom modes, a footgun prompt, etc). diff --git a/packages/evals/docker-compose.yml b/packages/evals/docker-compose.yml index 93e643e44b..3b251f8f95 100644 --- a/packages/evals/docker-compose.yml +++ b/packages/evals/docker-compose.yml @@ -56,7 +56,7 @@ services: context: ../../ dockerfile: packages/evals/Dockerfile.web ports: - - "${EVALS_WEB_PORT:-3000}:3000" + - "${EVALS_WEB_PORT:-3446}:3000" environment: - HOST_EXECUTION_METHOD=docker volumes: diff --git a/packages/evals/scripts/setup.sh b/packages/evals/scripts/setup.sh index d95b6e2514..cca6f9ce95 100755 --- a/packages/evals/scripts/setup.sh +++ b/packages/evals/scripts/setup.sh @@ -386,5 +386,5 @@ if ! nc -z localhost 3000; then echo "💡 You can start it anytime with 'pnpm --filter @roo-code/web-evals dev'." fi else - echo "👟 The evals web app is running at http://localhost:3000" + echo "👟 The evals web app is running at http://localhost:3000 (or http://localhost:3446 if using Docker)" fi