diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
index 204d37ef..ed96a64e 100644
--- a/.github/workflows/ci.yml
+++ b/.github/workflows/ci.yml
@@ -75,6 +75,13 @@ jobs:
         run: npm run lint
         continue-on-error: true
 
+      - name: Webview Tests
+        id: webview_test
+        if: always() && steps.install_webview.outcome == 'success'
+        working-directory: webview-ui
+        run: npm test
+        continue-on-error: true
+
       - name: Format Check
         id: format_check
         if: always() && steps.install_root.outcome == 'success'
@@ -118,6 +125,7 @@ jobs:
           TYPE_CHECK: ${{ steps.type_check.outcome }}
           ROOT_LINT: ${{ steps.root_lint.outcome }}
           WEBVIEW_LINT: ${{ steps.webview_lint.outcome }}
+          WEBVIEW_TEST: ${{ steps.webview_test.outcome }}
           FORMAT_CHECK: ${{ steps.format_check.outcome }}
           BUILD: ${{ steps.build.outcome }}
           AUDIT_ROOT: ${{ steps.audit_root.outcome }}
@@ -138,6 +146,7 @@ jobs:
             echo "| **Type check** | $(status "$TYPE_CHECK") |"
             echo "| **Root lint** | $(status "$ROOT_LINT") |"
             echo "| **Webview lint** | $(status "$WEBVIEW_LINT") |"
+            echo "| **Webview tests** | $(status "$WEBVIEW_TEST") |"
             echo "| **Format check** | $(status "$FORMAT_CHECK") |"
             echo "| **Build** | $(status "$BUILD") |"
             echo "| Audit root _(advisory)_ | $(status "$AUDIT_ROOT") |"
@@ -156,13 +165,14 @@ jobs:
           TYPE_CHECK: ${{ steps.type_check.outcome }}
           ROOT_LINT: ${{ steps.root_lint.outcome }}
           WEBVIEW_LINT: ${{ steps.webview_lint.outcome }}
+          WEBVIEW_TEST: ${{ steps.webview_test.outcome }}
           FORMAT_CHECK: ${{ steps.format_check.outcome }}
           BUILD: ${{ steps.build.outcome }}
         run: |
           failed=0
           for step in CHECKOUT SETUP_NODE INSTALL_ROOT INSTALL_WEBVIEW \
-                      TYPE_CHECK ROOT_LINT WEBVIEW_LINT FORMAT_CHECK \
-                      BUILD; do
+                      TYPE_CHECK ROOT_LINT WEBVIEW_LINT \
+                      WEBVIEW_TEST FORMAT_CHECK BUILD; do
             eval "val=\$$step"
             if [ "$val" != "success" ]; then
               echo "::error::$step failed"
@@ -170,3 +180,106 @@ jobs:
             fi
           done
           exit "$failed"
+
+  e2e:
+    needs: ci
+    strategy:
+      fail-fast: false
+      matrix:
+        os: [ubuntu-latest, macos-latest, windows-latest]
+    runs-on: ${{ matrix.os }}
+    timeout-minutes: 15
+    env:
+      PLAYWRIGHT_BROWSERS_PATH: .playwright-browsers
+
+    steps:
+      - name: Checkout
+        uses: actions/checkout@v6
+        with:
+          fetch-depth: 0
+
+      - name: Setup Node
+        uses: actions/setup-node@v6
+        with:
+          node-version-file: .nvmrc
+          cache: npm
+          cache-dependency-path: |
+            package-lock.json
+            webview-ui/package-lock.json
+
+      - name: Restore VS Code Cache
+        id: cache_vscode_restore
+        uses: actions/cache/restore@v4
+        with:
+          path: .vscode-test
+          key: vscode-test-${{ runner.os }}-${{ hashFiles('e2e/global-setup.ts') }}-v2
+          restore-keys: |
+            vscode-test-${{ runner.os }}-
+
+      - name: Restore Playwright Cache
+        id: cache_playwright_restore
+        uses: actions/cache/restore@v4
+        with:
+          path: .playwright-browsers
+          key: playwright-browsers-${{ runner.os }}-${{ hashFiles('package-lock.json') }}-v1
+          restore-keys: |
+            playwright-browsers-${{ runner.os }}-
+
+      - name: Install Root Dependencies
+        run: npm ci
+
+      - name: Install Webview Dependencies
+        working-directory: webview-ui
+        run: npm ci
+
+      - name: Build
+        run: node esbuild.js
+
+      - name: Build Webview
+        working-directory: webview-ui
+        run: npm run build
+
+      - name: Install Playwright Dependencies
+        id: install_playwright_deps
+        run: npx playwright install --with-deps chromium
+        continue-on-error: true
+
+      - name: E2E Tests
+        id: e2e_test
+        if: steps.install_playwright_deps.outcome == 'success'
+        run: npm run e2e
+        continue-on-error: true
+
+      - name: Save VS Code Cache
+        if: always() && steps.cache_vscode_restore.outputs.cache-hit != 'true' && steps.e2e_test.outcome == 'success' && hashFiles('.vscode-test/vscode-executable.txt') != ''
+        uses: actions/cache/save@v4
+        with:
+          path: .vscode-test
+          key: ${{ steps.cache_vscode_restore.outputs.cache-primary-key }}
+
+      - name: Save Playwright Cache
+        if: always() && steps.cache_playwright_restore.outputs.cache-hit != 'true' && steps.install_playwright_deps.outcome == 'success' && hashFiles('.playwright-browsers/**') != ''
+        uses: actions/cache/save@v4
+        with:
+          path: .playwright-browsers
+          key: ${{ steps.cache_playwright_restore.outputs.cache-primary-key }}
+
+      - name: Write Step Summary
+        if: always()
+        shell: bash
+        env:
+          OS: ${{ matrix.os }}
+          INSTALL_PLAYWRIGHT_DEPS: ${{ steps.install_playwright_deps.outcome }}
+          E2E_TEST: ${{ steps.e2e_test.outcome }}
+        run: |
+          status() {
+            if [ "$1" = "success" ]; then echo "✅ PASS"; else echo "❌ FAIL"; fi
+          }
+          {
+            echo "## E2E Results ($OS)"
+            echo
+            echo "| Check | Result |"
+            echo "| --- | --- |"
+            echo "| Install Playwright deps | $(status "$INSTALL_PLAYWRIGHT_DEPS") |"
+            echo "| E2E tests | $(status "$E2E_TEST") |"
+          } >> "$GITHUB_STEP_SUMMARY"
diff --git a/.github/workflows/pr-title.yml b/.github/workflows/pr-title.yml
index bed821cd..ee43fc0a 100644
--- a/.github/workflows/pr-title.yml
+++ b/.github/workflows/pr-title.yml
@@ -10,6 +10,7 @@ permissions:
 jobs:
   check:
     runs-on: ubuntu-latest
+    if: ${{ github.actor != 'dependabot[bot]' }}
     steps:
       - uses: amannn/action-semantic-pull-request@v6
         env:
diff --git a/.github/workflows/update-badges.yml b/.github/workflows/update-badges.yml
index a44d0d7f..c24c208b 100644
--- a/.github/workflows/update-badges.yml
+++ b/.github/workflows/update-badges.yml
@@ -8,6 +8,7 @@ on:
 jobs:
   update-badges:
     runs-on: ubuntu-latest
+    if: ${{ github.repository == 'pablodelucca/pixel-agents' }}
 
     steps:
       - name: Fetch VS Code Marketplace stats
diff --git a/.gitignore b/.gitignore
index aacf3d32..0452a69f 100644
--- a/.gitignore
+++ b/.gitignore
@@ -17,6 +17,10 @@ Thumbs.db
 .vscode-test/
 /.idea
 
+# E2E test artifacts
+test-results/
+playwright-report/
+
 # Build artifacts
 *.vsix
 *.map
diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md
index 9a48084a..54fa623b 100644
--- a/CONTRIBUTING.md
+++ b/CONTRIBUTING.md
@@ -94,6 +94,49 @@ These conventions are enforced by custom ESLint rules (`eslint-rules/pixel-agent
 
 These rules are set to `warn` — they won't block your PR but will flag violations for cleanup.
 
+## End-to-End Tests
+
+The `e2e/` directory contains Playwright tests that launch a real VS Code instance with the extension loaded in development mode.
+
+### Running e2e tests locally
+
+```bash
+# Build the extension first (tests load the compiled output)
+npm run build
+
+# Runs the e2e test
+npm run e2e
+
+# Step-by-step debug mode
+npm run e2e:debug
+```
+
+On the first run, `@vscode/test-electron` will download a stable VS Code release into `.vscode-test/` (≈200 MB). Subsequent runs reuse the cache.
+
+### Artifacts
+
+All test artifacts are written to `test-results/e2e/`:
+
+| Path | Contents |
+|---|---|
+| `test-results/e2e/videos/<test-name>/` | `.webm` screen recording for every test |
+| `playwright-report/e2e/` | Playwright HTML report (`npx playwright show-report playwright-report/e2e`) |
+| `test-results/e2e/*.png` | Final screenshots saved on failure |
+
+On failure, the test output prints the path to the video for that run.
+
+### Mock claude
+
+Tests never invoke the real `claude` CLI. Instead, a bash script at `e2e/fixtures/mock-claude` is copied into an isolated `bin/` directory and prepended to `PATH` before VS Code starts.
+
+The mock:
+1. Parses `--session-id <uuid>` from its arguments.
+2. Appends a line to `$HOME/.claude-mock/invocations.log` so tests can assert it was called.
+3. Creates `$HOME/.claude/projects/<project-hash>/<session-id>.jsonl` with a minimal init line so the extension's file-watcher can detect the session.
+4. Sleeps for 30 s (keeps the terminal alive) then exits.
+
+Each test runs with an isolated `HOME` and `--user-data-dir`, so no test state leaks between runs or into your real VS Code profile.
+
 ## Submitting a Pull Request
 
 1. Fork the repo and create a feature branch from `main`
diff --git a/e2e/fixtures/mock-claude b/e2e/fixtures/mock-claude
new file mode 100755
index 00000000..f8d6d4c7
--- /dev/null
+++ b/e2e/fixtures/mock-claude
@@ -0,0 +1,47 @@
+#!/usr/bin/env bash
+# Mock 'claude' executable for Pixel Agents e2e tests.
+#
+# Behaviour:
+#   1. Parses --session-id <id> from args.
+#   2. Appends an invocation record to $HOME/.claude-mock/invocations.log.
+#   3. Creates the expected JSONL file under $HOME/.claude/projects/<hash>/<id>.jsonl
+#      using the same path-hash algorithm as agentManager.ts
+#      (replace every non-[a-zA-Z0-9-] char with '-').
+#   4. Writes a minimal valid JSONL line so the extension file-watcher can proceed.
+#   5. Stays alive for up to 30 s (tests can kill it once assertions pass).
+
+set -euo pipefail
+
+SESSION_ID=""
+PREV=""
+for arg in "$@"; do
+  if [ "$PREV" = "--session-id" ]; then
+    SESSION_ID="$arg"
+  fi
+  PREV="$arg"
+done
+
+LOG_DIR="${HOME}/.claude-mock"
+mkdir -p "$LOG_DIR"
+echo "$(date -Iseconds) session-id=${SESSION_ID} cwd=$(pwd) args=$*" >> "${LOG_DIR}/invocations.log"
+
+if [ -n "$SESSION_ID" ]; then
+  CWD="$(pwd)"
+  # Replicate agentManager.ts: workspacePath.replace(/[^a-zA-Z0-9-]/g, '-')
+  DIR_NAME="$(printf '%s' "$CWD" | tr -c 'a-zA-Z0-9-' '-')"
+  PROJECT_DIR="${HOME}/.claude/projects/${DIR_NAME}"
+  mkdir -p "$PROJECT_DIR"
+  JSONL_FILE="${PROJECT_DIR}/${SESSION_ID}.jsonl"
+
+  # Write a minimal system init line so the extension watcher sees the file.
+  printf '{"type":"system","subtype":"init","content":"mock-claude-ready"}\n' >> "$JSONL_FILE"
+fi
+
+# Stay alive so the VS Code terminal doesn't immediately close.
+sleep 30 &
+SLEEP_PID=$!
+
+# Clean exit on SIGTERM/SIGINT.
+trap 'kill $SLEEP_PID 2>/dev/null; exit 0' SIGTERM SIGINT
+
+wait $SLEEP_PID || true
diff --git a/e2e/fixtures/mock-claude.cmd b/e2e/fixtures/mock-claude.cmd
new file mode 100644
index 00000000..754a3634
--- /dev/null
+++ b/e2e/fixtures/mock-claude.cmd
@@ -0,0 +1,49 @@
+@echo off
+REM Mock 'claude' executable for Pixel Agents e2e tests (Windows).
+REM
+REM Behaviour:
+REM   1. Parses --session-id <id> from args.
+REM   2. Appends an invocation record to %HOME%\.claude-mock\invocations.log.
+REM   3. Creates the expected JSONL file under %HOME%\.claude\projects\<hash>\<id>.jsonl
+REM   4. Stays alive for up to 30 s (tests can kill it once assertions pass).
+
+setlocal enabledelayedexpansion
+
+set "SESSION_ID="
+set "PREV="
+
+:parse_args
+if "%~1"=="" goto done_args
+if "!PREV!"=="--session-id" set "SESSION_ID=%~1"
+set "PREV=%~1"
+shift
+goto parse_args
+:done_args
+
+REM Use HOME if set (our e2e sets it), fall back to USERPROFILE
+if defined HOME (
+  set "MOCK_HOME=%HOME%"
+) else (
+  set "MOCK_HOME=%USERPROFILE%"
+)
+
+set "LOG_DIR=%MOCK_HOME%\.claude-mock"
+if not exist "%LOG_DIR%" mkdir "%LOG_DIR%"
+echo %DATE% %TIME% session-id=%SESSION_ID% cwd=%CD% args=%* >> "%LOG_DIR%\invocations.log"
+
+if "%SESSION_ID%"=="" goto stay_alive
+
+REM Replicate agentManager.ts: workspacePath.replace(/[^a-zA-Z0-9-]/g, '-')
+REM PowerShell one-liner to do the regex replace
+for /f "delims=" %%D in ('powershell -NoProfile -Command "[regex]::Replace('%CD%', '[^a-zA-Z0-9-]', '-')"') do set "DIR_NAME=%%D"
+
+set "PROJECT_DIR=%MOCK_HOME%\.claude\projects\%DIR_NAME%"
+if not exist "%PROJECT_DIR%" mkdir "%PROJECT_DIR%"
+
+set "JSONL_FILE=%PROJECT_DIR%\%SESSION_ID%.jsonl"
+echo {"type":"system","subtype":"init","content":"mock-claude-ready"} >> "%JSONL_FILE%"
+
+:stay_alive
+REM Stay alive so the VS Code terminal doesn't immediately close.
+REM Use ping to localhost as a cross-platform sleep (timeout command requires console).
+ping -n 31 127.0.0.1 > nul 2>&1
diff --git a/e2e/global-setup.ts b/e2e/global-setup.ts
new file mode 100644
index 00000000..d71dcd7e
--- /dev/null
+++ b/e2e/global-setup.ts
@@ -0,0 +1,18 @@
+import { downloadAndUnzipVSCode } from '@vscode/test-electron';
+import fs from 'fs';
+import path from 'path';
+
+export const VSCODE_CACHE_DIR = path.join(__dirname, '../.vscode-test');
+export const VSCODE_PATH_FILE = path.join(VSCODE_CACHE_DIR, 'vscode-executable.txt');
+
+export default async function globalSetup(): Promise<void> {
+  console.log('[e2e] Ensuring VS Code is downloaded...');
+  const vscodePath = await downloadAndUnzipVSCode({
+    version: 'stable',
+    cachePath: VSCODE_CACHE_DIR,
+  });
+  console.log(`[e2e] VS Code executable: ${vscodePath}`);
+
+  fs.mkdirSync(VSCODE_CACHE_DIR, { recursive: true });
+  fs.writeFileSync(VSCODE_PATH_FILE, vscodePath, 'utf8');
+}
diff --git a/e2e/helpers/launch.ts b/e2e/helpers/launch.ts
new file mode 100644
index 00000000..809efa4e
--- /dev/null
+++ b/e2e/helpers/launch.ts
@@ -0,0 +1,227 @@
+import { _electron as electron } from '@playwright/test';
+import type { ElectronApplication, Page } from '@playwright/test';
+import fs from 'fs';
+import os from 'os';
+import path from 'path';
+
+const REPO_ROOT = path.join(__dirname, '../..');
+const VSCODE_PATH_FILE = path.join(REPO_ROOT, '.vscode-test/vscode-executable.txt');
+const MOCK_CLAUDE_PATH = path.join(REPO_ROOT, 'e2e/fixtures/mock-claude');
+const MOCK_CLAUDE_CMD_PATH = path.join(REPO_ROOT, 'e2e/fixtures/mock-claude.cmd');
+const ARTIFACTS_DIR = path.join(REPO_ROOT, 'test-results/e2e');
+const IS_WINDOWS = process.platform === 'win32';
+const PATH_SEP = IS_WINDOWS ? ';' : ':';
+
+export interface VSCodeSession {
+  app: ElectronApplication;
+  window: Page;
+  /** Isolated HOME directory for this test session. */
+  tmpHome: string;
+  /** Workspace directory opened in VS Code. */
+  workspaceDir: string;
+  /** Path to the mock invocations log. */
+  mockLogFile: string;
+  cleanup: () => Promise<void>;
+}
+
+/**
+ * Launch VS Code with the Pixel Agents extension loaded in development mode.
+ *
+ * Uses an isolated temp HOME and injects the mock `claude` binary at the
+ * front of PATH so no real Claude CLI is needed.
+ */
+export async function launchVSCode(testTitle: string): Promise<VSCodeSession> {
+  const vscodePath = fs.readFileSync(VSCODE_PATH_FILE, 'utf8').trim();
+
+  // --- Isolated temp directories ---
+  const tmpBase = fs.mkdtempSync(path.join(os.tmpdir(), 'pixel-e2e-'));
+  const tmpHome = path.join(tmpBase, 'home');
+  const workspaceDir = path.join(tmpBase, 'workspace');
+  const userDataDir = path.join(tmpBase, 'userdata');
+  const mockBinDir = path.join(tmpBase, 'bin');
+
+  fs.mkdirSync(tmpHome, { recursive: true });
+  fs.mkdirSync(workspaceDir, { recursive: true });
+  fs.mkdirSync(userDataDir, { recursive: true });
+  fs.mkdirSync(mockBinDir, { recursive: true });
+
+  // On Windows, os.tmpdir() may return an 8.3 short path (e.g. RUNNER~1) while
+  // child processes see the long path (e.g. runneradmin) via %CD%. Normalize to
+  // the canonical long path so the project hash computed here matches mock-claude.
+  // fs.realpathSync only resolves symlinks; .native uses GetFinalPathNameByHandleW
+  // which also resolves 8.3 short names to their full form.
+  const resolvedWorkspaceDir = IS_WINDOWS ? fs.realpathSync.native(workspaceDir) : workspaceDir;
+
+  // macOS: create a temporary keychain so the OS doesn't show "Keychain Not Found" dialog.
+  // The isolated HOME has no keychain, and VS Code/Electron's safeStorage triggers a system prompt.
+  if (process.platform === 'darwin') {
+    const keychainDir = path.join(tmpHome, 'Library', 'Keychains');
+    fs.mkdirSync(keychainDir, { recursive: true });
+    const keychainPath = path.join(keychainDir, 'login.keychain-db');
+    try {
+      const { execSync } = require('child_process');
+      execSync(`security create-keychain -p "" "${keychainPath}"`, { stdio: 'ignore' });
+      execSync(`security default-keychain -s "${keychainPath}"`, {
+        stdio: 'ignore',
+        env: { ...process.env, HOME: tmpHome },
+      });
+    } catch {
+      // keychain creation failure is non-fatal, test may still work
+    }
+  }
+
+  // Copy mock-claude into an isolated bin dir
+  if (IS_WINDOWS) {
+    // Windows: copy the .cmd batch file as 'claude.cmd'
+    fs.copyFileSync(MOCK_CLAUDE_CMD_PATH, path.join(mockBinDir, 'claude.cmd'));
+  } else {
+    const mockDest = path.join(mockBinDir, 'claude');
+    fs.copyFileSync(MOCK_CLAUDE_PATH, mockDest);
+    fs.chmodSync(mockDest, 0o755);
+  }
+
+  // macOS: VS Code's integrated terminal resolves PATH from the login shell,
+  // ignoring the process env. Define a custom terminal profile that uses a
+  // non-login shell with our mock bin dir in PATH. On Linux the process env
+  // propagates directly, so no custom profile is needed.
+  if (process.platform === 'darwin') {
+    const userSettingsDir = path.join(userDataDir, 'User');
+    fs.mkdirSync(userSettingsDir, { recursive: true });
+    fs.writeFileSync(
+      path.join(userSettingsDir, 'settings.json'),
+      JSON.stringify(
+        {
+          'terminal.integrated.profiles.osx': {
+            e2e: {
+              path: '/bin/zsh',
+              args: ['--no-globalrcs'],
+              env: {
+                PATH: `${mockBinDir}:/usr/local/bin:/usr/bin:/bin`,
+                HOME: tmpHome,
+                ZDOTDIR: tmpHome,
+              },
+            },
+          },
+          'terminal.integrated.defaultProfile.osx': 'e2e',
+          'terminal.integrated.inheritEnv': false,
+        },
+        null,
+        2,
+      ),
+    );
+  }
+
+  const mockLogFile = path.join(tmpHome, '.claude-mock', 'invocations.log');
+
+  // --- Video output dir ---
+  const safeTitle = testTitle.replace(/[^a-z0-9]+/gi, '-').toLowerCase();
+  const videoDir = path.join(ARTIFACTS_DIR, 'videos', safeTitle);
+  fs.mkdirSync(videoDir, { recursive: true });
+
+  // --- Environment for VS Code process ---
+  const env: Record<string, string> = {
+    ...(process.env as Record<string, string>),
+    HOME: tmpHome,
+    // Prepend mock bin so 'claude' resolves to our mock
+    PATH: `${mockBinDir}${PATH_SEP}${process.env['PATH'] ?? '/usr/local/bin:/usr/bin:/bin'}`,
+    // Prevent VS Code from trying to talk to real accounts / telemetry
+    VSCODE_TELEMETRY_DISABLED: '1',
+  };
+
+  // --- VS Code launch args ---
+  const args = [
+    // Load our extension in dev mode (this overrides the installed version)
+    `--extensionDevelopmentPath=${REPO_ROOT}`,
+    // Disable all other extensions so tests are isolated
+    '--disable-extensions',
+    // Isolated user-data (settings, state, etc.)
+    `--user-data-dir=${userDataDir}`,
+    // Skip interactive prompts
+    '--disable-workspace-trust',
+    '--skip-release-notes',
+    '--skip-welcome',
+    '--no-sandbox',
+    // Disable GPU acceleration: prevents Electron GPU-sandbox stalls in headless
+    // CI environments (required on macOS arm64 runners, harmless elsewhere).
+    '--disable-gpu',
+    // On Linux, use the Ozone headless platform so Electron runs without a
+    // display server (equivalent to what --disable-gpu achieves on macOS/Windows).
+    ...(process.platform === 'linux' ? ['--ozone-platform=headless'] : []),
+    // Open the workspace folder
+    resolvedWorkspaceDir,
+  ];
+
+  const cleanup = async (): Promise<void> => {
+    try {
+      if (app) {
+        await app.close();
+      }
+    } catch {
+      // ignore close errors
+    }
+    // macOS: deregister the temporary keychain to avoid orphaned references
+    if (process.platform === 'darwin') {
+      try {
+        const keychainPath = path.join(tmpHome, 'Library', 'Keychains', 'login.keychain-db');
+        const { execSync } = require('child_process');
+        execSync(`security delete-keychain "${keychainPath}"`, { stdio: 'ignore' });
+      } catch {
+        // keychain may not exist or already be removed
+      }
+    }
+    try {
+      fs.rmSync(tmpBase, { recursive: true, force: true });
+    } catch {
+      // ignore cleanup errors
+    }
+  };
+
+  let app: ElectronApplication | undefined;
+
+  try {
+    // Playwright's video recording freezes VS Code's renderer on Windows,
+    // so only enable it on non-Windows platforms.
+    const launchOptions: Parameters<typeof electron.launch>[0] = {
+      executablePath: vscodePath,
+      args,
+      env,
+      cwd: resolvedWorkspaceDir,
+      timeout: 60_000,
+    };
+    if (!IS_WINDOWS) {
+      launchOptions.recordVideo = {
+        dir: videoDir,
+        size: { width: 1280, height: 800 },
+      };
+    }
+
+    app = await electron.launch(launchOptions);
+
+    const window = await app.firstWindow();
+
+    // The Ozone headless backend ignores --window-size CLI flags, so VS Code
+    // opens at a tiny default size on Linux. Resize via the Electron API after
+    // the window exists — getAllWindows() is empty before firstWindow() resolves.
+    if (process.platform === 'linux') {
+      await app.evaluate(({ BrowserWindow }) => {
+        BrowserWindow.getAllWindows()[0]?.setSize(1280, 800);
+      });
+      // Give VS Code's layout system time to respond to the resize before tests
+      // start measuring panel heights.
+      await window.waitForTimeout(500);
+    }
+
+    return { app, window, tmpHome, workspaceDir: resolvedWorkspaceDir, mockLogFile, cleanup };
+  } catch (error) {
+    await cleanup();
+    throw error;
+  }
+}
+
+/**
+ * Wait for VS Code's workbench to be fully ready before interacting.
+ */
+export async function waitForWorkbench(window: Page): Promise<void> {
+  // VS Code renders a div.monaco-workbench when the shell is ready
+  await window.waitForSelector('.monaco-workbench', { timeout: 60_000 });
+}
diff --git a/e2e/helpers/webview.ts b/e2e/helpers/webview.ts
new file mode 100644
index 00000000..8c964861
--- /dev/null
+++ b/e2e/helpers/webview.ts
@@ -0,0 +1,128 @@
+import type { Frame, Page } from '@playwright/test';
+import { expect } from '@playwright/test';
+
+const WEBVIEW_TIMEOUT_MS = 30_000;
+const PANEL_OPEN_TIMEOUT_MS = 15_000;
+const MIN_PANEL_HEIGHT_PX = 320;
+
+async function runCommand(window: Page, command: string): Promise<void> {
+  // Retry the full command palette interaction up to 3 times.
+  // macOS CI can swallow keypresses or fail to populate results.
+  for (let attempt = 0; attempt < 3; attempt++) {
+    // Dismiss any previous quick-input state
+    await window.keyboard.press('Escape');
+    await window.waitForTimeout(300);
+
+    try {
+      await window.keyboard.press('F1');
+      await window.waitForSelector('.quick-input-widget .quick-input-filter input', {
+        state: 'visible',
+        timeout: 5_000,
+      });
+      await window.keyboard.type(command);
+      // Wait for a list row matching the typed command (not stale results)
+      await window.waitForSelector(`.quick-input-list .monaco-list-row[aria-label*="${command}"]`, {
+        timeout: 5_000,
+      });
+      break;
+    } catch {
+      if (attempt === 2) {
+        throw new Error(`Command palette failed after 3 attempts for "${command}"`);
+      }
+    }
+  }
+  await window.keyboard.press('Enter');
+  await window
+    .waitForSelector('.quick-input-widget', {
+      state: 'hidden',
+      timeout: PANEL_OPEN_TIMEOUT_MS,
+    })
+    .catch(() => {
+      // Some commands update layout without immediately dismissing quick input.
+    });
+}
+
+async function getPanelHeight(window: Page): Promise<number> {
+  return window.evaluate(() => {
+    const panel =
+      document.querySelector<HTMLElement>('[id="workbench.panel.bottom"]') ??
+      document.querySelector<HTMLElement>('.part.panel');
+
+    return Math.round(panel?.getBoundingClientRect().height ?? 0);
+  });
+}
+
+async function ensurePanelIsLarge(window: Page): Promise<void> {
+  if ((await getPanelHeight(window)) > MIN_PANEL_HEIGHT_PX) {
+    return;
+  }
+
+  await runCommand(window, 'View: Toggle Maximized Panel');
+
+  await expect
+    .poll(() => getPanelHeight(window), {
+      message: 'Expected the bottom panel to be resized for the Pixel Agents webview',
+      timeout: PANEL_OPEN_TIMEOUT_MS,
+      intervals: [250, 500, 1000],
+    })
+    .toBeGreaterThan(MIN_PANEL_HEIGHT_PX);
+}
+
+/**
+ * Open the Pixel Agents panel via the Command Palette and wait for the
+ * "Pixel Agents: Show Panel" command to execute.
+ */
+export async function openPixelAgentsPanel(window: Page): Promise<void> {
+  await runCommand(window, 'Pixel Agents: Show Panel');
+
+  // Wait for the panel container to appear
+  await window
+    .waitForSelector('[id="workbench.panel.bottom"], .part.panel', {
+      timeout: PANEL_OPEN_TIMEOUT_MS,
+    })
+    .catch(() => {
+      // Panel might not use this id; just continue
+    });
+
+  await ensurePanelIsLarge(window);
+}
+
+/**
+ * Find and return the Pixel Agents webview frame.
+ *
+ * VS Code renders WebviewViewProvider content in an <iframe> whose URL
+ * starts with "vscode-webview://". Because VS Code can have multiple
+ * webviews, we wait until one frame exposes the "+ Agent" button before
+ * returning it.
+ */
+export async function getPixelAgentsFrame(window: Page): Promise<Frame> {
+  const deadline = Date.now() + WEBVIEW_TIMEOUT_MS;
+
+  while (Date.now() < deadline) {
+    for (const frame of window.frames()) {
+      const url = frame.url();
+      if (!url.startsWith('vscode-webview://')) continue;
+
+      try {
+        const btn = await frame.waitForSelector('button:has-text("+ Agent")', { timeout: 2_000 });
+        if (btn) return frame;
+      } catch {
+        // not this frame, keep looking
+      }
+    }
+
+    // Wait for a new frame to be attached
+    await window.waitForTimeout(500);
+  }
+
+  throw new Error('Timed out waiting for Pixel Agents webview frame with "+ Agent" button');
+}
+
+/**
+ * Click "+ Agent" in the webview and wait for the call to be dispatched.
+ */
+export async function clickAddAgent(frame: Frame): Promise<void> {
+  const btn = frame.locator('button', { hasText: '+ Agent' });
+  await expect(btn).toBeVisible({ timeout: WEBVIEW_TIMEOUT_MS });
+  await btn.click();
+}
diff --git a/e2e/playwright.config.ts b/e2e/playwright.config.ts
new file mode 100644
index 00000000..3ab7310d
--- /dev/null
+++ b/e2e/playwright.config.ts
@@ -0,0 +1,30 @@
+import path from 'path';
+
+import { defineConfig } from '@playwright/test';
+
+const artifactsDir = path.join(__dirname, '../test-results/e2e');
+
+export default defineConfig({
+  testDir: path.join(__dirname, 'tests'),
+  timeout: 120_000,
+  globalSetup: path.join(__dirname, 'global-setup.ts'),
+  reporter: [
+    ['list'],
+    [
+      'html',
+      {
+        // Must be outside outputDir to avoid Playwright clearing artifacts
+        outputFolder: path.join(__dirname, '../playwright-report/e2e'),
+        open: 'never',
+      },
+    ],
+  ],
+  outputDir: artifactsDir,
+  // NOTE: These settings are no-ops for Electron tests launched via electron.launch().
+  // Playwright's built-in artifact handling only applies to browser contexts.
+  // Video is configured in launch.ts (recordVideo option) and screenshots are
+  // handled manually in the test's afterEach/finally blocks.
+  use: {},
+  // Single worker: VS Code windows don't share well in parallel on one display
+  workers: 1,
+});
diff --git a/e2e/tests/agent-spawn.spec.ts b/e2e/tests/agent-spawn.spec.ts
new file mode 100644
index 00000000..2f53c860
--- /dev/null
+++ b/e2e/tests/agent-spawn.spec.ts
@@ -0,0 +1,141 @@
+/**
+ * E2E: Clicking "+ Agent" in the Pixel Agents webview spawns a mock Claude terminal.
+ *
+ * Assertions:
+ *   1. The mock `claude` binary was invoked (invocations.log exists and is non-empty).
+ *   2. The expected JSONL session file was created in the isolated HOME.
+ *   3. A VS Code terminal named "Claude Code #1" appears in the workbench.
+ *
+ * NOTE FOR NEW TESTS: As more specs are added, refactor session setup into a
+ * Playwright fixture using test.extend<{ session: VSCodeSession }>() so that
+ * launch/cleanup is automatic and tests stay focused on assertions. See:
+ * https://playwright.dev/docs/test-fixtures
+ */
+import { test, expect } from '@playwright/test';
+import fs from 'fs';
+import path from 'path';
+
+import { launchVSCode, waitForWorkbench } from '../helpers/launch';
+import { clickAddAgent, getPixelAgentsFrame, openPixelAgentsPanel } from '../helpers/webview';
+
+test('clicking + Agent spawns mock claude and creates a JSONL session file', async ({}, testInfo) => {
+  const session = await launchVSCode(testInfo.title);
+  const { window, tmpHome, mockLogFile } = session;
+  const runVideo = window.video();
+
+  test.setTimeout(120_000);
+
+  try {
+    // 1. Wait for VS Code workbench to be ready
+    await waitForWorkbench(window);
+
+    // 2. Open the Pixel Agents panel
+    await openPixelAgentsPanel(window);
+
+    // 3. Find the webview frame and click + Agent
+    const frame = await getPixelAgentsFrame(window);
+    await clickAddAgent(frame);
+
+    // 4. Assert: mock claude was invoked
+    //    The mock script writes to $HOME/.claude-mock/invocations.log
+    await expect
+      .poll(
+        () => {
+          try {
+            const content = fs.readFileSync(mockLogFile, 'utf8');
+            return content.trim().length > 0;
+          } catch {
+            return false;
+          }
+        },
+        {
+          message: `Expected invocations.log at ${mockLogFile} to be non-empty`,
+          timeout: 20_000,
+          intervals: [500, 1000],
+        },
+      )
+      .toBe(true);
+
+    const invocationLog = fs.readFileSync(mockLogFile, 'utf8');
+    expect(invocationLog).toContain('session-id=');
+    await testInfo.attach('mock-claude-invocations', {
+      body: invocationLog,
+      contentType: 'text/plain',
+    });
+
+    // 5. Assert: JSONL session file was created.
+    //    Scan all subdirectories under .claude/projects/ rather than hard-coding a
+    //    specific hash. On Windows, os.tmpdir() may return an 8.3 short path while
+    //    the VS Code terminal sees the long path, making the hashes differ even after
+    //    normalisation attempts.
+    const projectsDir = path.join(tmpHome, '.claude', 'projects');
+
+    const findJsonlFiles = (): string[] => {
+      try {
+        if (!fs.existsSync(projectsDir)) return [];
+        return fs.readdirSync(projectsDir).flatMap((entry) => {
+          const sub = path.join(projectsDir, entry);
+          try {
+            return fs.statSync(sub).isDirectory()
+              ? fs.readdirSync(sub).filter((f) => f.endsWith('.jsonl'))
+              : [];
+          } catch {
+            return [];
+          }
+        });
+      } catch {
+        return [];
+      }
+    };
+
+    await expect
+      .poll(findJsonlFiles, {
+        message: `Expected at least one .jsonl file under ${projectsDir}`,
+        timeout: 20_000,
+        intervals: [500, 1000],
+      })
+      .not.toHaveLength(0);
+
+    await testInfo.attach('jsonl-files', {
+      body: findJsonlFiles().join('\n'),
+      contentType: 'text/plain',
+    });
+
+    // 6. Assert: terminal "Claude Code #1" is visible in VS Code UI
+    //    VS Code renders the terminal name as visible text in the tab bar.
+    const terminalTab = window.getByText(/Claude Code #\d+/);
+    await expect(terminalTab.first()).toBeVisible({ timeout: 15_000 });
+  } finally {
+    // Save a screenshot of the final state regardless of outcome
+    const screenshotPath = path.join(
+      __dirname,
+      '../../test-results/e2e',
+      `agent-spawn-final-${Date.now()}.png`,
+    );
+    try {
+      fs.mkdirSync(path.dirname(screenshotPath), { recursive: true });
+      await window.screenshot({ path: screenshotPath });
+      await testInfo.attach('final-screenshot', {
+        path: screenshotPath,
+        contentType: 'image/png',
+      });
+    } catch {
+      // screenshot failure is non-fatal
+    }
+
+    await session.cleanup();
+
+    if (runVideo) {
+      try {
+        const videoPath = testInfo.outputPath('run-video.webm');
+        await runVideo.saveAs(videoPath);
+        await testInfo.attach('run-video', {
+          path: videoPath,
+          contentType: 'video/webm',
+        });
+      } catch {
+        // video attachment failure is non-fatal
+      }
+    }
+  }
+});
diff --git a/e2e/tsconfig.json b/e2e/tsconfig.json
new file mode 100644
index 00000000..a577e155
--- /dev/null
+++ b/e2e/tsconfig.json
@@ -0,0 +1,18 @@
+{
+  "compilerOptions": {
+    "target": "ES2022",
+    "module": "CommonJS",
+    "moduleResolution": "node",
+    "lib": ["ES2022", "DOM"],
+    "strict": true,
+    "noUnusedLocals": true,
+    "noUnusedParameters": true,
+    "esModuleInterop": true,
+    "sourceMap": true,
+    "outDir": "../dist/e2e",
+    "rootDir": ".",
+    "types": ["node"]
+  },
+  "include": ["./**/*.ts"],
+  "exclude": ["../node_modules", "../dist"]
+}
diff --git a/package-lock.json b/package-lock.json
index e312b621..09f26d0c 100644
--- a/package-lock.json
+++ b/package-lock.json
@@ -10,9 +10,11 @@
       "license": "MIT",
       "devDependencies": {
         "@anthropic-ai/sdk": "^0.80.0",
+        "@playwright/test": "^1.58.2",
         "@types/node": "25.x",
         "@types/pngjs": "^6.0.5",
         "@types/vscode": "^1.105.0",
+        "@vscode/test-electron": "^2.5.2",
         "esbuild": "^0.27.2",
         "eslint": "^10.0.3",
         "eslint-config-prettier": "^10.1.8",
@@ -662,6 +664,22 @@
         "url": "https://github.com/sponsors/nzakas"
       }
     },
+    "node_modules/@playwright/test": {
+      "version": "1.58.2",
+      "resolved": "https://registry.npmjs.org/@playwright/test/-/test-1.58.2.tgz",
+      "integrity": "sha512-akea+6bHYBBfA9uQqSYmlJXn61cTa+jbO87xVLCWbTqbWadRVmhxlXATaOjOgcBaWU4ePo0wB41KMFv3o35IXA==",
+      "dev": true,
+      "license": "Apache-2.0",
+      "dependencies": {
+        "playwright": "1.58.2"
+      },
+      "bin": {
+        "playwright": "cli.js"
+      },
+      "engines": {
+        "node": ">=18"
+      }
+    },
     "node_modules/@types/esrecurse": {
       "version": "4.3.1",
       "resolved": "https://registry.npmjs.org/@types/esrecurse/-/esrecurse-4.3.1.tgz",
@@ -940,6 +958,23 @@
         "url": "https://opencollective.com/typescript-eslint"
       }
     },
+    "node_modules/@vscode/test-electron": {
+      "version": "2.5.2",
+      "resolved": "https://registry.npmjs.org/@vscode/test-electron/-/test-electron-2.5.2.tgz",
+      "integrity": "sha512-8ukpxv4wYe0iWMRQU18jhzJOHkeGKbnw7xWRX3Zw1WJA4cEKbHcmmLPdPrPtL6rhDcrlCZN+xKRpv09n4gRHYg==",
+      "dev": true,
+      "license": "MIT",
+      "dependencies": {
+        "http-proxy-agent": "^7.0.2",
+        "https-proxy-agent": "^7.0.5",
+        "jszip": "^3.10.1",
+        "ora": "^8.1.0",
+        "semver": "^7.6.2"
+      },
+      "engines": {
+        "node": ">=16"
+      }
+    },
     "node_modules/acorn": {
       "version": "8.16.0",
       "resolved": "https://registry.npmjs.org/acorn/-/acorn-8.16.0.tgz",
@@ -963,6 +998,16 @@
         "acorn": "^6.0.0 || ^7.0.0 || ^8.0.0"
       }
     },
+    "node_modules/agent-base": {
+      "version": "7.1.4",
+      "resolved": "https://registry.npmjs.org/agent-base/-/agent-base-7.1.4.tgz",
+      "integrity": "sha512-MnA+YT8fwfJPgBx3m60MNqakm30XOkyIoH1y6huTQvC0PwZG7ki8NacLBcrPbNoo8vEZy7Jpuk7+jMO+CUovTQ==",
+      "dev": true,
+      "license": "MIT",
+      "engines": {
+        "node": ">= 14"
+      }
+    },
     "node_modules/ajv": {
       "version": "6.14.0",
       "resolved": "https://registry.npmjs.org/ajv/-/ajv-6.14.0.tgz",
@@ -1154,6 +1199,19 @@
         "url": "https://github.com/sponsors/ljharb"
       }
     },
+    "node_modules/chalk": {
+      "version": "5.6.2",
+      "resolved": "https://registry.npmjs.org/chalk/-/chalk-5.6.2.tgz",
+      "integrity": "sha512-7NzBL0rN6fMUW+f7A6Io4h40qQlG+xGmtMxfbnH/K7TAtt8JQWVQK+6g0UXKMeVJoyV5EkkNsErQ8pVD3bLHbA==",
+      "dev": true,
+      "license": "MIT",
+      "engines": {
+        "node": "^12.17.0 || ^14.13 || >=16.0.0"
+      },
+      "funding": {
+        "url": "https://github.com/chalk/chalk?sponsor=1"
+      }
+    },
     "node_modules/cli-cursor": {
       "version": "5.0.0",
       "resolved": "https://registry.npmjs.org/cli-cursor/-/cli-cursor-5.0.0.tgz",
@@ -1170,6 +1228,19 @@
         "url": "https://github.com/sponsors/sindresorhus"
       }
     },
+    "node_modules/cli-spinners": {
+      "version": "2.9.2",
+      "resolved": "https://registry.npmjs.org/cli-spinners/-/cli-spinners-2.9.2.tgz",
+      "integrity": "sha512-ywqV+5MmyL4E7ybXgKys4DugZbX0FC6LnwrhjuykIjnK9k8OQacQ7axGKnjDXWNhns0xot3bZI5h55H8yo9cJg==",
+      "dev": true,
+      "license": "MIT",
+      "engines": {
+        "node": ">=6"
+      },
+      "funding": {
+        "url": "https://github.com/sponsors/sindresorhus"
+      }
+    },
     "node_modules/cli-truncate": {
       "version": "5.2.0",
       "resolved": "https://registry.npmjs.org/cli-truncate/-/cli-truncate-5.2.0.tgz",
@@ -1211,6 +1282,13 @@
       "dev": true,
       "license": "MIT"
     },
+    "node_modules/core-util-is": {
+      "version": "1.0.3",
+      "resolved": "https://registry.npmjs.org/core-util-is/-/core-util-is-1.0.3.tgz",
+      "integrity": "sha512-ZQBvi1DcpJ4GDqanjucZ2Hj3wEO5pZDS89BWbkcrvdxksJorwUDDZamX9ldFkp9aw2lmBDLgkObEA4DWNJ9FYQ==",
+      "dev": true,
+      "license": "MIT"
+    },
     "node_modules/cross-spawn": {
       "version": "7.0.6",
       "resolved": "https://registry.npmjs.org/cross-spawn/-/cross-spawn-7.0.6.tgz",
@@ -1859,9 +1937,9 @@
       }
     },
     "node_modules/flatted": {
-      "version": "3.3.3",
-      "resolved": "https://registry.npmjs.org/flatted/-/flatted-3.3.3.tgz",
-      "integrity": "sha512-GX+ysw4PBCz0PzosHDepZGANEuFCMLrnRTiEy9McGjmkCQYwRq4A/X786G/fjM/+OjsWSU1ZrY5qyARZmO/uwg==",
+      "version": "3.4.2",
+      "resolved": "https://registry.npmjs.org/flatted/-/flatted-3.4.2.tgz",
+      "integrity": "sha512-PjDse7RzhcPkIJwy5t7KPWQSZ9cAbzQXcafsetQoD7sOJRQlGikNbx7yZp2OotDnJyrDcbyRq3Ttb18iYOqkxA==",
       "dev": true,
       "license": "ISC"
     },
@@ -2158,6 +2236,34 @@
       "dev": true,
       "license": "ISC"
     },
+    "node_modules/http-proxy-agent": {
+      "version": "7.0.2",
+      "resolved": "https://registry.npmjs.org/http-proxy-agent/-/http-proxy-agent-7.0.2.tgz",
+      "integrity": "sha512-T1gkAiYYDWYx3V5Bmyu7HcfcvL7mUrTWiM6yOfa3PIphViJ/gFPbvidQ+veqSOHci/PxBcDabeUNCzpOODJZig==",
+      "dev": true,
+      "license": "MIT",
+      "dependencies": {
+        "agent-base": "^7.1.0",
+        "debug": "^4.3.4"
+      },
+      "engines": {
+        "node": ">= 14"
+      }
+    },
+    "node_modules/https-proxy-agent": {
+      "version": "7.0.6",
+      "resolved": "https://registry.npmjs.org/https-proxy-agent/-/https-proxy-agent-7.0.6.tgz",
+      "integrity": "sha512-vK9P5/iUfdl95AI+JVyUuIcVtd4ofvtrOr3HNtM2yxC9bnMbEdp3x01OhQNnjb8IJYi38VlTE3mBXwcfvywuSw==",
+      "dev": true,
+      "license": "MIT",
+      "dependencies": {
+        "agent-base": "^7.1.2",
+        "debug": "4"
+      },
+      "engines": {
+        "node": ">= 14"
+      }
+    },
     "node_modules/husky": {
       "version": "9.1.7",
       "resolved": "https://registry.npmjs.org/husky/-/husky-9.1.7.tgz",
@@ -2184,6 +2290,13 @@
         "node": ">= 4"
       }
     },
+    "node_modules/immediate": {
+      "version": "3.0.6",
+      "resolved": "https://registry.npmjs.org/immediate/-/immediate-3.0.6.tgz",
+      "integrity": "sha512-XXOFtyqDjNDAQxVfYxuF7g9Il/IbWmmlQg2MYKOH8ExIT1qg6xc4zyS3HaEEATgs1btfzxq15ciUiY7gjSXRGQ==",
+      "dev": true,
+      "license": "MIT"
+    },
     "node_modules/imurmurhash": {
       "version": "0.1.4",
       "resolved": "https://registry.npmjs.org/imurmurhash/-/imurmurhash-0.1.4.tgz",
@@ -2194,6 +2307,13 @@
         "node": ">=0.8.19"
       }
     },
+    "node_modules/inherits": {
+      "version": "2.0.4",
+      "resolved": "https://registry.npmjs.org/inherits/-/inherits-2.0.4.tgz",
+      "integrity": "sha512-k/vGaX4/Yla3WzyMCvTQOXYeIHvqOKtnqBduzTHpzpQZzAskKMhZ2K+EnBiSM9zGSoIFeMpXKxa4dYeZIQqewQ==",
+      "dev": true,
+      "license": "ISC"
+    },
     "node_modules/internal-slot": {
       "version": "1.1.0",
       "resolved": "https://registry.npmjs.org/internal-slot/-/internal-slot-1.1.0.tgz",
@@ -2426,6 +2546,19 @@
         "node": ">=0.10.0"
       }
     },
+    "node_modules/is-interactive": {
+      "version": "2.0.0",
+      "resolved": "https://registry.npmjs.org/is-interactive/-/is-interactive-2.0.0.tgz",
+      "integrity": "sha512-qP1vozQRI+BMOPcjFzrjXuQvdak2pHNUMZoeG2eRbiSqyvbEf/wQtEOTOX1guk6E3t36RkaqiSt8A/6YElNxLQ==",
+      "dev": true,
+      "license": "MIT",
+      "engines": {
+        "node": ">=12"
+      },
+      "funding": {
+        "url": "https://github.com/sponsors/sindresorhus"
+      }
+    },
     "node_modules/is-map": {
       "version": "2.0.3",
       "resolved": "https://registry.npmjs.org/is-map/-/is-map-2.0.3.tgz",
@@ -2568,6 +2701,19 @@
         "url": "https://github.com/sponsors/ljharb"
       }
     },
+    "node_modules/is-unicode-supported": {
+      "version": "2.1.0",
+      "resolved": "https://registry.npmjs.org/is-unicode-supported/-/is-unicode-supported-2.1.0.tgz",
+      "integrity": "sha512-mE00Gnza5EEB3Ds0HfMyllZzbBrmLOX3vfWoj9A9PEnTfratQ/BcaJOuMhnkhjXvb2+FkY3VuHqtAGpTPmglFQ==",
+      "dev": true,
+      "license": "MIT",
+      "engines": {
+        "node": ">=18"
+      },
+      "funding": {
+        "url": "https://github.com/sponsors/sindresorhus"
+      }
+    },
     "node_modules/is-weakmap": {
       "version": "2.0.2",
       "resolved": "https://registry.npmjs.org/is-weakmap/-/is-weakmap-2.0.2.tgz",
@@ -2614,6 +2760,13 @@
         "url": "https://github.com/sponsors/ljharb"
       }
     },
+    "node_modules/isarray": {
+      "version": "1.0.0",
+      "resolved": "https://registry.npmjs.org/isarray/-/isarray-1.0.0.tgz",
+      "integrity": "sha512-VLghIWNM6ELQzo7zwmcg0NmTVyWKYjvIeM83yjp0wRDTmUnrM678fQbcKBo6n2CJEF0szoG//ytg+TKla89ALQ==",
+      "dev": true,
+      "license": "MIT"
+    },
     "node_modules/isexe": {
       "version": "2.0.0",
       "resolved": "https://registry.npmjs.org/isexe/-/isexe-2.0.0.tgz",
@@ -2663,6 +2816,19 @@
       "dev": true,
       "license": "MIT"
     },
+    "node_modules/jszip": {
+      "version": "3.10.1",
+      "resolved": "https://registry.npmjs.org/jszip/-/jszip-3.10.1.tgz",
+      "integrity": "sha512-xXDvecyTpGLrqFrvkrUSoxxfJI5AH7U8zxxtVclpsUtMCq4JQ290LY8AW5c7Ggnr/Y/oK+bQMbqK2qmtk3pN4g==",
+      "dev": true,
+      "license": "(MIT OR GPL-3.0-or-later)",
+      "dependencies": {
+        "lie": "~3.3.0",
+        "pako": "~1.0.2",
+        "readable-stream": "~2.3.6",
+        "setimmediate": "^1.0.5"
+      }
+    },
     "node_modules/keyv": {
       "version": "4.5.4",
       "resolved": "https://registry.npmjs.org/keyv/-/keyv-4.5.4.tgz",
@@ -2687,6 +2853,16 @@
         "node": ">= 0.8.0"
       }
     },
+    "node_modules/lie": {
+      "version": "3.3.0",
+      "resolved": "https://registry.npmjs.org/lie/-/lie-3.3.0.tgz",
+      "integrity": "sha512-UaiMJzeWRlEujzAuw5LokY1L5ecNQYZKfmyZ9L7wDHb/p5etKaxXhohBcrw0EYby+G/NA52vRSN4N39dxHAIwQ==",
+      "dev": true,
+      "license": "MIT",
+      "dependencies": {
+        "immediate": "~3.0.5"
+      }
+    },
     "node_modules/lint-staged": {
       "version": "16.4.0",
       "resolved": "https://registry.npmjs.org/lint-staged/-/lint-staged-16.4.0.tgz",
@@ -2761,6 +2937,36 @@
         "url": "https://github.com/sponsors/sindresorhus"
       }
     },
+    "node_modules/log-symbols": {
+      "version": "6.0.0",
+      "resolved": "https://registry.npmjs.org/log-symbols/-/log-symbols-6.0.0.tgz",
+      "integrity": "sha512-i24m8rpwhmPIS4zscNzK6MSEhk0DUWa/8iYQWxhffV8jkI4Phvs3F+quL5xvS0gdQR0FyTCMMH33Y78dDTzzIw==",
+      "dev": true,
+      "license": "MIT",
+      "dependencies": {
+        "chalk": "^5.3.0",
+        "is-unicode-supported": "^1.3.0"
+      },
+      "engines": {
+        "node": ">=18"
+      },
+      "funding": {
+        "url": "https://github.com/sponsors/sindresorhus"
+      }
+    },
+    "node_modules/log-symbols/node_modules/is-unicode-supported": {
+      "version": "1.3.0",
+      "resolved": "https://registry.npmjs.org/is-unicode-supported/-/is-unicode-supported-1.3.0.tgz",
+      "integrity": "sha512-43r2mRvz+8JRIKnWJ+3j8JtjRKZ6GmjzfaE/qiBJnikNnYv/6bagRJ1kUhNk8R5EX/GkobD+r+sfxCPJsiKBLQ==",
+      "dev": true,
+      "license": "MIT",
+      "engines": {
+        "node": ">=12"
+      },
+      "funding": {
+        "url": "https://github.com/sponsors/sindresorhus"
+      }
+    },
     "node_modules/log-update": {
       "version": "6.1.0",
       "resolved": "https://registry.npmjs.org/log-update/-/log-update-6.1.0.tgz",
@@ -3023,9 +3229,9 @@
       }
     },
     "node_modules/npm-run-all/node_modules/minimatch": {
-      "version": "3.1.2",
-      "resolved": "https://registry.npmjs.org/minimatch/-/minimatch-3.1.2.tgz",
-      "integrity": "sha512-J7p63hRiAjw1NDEww1W7i37+ByIrOWO5XQQAzZ3VOcL0PNybwpfmV/N05zFAzwQ9USyEcX6t3UO+K5aqBQOIHw==",
+      "version": "3.1.5",
+      "resolved": "https://registry.npmjs.org/minimatch/-/minimatch-3.1.5.tgz",
+      "integrity": "sha512-VgjWUsnnT6n+NUk6eZq77zeFdpW2LWDzP6zFGrCbHXiYNul5Dzqk2HHQ5uFH2DNW5Xbp8+jVzaeNt94ssEEl4w==",
       "dev": true,
       "license": "ISC",
       "dependencies": {
@@ -3182,6 +3388,48 @@
         "node": ">= 0.8.0"
       }
     },
+    "node_modules/ora": {
+      "version": "8.2.0",
+      "resolved": "https://registry.npmjs.org/ora/-/ora-8.2.0.tgz",
+      "integrity": "sha512-weP+BZ8MVNnlCm8c0Qdc1WSWq4Qn7I+9CJGm7Qali6g44e/PUzbjNqJX5NJ9ljlNMosfJvg1fKEGILklK9cwnw==",
+      "dev": true,
+      "license": "MIT",
+      "dependencies": {
+        "chalk": "^5.3.0",
+        "cli-cursor": "^5.0.0",
+        "cli-spinners": "^2.9.2",
+        "is-interactive": "^2.0.0",
+        "is-unicode-supported": "^2.0.0",
+        "log-symbols": "^6.0.0",
+        "stdin-discarder": "^0.2.2",
+        "string-width": "^7.2.0",
+        "strip-ansi": "^7.1.0"
+      },
+      "engines": {
+        "node": ">=18"
+      },
+      "funding": {
+        "url": "https://github.com/sponsors/sindresorhus"
+      }
+    },
+    "node_modules/ora/node_modules/string-width": {
+      "version": "7.2.0",
+      "resolved": "https://registry.npmjs.org/string-width/-/string-width-7.2.0.tgz",
+      "integrity": "sha512-tsaTIkKW9b4N+AEj+SVA+WhJzV7/zMhcSu78mLKWSk7cXMOSHsBKFWUs0fWwq8QyK3MgJBQRX6Gbi4kYbdvGkQ==",
+      "dev": true,
+      "license": "MIT",
+      "dependencies": {
+        "emoji-regex": "^10.3.0",
+        "get-east-asian-width": "^1.0.0",
+        "strip-ansi": "^7.1.0"
+      },
+      "engines": {
+        "node": ">=18"
+      },
+      "funding": {
+        "url": "https://github.com/sponsors/sindresorhus"
+      }
+    },
     "node_modules/own-keys": {
       "version": "1.0.1",
       "resolved": "https://registry.npmjs.org/own-keys/-/own-keys-1.0.1.tgz",
@@ -3232,6 +3480,13 @@
         "url": "https://github.com/sponsors/sindresorhus"
       }
     },
+    "node_modules/pako": {
+      "version": "1.0.11",
+      "resolved": "https://registry.npmjs.org/pako/-/pako-1.0.11.tgz",
+      "integrity": "sha512-4hLB8Py4zZce5s4yd9XzopqwVv/yGNhV1Bl8NTmCq1763HeK2+EwVTv+leGeL13Dnh2wfbqowVPXCIO0z4taYw==",
+      "dev": true,
+      "license": "(MIT AND Zlib)"
+    },
     "node_modules/parse-json": {
       "version": "4.0.0",
       "resolved": "https://registry.npmjs.org/parse-json/-/parse-json-4.0.0.tgz",
@@ -3322,6 +3577,53 @@
         "node": ">=4"
       }
     },
+    "node_modules/playwright": {
+      "version": "1.58.2",
+      "resolved": "https://registry.npmjs.org/playwright/-/playwright-1.58.2.tgz",
+      "integrity": "sha512-vA30H8Nvkq/cPBnNw4Q8TWz1EJyqgpuinBcHET0YVJVFldr8JDNiU9LaWAE1KqSkRYazuaBhTpB5ZzShOezQ6A==",
+      "dev": true,
+      "license": "Apache-2.0",
+      "dependencies": {
+        "playwright-core": "1.58.2"
+      },
+      "bin": {
+        "playwright": "cli.js"
+      },
+      "engines": {
+        "node": ">=18"
+      },
+      "optionalDependencies": {
+        "fsevents": "2.3.2"
+      }
+    },
+    "node_modules/playwright-core": {
+      "version": "1.58.2",
+      "resolved": "https://registry.npmjs.org/playwright-core/-/playwright-core-1.58.2.tgz",
+      "integrity": "sha512-yZkEtftgwS8CsfYo7nm0KE8jsvm6i/PTgVtB8DL726wNf6H2IMsDuxCpJj59KDaxCtSnrWan2AeDqM7JBaultg==",
+      "dev": true,
+      "license": "Apache-2.0",
+      "bin": {
+        "playwright-core": "cli.js"
+      },
+      "engines": {
+        "node": ">=18"
+      }
+    },
+    "node_modules/playwright/node_modules/fsevents": {
+      "version": "2.3.2",
+      "resolved": "https://registry.npmjs.org/fsevents/-/fsevents-2.3.2.tgz",
+      "integrity": "sha512-xiqMQR4xAeHTuB9uWm+fFRcIOgKBMiOBP+eXiyT7jsgVCq1bkVygt00oASowB7EdtpOHaaPgKt812P9ab+DDKA==",
+      "dev": true,
+      "hasInstallScript": true,
+      "license": "MIT",
+      "optional": true,
+      "os": [
+        "darwin"
+      ],
+      "engines": {
+        "node": "^8.16.0 || ^10.6.0 || >=11.0.0"
+      }
+    },
     "node_modules/pngjs": {
       "version": "7.0.0",
       "resolved": "https://registry.npmjs.org/pngjs/-/pngjs-7.0.0.tgz",
@@ -3368,6 +3670,13 @@
         "url": "https://github.com/prettier/prettier?sponsor=1"
       }
     },
+    "node_modules/process-nextick-args": {
+      "version": "2.0.1",
+      "resolved": "https://registry.npmjs.org/process-nextick-args/-/process-nextick-args-2.0.1.tgz",
+      "integrity": "sha512-3ouUOpQhtgrbOa17J7+uxOTpITYWaGP7/AhoR3+A+/1e9skrzelGi/dXzEYyvbxubEF6Wn2ypscTKiKJFFn1ag==",
+      "dev": true,
+      "license": "MIT"
+    },
     "node_modules/punycode": {
       "version": "2.3.1",
       "resolved": "https://registry.npmjs.org/punycode/-/punycode-2.3.1.tgz",
@@ -3393,6 +3702,22 @@
         "node": ">=4"
       }
     },
+    "node_modules/readable-stream": {
+      "version": "2.3.8",
+      "resolved": "https://registry.npmjs.org/readable-stream/-/readable-stream-2.3.8.tgz",
+      "integrity": "sha512-8p0AUk4XODgIewSi0l8Epjs+EVnWiK7NoDIEGU0HhE7+ZyY8D1IMY7odu5lRrFXGg71L15KG8QrPmum45RTtdA==",
+      "dev": true,
+      "license": "MIT",
+      "dependencies": {
+        "core-util-is": "~1.0.0",
+        "inherits": "~2.0.3",
+        "isarray": "~1.0.0",
+        "process-nextick-args": "~2.0.0",
+        "safe-buffer": "~5.1.1",
+        "string_decoder": "~1.1.1",
+        "util-deprecate": "~1.0.1"
+      }
+    },
     "node_modules/reflect.getprototypeof": {
       "version": "1.0.10",
       "resolved": "https://registry.npmjs.org/reflect.getprototypeof/-/reflect.getprototypeof-1.0.10.tgz",
@@ -3519,6 +3844,13 @@
       "dev": true,
       "license": "MIT"
     },
+    "node_modules/safe-buffer": {
+      "version": "5.1.2",
+      "resolved": "https://registry.npmjs.org/safe-buffer/-/safe-buffer-5.1.2.tgz",
+      "integrity": "sha512-Gd2UZBJDkXlY7GbJxfsE8/nvKkUEU1G38c1siN6QP6a9PT9MmHB8GnpscSmMJSoF8LOIrt8ud/wPtojys4G6+g==",
+      "dev": true,
+      "license": "MIT"
+    },
     "node_modules/safe-push-apply": {
       "version": "1.0.0",
       "resolved": "https://registry.npmjs.org/safe-push-apply/-/safe-push-apply-1.0.0.tgz",
@@ -3623,6 +3955,13 @@
         "node": ">= 0.4"
       }
     },
+    "node_modules/setimmediate": {
+      "version": "1.0.5",
+      "resolved": "https://registry.npmjs.org/setimmediate/-/setimmediate-1.0.5.tgz",
+      "integrity": "sha512-MATJdZp8sLqDl/68LfQmbP8zKPLQNV6BIZoIgrscFDQ+RsvK/BxeDQOgyxKKoh0y/8h3BqVFnCqQ/gd+reiIXA==",
+      "dev": true,
+      "license": "MIT"
+    },
     "node_modules/shebang-command": {
       "version": "2.0.0",
       "resolved": "https://registry.npmjs.org/shebang-command/-/shebang-command-2.0.0.tgz",
@@ -3814,6 +4153,19 @@
       "dev": true,
       "license": "CC0-1.0"
     },
+    "node_modules/stdin-discarder": {
+      "version": "0.2.2",
+      "resolved": "https://registry.npmjs.org/stdin-discarder/-/stdin-discarder-0.2.2.tgz",
+      "integrity": "sha512-UhDfHmA92YAlNnCfhmq0VeNL5bDbiZGg7sZ2IvPsXubGkiNa9EC+tUTsjBRsYUAz87btI6/1wf4XoVvQ3uRnmQ==",
+      "dev": true,
+      "license": "MIT",
+      "engines": {
+        "node": ">=18"
+      },
+      "funding": {
+        "url": "https://github.com/sponsors/sindresorhus"
+      }
+    },
     "node_modules/stop-iteration-iterator": {
       "version": "1.1.0",
       "resolved": "https://registry.npmjs.org/stop-iteration-iterator/-/stop-iteration-iterator-1.1.0.tgz",
@@ -3828,6 +4180,16 @@
         "node": ">= 0.4"
       }
     },
+    "node_modules/string_decoder": {
+      "version": "1.1.1",
+      "resolved": "https://registry.npmjs.org/string_decoder/-/string_decoder-1.1.1.tgz",
+      "integrity": "sha512-n/ShnvDi6FHbbVfviro+WojiFzv+s8MPMHBczVePfUpDJLwoLT0ht1l4YwBCbi8pJAveEEdnkHyPyTP/mzRfwg==",
+      "dev": true,
+      "license": "MIT",
+      "dependencies": {
+        "safe-buffer": "~5.1.0"
+      }
+    },
     "node_modules/string-argv": {
       "version": "0.3.2",
       "resolved": "https://registry.npmjs.org/string-argv/-/string-argv-0.3.2.tgz",
@@ -4204,6 +4566,13 @@
         "punycode": "^2.1.0"
       }
     },
+    "node_modules/util-deprecate": {
+      "version": "1.0.2",
+      "resolved": "https://registry.npmjs.org/util-deprecate/-/util-deprecate-1.0.2.tgz",
+      "integrity": "sha512-EPD5q1uXyFxJpCrLnCc1nHnq3gOa6DZBocAIiI2TaSCA7VCJ1UJDMagCzIkXNsUYfD1daK//LTEQ8xiIbrHtcw==",
+      "dev": true,
+      "license": "MIT"
+    },
     "node_modules/validate-npm-package-license": {
       "version": "3.0.4",
       "resolved": "https://registry.npmjs.org/validate-npm-package-license/-/validate-npm-package-license-3.0.4.tgz",
diff --git a/package.json b/package.json
index f381a99f..a55a4938 100644
--- a/package.json
+++ b/package.json
@@ -65,13 +65,17 @@
     "lint:webview:fix": "cd webview-ui && eslint . --fix",
     "import-tileset": "tsx scripts/import-tileset-cli.ts",
     "format": "prettier --write \"src/**/*.ts\" \"webview-ui/src/**/*.{ts,tsx,css}\" \"*.{js,mjs}\" \"webview-ui/*.{js,ts}\"",
-    "format:check": "prettier --check \"src/**/*.ts\" \"webview-ui/src/**/*.{ts,tsx,css}\" \"*.{js,mjs}\" \"webview-ui/*.{js,ts}\""
+    "format:check": "prettier --check \"src/**/*.ts\" \"webview-ui/src/**/*.{ts,tsx,css}\" \"*.{js,mjs}\" \"webview-ui/*.{js,ts}\"",
+    "e2e": "playwright test --config e2e/playwright.config.ts",
+    "e2e:debug": "playwright test --config e2e/playwright.config.ts --debug"
   },
   "devDependencies": {
     "@anthropic-ai/sdk": "^0.80.0",
+    "@playwright/test": "^1.58.2",
     "@types/node": "25.x",
     "@types/pngjs": "^6.0.5",
     "@types/vscode": "^1.105.0",
+    "@vscode/test-electron": "^2.5.2",
     "esbuild": "^0.27.2",
     "eslint": "^10.0.3",
     "eslint-config-prettier": "^10.1.8",
diff --git a/webview-ui/package-lock.json b/webview-ui/package-lock.json
index 8351aff3..42691ce6 100644
--- a/webview-ui/package-lock.json
+++ b/webview-ui/package-lock.json
@@ -1820,9 +1820,9 @@
       }
     },
     "node_modules/caniuse-lite": {
-      "version": "1.0.30001780",
-      "resolved": "https://registry.npmjs.org/caniuse-lite/-/caniuse-lite-1.0.30001780.tgz",
-      "integrity": "sha512-llngX0E7nQci5BPJDqoZSbuZ5Bcs9F5db7EtgfwBerX9XGtkkiO4NwfDDIRzHTTwcYC8vC7bmeUEPGrKlR/TkQ==",
+      "version": "1.0.30001781",
+      "resolved": "https://registry.npmjs.org/caniuse-lite/-/caniuse-lite-1.0.30001781.tgz",
+      "integrity": "sha512-RdwNCyMsNBftLjW6w01z8bKEvT6e/5tpPVEgtn22TiLGlstHOVecsX2KHFkD5e/vRnIE4EGzpuIODb3mtswtkw==",
       "dev": true,
       "funding": [
         {
@@ -2346,9 +2346,9 @@
       }
     },
     "node_modules/get-tsconfig": {
-      "version": "4.13.6",
-      "resolved": "https://registry.npmjs.org/get-tsconfig/-/get-tsconfig-4.13.6.tgz",
-      "integrity": "sha512-shZT/QMiSHc/YBLxxOkMtgSid5HFoauqCE3/exfsEcwg1WkeqjG+V40yBbBrsD+jW2HDXcs28xOfcbm2jI8Ddw==",
+      "version": "4.13.7",
+      "resolved": "https://registry.npmjs.org/get-tsconfig/-/get-tsconfig-4.13.7.tgz",
+      "integrity": "sha512-7tN6rFgBlMgpBML5j8typ92BKFi2sFQvIdpAqLA2beia5avZDrMs0FLZiM5etShWq5irVyGcGMEA1jcDaK7A/Q==",
       "dev": true,
       "license": "MIT",
       "dependencies": {