digidem
diff --git a/‎.dockerignore‎
Lines changed: 152 additions & 0 deletions b/‎.dockerignore‎
Lines changed: 152 additions & 0 deletions
diff --git a/‎.env.example‎
Lines changed: 31 additions & 1 deletion b/‎.env.example‎
Lines changed: 31 additions & 1 deletion
diff --git a/‎.github/workflows/api-validate.yml‎
Lines changed: 135 additions & 0 deletions b/‎.github/workflows/api-validate.yml‎
Lines changed: 135 additions & 0 deletions
diff --git a/‎.github/workflows/clean-content.yml‎
Lines changed: 25 additions & 7 deletions b/‎.github/workflows/clean-content.yml‎
Lines changed: 25 additions & 7 deletions
@@ -0,0 +1,152 @@
+# ============================================
+# .dockerignore for Comapeo Docs API Server
+# Minimizes Docker context size by excluding unnecessary files
+# ============================================
+
+# Dependencies (installed in container via package.json)
+node_modules
+npm-debug.log*
+yarn-error.log*
+package-lock.json
+yarn.lock
+pnpm-lock.yaml
+
+# Build outputs and caches
+build/
+dist/
+.out/
+.docusaurus/
+.cache-loader/
+*.tsbuildinfo
+
+# ============================================
+# Content Generation (not needed for API server)
+# ============================================
+# Generated content from Notion (synced from content branch)
+docs/
+i18n/
+static/images/
+
+# ============================================
+# Development & Testing (not needed in production)
+# ============================================
+# Test files and coverage
+coverage/
+test-results*.json
+test-results*.html
+*.test.ts
+*.test.tsx
+*.spec.ts
+vitest.config.ts
+__tests__/
+
+# Development configuration
+.eslintrc*
+.prettierrc*
+.prettierignore
+lefthook.yml
+
+# CI/CD
+.github/
+.gitlab-ci.yml
+.azure-pipelines.yml
+.circleci/
+
+# ============================================
+# Documentation & Assets (not needed for API)
+# ============================================
+# Project documentation
+README.md
+CONTRIBUTING.md
+CHANGELOG.md
+LICENSE
+context/
+NOTION_FETCH_ARCHITECTURE.md
+
+# Assets not needed for API server
+assets/
+favicon.*
+robots.txt
+
+# ============================================
+# Development Directories (not needed in container)
+# ============================================
+# Git
+.git/
+.gitignore
+.gitattributes
+
+# IDE
+.vscode/
+.idea/
+*.swp
+*.swo
+*~
+.marscode/
+.eclipse/
+
+# Worktrees and development directories
+worktrees/
+.dev-docs/
+
+# ============================================
+# Environment & Secrets (use env vars or mounted secrets)
+# ============================================
+.env
+.env.*
+!.env.example
+
+# ============================================
+# Temporary & Generated Files
+# ============================================
+# Temporary files
+*.tmp
+*.temp
+*-preview-*.md
+.cache/
+screenshots/
+
+# Notion exports and emoji files (not needed for API)
+notion_*.json
+
+# Runtime metrics and cache files
+retry-metrics.json
+image-cache.json
+image-failures.json
+
+# Job persistence data (mounted as volume)
+.jobs-data/
+
+# Audit data (development only)
+.audit-data/
+
+# Development planning
+TASK.md
+NEXT_STEPS.md
+PRD.md
+TODO.md
+
+# ============================================
+# Docker Files (don't include Docker files in image)
+# ============================================
+Dockerfile*
+docker-compose*
+.dockerignore
+
+# ============================================
+# Misc (OS files, logs)
+# ============================================
+.DS_Store
+Thumbs.db
+*.log
+
+# ============================================
+# Test Directories under scripts/ (explicit)
+# ============================================
+scripts/test-docker/
+scripts/test-scaffold/
+scripts/test-utils/
+scripts/**/__tests__/
+scripts/**/*.test.ts
+api-server/**/__tests__/
+api-server/**/*.test.ts
@@ -50,11 +50,41 @@ MAX_IMAGE_RETRIES=3
 # TEST_DATA_SOURCE_ID=test-database-id-here
 # TEST_MODE=true
 
-# OpenAI API Configuration
+# OpenAI Configuration (Required for translation jobs)
+OPENAI_API_KEY=your_openai_api_key_here
+OPENAI_MODEL=gpt-4o-mini
 # Optional: Use alternative OpenAI-compatible APIs (like Deepseek)
 # OPENAI_BASE_URL=https://api.deepseek.com
 # OPENAI_MODEL=deepseek-chat
 
+# API Server Configuration (for Docker deployment)
+NODE_ENV=production
+API_HOST=0.0.0.0
+API_PORT=3001
+
+# Content Repository Configuration (required for mutating jobs in API server)
+# Required for: notion:fetch, notion:fetch-all, notion:translate
+# GitHub repository URL must be HTTPS (no embedded credentials)
+GITHUB_REPO_URL=https://github.com/digidem/comapeo-docs.git
+# GitHub token with permissions to push to the content branch
+GITHUB_TOKEN=your_github_token_here
+# Git author identity used for content commits created by jobs
+GIT_AUTHOR_NAME=CoMapeo Content Bot
+GIT_AUTHOR_EMAIL=content-bot@example.com
+
+# Content repository behavior (optional)
+GITHUB_CONTENT_BRANCH=content
+WORKDIR=/workspace/repo
+COMMIT_MESSAGE_PREFIX=content-bot:
+ALLOW_EMPTY_COMMITS=false
+
+# API Authentication (Optional - generate secure keys with: openssl rand -base64 32)
+# API_KEY_DEPLOYMENT=your_secure_api_key_here
+# API_KEY_GITHUB_ACTIONS=your_github_actions_key_here
+# Dedicated key for POST /notion-trigger (x-api-key header)
+# Required if you expose/use the Notion trigger endpoint.
+NOTION_TRIGGER_API_KEY=your_notion_trigger_key_here
+
 # URL Handling
 # Fallback URL used when an invalid URL is encountered in blocks (e.g., bookmark, embed)
 # This is used to replace invalid/removed URLs during translation
 
@@ -0,0 +1,135 @@
+name: API Validate
+
+on:
+  workflow_dispatch:
+  push:
+    branches:
+      - main
+      - "feat/**"
+    paths:
+      - ".github/workflows/api-validate.yml"
+      - "api-server/**"
+      - "package.json"
+  pull_request:
+    paths:
+      - ".github/workflows/api-validate.yml"
+      - "api-server/**"
+      - "package.json"
+
+jobs:
+  api-validate:
+    runs-on: ubuntu-latest
+    timeout-minutes: 20
+    env:
+      API_HOST: "127.0.0.1"
+      API_PORT: "3001"
+      API_BASE_URL: "http://127.0.0.1:3001"
+      API_KEY_CI: ${{ secrets.API_KEY_GITHUB_ACTIONS || 'ci-fallback-api-key-1234567890abcdef' }}
+      NOTION_API_KEY: ${{ secrets.NOTION_API_KEY }}
+      DATABASE_ID: ${{ secrets.DATABASE_ID }}
+      DATA_SOURCE_ID: ${{ secrets.DATA_SOURCE_ID }}
+      OPENAI_API_KEY: ${{ secrets.OPENAI_API_KEY }}
+      DEFAULT_DOCS_PAGE: "overview"
+      CI_FETCH_HOLD_MS: "3000"
+      GITHUB_REPO_URL: "https://github.com/${{ github.repository }}.git"
+      GITHUB_TOKEN: ${{ github.token }}
+      GIT_AUTHOR_NAME: "github-actions[bot]"
+      GIT_AUTHOR_EMAIL: "41898282+github-actions[bot]@users.noreply.github.com"
+      WORKDIR: ${{ github.workspace }}
+    steps:
+      - name: Checkout
+        uses: actions/checkout@v4
+
+      - name: Setup Bun
+        uses: oven-sh/setup-bun@v2
+        with:
+          bun-version: "1"
+
+      - name: Install dependencies
+        run: bun i --frozen-lockfile
+
+      - name: Rebuild sharp for CI environment
+        run: npm rebuild sharp
+
+      - name: Start local API
+        run: |
+          set -euo pipefail
+          bun run api:server > /tmp/api-validate-server.log 2>&1 &
+          echo $! > /tmp/api-validate-server.pid
+
+      - name: Wait for health endpoint
+        run: |
+          set -euo pipefail
+          for i in $(seq 1 60); do
+            if curl -sf "${API_BASE_URL}/health" >/dev/null; then
+              exit 0
+            fi
+            sleep 1
+          done
+          echo "API health endpoint did not become ready in time"
+          exit 1
+
+      - name: Run API smoke assertions
+        run: |
+          set -euo pipefail
+          test -n "${API_KEY_CI}"
+
+          # 401 envelope for missing auth on create-job endpoint.
+          HTTP_CODE=$(curl -sS -o /tmp/api-validate-unauthorized.json -w "%{http_code}" \
+            -X POST "${API_BASE_URL}/jobs" \
+            -H "Content-Type: application/json" \
+            -d '{"type":"fetch-ready","options":{"dryRun":true,"maxPages":1}}')
+          test "${HTTP_CODE}" = "401"
+          jq -e '.status == "failed" and .error.code == "UNAUTHORIZED" and (.jobId | not)' /tmp/api-validate-unauthorized.json >/dev/null
+
+          # Sequential 202 (accepted) then immediate 409 (lock held by CI_FETCH_HOLD_MS).
+          HTTP_CODE=$(curl -sS -o /tmp/api-validate-job-1.json -w "%{http_code}" \
+            -X POST "${API_BASE_URL}/jobs" \
+            -H "Authorization: Bearer ${API_KEY_CI}" \
+            -H "Content-Type: application/json" \
+            -d '{"type":"fetch-ready","options":{"dryRun":true,"maxPages":1}}')
+          test "${HTTP_CODE}" = "202"
+          JOB_ID=$(jq -r '.jobId' /tmp/api-validate-job-1.json)
+          test -n "${JOB_ID}"
+          test "${JOB_ID}" != "null"
+          jq -e '.status == "pending"' /tmp/api-validate-job-1.json >/dev/null
+
+          HTTP_CODE=$(curl -sS -o /tmp/api-validate-job-2.json -w "%{http_code}" \
+            -X POST "${API_BASE_URL}/jobs" \
+            -H "Authorization: Bearer ${API_KEY_CI}" \
+            -H "Content-Type: application/json" \
+            -d '{"type":"fetch-all","options":{"dryRun":true,"maxPages":1}}')
+          test "${HTTP_CODE}" = "409"
+          jq -e '.status == "failed" and .error.code == "CONFLICT" and (.jobId | not)' /tmp/api-validate-job-2.json >/dev/null
+
+          # Poll the accepted fetch-ready job to terminal state.
+          STATUS=""
+          for i in $(seq 1 180); do
+            curl -sS \
+              -H "Authorization: Bearer ${API_KEY_CI}" \
+              "${API_BASE_URL}/jobs/${JOB_ID}" > /tmp/api-validate-job-status.json
+            STATUS=$(jq -r '.status' /tmp/api-validate-job-status.json)
+            if [ "${STATUS}" = "completed" ] || [ "${STATUS}" = "failed" ]; then
+              break
+            fi
+            sleep 1
+          done
+
+          test "${STATUS}" = "completed"
+          jq -e '.dryRun == true and .commitHash == null and (.pagesProcessed | type == "number")' /tmp/api-validate-job-status.json >/dev/null
+
+      - name: Cleanup local API
+        if: always()
+        run: |
+          set +e
+          if [ -f /tmp/api-validate-server.pid ]; then
+            PID="$(cat /tmp/api-validate-server.pid)"
+            if [ -n "${PID}" ] && kill -0 "${PID}" 2>/dev/null; then
+              kill "${PID}" 2>/dev/null || true
+              sleep 1
+            fi
+          fi
+          if [ -f /tmp/api-validate-server.log ]; then
+            echo "=== api-validate-server.log ==="
+            tail -n 200 /tmp/api-validate-server.log || true
+          fi
@@ -23,9 +23,30 @@ jobs:
 
     steps:
       - name: Checkout content branch
-        uses: actions/checkout@v4
+        uses: actions/checkout@v6
         with:
           ref: content
+          fetch-depth: 0
+
+      - name: Configure git user
+        run: |
+          git config user.name "github-actions[bot]"
+          git config user.email "41898282+github-actions[bot]@users.noreply.github.com"
+
+      - name: Sync content branch with main
+        run: |
+          set -e
+
+          echo "Fetching latest main branch..."
+          git fetch origin main
+
+          echo "Merging origin/main into content..."
+          if git merge --no-edit origin/main; then
+            echo "content branch synced with main"
+          else
+            echo "Failed to merge main into content. Resolve conflicts manually."
+            exit 1
+          fi
 
       - name: Setup Bun
         uses: oven-sh/setup-bun@v2
@@ -49,14 +70,11 @@ jobs:
 
       - name: Commit cleanup results
         run: |
-          git config user.name "github-actions[bot]"
-          git config user.email "41898282+github-actions[bot]@users.noreply.github.com"
-
           # Stage all changes from the cleanup
           git add .
 
-          # Commit if there are changes
-          git diff --cached --quiet || git commit -m "(content-cleanup): remove all generated content from Notion"
+          # Commit if there are changes (skip pre-commit hooks in CI)
+          git diff --cached --quiet || git commit --no-verify -m "(content-cleanup): remove all generated content from Notion"
 
           # Push to content branch
           git push origin content
@@ -83,7 +101,7 @@ jobs:
               - type: "section"
                 text:
                   type: "mrkdwn"
-                  text: "*Generated content cleanup*: ${{ job.status }}\nConfirm flag: `${{ github.event.inputs.confirm }}`"
+                  text: "*Generated content cleanup*: ${{ job.status }}\nConfirm flag: `--confirm=yes` (hardcoded)"
               - type: "section"
                 text:
                   type: "mrkdwn"