platzhersh · platzhersh · Jan 6, 2026 · Jan 5, 2026 · Jan 5, 2026 · Jan 5, 2026
diff --git a/CLAUDE.md b/CLAUDE.md
@@ -71,6 +71,53 @@ cd api && prisma studio
 cd api && prisma migrate dev --create-only --name migration_name
 ```
 
+### Synthetic Data Seeding
+
+#### Local Development Seeding
+```bash
+# Seed basic patient demographics (original script)
+python scripts/seed.py
+
+# Seed staging data with synthetic vitals (requires API running)
+python scripts/seed_staging.py
+
+# Or with environment variable (mimics Railway staging)
+RAILWAY_ENVIRONMENT=staging python scripts/seed_staging.py
+```
+
+#### Railway Staging Deployment
+Synthetic data is **automatically seeded** on Railway staging deployments when `RAILWAY_ENVIRONMENT=staging` is set.
+
+**Configuration:**
+1. In Railway staging project, set environment variable:
+   ```
+   RAILWAY_ENVIRONMENT=staging
+   ```
+
+2. On deployment, the Dockerfile automatically:
+   - Runs `prisma migrate deploy`
+   - **Seeds synthetic data** (if patient count < 3)
+   - Starts the API
+
+**Seed Script Behavior:**
+- **Environment-aware**: Only runs when `RAILWAY_ENVIRONMENT=staging`
+- **Idempotent**: Safe to run multiple times (checks patient count threshold)
+- **Fast**: Completes in <10 seconds
+- **Generates**:
+  - 15 synthetic patients with realistic demographics (Faker)
+  - 2-5 vital signs readings per patient
+  - Clinically plausible values (BP: 90-140/60-90 mmHg, Pulse: 60-100 bpm)
+  - Timestamps spread over past 1-4 weeks
+  - MRN prefix: `STAGING-` to distinguish from production data
+
+**Manual Trigger:**
+```bash
+# SSH into Railway container (if needed)
+railway run python /scripts/seed_staging.py
+```
+
+See [ADR-0005](./docs/adr/0005-synthetic-data-generation.md) for implementation details and decision rationale.
+
 ### Docker & Infrastructure
 ```bash
 # Check EHRBase status (wait 30-60s after docker compose up)

diff --git a/api/Dockerfile b/api/Dockerfile
@@ -23,11 +23,15 @@ COPY api/src ./src
 COPY api/prisma ./prisma
 COPY api/templates ./templates
 
+# Copy seed scripts (from repo root)
+COPY scripts /scripts
+
 # Generate Prisma client (binaries will be cached in PRISMA_BINARY_CACHE_DIR)
 RUN prisma generate
 
-# Grant non-root user ownership of app directory and Prisma binaries
+# Grant non-root user ownership of app directory, scripts, and Prisma binaries
 RUN chown -R appuser:appgroup /app && \
+    chown -R appuser:appgroup /scripts && \
     chown -R appuser:appgroup /home/appuser/.cache && \
     chown -R appuser:appgroup /usr/local/lib/python*/site-packages/prisma/
 
@@ -38,4 +42,11 @@ EXPOSE 8000
 # Use Railway's $PORT if available, otherwise default to 8000
 # Use shell form to allow environment variable substitution
 # Run migrations before starting the server
-CMD sh -c "echo 'Running database migrations...' && prisma migrate deploy && echo 'Starting uvicorn on port ${PORT:-8000}...' && uvicorn src.main:app --host 0.0.0.0 --port ${PORT:-8000}"
+# Conditionally seed staging data if RAILWAY_ENVIRONMENT=staging
+CMD sh -c "echo 'Running database migrations...' && \
+  prisma migrate deploy && \
+  if [ \"$RAILWAY_ENVIRONMENT\" = \"staging\" ]; then \
+    echo 'Seeding staging data...' && python /scripts/seed_staging.py; \
+  fi && \
+  echo 'Starting uvicorn on port ${PORT:-8000}...' && \
+  uvicorn src.main:app --host 0.0.0.0 --port ${PORT:-8000}"
diff --git a/api/pyproject.toml b/api/pyproject.toml
@@ -13,6 +13,7 @@ dependencies = [
     "httpx>=0.26.0",
     "python-multipart>=0.0.6",
     "aiofiles>=23.2.0",
+    "faker>=22.0.0",
 ]
 
 [project.optional-dependencies]