smkwray
diff --git a/‎.env.example‎
Lines changed: 13 additions & 0 deletions b/‎.env.example‎
Lines changed: 13 additions & 0 deletions
diff --git a/‎.github/workflows/ci.yml‎
Lines changed: 41 additions & 0 deletions b/‎.github/workflows/ci.yml‎
Lines changed: 41 additions & 0 deletions
diff --git a/‎.github/workflows/pages.yml‎
Lines changed: 52 additions & 0 deletions b/‎.github/workflows/pages.yml‎
Lines changed: 52 additions & 0 deletions
diff --git a/‎.gitignore‎
Lines changed: 34 additions & 0 deletions b/‎.gitignore‎
Lines changed: 34 additions & 0 deletions
diff --git a/‎DATA_SOURCES.md‎
Lines changed: 52 additions & 0 deletions b/‎DATA_SOURCES.md‎
Lines changed: 52 additions & 0 deletions
diff --git a/‎LICENSE‎
Lines changed: 22 additions & 0 deletions b/‎LICENSE‎
Lines changed: 22 additions & 0 deletions
diff --git a/‎Makefile‎
Lines changed: 41 additions & 0 deletions b/‎Makefile‎
Lines changed: 41 additions & 0 deletions
diff --git a/‎README.md‎
Lines changed: 103 additions & 0 deletions b/‎README.md‎
Lines changed: 103 additions & 0 deletions
diff --git a/‎data_final/.gitkeep‎
Lines changed: 1 addition & 0 deletions b/‎data_final/.gitkeep‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎data_intermediate/.gitkeep‎
Lines changed: 1 addition & 0 deletions b/‎data_intermediate/.gitkeep‎
Lines changed: 1 addition & 0 deletions
@@ -0,0 +1,13 @@
+# External environment settings for geoluck.
+# Copy to `.env` and point everything at paths outside the repo.
+
+PROJECT_VENV_ROOT=$HOME/venvs/<project-name>
+UV_PROJECT_ENVIRONMENT=$PROJECT_VENV_ROOT
+PYTHONDONTWRITEBYTECODE=1
+PYTHONPYCACHEPREFIX=$PROJECT_VENV_ROOT/.cache/pycache
+PYTEST_ADDOPTS="-p no:cacheprovider"
+UV_CACHE_DIR=$PROJECT_VENV_ROOT/.cache/uv
+RUFF_CACHE_DIR=$PROJECT_VENV_ROOT/.cache/ruff
+NPM_CONFIG_CACHE=$PROJECT_VENV_ROOT/.cache/npm
+PLAYWRIGHT_BROWSERS_PATH=$PROJECT_VENV_ROOT/.cache/playwright
+WINEPREFIX=$PROJECT_VENV_ROOT/.cache/wine
@@ -0,0 +1,41 @@
+name: CI
+
+on:
+  push:
+    branches: ["**"]
+  pull_request:
+
+jobs:
+  build:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+
+      - uses: actions/setup-python@v5
+        with:
+          python-version: "3.12"
+
+      - uses: astral-sh/setup-uv@v5
+        with:
+          version: "0.6.6"
+
+      - name: Sync Python environment
+        run: uv sync --all-extras
+
+      - name: Run tests
+        run: uv run python -B -m pytest
+
+      - uses: actions/setup-node@v4
+        with:
+          node-version: "20"
+          cache: "npm"
+          cache-dependency-path: web/package-lock.json
+
+      - name: Install web dependencies
+        working-directory: web
+        run: npm ci
+
+      - name: Build web app
+        working-directory: web
+        run: npm run build
+
@@ -0,0 +1,52 @@
+name: Deploy Pages
+
+on:
+  push:
+    branches: ["main"]
+  workflow_dispatch:
+
+permissions:
+  contents: read
+  pages: write
+  id-token: write
+
+concurrency:
+  group: pages
+  cancel-in-progress: true
+
+jobs:
+  build:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+
+      - uses: actions/setup-node@v4
+        with:
+          node-version: "20"
+          cache: "npm"
+          cache-dependency-path: web/package-lock.json
+
+      - name: Install web dependencies
+        working-directory: web
+        run: npm ci
+
+      - name: Build web app
+        working-directory: web
+        run: npm run build
+
+      - uses: actions/configure-pages@v5
+
+      - uses: actions/upload-pages-artifact@v3
+        with:
+          path: web/dist
+
+  deploy:
+    environment:
+      name: github-pages
+      url: ${{ steps.deployment.outputs.page_url }}
+    runs-on: ubuntu-latest
+    needs: build
+    steps:
+      - id: deployment
+        uses: actions/deploy-pages@v4
+
@@ -0,0 +1,34 @@
+.DS_Store
+.env
+.env.local
+.python-version
+.coverage
+.mypy_cache/
+.pytest_cache/
+.ruff_cache/
+.cache/
+.venv/
+venv/
+env/
+__pycache__/
+*.py[cod]
+*.log
+
+# Private local agent/project planning files
+AGENTS.md
+geoluck_codex_plan.md
+
+# Private agent workflow state
+do/
+
+# Local/generated data artifacts
+data_raw/**
+data_intermediate/**
+data_final/**
+!data_raw/.gitkeep
+!data_intermediate/.gitkeep
+!data_final/.gitkeep
+
+# Generated frontend payloads/build products
+web/node_modules/
+web/dist/
@@ -0,0 +1,22 @@
+MIT License
+
+Copyright (c) 2026
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
+
@@ -0,0 +1,41 @@
+SHELL := /bin/bash
+.ONESHELL:
+
+.PHONY: sync test lint fmt web-install web-build check
+
+define load_env
+if [ -f .env ]; then
+  set -a
+  source ./.env
+  set +a
+fi
+endef
+
+sync:
+	$(load_env)
+	uv sync
+
+test:
+	$(load_env)
+	uv run python -B -m pytest
+
+lint:
+	$(load_env)
+	uv run ruff check .
+
+fmt:
+	$(load_env)
+	uv run ruff format .
+
+web-install:
+	$(load_env)
+	cd web
+	npm install
+
+web-build:
+	$(load_env)
+	cd web
+	npm run build
+
+check: test web-build
+
@@ -0,0 +1,103 @@
+# geoluck &nbsp; <img src="logo/geoduck.png" alt="" width="36" />
+
+**How much of relative country prosperity can be predicted from geography, natural endowments, resource development, and social structure — and who beats their geography?**
+
+Geoluck is an open-source research project that builds a country-decade panel (1900–2020) and trains machine learning models to predict four prosperity outcomes from tiered feature sets. The results are published as an interactive static site.
+
+This is explicitly about **predictive association**, not causal effect.
+
+**[View the live site →](https://smkwray.github.io/geoluck/)**
+
+---
+
+## What the site shows
+
+The static site models four outcome metrics, each converted to within-decade percentile ranks:
+
+| Outcome | Definition | Source |
+|---|---|---|
+| **Income** | Log GDP per capita rank | Maddison Project Database 2023 |
+| **Wealth** | Produced capital per capita rank | World Bank Changing Wealth of Nations |
+| **Life expectancy** | Life expectancy at birth rank | World Bank WDI / UN Population Division |
+| **Inequality** | Disposable-income Gini rank (higher = more equal) | SWIID |
+
+Predictor features are organized into three independently toggleable tiers:
+
+- **Nature** — Pure geography: latitude, climate normals, terrain, soil, malaria ecology, seismic activity, wind/solar potential, ocean productivity, cyclone exposure.
+- **Infrastructure** — Resource development: dams, irrigation, oil/gas/coal/mineral extraction, agricultural land use, energy assets.
+- **Society** — Social and institutional structure: governance, democracy, trade openness, colonial history, ethnic/religious fractionalization, gender inequality, demographics.
+
+All seven non-empty tier combinations are modeled independently for each outcome (28 model bundles). The site supports interactive choropleth maps, model comparison, country-level SHAP feature contributions, country-vs-country comparison, feature exploration by data source, full sortable rankings with CSV export, and shareable deep links.
+
+---
+
+## Repository structure
+
+```
+src/           Python pipeline — ETL, feature building, modeling, export
+web/           Static frontend — TypeScript, Vite, Leaflet, Chart.js
+docs/          Methodology and payload documentation
+web/public/data/   Precomputed JSON payloads consumed by the frontend
+```
+
+---
+
+## Data policy
+
+Raw and intermediate research data are **not** stored in the public repository. Only compact, precomputed JSON payloads required by the static site are committed under `web/public/data/`. These are generated by the Python pipeline's export commands.
+
+---
+
+## Modeling notes
+
+- Models are evaluated **out of sample** using cross-validated R², RMSE, MAE, and Spearman rank correlation.
+- User-facing predictions and residuals use **cross-validated exports**, not in-sample fits.
+- Feature contributions use SHAP values from fold-trained estimators.
+- Results should be interpreted as **predictive structure**, not causal effects. A high R² for Nature-only features means geography is a strong statistical predictor — likely because it correlates with deeper causal channels — not that geography *causes* prosperity.
+
+---
+
+## GitHub Pages deployment
+
+The site is deployed through **GitHub Actions**, not "Deploy from a branch."
+
+In repository Settings → Pages, set the source to **GitHub Actions**. The workflow builds the frontend from `web/` and publishes the contents of `web/dist/`.
+
+---
+
+## Local development
+
+```bash
+# Python pipeline
+make sync        # Install/sync Python dependencies
+make test        # Run tests
+
+# Frontend
+make web-build   # Build the static site (output: web/dist/)
+```
+
+The frontend expects JSON data under `web/public/data/`. These payloads are committed to the repository and are generated by:
+
+```bash
+uv run geoluck export-web-data
+```
+
+For frontend development with hot reload:
+
+```bash
+cd web && npm run dev
+```
+
+---
+
+## Documentation
+
+- [`DATA_SOURCES.md`](DATA_SOURCES.md) — Source registry and licensing notes
+- [`docs/MODEL_SPECS.md`](docs/MODEL_SPECS.md) — Model families, feature-set variants, evaluation design
+- [`docs/UI_DATA_PAYLOADS.md`](docs/UI_DATA_PAYLOADS.md) — Frontend JSON payload schemas
+
+---
+
+## License
+
+MIT
@@ -0,0 +1 @@
+
@@ -0,0 +1 @@
+