semcod
diff --git a/‎Dockerfile.test‎
Lines changed: 138 additions & 0 deletions b/‎Dockerfile.test‎
Lines changed: 138 additions & 0 deletions
diff --git a/‎README.md‎
Lines changed: 80 additions & 26 deletions b/‎README.md‎
Lines changed: 80 additions & 26 deletions
diff --git a/‎TODO.md‎
Lines changed: 23 additions & 6 deletions b/‎TODO.md‎
Lines changed: 23 additions & 6 deletions
@@ -0,0 +1,138 @@
+# Multi-stage Dockerfile for vallm testing across different systems
+
+# Stage 1: Ubuntu 22.04
+FROM ubuntu:22.04 AS ubuntu-22
+ENV DEBIAN_FRONTEND=noninteractive
+RUN apt-get update && apt-get install -y \
+    python3.11 \
+    python3.11-pip \
+    python3.11-venv \
+    python3.11-dev \
+    git \
+    curl \
+    && rm -rf /var/lib/apt/lists/*
+
+WORKDIR /app
+COPY . .
+RUN python3.11 -m venv /opt/venv
+RUN . /opt/venv/bin/activate && pip install -e .[all]
+RUN . /opt/venv/bin/activate && vallm --help
+RUN . /opt/venv/bin/activate && vallm info
+
+# Stage 2: Ubuntu 24.04
+FROM ubuntu:24.04 AS ubuntu-24
+ENV DEBIAN_FRONTEND=noninteractive
+RUN apt-get update && apt-get install -y \
+    python3.12 \
+    python3.12-pip \
+    python3.12-venv \
+    python3.12-dev \
+    git \
+    curl \
+    && rm -rf /var/lib/apt/lists/*
+
+WORKDIR /app
+COPY . .
+RUN python3.12 -m venv /opt/venv
+RUN . /opt/venv/bin/activate && pip install -e .[all]
+RUN . /opt/venv/bin/activate && vallm --help
+RUN . /opt/venv/bin/activate && vallm info
+
+# Stage 3: Debian 12 (Bookworm)
+FROM debian:bookworm AS debian-12
+ENV DEBIAN_FRONTEND=noninteractive
+RUN apt-get update && apt-get install -y \
+    python3.11 \
+    python3-pip \
+    python3-venv \
+    python3-dev \
+    git \
+    curl \
+    && rm -rf /var/lib/apt/lists/*
+
+WORKDIR /app
+COPY . .
+RUN python3 -m venv /opt/venv
+RUN . /opt/venv/bin/activate && pip install -e .[all]
+RUN . /opt/venv/bin/activate && vallm --help
+RUN . /opt/venv/bin/activate && vallm info
+
+# Stage 4: Alpine Linux
+FROM alpine:3.19 AS alpine
+RUN apk add --no-cache \
+    python3-dev \
+    py3-pip \
+    py3-virtualenv \
+    git \
+    curl \
+    gcc \
+    musl-dev \
+    linux-headers
+
+WORKDIR /app
+COPY . .
+RUN python3 -m venv /opt/venv
+RUN . /opt/venv/bin/activate && pip install -e .[all]
+RUN . /opt/venv/bin/activate && vallm --help
+RUN . /opt/venv/bin/activate && vallm info
+
+# Stage 5: Fedora 39
+FROM fedora:39 AS fedora-39
+RUN dnf install -y \
+    python3.11 \
+    python3-pip \
+    python3-devel \
+    git \
+    curl \
+    && dnf clean all
+
+WORKDIR /app
+COPY . .
+RUN python3.11 -m venv /opt/venv
+RUN . /opt/venv/bin/activate && pip install -e .[all]
+RUN . /opt/venv/bin/activate && vallm --help
+RUN . /opt/venv/bin/activate && vallm info
+
+# Stage 6: CentOS Stream 9
+FROM quay.io/centos/centos:stream9 AS centos-9
+RUN dnf install -y \
+    python3.9 \
+    python3-pip \
+    python3-devel \
+    git \
+    curl \
+    && dnf clean all
+
+WORKDIR /app
+COPY . .
+RUN python3.9 -m venv /opt/venv
+RUN . /opt/venv/bin/activate && pip install -e .[all]
+RUN . /opt/venv/bin/activate && vallm --help
+RUN . /opt/venv/bin/activate && vallm info
+
+# Stage 7: Python Slim (Debian-based)
+FROM python:3.11-slim AS python-slim
+RUN apt-get update && apt-get install -y \
+    git \
+    curl \
+    && rm -rf /var/lib/apt/lists/*
+
+WORKDIR /app
+COPY . .
+RUN pip install -e .[all]
+RUN vallm --help
+RUN vallm info
+
+# Stage 8: Python Alpine
+FROM python:3.11-alpine AS python-alpine
+RUN apk add --no-cache \
+    git \
+    curl \
+    gcc \
+    musl-dev
+
+WORKDIR /app
+COPY . .
+RUN pip install -e .[all]
+RUN vallm --help
+RUN vallm info
@@ -42,7 +42,7 @@ vallm validates code proposals through a **four-tier pipeline** — from millise
 
 | Language | Syntax | Imports | Complexity | Security |
 |----------|--------|---------|------------|----------|
-| Python | ✅ AST + tree-sitter | ✅ Full resolution | ✅ radon + lizard | ✅ bandit + patterns |
+| Python | ✅ AST + tree-sitter | ✅ Full resolution (22 methods) | ✅ radon + lizard | ✅ bandit + patterns |
 | JavaScript | ✅ tree-sitter | ✅ Node.js builtins | ✅ lizard | ✅ XSS, eval patterns |
 | TypeScript | ✅ tree-sitter | ✅ Node.js builtins | ✅ lizard | ✅ XSS, eval patterns |
 | Go | ✅ tree-sitter | ✅ stdlib + modules | ✅ lizard | ✅ SQL injection, exec |
@@ -73,6 +73,20 @@ pip install vallm[graph]      # NetworkX graph analysis
 
 ## Quick Start
 
+### Validate Entire Project
+
+```bash
+# Install with LLM support
+pip install vallm[llm]
+
+# Setup Ollama (for semantic review)
+ollama pull qwen2.5-coder:7b
+ollama serve
+
+# Validate entire project recursively
+vallm batch . --recursive --semantic --model qwen2.5-coder:7b
+```
+
 ### Python API
 
 ```python
@@ -94,22 +108,23 @@ print(f"Verdict: {result.verdict.value}")  # pass / review / fail
 print(f"Score: {result.weighted_score:.2f}")
 ```
 
-### CLI
+### CLI Commands Reference
 
 ```bash
-# Validate a file
-vallm validate --file mycode.py
-
-# Quick syntax check
-vallm check mycode.py
+# Batch validation (best for entire projects)
+vallm batch . --recursive --semantic --model qwen2.5-coder:7b
+vallm batch src/ --recursive --include "*.py,*.js" --exclude "*/test/*"
+vallm batch . --recursive --format json --fail-fast
 
-# With LLM semantic review (requires Ollama)
+# Single file validation
 vallm validate --file mycode.py --semantic --model qwen2.5-coder:7b
+vallm validate --file app.js --security
 
-# JSON output
-vallm validate --file mycode.py --format json
+# Quick syntax check only
+vallm check mycode.py
+vallm check src/main.go
 
-# Show config and available validators
+# Configuration and info
 vallm info
 ```
 
@@ -253,31 +268,67 @@ cd examples && ./run.sh
 | `05_llm_semantic_review/` | Ollama Qwen 2.5 Coder 7B LLM-as-judge review |
 | `06_multilang_validation/` | JavaScript and C validation via tree-sitter |
 | `07_multi_language/` | **Comprehensive multi-language support** — 8+ languages with auto-detection |
+| `08_code2llm_integration/` | Project analysis integration with code2llm |
+| `09_code2logic_integration/` | Call graph analysis with code2logic |
+| `10_mcp_ollama_demo/` | MCP (Model Context Protocol) demo with Ollama |
+| `11_claude_code_autonomous/` | Autonomous refactoring with Claude Code |
+| `12_ollama_simple_demo/` | Simplified Ollama integration example |
 
 ## Architecture
 
 ```
 src/vallm/
-├── cli.py              # Typer CLI: validate, check, info, batch
-├── config.py           # pydantic-settings (VALLM_* env vars)
-├── hookspecs.py        # pluggy hook specifications
-├── scoring.py          # Weighted scoring + verdict engine
+├── cli.py                 # Typer CLI (401L, 8 methods, CC=42) - needs refactoring
+├── config.py              # pydantic-settings (VALLM_* env vars)
+├── hookspecs.py           # pluggy hook specifications
+├── scoring.py             # Weighted scoring + verdict engine (CC=18 validate function)
 ├── core/
-│   ├── languages.py    # Language enum, auto-detection, 30+ languages
-│   ├── proposal.py     # Proposal model
-│   ├── ast_compare.py  # tree-sitter + Python AST similarity
-│   ├── graph_builder.py # Import/call graph construction
-│   └── graph_diff.py   # Before/after graph comparison
+│   ├── languages.py       # Language enum, auto-detection, 30+ languages
+│   ├── proposal.py        # Proposal model
+│   ├── ast_compare.py     # tree-sitter + Python AST similarity
+│   ├── graph_builder.py   # Import/call graph construction
+│   └── graph_diff.py      # Before/after graph comparison
 ├── validators/
-│   ├── syntax.py       # Tier 1: ast.parse + tree-sitter (multi-lang)
-│   ├── imports.py      # Tier 1: module resolution (Python)
-│   ├── complexity.py   # Tier 2: radon (Python) + lizard (16+ langs)
-│   ├── security.py     # Tier 2: patterns + bandit
-│   └── semantic.py     # Tier 3: LLM-as-judge
+│   ├── syntax.py          # Tier 1: ast.parse + tree-sitter (multi-lang)
+│   ├── imports.py         # Tier 1: module resolution (653L, 22 methods) - god module
+│   ├── complexity.py      # Tier 2: radon (Python) + lizard (16+ langs)
+│   ├── security.py        # Tier 2: patterns + bandit
+│   └── semantic.py        # Tier 3: LLM-as-judge
 └── sandbox/
-    └── runner.py       # subprocess / Docker execution
+    └── runner.py          # subprocess / Docker execution
 ```
 
+### Code Health Metrics
+
+Current codebase metrics (generated by code2llm analysis):
+
+| Metric | Current | Target |
+|--------|---------|--------|
+| Avg Cyclomatic Complexity (CC̄) | 3.5 | ≤2.4 |
+| Max CC | 42 | ≤20 |
+| God Modules (>500L) | 2 | 0 |
+| High CC Functions (≥15) | 2 | ≤1 |
+| Total Functions | 91 | - |
+| Total Classes | 19 | - |
+
+**Critical Functions (CC ≥ 10)**:
+
+| Function | Location | CC | Fan-out | Priority |
+|----------|----------|-----|---------|----------|
+| `batch` | `cli.py:140` | **42** | 34 | 🔴 Split immediately |
+| `validate` | `scoring.py:122` | **18** | 20 | 🟡 Refactor |
+| `_check_lizard` | `complexity.py` | 12 | 9 | 🟡 Simplify |
+| `_parse_response` | `semantic.py` | 12 | 17 | 🟡 Simplify |
+
+**God Modules**:
+- `src/vallm/validators/imports.py` (653L, 22 methods, 22 dependent imports)
+- `src/vallm/cli.py` (401L, 8 methods, CC=42)
+
+See `project/` directory for full analysis files:
+- `analysis.toon` - Health diagnostics and complexity metrics
+- `evolution.toon` - Refactoring queue with ranked priorities
+- `context.md` - Architecture summary for LLM assistance
+
 ## Roadmap
 
 **v0.2 — Completeness**
@@ -286,13 +337,16 @@ src/vallm/
 - TOML config loading (`vallm.toml`, `[tool.vallm]`)
 - Pre-commit hook integration
 - GitHub Actions CI/CD
+- **Refactoring: Split `batch` function (CC=42)**
+- **Refactoring: Modularize `imports.py` god module**
 
 **v0.3 — Depth**
 - AST edit distance via apted/zss
 - CodeBERTScore embedding similarity
 - NetworkX cycle detection and centrality in graph analysis
 - RegressionValidator (Tier 4) with pytest-json-report
 - TypeCheckValidator (mypy/pyright)
+- **Refactoring: Extract output formatters**
 
 **v0.4 — Intelligence**
 - `--fix` auto-repair mode (LLM-based retry loop)
 
@@ -1,17 +1,34 @@
 # TODO
 
-## Refactoring — reduce complexity (from analysis.toon)
+## Refactoring — reduce complexity (current status: 2026-03-22)
 
-5 functions have CC≥10 (target: max-CC ≤7, CC̄ ≤2.8):
+**Current Metrics (from code2llm analysis):**
+- CC̄ = 3.5 (target: ≤2.4)
+- Max CC = 42 (target: ≤20)
+- God modules = 2 (target: 0)
+- High CC (≥15) = 2 functions (target: ≤1)
+- Critical functions (CC≥10) = 8 functions
+
+**Priority 1: Critical Functions (CC≥15)**
+
+- [ ] **`cli.batch` CC=42, fan=34** — SPLIT: extract file discovery, filtering, validation loop, result aggregation, and output formatting into separate modules
+- [ ] **`scoring.validate` CC=18, fan=20** — REFACTOR: extract validator sorting and fail-fast execution logic
+
+**Priority 2: High Complexity (CC 10-15)**
 
-- [ ] **`cli.validate` CC=14, fan=18** — extract settings build, proposal build, and output dispatch into separate functions
-- [ ] **`cli.batch` CC=high** — newly added, needs refactoring (inline: extract file filtering, result aggregation)
 - [ ] **`SemanticValidator._parse_response` CC=12, fan=17** — split JSON extraction, score normalization, and issue parsing into 3 methods
 - [ ] **`ComplexityValidator._check_python_complexity` CC=11** — extract radon block analysis and MI check into helpers
 - [ ] **`_output_rich` CC=11, fan=8** — extract verdict panel, results table, and issues list into separate renderers
-- [ ] **`ImportValidator.validate` CC=11** — extract AST walking into `_extract_imports()` generator
+- [ ] **`ImportValidator._validate_python` CC=10, fan=13** — extract AST walking into `_extract_imports()` generator
+- [ ] **`cli.validate` CC=high** — extract settings build, proposal build, and output dispatch
+
+**Priority 3: God Modules**
+
+- [ ] **`validators/imports.py` (653L, 22 methods)** — SPLIT into language-specific submodules: python.py, javascript.py, go.py, rust.py, java.py, c_cpp.py
+  - Risk: 22 import paths depend on this — maintain backward compatibility via `__init__.py` re-exports
+- [ ] **`cli.py` (401L, 8 methods, CC=42)** — SPLIT: extract output formatters to `output.py`, batch logic to `batch.py`
 
-9 more functions at CC 5–10 to review after critical ones are resolved.
+**Priority 4: Medium Complexity (CC 5-10)** — 19 functions to review after critical ones
 
 ## Multi-Language Support (Completed ✓)