refactoring

tom-sapletta-com · tom-sapletta-com · commit 2e145ed6a541 · 2026-02-25T10:25:03.000+01:00
diff --git a/Makefile b/Makefile
@@ -1,4 +1,5 @@
 .PHONY: help install install-dev install-full clean build test lint format typecheck publish publish-test docs docker
+.PHONY: benchmark benchmark-format benchmark-function benchmark-project benchmark-token benchmark-compare benchmark-toon examples
 
 POETRY := $(shell command -v poetry 2>/dev/null)
 ifeq ($(POETRY),)
@@ -298,6 +299,149 @@ run-compare: ## Compare sizes of all formats
 status: ## Show library status
 	code2logic --status
 
+# ============================================================================
+# Benchmarks
+# ============================================================================
+
+BENCH_SAMPLES := tests/samples
+BENCH_OUTPUT  := examples/output
+BENCH_LIMIT   := 20
+BENCH_FORMATS := yaml toon logicml json
+
+benchmark: benchmark-format benchmark-function benchmark-token benchmark-project benchmark-toon benchmark-compare ## Run all benchmarks (no LLM)
+	@echo ""
+	@echo "$(GREEN)All benchmarks completed!$(NC)"
+	@echo "Results in $(BENCH_OUTPUT)/"
+	@ls -lhS $(BENCH_OUTPUT)/*.json 2>/dev/null
+
+benchmark-format: ## Benchmark format reproduction (yaml/toon/logicml/json)
+	@echo "$(BLUE)━━━ Format Benchmark ━━━$(NC)"
+	$(PYTHON) examples/15_unified_benchmark.py \
+		--no-llm --type format \
+		--folder $(BENCH_SAMPLES)/ \
+		--formats $(BENCH_FORMATS) \
+		--limit $(BENCH_LIMIT) --verbose \
+		--output $(BENCH_OUTPUT)/benchmark_format.json
+
+benchmark-function: ## Benchmark function-level reproduction
+	@echo "$(BLUE)━━━ Function Benchmark ━━━$(NC)"
+	$(PYTHON) examples/15_unified_benchmark.py \
+		--no-llm --type function \
+		--file $(BENCH_SAMPLES)/sample_functions.py \
+		--limit 10 --verbose \
+		--output $(BENCH_OUTPUT)/benchmark_function.json
+
+benchmark-token: ## Benchmark token efficiency across formats
+	@echo "$(BLUE)━━━ Token Efficiency Benchmark ━━━$(NC)"
+	$(PYTHON) examples/11_token_benchmark.py \
+		--no-llm \
+		--folder $(BENCH_SAMPLES)/ \
+		--formats $(BENCH_FORMATS) \
+		--limit $(BENCH_LIMIT) --verbose \
+		--output $(BENCH_OUTPUT)/benchmark_token.json
+
+benchmark-project: ## Benchmark project-level reproduction
+	@echo "$(BLUE)━━━ Project Benchmark ━━━$(NC)"
+	$(PYTHON) examples/15_unified_benchmark.py \
+		--no-llm --type project \
+		--folder $(BENCH_SAMPLES)/ \
+		--formats $(BENCH_FORMATS) \
+		--limit $(BENCH_LIMIT) --verbose \
+		--output $(BENCH_OUTPUT)/benchmark_project.json
+
+benchmark-toon: ## Generate TOON + function-logic for self-analysis
+	@echo "$(BLUE)━━━ TOON Self-Analysis ━━━$(NC)"
+	@mkdir -p $(BENCH_OUTPUT)
+	$(PYTHON) -m code2logic ./ -f toon --compact --name project -o ./
+	$(PYTHON) -m code2logic ./ -f toon --compact --no-repeat-module --function-logic --with-schema --name project -o ./
+	$(PYTHON) -m code2logic ./ -f yaml --compact --name project -o $(BENCH_OUTPUT)/
+	$(PYTHON) -m code2logic ./ -f json --name project -o $(BENCH_OUTPUT)/
+	$(PYTHON) -m code2logic ./ -f markdown --name project -o $(BENCH_OUTPUT)/
+	$(PYTHON) -m code2logic ./ -f compact --name project -o $(BENCH_OUTPUT)/
+	$(PYTHON) -m code2logic ./ -f csv -d standard --name project -o $(BENCH_OUTPUT)/
+	@echo ""
+	@echo "$(BLUE)Format size comparison (self-analysis):$(NC)"
+	@printf "  %-25s %10s %10s\n" "Format" "Size" "~Tokens"
+	@printf "  %-25s %10s %10s\n" "-------------------------" "----------" "----------"
+	@for f in project.toon project.functions.toon $(BENCH_OUTPUT)/project.yaml $(BENCH_OUTPUT)/project.json $(BENCH_OUTPUT)/project.md $(BENCH_OUTPUT)/project.txt $(BENCH_OUTPUT)/project.csv; do \
+		if [ -f "$$f" ]; then \
+			sz=$$(wc -c < "$$f"); \
+			tok=$$((sz / 4)); \
+			printf "  %-25s %8s B %8s\n" "$$(basename $$f)" "$$sz" "$$tok"; \
+		fi; \
+	done
+	@echo ""
+	@echo "$(GREEN)TOON files:$(NC)"
+	@ls -lh project.toon project.functions.toon project.toon-schema.json project.functions-schema.json 2>/dev/null
+
+benchmark-compare: ## Show summary comparison of all benchmark results
+	@echo ""
+	@echo "$(BLUE)━━━ Benchmark Summary ━━━$(NC)"
+	@$(PYTHON) examples/benchmark_summary.py $(BENCH_OUTPUT)
+
+# ============================================================================
+# Examples (step by step)
+# ============================================================================
+
+examples: ## Run all examples step by step (no LLM required)
+	@mkdir -p $(BENCH_OUTPUT)
+	@echo "$(BLUE)━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━$(NC)"
+	@echo "$(BLUE)  Running all code2logic examples (--no-llm where needed)$(NC)"
+	@echo "$(BLUE)━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━$(NC)"
+	@echo ""
+	@echo "$(YELLOW)[1/16] Quick Start — basic analysis$(NC)"
+	$(PYTHON) examples/01_quick_start.py
+	@echo ""
+	@echo "$(YELLOW)[2/16] Refactoring — suggest improvements$(NC)"
+	$(PYTHON) examples/02_refactoring.py
+	@echo ""
+	@echo "$(YELLOW)[3/16] Reproduction — code ↔ spec round-trip$(NC)"
+	$(PYTHON) examples/03_reproduction.py --no-llm
+	@echo ""
+	@echo "$(YELLOW)[4/16] Project Analysis — multi-file$(NC)"
+	$(PYTHON) examples/04_project.py --no-llm
+	@echo ""
+	@echo "$(YELLOW)[5/16] LLM Integration — provider detection$(NC)"
+	$(PYTHON) examples/05_llm_integration.py --no-llm
+	@echo ""
+	@echo "$(YELLOW)[6/16] Metrics — reproduction quality$(NC)"
+	$(PYTHON) examples/06_metrics.py --no-llm
+	@echo ""
+	@echo "$(YELLOW)[7/16] Format Benchmark — compare formats$(NC)"
+	$(PYTHON) examples/08_format_benchmark.py --no-llm
+	@echo ""
+	@echo "$(YELLOW)[8/16] Async Benchmark — async code analysis$(NC)"
+	$(PYTHON) examples/09_async_benchmark.py --no-llm
+	@echo ""
+	@echo "$(YELLOW)[9/16] Function Reproduction — per-function$(NC)"
+	$(PYTHON) examples/10_function_reproduction.py --no-llm
+	@echo ""
+	@echo "$(YELLOW)[10/16] Token Benchmark — token efficiency$(NC)"
+	$(PYTHON) examples/11_token_benchmark.py --no-llm
+	@echo ""
+	@echo "$(YELLOW)[11/16] Comprehensive Analysis — full pipeline$(NC)"
+	$(PYTHON) examples/12_comprehensive_analysis.py --no-llm --limit 3
+	@echo ""
+	@echo "$(YELLOW)[12/16] Project Benchmark — project-level scores$(NC)"
+	$(PYTHON) examples/13_project_benchmark.py --no-llm
+	@echo ""
+	@echo "$(YELLOW)[13/16] Repeatability Test — determinism check$(NC)"
+	$(PYTHON) examples/14_repeatability_test.py --no-llm --file tests/samples/sample_functions.py --runs 2
+	@echo ""
+	@echo "$(YELLOW)[14/16] Unified Benchmark — all-in-one$(NC)"
+	$(PYTHON) examples/15_unified_benchmark.py --no-llm --verbose
+	@echo ""
+	@echo "$(YELLOW)[15/16] Terminal Demo — rich output$(NC)"
+	$(PYTHON) examples/16_terminal_demo.py
+	@echo ""
+	@echo "$(YELLOW)[16/16] Duplicate Detection$(NC)"
+	$(PYTHON) examples/duplicate_detection.py
+	@echo ""
+	@echo "$(GREEN)━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━$(NC)"
+	@echo "$(GREEN)  All 16 examples completed successfully!$(NC)"
+	@echo "$(GREEN)━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━$(NC)"
+	@echo "  Output: $(BENCH_OUTPUT)/"
+
 # ============================================================================
 # LLM Integration
 # ============================================================================
diff --git a/README.md b/README.md
@@ -49,7 +49,9 @@ pip install code2logic[nlp]         # Enhanced intents
 ## 📖 Quick Start
 ```bash
 code2logic ./ -f yaml --compact --function-logic --with-schema -o project.yaml
-code2logic ./ -f toon --ultra-compact --function-logic --with-schema -o project.toon
+code2logic ./ -f toon --function-logic --with-schema --name project -o ./
+# Optional: include function intent/purpose column in project.functions.toon
+code2logic ./ -f toon --function-logic --does --name project -o ./
 ```
     
 ### Command Line
diff --git a/code2logic/cli.py b/code2logic/cli.py
@@ -668,6 +668,11 @@ def _maybe_print_pretty_help() -> bool:
         action='store_true',
         help='Reduce repeated directory prefixes in function-logic TOON section function_details by using ./file for consecutive entries in the same folder.'
     )
+    parser.add_argument(
+        '--does',
+        action='store_true',
+        help='Include the does/intent column in function-logic TOON output. Without this flag, the does column is omitted to save tokens.'
+    )
     parser.add_argument(
         '--no-install',
         action='store_true',
@@ -1038,6 +1043,7 @@ def _maybe_print_pretty_help() -> bool:
                 detail=args.detail,
                 no_repeat_name=args.no_repeat_module,
                 no_repeat_details=args.no_repeat_details,
+                include_does=args.does,
             )
         else:
             logic_out = logic_gen.generate(project, detail=args.detail)
diff --git a/code2logic/function_logic.py b/code2logic/function_logic.py
@@ -65,6 +65,7 @@ def generate_toon(
         detail: str = 'full',
         no_repeat_name: bool = False,
         no_repeat_details: bool = False,
+        include_does: bool = False,
     ) -> str:
         if detail == 'detailed':
             detail = 'full'
@@ -110,7 +111,7 @@ def generate_toon(
             lines.append(f"  {toon._quote(details_key)}:")
 
             header = f"line{dm}name{dm}sig"
-            if detail in ('standard', 'full'):
+            if include_does and detail in ('standard', 'full'):
                 header += f"{dm}does"
             if detail == 'full':
                 header += f"{dm}decorators{dm}calls{dm}raises"
@@ -135,7 +136,7 @@ def generate_toon(
                     toon._quote(sig),
                 ]
 
-                if detail in ('standard', 'full'):
+                if include_does and detail in ('standard', 'full'):
                     does = self._build_does(func)
                     row.append(toon._quote(does))
 
diff --git a/code2logic/generators.py b/code2logic/generators.py
@@ -209,7 +209,8 @@ def _gen_module(self, lines: List[str], m: ModuleInfo,
             lines.append(f"imports: [{imps}]")
 
         if m.constants:
-            lines.append(f"constants: [{', '.join(m.constants[:5])}]")
+            cnames = [c.name if hasattr(c, 'name') else str(c) for c in m.constants[:5]]
+            lines.append(f"constants: [{', '.join(cnames)}]")
         lines.append("```")
         lines.append("")
 
diff --git a/docs/03-cli-reference.md b/docs/03-cli-reference.md
@@ -46,6 +46,7 @@ If `CODE2LOGIC_DEFAULT_PROVIDER=auto`, Code2Logic tries providers in priority or
 | `--ultra-compact` | | Use ultra-compact TOON format (71% smaller) |
 | `--no-repeat-module` | | Reduce repeated directory prefixes in TOON `modules[...]` tables by using `./file` for consecutive entries in the same folder |
 | `--no-repeat-details` | | Reduce repeated directory prefixes in function-logic TOON `function_details` section by using `./file` for consecutive entries in the same folder |
+| `--does` | | Include the `does` (intent/purpose) column in function-logic TOON output. Omitted by default to save tokens |
 | `--with-schema` | | Generate JSON schema alongside output |
 | `--verbose` | `-v` | Verbose output with timing |
 | `--debug` | | Debug output (very verbose) |
@@ -130,6 +131,12 @@ code2logic /path/to/project -f toon --ultra-compact --with-schema
 
 # Generate function-logic as TOON + compress function_details module keys
 code2logic /path/to/project -f toon --function-logic --name project -o ./ --no-repeat-details
+
+# Generate function-logic TOON with intent descriptions (does column)
+code2logic /path/to/project -f toon --function-logic --does --name project -o ./
+
+# Generate function-logic TOON + schema (project.functions.toon + project.functions-schema.json)
+code2logic /path/to/project -f toon --function-logic --with-schema --name project -o ./
 ```
 
 Token-oriented object notation - most efficient format for LLM consumption.
diff --git a/docs/07-toon.md b/docs/07-toon.md
@@ -168,22 +168,81 @@ modules[4]{path,lang,lines,kb}:
 **Example (function-logic TOON, function_details):**
 
 ```bash
-code2logic /path/to/project -f toon --function-logic --name project -o ./ --no-repeat-details
+code2logic /path/to/project -f toon --function-logic --with-schema --name project -o ./ --no-repeat-details
 ```
 
 Output fragment:
 
 ```toon
+# myproject function-logic | 3 modules
+# Convention: name with . = method, ~name = async, cc:N shown only when >1
+project: myproject
+generated: "2026-02-25T09:00:00"
+modules[3]{path,lang,items}:
+  firmware/main.py,py,4
+  ./test_main.py,py,15
+  db/config.py,py,5
+
 function_details:
   firmware/main.py:
-    functions[2]{line,name,kind,sig,async,cc,does}:
-      77,index_page,function,(),true,2,Serve the firmware UI
-      85,health_check,function,(),true,1,Health check endpoint
+    functions[4]{line,name,sig}:
+      77,~index_page cc:2,()
+      85,~health_check,()
+      90,~status,()
+      96,"~websocket_endpoint cc:5","(websocket:WebSocket)"
   ./test_main.py:
-    functions[1]{line,name,kind,sig,async,cc,does}:
-      14,TestFirmwareSimulator.test_health_check,method,(),false,1,Test basic health endpoint
+    functions[15]{line,name,sig}:
+      14,TestFirmwareSimulator.test_health_check,()
+      20,TestFirmwareSimulator.test_scenarios_fetch,()
+```
+
+If you also want the intent/purpose column, add `--does`:
+
+```bash
+code2logic /path/to/project -f toon --function-logic --does --name project -o ./ --no-repeat-details
 ```
 
+### Format Conventions (function-logic TOON)
+
+| Convention | Meaning | Example |
+|---|---|---|
+| Name with `.` | Method | `Config.get_api_key` |
+| Name without `.` | Top-level function | `main` |
+| `~` prefix | Async | `~index_page` |
+| `cc:N` suffix | Cyclomatic complexity > 1 | `~index_page cc:2` |
+| `./file` | Same directory as previous entry | `./test_main.py` |
+
+Only modules with at least one function/method are listed. Empty modules (`__init__.py`, `models.py` with 0 items) are omitted.
+
+### The `--does` flag
+
+By default, the `does` (intent/purpose) column is **omitted** from function-logic TOON to save tokens. Use `--does` to include it:
+
+```bash
+# Without --does (default, compact):
+#   functions[2]{line,name,sig}:
+#     77,~index_page cc:2,()
+
+# With --does (adds intent column):
+#   functions[2]{line,name,sig,does}:
+#     77,~index_page cc:2,(),Serve the firmware UI
+
+code2logic /path/to/project -f toon --function-logic --does --name project -o ./
+```
+
+Use `--does` when you need the LLM to understand **what each function does**, not just its signature. Omit it when you only need structure/navigation.
+
+### Schema Generation
+
+When `--with-schema` is used with `--function-logic` and TOON format, a JSON schema is written alongside:
+
+```bash
+code2logic /path/to/project -f toon --function-logic --with-schema --name project -o ./
+# Produces: project.functions.toon + project.functions-schema.json
+```
+
+If using `--stdout`, the function-logic schema is printed under the `=== FUNCTION_LOGIC_SCHEMA ===` section marker.
+
 Notes:
 
 - `--no-repeat-module` affects TOON `modules[...]` tables (main TOON output and function-logic TOON modules table).
diff --git a/examples/benchmark_summary.py b/examples/benchmark_summary.py
@@ -0,0 +1,54 @@
+#!/usr/bin/env python3
+"""Print benchmark summary from JSON result files."""
+import json
+import os
+import sys
+
+
+def main():
+    out = sys.argv[1] if len(sys.argv) > 1 else "examples/output"
+
+    files = {
+        "Format": os.path.join(out, "benchmark_format.json"),
+        "Token": os.path.join(out, "benchmark_token.json"),
+        "Project": os.path.join(out, "benchmark_project.json"),
+        "Function": os.path.join(out, "benchmark_function.json"),
+    }
+
+    print()
+    print(
+        f"{'Benchmark':<12} {'Files':>6} {'Avg Score':>10} "
+        f"{'Syntax OK':>10} {'Runs OK':>10} {'Best Format':>14} {'Time':>8}"
+    )
+    print("-" * 75)
+
+    for name, path in files.items():
+        if not os.path.exists(path):
+            continue
+        d = json.load(open(path))
+        total = d.get("total_files", d.get("total_functions", "-"))
+        print(
+            f"{name:<12} {total:>6} "
+            f"{d.get('avg_score', 0):>9.1f}% "
+            f"{d.get('syntax_ok_rate', 0):>9.0f}% "
+            f"{d.get('runs_ok_rate', 0):>9.0f}% "
+            f"{d.get('best_format', '-'):>14} "
+            f"{d.get('total_time', 0):>7.1f}s"
+        )
+
+    print()
+
+    fmt_path = os.path.join(out, "benchmark_format.json")
+    if os.path.exists(fmt_path):
+        d = json.load(open(fmt_path))
+        scores = d.get("format_scores", {})
+        if scores:
+            print("Format scores:")
+            for fmt, sc in sorted(scores.items(), key=lambda x: -x[1]):
+                bar = "\u2588" * int(sc / 2)
+                print(f"  {fmt:<10} {sc:>6.1f}%  {bar}")
+            print()
+
+
+if __name__ == "__main__":
+    main()
diff --git a/project.functions-schema.json b/project.functions-schema.json
diff --git a/project.functions.toon b/project.functions.toon
diff --git a/project.toon b/project.toon