Move CI scripts to standard scripts directory

khaosans · khaosans · commit 2a7f89097854 · 2025-08-19T16:28:14.000-07:00
- Move test_performance_regression.py from temp/one-off-scripts/ to scripts/
- Move generate_final_report.py from temp/one-off-scripts/ to scripts/
- Move generate_assets.py from temp/one-off-scripts/ to scripts/
- Move generate_test_assets.py from temp/one-off-scripts/ to scripts/
- Update all GitHub Actions workflow references to use scripts/ directory

This ensures CI scripts are in a standard, accessible location and fixes
path issues in the GitHub Actions environment.
diff --git a/.github/workflows/verify.yml b/.github/workflows/verify.yml
@@ -54,7 +54,7 @@ jobs:
           retention-days: 30
       - name: Generate Final Test Report
         run: |
-          poetry run python temp/one-off-scripts/generate_final_report.py || true
+          poetry run python scripts/generate_final_report.py || true
       - name: Upload Final Test Report
         uses: actions/upload-artifact@v4
         with:
@@ -107,7 +107,7 @@ jobs:
       
       - name: Generate test fixtures
         run: |
-          poetry run python temp/one-off-scripts/generate_test_assets.py || echo "Test assets generation failed, continuing..."
+          poetry run python scripts/generate_test_assets.py || echo "Test assets generation failed, continuing..."
       
       - name: Run E2E tests
         run: |
@@ -167,7 +167,7 @@ jobs:
         run: |
           mkdir -p tests/data
           mkdir -p test_chroma_db
-          poetry run python temp/one-off-scripts/generate_assets.py || echo "Test assets generation failed, continuing..."
+          poetry run python scripts/generate_assets.py || echo "Test assets generation failed, continuing..."
       - name: Run integration tests
         run: |
           poetry run pytest -n auto tests/ -m "integration" -v --tb=short --timeout=300
@@ -186,7 +186,7 @@ jobs:
           rm -rf tests/data/test_*
       - name: Generate Final Test Report
         run: |
-          poetry run python temp/one-off-scripts/generate_final_report.py || true
+          poetry run python scripts/generate_final_report.py || true
       - name: Upload Final Test Report
         uses: actions/upload-artifact@v4
         with:
@@ -233,10 +233,10 @@ jobs:
           # Check if any tests were actually run
           if echo "$TEST_OUTPUT" | grep -q "no tests ran"; then
             echo "No performance tests found, running fallback script..."
-            poetry run python temp/one-off-scripts/test_performance_regression.py
+            poetry run python scripts/test_performance_regression.py
           elif [ $TEST_EXIT_CODE -ne 0 ]; then
             echo "Performance tests failed, running fallback script..."
-            poetry run python temp/one-off-scripts/test_performance_regression.py
+            poetry run python scripts/test_performance_regression.py
           else
             echo "Performance tests completed successfully"
           fi
@@ -249,7 +249,7 @@ jobs:
           retention-days: 30
       - name: Generate Final Test Report
         run: |
-          poetry run python temp/one-off-scripts/generate_final_report.py || true
+          poetry run python scripts/generate_final_report.py || true
       - name: Check Final Test Report Exists
         run: |
           if [ ! -f final_test_report.md ]; then
diff --git a/scripts/generate_assets.py b/scripts/generate_assets.py
@@ -0,0 +1,62 @@
+import os
+from PIL import Image
+
+def ensure_dir(directory):
+    if not os.path.exists(directory):
+        os.makedirs(directory)
+
+def generate_assets(logo_path):
+    # Create directories
+    dirs = [
+        'assets/brand/logo',
+        'assets/brand/favicon',
+        'assets/brand/social'
+    ]
+    for dir_path in dirs:
+        ensure_dir(dir_path)
+    
+    # Load the logo
+    logo = Image.open(logo_path)
+    
+    # Save full logo
+    logo.save('assets/brand/logo/elron-logo-full.png', 'PNG')
+    
+    # Generate favicons
+    favicon_sizes = {
+        16: 'favicon-16x16.png',
+        32: 'favicon-32x32.png',
+        180: 'apple-touch-icon.png'
+    }
+    
+    for size, filename in favicon_sizes.items():
+        resized = logo.resize((size, size), Image.LANCZOS)
+        resized.save(f'assets/brand/favicon/{filename}')
+    
+    # Generate social media images
+    social_sizes = {
+        'og-image.png': (1200, 630),
+        'twitter-card.png': (1200, 600)
+    }
+    
+    for filename, (width, height) in social_sizes.items():
+        # Create social media image with logo
+        social_img = Image.new('RGB', (width, height), (15, 23, 42))  # Dark background
+        
+        # Calculate dimensions for the logo (use 1/3 of the height)
+        logo_height = height // 3
+        aspect_ratio = logo.width / logo.height
+        logo_width = int(logo_height * aspect_ratio)
+        
+        # Resize logo
+        resized_logo = logo.resize((logo_width, logo_height), Image.LANCZOS)
+        
+        # Calculate position to center the logo
+        x = (width - logo_width) // 2
+        y = (height - logo_height) // 2
+        
+        # Paste the logo
+        social_img.paste(resized_logo, (x, y))
+        social_img.save(f'assets/brand/social/{filename}')
+
+if __name__ == "__main__":
+    generate_assets('LOGO.jpg')
diff --git a/scripts/generate_final_report.py b/scripts/generate_final_report.py
@@ -0,0 +1,159 @@
+#!/usr/bin/env python3
+"""
+Aggregate all test, coverage, LLM Judge, and performance results into a single Markdown report for CI/CD.
+"""
+import os
+import json
+from datetime import datetime
+
+def read_json(path):
+    try:
+        with open(path, 'r') as f:
+            return json.load(f)
+    except FileNotFoundError:
+        print(f"⚠️  File not found: {path}")
+        return None
+    except json.JSONDecodeError as e:
+        print(f"⚠️  Failed to decode JSON from {path}: {e}")
+        return None
+    except Exception as e:
+        print(f"⚠️  Unexpected error reading {path}: {e}")
+        return None
+
+def read_coverage():
+    # Try to read coverage summary from htmlcov or coverage.xml
+    summary = {}
+    if os.path.exists('htmlcov/index.html'):
+        # Parse HTML for total coverage (simple regex)
+        try:
+            with open('htmlcov/index.html') as f:
+                html = f.read()
+            import re
+            m = re.search(r'TOTAL.*?(\d+)%', html)
+            if m:
+                summary['total'] = int(m.group(1))
+        except Exception:
+            pass
+    if os.path.exists('coverage.xml'):
+        try:
+            import xml.etree.ElementTree as ET
+            tree = ET.parse('coverage.xml')
+            root = tree.getroot()
+            summary['total'] = float(root.attrib.get('line-rate', 0)) * 100
+        except Exception:
+            pass
+    return summary
+
+def read_pytest_results():
+    # Try to read pytest output from last run (if available)
+    log_path = 'ci_build_doc_test.log'
+    if not os.path.exists(log_path):
+        return None
+    summary = {}
+    try:
+        with open(log_path) as f:
+            lines = f.readlines()
+        for line in lines:
+            if 'collected' in line and 'items' in line:
+                summary['collected'] = int(line.split('collected')[1].split('items')[0].strip())
+            if 'passed' in line and 'skipped' in line:
+                import re
+                m = re.findall(r'(\d+) passed', line)
+                if m:
+                    summary['passed'] = int(m[0])
+                m = re.findall(r'(\d+) skipped', line)
+                if m:
+                    summary['skipped'] = int(m[0])
+        return summary
+    except Exception as e:
+        print(f"⚠️  Error parsing pytest log: {e}")
+        return {}
+
+def main():
+    now = datetime.utcnow().strftime('%Y-%m-%d %H:%M UTC')
+    report = [f"# 🧪 Final Test Report\n\n*Generated: {now}*\n"]
+
+    # Test summary
+    pytest_results = read_pytest_results()
+    if pytest_results is not None:
+        if pytest_results:
+            report.append("## ✅ Test Results Summary\n")
+            report.append(f"- Total tests collected: {pytest_results.get('collected','?')}")
+            report.append(f"- Passed: {pytest_results.get('passed','?')}")
+            report.append(f"- Skipped: {pytest_results.get('skipped','?')}")
+            report.append("")
+        else:
+            report.append("## ✅ Test Results Summary\n- ⚠️  Pytest log found but no summary could be parsed.\n")
+    else:
+        report.append("## ✅ Test Results Summary\n- ⚠️  No pytest summary found.\n")
+
+    # Coverage summary
+    coverage = read_coverage()
+    if coverage and 'total' in coverage:
+        report.append(f"## 📊 Coverage Summary\n- Total coverage: **{coverage['total']}%**\n")
+    else:
+        report.append("## 📊 Coverage Summary\n- ⚠️  No coverage data found.\n")
+
+    # LLM Judge results
+    llm_judge = read_json('llm_judge_results.json')
+    if llm_judge:
+        report.append("## 🤖 LLM Judge Results\n")
+        score = llm_judge.get('overall_score', '?')
+        report.append(f"- Overall Score: **{score}/10**")
+        if 'scores' in llm_judge:
+            report.append("- Score Breakdown:")
+            for k, v in llm_judge['scores'].items():
+                if isinstance(v, dict):
+                    report.append(f"    - {k}: {v.get('score','?')}/10 — {v.get('justification','')}")
+                else:
+                    report.append(f"    - {k}: {v}")
+        if 'recommendations' in llm_judge:
+            report.append("- Recommendations:")
+            for rec in llm_judge['recommendations']:
+                report.append(f"    - {rec}")
+        if 'next_steps' in llm_judge:
+            report.append("- Next Steps:")
+            for step in llm_judge['next_steps']:
+                report.append(f"    - {step}")
+        report.append("")
+    else:
+        report.append("## 🤖 LLM Judge Results\n- ⚠️  No LLM Judge results found.\n")
+
+    # Performance metrics
+    perf = read_json('performance_metrics.json')
+    if perf:
+        report.append("## 🚦 Performance Metrics\n")
+        for k in ['elapsed_seconds','memory_mb','threshold_seconds','threshold_mb','status']:
+            if k in perf:
+                report.append(f"- {k.replace('_',' ').title()}: {perf[k]}")
+        report.append("")
+    else:
+        report.append("## 🚦 Performance Metrics\n- ⚠️  No performance metrics found.\n")
+
+    # Recommendations (consolidated, no duplicates)
+    report.append("## 📝 Recommendations\n")
+    any_recommendation = False
+    if llm_judge and 'recommendations' in llm_judge and llm_judge['recommendations']:
+        for rec in llm_judge['recommendations']:
+            report.append(f"- {rec}")
+        any_recommendation = True
+    if coverage and coverage.get('total',0) < 50:
+        report.append("- 🚨 Coverage is below 50%. Add more tests!")
+        any_recommendation = True
+    if perf and perf.get('status') == 'FAIL':
+        report.append("- 🚨 Performance regression detected. Optimize code or dependencies.")
+        any_recommendation = True
+    if not any_recommendation:
+        report.append("- No additional recommendations.\n")
+    report.append("")
+
+    # Comparison to previous run (stub)
+    report.append("## 🔄 Comparison to Previous Run\n- (Comparison feature coming soon)\n")
+
+    # Save report
+    with open('final_test_report.md','w') as f:
+        f.write('\n'.join(report))
+    print("✅ Final test report generated: final_test_report.md")
+
+if __name__ == "__main__":
+    main() 
diff --git a/scripts/generate_test_assets.py b/scripts/generate_test_assets.py
@@ -0,0 +1,32 @@
+#!/usr/bin/env python3
+"""
+Generate lightweight test assets for integration tests
+"""
+
+import os
+from pathlib import Path
+
+def create_test_files():
+    """Create minimal test files for integration tests"""
+    test_dir = Path("tests/data")
+    test_dir.mkdir(parents=True, exist_ok=True)
+    
+    # Create minimal test PDF
+    pdf_content = b'%PDF-1.4\n1 0 obj\n<<\n/Type /Catalog\n/Pages 2 0 R\n>>\nendobj\n2 0 obj\n<<\n/Type /Pages\n/Kids [3 0 R]\n/Count 1\n>>\nendobj\n3 0 obj\n<<\n/Type /Page\n/Parent 2 0 R\n/MediaBox [0 0 612 792]\n/Contents 4 0 R\n>>\nendobj\n4 0 obj\n<<\n/Length 44\n>>\nstream\nBT\n/F1 12 Tf\n72 720 Td\n(Test PDF) Tj\nET\nendstream\nendobj\nxref\n0 5\n0000000000 65535 f \n0000000009 00000 n \n0000000058 00000 n \n0000000115 00000 n \n0000000204 00000 n \ntrailer\n<<\n/Size 5\n/Root 1 0 R\n>>\nstartxref\n297\n%%EOF'
+    
+    with open(test_dir / "test_document.pdf", "wb") as f:
+        f.write(pdf_content)
+    
+    # Create minimal test text file
+    with open(test_dir / "test_document.txt", "w") as f:
+        f.write("This is a test document for integration testing.")
+    
+    # Create minimal test image (1x1 pixel PNG)
+    png_content = b'\x89PNG\r\n\x1a\n\x00\x00\x00\rIHDR\x00\x00\x00\x01\x00\x00\x00\x01\x08\x02\x00\x00\x00\x90wS\xde\x00\x00\x00\tpHYs\x00\x00\x0b\x13\x00\x00\x0b\x13\x01\x00\x9a\x9c\x18\x00\x00\x00\x0cIDATx\x9cc```\x00\x00\x00\x04\x00\x01\xf6\x178U\x00\x00\x00\x00IEND\xaeB`\x82'
+    
+    with open(test_dir / "test_image.png", "wb") as f:
+        f.write(png_content)
+
+if __name__ == "__main__":
+    create_test_files()
+    print("✅ Test assets generated successfully!") 
diff --git a/scripts/test_performance_regression.py b/scripts/test_performance_regression.py