init

codelion · codelion · commit 2c6298f571e5 · 2025-05-19T14:49:40.000+08:00
diff --git a/examples/circle_packing/README.md b/examples/circle_packing/README.md
@@ -0,0 +1,71 @@
+# Circle Packing Example
+
+This example attempts to replicate one of the results from the AlphaEvolve paper (Section B.12): packing circles inside a unit square to maximize the sum of their radii.
+
+## Problem Description
+
+Given a positive integer n, the problem is to pack n disjoint circles inside a unit square so as to maximize the sum of their radii. The circles must:
+- Lie entirely within the unit square [0,1] × [0,1]
+- Not overlap with each other
+
+This is a well-studied problem in computational geometry with applications in various fields including material science, facility location, and computer graphics.
+
+## AlphaEvolve Results
+
+According to the paper, AlphaEvolve found new constructions improving the state of the art:
+- For n = 26, improved from 2.634 to 2.635
+- For n = 32, improved from 2.936 to 2.937
+
+## Running the Example
+
+```bash
+python openevolve-run.py examples/circle_packing/initial_program.py examples/circle_packing/evaluator.py --config examples/circle_packing/config.yaml --iterations 100
+```
+
+## Evaluation Metrics
+
+The evaluator calculates several metrics:
+- `sum_radii_26`: Sum of radii for n=26
+- `sum_radii_32`: Sum of radii for n=32
+- `target_ratio_26`: Ratio of achieved sum to target (2.635) for n=26
+- `target_ratio_32`: Ratio of achieved sum to target (2.937) for n=32
+- `validity`: 1.0 if solutions for both n=26 and n=32 are valid, 0.0 otherwise
+- `avg_target_ratio`: Average of target ratios
+- `combined_score`: avg_target_ratio * validity (main fitness metric)
+
+## Expected Results
+
+A successful run should find packing arrangements with sums approaching or exceeding the values reported in the AlphaEvolve paper:
+- n=26: 2.635
+- n=32: 2.937
+
+## Visualization
+
+You can visualize the best solution by adding a visualization function to the best program:
+
+```python
+def visualize(centers, radii):
+    import matplotlib.pyplot as plt
+    from matplotlib.patches import Circle
+    
+    fig, ax = plt.subplots(figsize=(8, 8))
+    
+    # Draw unit square
+    ax.set_xlim(0, 1)
+    ax.set_ylim(0, 1)
+    ax.set_aspect('equal')
+    ax.grid(True)
+    
+    # Draw circles
+    for i, (center, radius) in enumerate(zip(centers, radii)):
+        circle = Circle(center, radius, alpha=0.5)
+        ax.add_patch(circle)
+        ax.text(center[0], center[1], str(i), ha='center', va='center')
+    
+    plt.title(f"Circle Packing (n={len(centers)}, sum={sum(radii):.6f})")
+    plt.show()
+    
+# Example usage:
+# centers, radii, sum_radii = run_packing(26)
+# visualize(centers, radii)
+```
diff --git a/examples/circle_packing/config.yaml b/examples/circle_packing/config.yaml
@@ -0,0 +1,44 @@
+# Configuration for circle packing example
+max_iterations: 100
+checkpoint_interval: 10
+log_level: "INFO"
+
+# LLM configuration
+llm:
+  # primary_model: "gemini-2.0-flash-lite"
+  primary_model: "llama3.1-8b"
+  primary_model_weight: 0.8
+  # secondary_model: "gemini-2.0-flash"
+  secondary_model: "llama-4-scout-17b-16e-instruct"
+  secondary_model_weight: 0.2
+  # api_base: "https://generativelanguage.googleapis.com/v1beta/openai/"
+  api_base: "https://api.cerebras.ai/v1"
+  temperature: 0.7
+  top_p: 0.95
+  max_tokens: 4096
+
+# Prompt configuration
+prompt:
+  system_message: "You are an expert programmer specializing in optimization algorithms and computational geometry. Your task is to improve a circle packing algorithm to maximize the sum of radii when packing n circles in a unit square without overlaps. The AlphaEvolve paper achieved a sum of 2.635 for n=26 and 2.937 for n=32. Focus on finding better optimization strategies to reach or exceed these values."
+  num_top_programs: 3
+  use_template_stochasticity: true
+
+# Database configuration
+database:
+  population_size: 50
+  archive_size: 20
+  num_islands: 3
+  elite_selection_ratio: 0.2
+  exploitation_ratio: 0.7
+
+# Evaluator configuration
+evaluator:
+  timeout: 60
+  cascade_evaluation: true
+  cascade_thresholds: [0.5, 0.75]
+  parallel_evaluations: 4
+  use_llm_feedback: false
+
+# Evolution settings
+diff_based_evolution: true
+allow_full_rewrites: false
diff --git a/examples/circle_packing/evaluator.py b/examples/circle_packing/evaluator.py
@@ -0,0 +1,257 @@
+"""
+Evaluator for circle packing example
+"""
+
+import importlib.util
+import numpy as np
+import time
+import concurrent.futures
+import threading
+import traceback
+import sys
+
+
+def run_with_timeout(func, args=(), kwargs={}, timeout_seconds=30):
+    """
+    Run a function with a timeout using concurrent.futures
+
+    Args:
+        func: Function to run
+        args: Arguments to pass to the function
+        kwargs: Keyword arguments to pass to the function
+        timeout_seconds: Timeout in seconds
+
+    Returns:
+        Result of the function or raises TimeoutError
+    """
+    with concurrent.futures.ThreadPoolExecutor(max_workers=1) as executor:
+        future = executor.submit(func, *args, **kwargs)
+        try:
+            return future.result(timeout=timeout_seconds)
+        except concurrent.futures.TimeoutError:
+            raise TimeoutError(
+                f"Function {func.__name__} timed out after {timeout_seconds} seconds"
+            )
+
+
+def validate_packing(centers, radii):
+    """
+    Validate that circles don't overlap and are inside the unit square
+
+    Args:
+        centers: np.array of shape (n, 2) with (x, y) coordinates
+        radii: np.array of shape (n) with radius of each circle
+
+    Returns:
+        True if valid, False otherwise
+    """
+    n = centers.shape[0]
+
+    # Check if circles are inside the unit square
+    for i in range(n):
+        x, y = centers[i]
+        r = radii[i]
+        if x - r < -1e-6 or x + r > 1 + 1e-6 or y - r < -1e-6 or y + r > 1 + 1e-6:
+            print(f"Circle {i} at ({x}, {y}) with radius {r} is outside the unit square")
+            return False
+
+    # Check for overlaps
+    for i in range(n):
+        for j in range(i + 1, n):
+            dist = np.sqrt(np.sum((centers[i] - centers[j]) ** 2))
+            if dist < radii[i] + radii[j] - 1e-6:  # Allow for tiny numerical errors
+                print(f"Circles {i} and {j} overlap: dist={dist}, r1+r2={radii[i]+radii[j]}")
+                return False
+
+    return True
+
+
+def evaluate(program_path):
+    """
+    Evaluate the program by running it for n=26 and n=32 and checking the sum of radii
+
+    Args:
+        program_path: Path to the program file
+
+    Returns:
+        Dictionary of metrics
+    """
+    # Target values from the paper
+    TARGETS = {26: 2.635, 32: 2.937}  # AlphaEvolve result for n=26  # AlphaEvolve result for n=32
+
+    try:
+        # Load the program
+        spec = importlib.util.spec_from_file_location("program", program_path)
+        program = importlib.util.module_from_spec(spec)
+        spec.loader.exec_module(program)
+
+        # Check if the required function exists
+        if not hasattr(program, "run_packing"):
+            print(f"Error: program does not have 'run_packing' function")
+            return {"sum_radii": 0.0, "validity": 0.0, "combined_score": 0.0}
+
+        # Run for two different n values
+        results = {}
+
+        for n in [26, 32]:
+            try:
+                start_time = time.time()
+
+                # Run packing with timeout
+                centers, radii, sum_radii = run_with_timeout(
+                    program.run_packing, args=(n,), timeout_seconds=30
+                )
+
+                end_time = time.time()
+
+                # Ensure centers and radii are numpy arrays
+                if not isinstance(centers, np.ndarray):
+                    centers = np.array(centers)
+                if not isinstance(radii, np.ndarray):
+                    radii = np.array(radii)
+
+                # Validate solution
+                valid = validate_packing(centers, radii)
+
+                # Check shape and size
+                shape_valid = centers.shape == (n, 2) and radii.shape == (n,)
+                if not shape_valid:
+                    print(
+                        f"Invalid shapes: centers={centers.shape}, radii={radii.shape}, expected ({n}, 2) and ({n},)"
+                    )
+                    valid = False
+
+                # Recalculate sum to verify
+                actual_sum = np.sum(radii) if valid else 0.0
+
+                # Make sure sum_radii matches the actual sum
+                if abs(actual_sum - sum_radii) > 1e-6:
+                    print(
+                        f"Warning: Reported sum {sum_radii} doesn't match calculated sum {actual_sum}"
+                    )
+
+                target = TARGETS[n]
+
+                # Store results
+                results[n] = {
+                    "valid": valid,
+                    "sum_radii": actual_sum,
+                    "time": end_time - start_time,
+                    "target_ratio": actual_sum / target if valid else 0.0,
+                }
+
+                print(
+                    f"n={n}: valid={valid}, sum_radii={actual_sum:.6f}, target={target}, ratio={actual_sum/target if valid else 0:.6f}"
+                )
+
+            except TimeoutError as e:
+                print(f"Timeout running for n={n}: {str(e)}")
+                results[n] = {
+                    "valid": False,
+                    "sum_radii": 0.0,
+                    "time": 30.0,  # timeout value
+                    "target_ratio": 0.0,
+                }
+            except Exception as e:
+                print(f"Error running for n={n}: {str(e)}")
+                traceback.print_exc()
+                results[n] = {"valid": False, "sum_radii": 0.0, "time": 0.0, "target_ratio": 0.0}
+
+        # Calculate combined metrics
+        avg_ratio = (results[26]["target_ratio"] + results[32]["target_ratio"]) / 2
+        validity = 1.0 if results[26]["valid"] and results[32]["valid"] else 0.0
+
+        # Return metrics - higher values are better
+        return {
+            "sum_radii_26": float(results[26]["sum_radii"]),
+            "sum_radii_32": float(results[32]["sum_radii"]),
+            "target_ratio_26": float(results[26]["target_ratio"]),
+            "target_ratio_32": float(results[32]["target_ratio"]),
+            "validity": float(validity),
+            "avg_target_ratio": float(avg_ratio),
+            "combined_score": float(avg_ratio * validity),
+        }
+
+    except Exception as e:
+        print(f"Evaluation failed completely: {str(e)}")
+        traceback.print_exc()
+        return {
+            "sum_radii_26": 0.0,
+            "sum_radii_32": 0.0,
+            "target_ratio_26": 0.0,
+            "target_ratio_32": 0.0,
+            "validity": 0.0,
+            "avg_target_ratio": 0.0,
+            "combined_score": 0.0,
+        }
+
+
+# Stage-based evaluation for cascade evaluation
+def evaluate_stage1(program_path):
+    """
+    First stage evaluation - quick validation check with only n=26
+    """
+    try:
+        # Load the program
+        spec = importlib.util.spec_from_file_location("program", program_path)
+        program = importlib.util.module_from_spec(spec)
+        spec.loader.exec_module(program)
+
+        # Check if the required function exists
+        if not hasattr(program, "run_packing"):
+            print(f"Error: program does not have 'run_packing' function")
+            return {"validity": 0.0, "error": "Missing run_packing function"}
+
+        try:
+            # Run with a lower iteration count for quicker checking
+            centers, radii, sum_radii = run_with_timeout(
+                program.run_packing, args=(26,), timeout_seconds=10
+            )
+
+            # Ensure centers and radii are numpy arrays
+            if not isinstance(centers, np.ndarray):
+                centers = np.array(centers)
+            if not isinstance(radii, np.ndarray):
+                radii = np.array(radii)
+
+            # Validate solution (shapes and constraints)
+            shape_valid = centers.shape == (26, 2) and radii.shape == (26,)
+            if not shape_valid:
+                print(f"Invalid shapes: centers={centers.shape}, radii={radii.shape}")
+                return {"validity": 0.0, "error": "Invalid shapes"}
+
+            valid = validate_packing(centers, radii)
+
+            # Calculate sum
+            actual_sum = np.sum(radii) if valid else 0.0
+
+            # Target from paper
+            target = 2.635
+
+            # Return evaluation metrics
+            return {
+                "validity": 1.0 if valid else 0.0,
+                "sum_radii": float(actual_sum),
+                "target_ratio": float(actual_sum / target if valid else 0.0),
+            }
+
+        except TimeoutError as e:
+            print(f"Stage 1 evaluation timed out: {e}")
+            return {"validity": 0.0, "error": "Timeout"}
+        except Exception as e:
+            print(f"Stage 1 evaluation failed: {e}")
+            print(traceback.format_exc())
+            return {"validity": 0.0, "error": str(e)}
+
+    except Exception as e:
+        print(f"Stage 1 evaluation failed completely: {e}")
+        print(traceback.format_exc())
+        return {"validity": 0.0, "error": str(e)}
+
+
+def evaluate_stage2(program_path):
+    """
+    Second stage evaluation - full evaluation with n=26 and n=32
+    """
+    # Full evaluation as in the main evaluate function
+    return evaluate(program_path)
diff --git a/examples/circle_packing/initial_program.py b/examples/circle_packing/initial_program.py