tylerbessire
diff --git a/‎.DS_Store‎
0 Bytes b/‎.DS_Store‎
0 Bytes
diff --git a/‎arc_solver/__pycache__/enhanced_search.cpython-313.pyc‎
1.44 KB b/‎arc_solver/__pycache__/enhanced_search.cpython-313.pyc‎
1.44 KB
diff --git a/‎arc_solver/__pycache__/solver.cpython-313.pyc‎
21.1 KB b/‎arc_solver/__pycache__/solver.cpython-313.pyc‎
21.1 KB
diff --git a/‎arc_solver/behavioral_engine.py‎
Lines changed: 27 additions & 1 deletion b/‎arc_solver/behavioral_engine.py‎
Lines changed: 27 additions & 1 deletion
diff --git a/‎arc_solver/dsl.py‎
Lines changed: 0 additions & 71 deletions b/‎arc_solver/dsl.py‎
Lines changed: 0 additions & 71 deletions
@@ -58,6 +58,7 @@ class RewardBreakdown:
     shape_accuracy: float
     behaviour_bonus: float
     program_length_penalty: float
+    generalization_penalty: float
     reward: float
 
 
@@ -115,15 +116,38 @@ def grade(
             + shape_accuracy * self.shape_weight
             + behaviour_bonus * self.behaviour_weight
         )
-        reward = max(0.0, min(1.0, reward - penalty))
+        generalization_penalty = self._generalization_penalty(predictions, targets)
+        reward = max(0.0, min(1.0, reward - penalty - generalization_penalty))
         return RewardBreakdown(
             pixel_accuracy=pixel_accuracy,
             shape_accuracy=shape_accuracy,
             behaviour_bonus=behaviour_bonus,
             program_length_penalty=penalty,
+            generalization_penalty=generalization_penalty,
             reward=reward,
         )
 
+    def _generalization_penalty(
+        self,
+        predictions: Sequence[Array],
+        targets: Sequence[Array],
+    ) -> float:
+        penalty = 0.0
+        if len(predictions) > 1 and len(targets) > 1:
+            first_pred = predictions[0]
+            preds_identical = all(np.array_equal(first_pred, pred) for pred in predictions[1:])
+            first_target = targets[0]
+            targets_identical = all(np.array_equal(first_target, tgt) for tgt in targets[1:])
+            if preds_identical and not targets_identical:
+                penalty += 0.1
+
+        constant_predictions = all(np.all(pred == pred.flat[0]) for pred in predictions) if predictions else False
+        constant_targets = all(np.all(tgt == tgt.flat[0]) for tgt in targets) if targets else False
+        if constant_predictions and not constant_targets:
+            penalty += 0.1
+
+        return penalty
+
 
 @dataclass
 class BehaviouralMetrics:
@@ -231,6 +255,7 @@ def train(
                 continue
             solved = best_breakdown.reward > 0.999
             guidance.reinforce(train_pairs, best_program, best_breakdown.reward, inference)
+            search.intraverbal.reinforce(best_program, best_breakdown.reward)
             episodic.add_successful_solution(
                 train_pairs,
                 [best_program],
@@ -311,6 +336,7 @@ def _emit_metrics(
             "pixel_accuracy": breakdown.pixel_accuracy,
             "shape_accuracy": breakdown.shape_accuracy,
             "behaviour_bonus": breakdown.behaviour_bonus,
+            "generalization_penalty": breakdown.generalization_penalty,
             "program_length": len(program),
             "global": self.metrics.as_dict(),
         }
 
@@ -21,7 +21,6 @@
     pad_to,
     bg_color,
 )
-from .patterns import PlaceholderTemplate, PlaceholderTemplateEngine
 
 
 class Op:
@@ -628,69 +627,6 @@ def op_human_spatial_reasoning(a: Array, hypothesis_name: str = "",
     return a  # Will be replaced by the actual hypothesis result
 
 
-# Custom operations for placeholder reconstruction
-def op_create_pattern_fill(a: Array, pattern: List[int], target_bounds: Tuple[int, int, int, int], direction: str) -> Array:
-    """Create a grid with pattern filled in the target bounds."""
-    from .placeholder_reconstruction import create_pattern_fill
-    return create_pattern_fill(a, pattern, target_bounds, direction)
-
-
-def op_tile_pattern(a: Array, pattern: List[int], target_bounds: Tuple[int, int, int, int], direction: str) -> Array:
-    """Tile a pattern within the target bounds."""
-    from .placeholder_reconstruction import tile_pattern
-    return tile_pattern(a, pattern, target_bounds, direction)
-
-
-def op_paste_at(source: Array, target_top: int, target_left: int, *, target_grid: Optional[Array] = None) -> Array:
-    """Paste source grid into target at specified position."""
-    from .placeholder_reconstruction import paste_at
-    if target_grid is None:
-        # Create a target grid of appropriate size
-        target_grid = np.zeros((source.shape[0] + target_top, source.shape[1] + target_left), dtype=source.dtype)
-    return paste_at(source, target_grid, target_top, target_left)
-
-
-def op_apply_advanced_mirroring(a: Array, template: Any, strategy: str) -> Array:
-    """Apply advanced mirroring strategies."""
-    from .placeholder_reconstruction import apply_advanced_mirroring
-    return apply_advanced_mirroring(a, template, strategy)
-
-
-def op_derive_recolor_mapping(a: Array, template: Any, candidate_region: Array) -> Dict[int, int]:
-    """Derive recolor mapping from border analysis."""
-    from .placeholder_reconstruction import derive_recolor_mapping
-    return derive_recolor_mapping(a, template, candidate_region)
-
-
-def op_extract_stripe_patterns(a: Array, template: Any) -> Dict[str, Array]:
-    """Extract stripe patterns from borders."""
-    from .placeholder_reconstruction import extract_stripe_patterns
-    return extract_stripe_patterns(a, template)
-
-
-def op_apply_placeholder_template(a: Array, template_signature: str, template_shape: Tuple[int, int]) -> Array:
-    """Applies a placeholder template to reconstruct a grid."""
-    engine = PlaceholderTemplateEngine()
-    # This is a simplified version. We need to reconstruct the template object.
-    # For now, we'll rely on the engine's internal cache if it exists, 
-    # but this will likely fail if the template isn't already in memory.
-    # A proper implementation would need to deserialize the template fully.
-    template = PlaceholderTemplate(signature=template_signature, placeholder_shape=template_shape, fill_fn=lambda x: x) # Dummy fill_fn
-    result = engine.apply_template(a, template)
-    if result is None:
-        raise ValueError("Failed to apply placeholder template from macro.")
-    return result
-
-
-def op_extract_using_transformation(a: Array, **kwargs) -> Array:
-    """Placeholder for applying a transformation from a macro."""
-    # This is a complex operation that depends on the HumanGradeReasoner state.
-    # Implementing this as a pure function would require significant refactoring.
-    # For now, this will act as a placeholder and return the input grid.
-    print("WARNING: op_extract_using_transformation is not fully implemented and will not produce the correct output.")
-    return a
-
-
 # Registry of primitive operations ---------------------------------------------------------
 OPS: Dict[str, Op] = {
     "identity": Op("identity", op_identity, 1, []),
@@ -715,13 +651,6 @@ def op_extract_using_transformation(a: Array, **kwargs) -> Array:
     "extract_distinct_regions": Op("extract_distinct_regions", op_extract_distinct_regions, 1, []),
     "human_spatial_reasoning": Op("human_spatial_reasoning", op_human_spatial_reasoning, 1, 
                                   ["hypothesis_name", "hypothesis_id", "confidence", "verification_score"]),
-    
-    # Placeholder reconstruction operations
-    "create_pattern_fill": Op("create_pattern_fill", op_create_pattern_fill, 1, ["pattern", "target_bounds", "direction"]),
-    "tile_pattern": Op("tile_pattern", op_tile_pattern, 1, ["pattern", "target_bounds", "direction"]),
-    "paste_at": Op("paste_at", op_paste_at, 1, ["target_top", "target_left", "target_grid"]),
-    "apply_placeholder_template": Op("apply_placeholder_template", op_apply_placeholder_template, 1, ["template_signature", "template_shape"]),
-    "extract_using_transformation": Op("extract_using_transformation", op_extract_using_transformation, 1, ["target_shape", "translation", "subject_signature", "object_signature"]),
 }