PytorchConnectomics
diff --git a/‎connectomics/config/__init__.py‎
Lines changed: 2 additions & 0 deletions b/‎connectomics/config/__init__.py‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎connectomics/config/hydra_config.py‎
Lines changed: 25 additions & 13 deletions b/‎connectomics/config/hydra_config.py‎
Lines changed: 25 additions & 13 deletions
diff --git a/‎connectomics/config/hydra_utils.py‎
Lines changed: 90 additions & 0 deletions b/‎connectomics/config/hydra_utils.py‎
Lines changed: 90 additions & 0 deletions
diff --git a/‎connectomics/data/process/distance.py‎
Lines changed: 1 addition & 1 deletion b/‎connectomics/data/process/distance.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎connectomics/lightning/lit_model.py‎
Lines changed: 101 additions & 23 deletions b/‎connectomics/lightning/lit_model.py‎
Lines changed: 101 additions & 23 deletions
@@ -15,6 +15,7 @@
     validate_config,
     get_config_hash,
     create_experiment_name,
+    resolve_data_paths,
 )
 
 # Auto-configuration system
@@ -47,6 +48,7 @@
     'validate_config',
     'get_config_hash',
     'create_experiment_name',
+    'resolve_data_paths',
     # Auto-configuration
     'auto_plan_config',
     'AutoConfigPlanner',
 
@@ -334,16 +334,23 @@ class DataConfig:
     # Dataset type
     dataset_type: Optional[str] = None  # Type of dataset: None (volume), 'filename', 'tile', etc.
 
+    # Base path (prepended to train_image, train_label, etc. if set)
+    train_path: str = ""  # Base path for training data (e.g., "/path/to/dataset/")
+    val_path: str = ""  # Base path for validation data
+    test_path: str = ""  # Base path for test data
+
     # Paths - Volume-based datasets
-    train_image: Optional[str] = None
-    train_label: Optional[str] = None
-    train_mask: Optional[str] = None  # Valid region mask for training
-    val_image: Optional[str] = None
-    val_label: Optional[str] = None
-    val_mask: Optional[str] = None  # Valid region mask for validation
-    test_image: Optional[str] = None
-    test_label: Optional[str] = None
-    test_mask: Optional[str] = None  # Valid region mask for testing
+    # These can be strings (single file), lists (multiple files), or None
+    # Using Any to support both str and List[str] (OmegaConf doesn't support Union of containers)
+    train_image: Any = None  # str, List[str], or None
+    train_label: Any = None  # str, List[str], or None
+    train_mask: Any = None  # str, List[str], or None (Valid region mask for training)
+    val_image: Any = None  # str, List[str], or None
+    val_label: Any = None  # str, List[str], or None
+    val_mask: Any = None  # str, List[str], or None (Valid region mask for validation)
+    test_image: Any = None  # str, List[str], or None
+    test_label: Any = None  # str, List[str], or None
+    test_mask: Any = None  # str, List[str], or None (Valid region mask for testing)
 
     # Paths - JSON/filename-based datasets
     train_json: Optional[str] = None  # JSON file with image/label file lists
@@ -413,6 +420,9 @@ class DataConfig:
         True  # Preload volumes into memory for fast random cropping (default: True)
     )
 
+    # Reject sampling configuration (for volumetric patch sampling)
+    reject_sampling: Optional[Dict[str, Any]] = None  # Dict with 'size_thres' and 'p' keys
+
     # Multi-channel label transformation (for affinity maps, distance transforms, etc.)
     label_transform: LabelTransformConfig = field(default_factory=LabelTransformConfig)
 
@@ -745,9 +755,9 @@ class AugmentationConfig:
 class InferenceDataConfig:
     """Inference data configuration."""
 
-    test_image: Optional[str] = None  # Singular form for compatibility
-    test_label: Optional[str] = None  # Singular form for compatibility
-    test_mask: Optional[str] = None  # Optional mask for inference
+    test_image: Any = None  # str, List[str], or None - Can be single file or list of files
+    test_label: Any = None  # str, List[str], or None - Can be single file or list of files
+    test_mask: Any = None  # str, List[str], or None - Optional mask for inference
     test_resolution: Optional[List[float]] = (
         None  # Test data resolution [z, y, x] in nm (e.g., [30, 6, 6])
     )
@@ -763,12 +773,14 @@ class SlidingWindowConfig:
 
     window_size: Optional[List[int]] = None
     sw_batch_size: Optional[int] = None  # If None, will use system.inference.batch_size
-    overlap: float = 0.5
+    overlap: Optional[float] = 0.5  # Overlap ratio (0-1), or None to use stride instead
+    stride: Optional[List[int]] = None  # Explicit stride (overrides overlap if set)
     blending: str = "gaussian"  # 'gaussian' or 'constant' - blending mode for overlapping patches
     sigma_scale: float = (
         0.125  # Gaussian sigma scale (only for blending='gaussian'); larger = smoother blending
     )
     padding_mode: str = "constant"  # Padding mode at volume boundaries
+    pad_size: Optional[List[int]] = None  # Padding size for context (e.g., [16, 32, 32])
 
 
 @dataclass
 
@@ -231,6 +231,95 @@ def create_experiment_name(cfg: Config) -> str:
     return "_".join(parts)
 
 
+def resolve_data_paths(cfg: Config) -> Config:
+    """
+    Resolve data paths by combining base paths (train_path, val_path, test_path)
+    with relative file paths (train_image, train_label, etc.).
+
+    This function modifies the config in-place by:
+    1. Prepending base paths to relative file paths
+    2. Expanding glob patterns to actual file lists
+    3. Flattening nested lists from glob expansion
+
+    Args:
+        cfg: Config object to resolve paths for
+
+    Returns:
+        Config object with resolved paths (same object, modified in-place)
+
+    Example:
+        >>> cfg.data.train_path = "/data/barcode/"
+        >>> cfg.data.train_image = ["PT37/*_raw.tif", "file.tif"]
+        >>> resolve_data_paths(cfg)
+        >>> print(cfg.data.train_image)
+        ['/data/barcode/PT37/img1_raw.tif', '/data/barcode/PT37/img2_raw.tif', '/data/barcode/file.tif']
+    """
+    import os
+    from glob import glob
+
+    def _combine_path(base_path: str, file_path: Optional[Union[str, List[str]]]) -> Optional[Union[str, List[str]]]:
+        """Helper to combine base path with file path(s) and expand globs."""
+        if file_path is None:
+            return file_path
+
+        # Handle list of paths
+        if isinstance(file_path, list):
+            result = []
+            for p in file_path:
+                resolved = _combine_path(base_path, p)
+                # If resolved is a list (from glob expansion), extend
+                if isinstance(resolved, list):
+                    result.extend(resolved)
+                else:
+                    result.append(resolved)
+            return result
+
+        # Handle string path
+        # Combine with base path if relative
+        if base_path and not os.path.isabs(file_path):
+            file_path = os.path.join(base_path, file_path)
+
+        # Expand glob patterns
+        if "*" in file_path or "?" in file_path:
+            expanded = sorted(glob(file_path))
+            if expanded:
+                return expanded
+            else:
+                # No matches - return original pattern (will be caught by validation)
+                return file_path
+
+        return file_path
+
+    # Resolve training paths
+    if cfg.data.train_path:
+        cfg.data.train_image = _combine_path(cfg.data.train_path, cfg.data.train_image)
+        cfg.data.train_label = _combine_path(cfg.data.train_path, cfg.data.train_label)
+        cfg.data.train_mask = _combine_path(cfg.data.train_path, cfg.data.train_mask)
+        cfg.data.train_json = _combine_path(cfg.data.train_path, cfg.data.train_json)
+
+    # Resolve validation paths
+    if cfg.data.val_path:
+        cfg.data.val_image = _combine_path(cfg.data.val_path, cfg.data.val_image)
+        cfg.data.val_label = _combine_path(cfg.data.val_path, cfg.data.val_label)
+        cfg.data.val_mask = _combine_path(cfg.data.val_path, cfg.data.val_mask)
+        cfg.data.val_json = _combine_path(cfg.data.val_path, cfg.data.val_json)
+
+    # Resolve test paths
+    if cfg.data.test_path:
+        cfg.data.test_image = _combine_path(cfg.data.test_path, cfg.data.test_image)
+        cfg.data.test_label = _combine_path(cfg.data.test_path, cfg.data.test_label)
+        cfg.data.test_mask = _combine_path(cfg.data.test_path, cfg.data.test_mask)
+        cfg.data.test_json = _combine_path(cfg.data.test_path, cfg.data.test_json)
+
+    # Also resolve inference data paths
+    if cfg.data.test_path and cfg.inference.data:
+        cfg.inference.data.test_image = _combine_path(cfg.data.test_path, cfg.inference.data.test_image)
+        cfg.inference.data.test_label = _combine_path(cfg.data.test_path, cfg.inference.data.test_label)
+        cfg.inference.data.test_mask = _combine_path(cfg.data.test_path, cfg.inference.data.test_mask)
+
+    return cfg
+
+
 __all__ = [
     "load_config",
     "save_config",
@@ -242,4 +331,5 @@ def create_experiment_name(cfg: Config) -> str:
     "validate_config",
     "get_config_hash",
     "create_experiment_name",
+    "resolve_data_paths",
 ]
@@ -232,7 +232,7 @@ def skeleton_aware_distance_transform(
     bg_value: float = -1.0,
     relabel: bool = True,
     padding: bool = False,
-    resolution: Tuple[float] = (1.0, 1.0),
+    resolution: Tuple[float] = (1.0, 1.0, 1.0),
     alpha: float = 0.8,
     smooth: bool = True,
     smooth_skeleton_only: bool = True,
 
@@ -1005,33 +1005,72 @@ def training_step(self, batch: Dict[str, torch.Tensor], batch_idx: int) -> STEP_
             ds_weights = [1.0] + [0.5 ** i for i in range(1, len(ds_outputs) + 1)]
             all_outputs = [main_output] + ds_outputs
 
+            # Check if multi-task learning is configured
+            is_multi_task = hasattr(self.cfg.model, 'multi_task_config') and self.cfg.model.multi_task_config is not None
+
             for scale_idx, (output, ds_weight) in enumerate(zip(all_outputs, ds_weights)):
                 # Match target to output size
                 target = self._match_target_to_output(labels, output)
 
                 # Compute loss for this scale
                 scale_loss = 0.0
-                for loss_fn, weight in zip(self.loss_functions, self.loss_weights):
-                    loss = loss_fn(output, target)
 
-                    # Check for NaN/Inf immediately after computing loss
-                    if self.enable_nan_detection and (torch.isnan(loss) or torch.isinf(loss)):
-                        print(f"\n{'='*80}")
-                        print(f"⚠️  NaN/Inf detected in loss computation!")
-                        print(f"{'='*80}")
-                        print(f"Loss function: {loss_fn.__class__.__name__}")
-                        print(f"Loss value: {loss.item()}")
-                        print(f"Scale: {scale_idx}, Weight: {weight}")
-                        print(f"Output shape: {output.shape}, range: [{output.min():.4f}, {output.max():.4f}]")
-                        print(f"Target shape: {target.shape}, range: [{target.min():.4f}, {target.max():.4f}]")
-                        print(f"Output contains NaN: {torch.isnan(output).any()}")
-                        print(f"Target contains NaN: {torch.isnan(target).any()}")
-                        if self.debug_on_nan:
-                            print(f"\nEntering debugger...")
-                            pdb.set_trace()
-                        raise ValueError(f"NaN/Inf in loss at scale {scale_idx}")
-
-                    scale_loss += loss * weight
+                if is_multi_task:
+                    # Multi-task learning with deep supervision:
+                    # Apply specific losses to specific channels at each scale
+                    for task_idx, task_config in enumerate(self.cfg.model.multi_task_config):
+                        start_ch, end_ch, task_name, loss_indices = task_config
+
+                        # Extract channels for this task
+                        task_output = output[:, start_ch:end_ch, ...]
+                        task_target = target[:, start_ch:end_ch, ...]
+
+                        # Apply specified losses for this task
+                        for loss_idx in loss_indices:
+                            loss_fn = self.loss_functions[loss_idx]
+                            weight = self.loss_weights[loss_idx]
+
+                            loss = loss_fn(task_output, task_target)
+
+                            # Check for NaN/Inf
+                            if self.enable_nan_detection and (torch.isnan(loss) or torch.isinf(loss)):
+                                print(f"\n{'='*80}")
+                                print(f"⚠️  NaN/Inf detected in deep supervision multi-task loss!")
+                                print(f"{'='*80}")
+                                print(f"Scale: {scale_idx}, Task: {task_name} (channels {start_ch}:{end_ch})")
+                                print(f"Loss function: {loss_fn.__class__.__name__} (index {loss_idx})")
+                                print(f"Loss value: {loss.item()}")
+                                print(f"Output shape: {task_output.shape}, range: [{task_output.min():.4f}, {task_output.max():.4f}]")
+                                print(f"Target shape: {task_target.shape}, range: [{task_target.min():.4f}, {task_target.max():.4f}]")
+                                if self.debug_on_nan:
+                                    print(f"\nEntering debugger...")
+                                    pdb.set_trace()
+                                raise ValueError(f"NaN/Inf in deep supervision loss at scale {scale_idx}, task {task_name}")
+
+                            scale_loss += loss * weight
+                else:
+                    # Standard deep supervision: apply all losses to all outputs
+                    for loss_fn, weight in zip(self.loss_functions, self.loss_weights):
+                        loss = loss_fn(output, target)
+
+                        # Check for NaN/Inf immediately after computing loss
+                        if self.enable_nan_detection and (torch.isnan(loss) or torch.isinf(loss)):
+                            print(f"\n{'='*80}")
+                            print(f"⚠️  NaN/Inf detected in loss computation!")
+                            print(f"{'='*80}")
+                            print(f"Loss function: {loss_fn.__class__.__name__}")
+                            print(f"Loss value: {loss.item()}")
+                            print(f"Scale: {scale_idx}, Weight: {weight}")
+                            print(f"Output shape: {output.shape}, range: [{output.min():.4f}, {output.max():.4f}]")
+                            print(f"Target shape: {target.shape}, range: [{target.min():.4f}, {target.max():.4f}]")
+                            print(f"Output contains NaN: {torch.isnan(output).any()}")
+                            print(f"Target contains NaN: {torch.isnan(target).any()}")
+                            if self.debug_on_nan:
+                                print(f"\nEntering debugger...")
+                                pdb.set_trace()
+                            raise ValueError(f"NaN/Inf in loss at scale {scale_idx}")
+
+                        scale_loss += loss * weight
 
                 total_loss += scale_loss * ds_weight
                 loss_dict[f'train_loss_scale_{scale_idx}'] = scale_loss.item()
@@ -1100,15 +1139,38 @@ def validation_step(self, batch: Dict[str, torch.Tensor], batch_idx: int) -> STE
             ds_weights = [1.0] + [0.5 ** i for i in range(1, len(ds_outputs) + 1)]
             all_outputs = [main_output] + ds_outputs
 
+            # Check if multi-task learning is configured
+            is_multi_task = hasattr(self.cfg.model, 'multi_task_config') and self.cfg.model.multi_task_config is not None
+
             for scale_idx, (output, ds_weight) in enumerate(zip(all_outputs, ds_weights)):
                 # Match target to output size
                 target = self._match_target_to_output(labels, output)
 
                 # Compute loss for this scale
                 scale_loss = 0.0
-                for loss_fn, weight in zip(self.loss_functions, self.loss_weights):
-                    loss = loss_fn(output, target)
-                    scale_loss += loss * weight
+
+                if is_multi_task:
+                    # Multi-task learning with deep supervision:
+                    # Apply specific losses to specific channels at each scale
+                    for task_idx, task_config in enumerate(self.cfg.model.multi_task_config):
+                        start_ch, end_ch, task_name, loss_indices = task_config
+
+                        # Extract channels for this task
+                        task_output = output[:, start_ch:end_ch, ...]
+                        task_target = target[:, start_ch:end_ch, ...]
+
+                        # Apply specified losses for this task
+                        for loss_idx in loss_indices:
+                            loss_fn = self.loss_functions[loss_idx]
+                            weight = self.loss_weights[loss_idx]
+
+                            loss = loss_fn(task_output, task_target)
+                            scale_loss += loss * weight
+                else:
+                    # Standard deep supervision: apply all losses to all outputs
+                    for loss_fn, weight in zip(self.loss_functions, self.loss_weights):
+                        loss = loss_fn(output, target)
+                        scale_loss += loss * weight
 
                 total_loss += scale_loss * ds_weight
                 loss_dict[f'val_loss_scale_{scale_idx}'] = scale_loss.item()
@@ -1367,6 +1429,10 @@ def _match_target_to_output(
         For segmentation masks, uses nearest-neighbor interpolation to preserve labels.
         For continuous targets, uses trilinear interpolation.
 
+        IMPORTANT: For continuous targets in range [-1, 1] (e.g., tanh-normalized SDT),
+        trilinear interpolation can cause overshooting beyond bounds. We clamp the
+        resized targets back to [-1, 1] to prevent loss explosion.
+
         Args:
             target: Target tensor of shape (B, C, D, H, W)
             output: Output tensor of shape (B, C, D', H', W')
@@ -1396,6 +1462,18 @@ def _match_target_to_output(
                 align_corners=False,
             )
 
+            # CRITICAL FIX: Clamp resized targets to prevent interpolation overshooting
+            # For targets in range [-1, 1] (e.g., tanh-normalized SDT), trilinear interpolation
+            # can produce values outside this range (e.g., -1.2, 1.3) which causes loss explosion
+            # when used with tanh-activated predictions.
+            # Check if targets are in typical normalized ranges:
+            if target.min() >= -1.5 and target.max() <= 1.5:
+                # Likely normalized to [-1, 1] (with some tolerance for existing overshoots)
+                target_resized = torch.clamp(target_resized, -1.0, 1.0)
+            elif target.min() >= 0.0 and target.max() <= 1.5:
+                # Likely normalized to [0, 1]
+                target_resized = torch.clamp(target_resized, 0.0, 1.0)
+
         return target_resized
 
     def configure_optimizers(self) -> Dict[str, Any]: