feat: add save_intermediate param to predictor to return output logits

okunator · okunator · commit f994c2e5f9a2 · 2025-11-14T11:25:22.000+02:00
diff --git a/cellseg_models_pytorch/inference/predictor.py b/cellseg_models_pytorch/inference/predictor.py
@@ -76,6 +76,7 @@ def predict(
         self,
         x: Union[torch.Tensor, np.ndarray, Image],
         apply_boundary_weight: bool = False,
+        save_intermediate: bool = False,
     ) -> Dict[str, torch.Tensor]:
         """Run the input through the model.
 
@@ -88,6 +89,10 @@ def predict(
             apply_boundary_weight (bool, default=True):
                 Whether to apply boundary weights to mitigate boundary artefacts
                 in aux predictions.
+            save_intermediate (bool, default=False):
+                Whether to save intermediate results (logits). If True, the method
+                returns a tuple (final predictions, intermediate results), where the
+                intermediate results are the raw model outputs before argmax.
 
         Returns:
             Dict[str, torch.Tensor]:
@@ -117,15 +122,22 @@ def predict(
                 .unsqueeze(0)
             )
 
+        intermediate = None
         with torch.no_grad():
             if self.mixed_precision:
                 with torch.autocast(self.device.type, dtype=torch.float16):
                     probs = self._predict(x)
+                    if save_intermediate:
+                        intermediate = probs
                     probs = self._argmax(probs)
             else:
                 probs = self._predict(x)
+                if save_intermediate:
+                    intermediate = probs
                 probs = self._argmax(probs)
 
+        if save_intermediate:
+            return probs, intermediate
         return probs
 
     def _to_tensor(self, x: Union[np.ndarray, Image]) -> torch.Tensor:
@@ -265,6 +277,7 @@ def predict_sliding_win(
         stride: int,
         padding: int = 20,
         apply_boundary_weight: bool = True,
+        save_intermediate: bool = False,
     ) -> Dict[str, torch.Tensor]:
         """Run the input through the model.
 
@@ -283,11 +296,14 @@ def predict_sliding_win(
             apply_boundary_weight (bool, default=True):
                 Whether to apply boundary weights to mitigate boundary artefacts
                 in aux predictions.
+            save_intermediate (bool, default=False):
+                Whether to save intermediate results (logits). If True, the method
+                returns a tuple (final predictions, intermediate results), where the
+                intermediate results are the raw model outputs before argmax.
 
         Returns:
             Dict[str, torch.Tensor]:
-                Dictionary containing the model predictions (probabilities).
-                Shapes: (B, C, H, W).
+                Dictionary containing the model predictions. Shapes: (B, C, H, W).
         """
         # check if the input is a tensor
         if not isinstance(x, torch.Tensor):
@@ -311,15 +327,23 @@ def predict_sliding_win(
                 .unsqueeze(0)
             )
 
+        intermediate = None
         with torch.no_grad():
             if self.mixed_precision:
                 with torch.autocast(self.device.type, dtype=torch.float16):
                     probs = self._predict_sliding_win(x, window_size, stride, padding)
+                    if save_intermediate:
+                        intermediate = probs
                     probs = self._argmax(probs)
             else:
                 probs = self._predict_sliding_win(x, window_size, stride, padding)
+                if save_intermediate:
+                    intermediate = probs
                 probs = self._argmax(probs)
 
+        if save_intermediate:
+            return probs, intermediate
+
         return probs
 
     @staticmethod
diff --git a/cellseg_models_pytorch/wsi/cucim_reader.py b/cellseg_models_pytorch/wsi/cucim_reader.py
@@ -13,10 +13,7 @@
     HAS_CUCIM = False
 
 
-CUCIM_READABLE_FORMATS = (
-    ".svs",
-    ".tiff",
-)
+CUCIM_READABLE_FORMATS = (".svs", ".tiff", ".tif")
 
 
 class CucimReader(SlideReaderBackend):