computational-cell-analytics
diff --git a/‎scripts/cooper/training/evaluate_compartments.py‎
Lines changed: 103 additions & 0 deletions b/‎scripts/cooper/training/evaluate_compartments.py‎
Lines changed: 103 additions & 0 deletions
diff --git a/‎scripts/cooper/training/train_compartments.py‎
Lines changed: 0 additions & 1 deletion b/‎scripts/cooper/training/train_compartments.py‎
Lines changed: 0 additions & 1 deletion
diff --git a/‎synapse_net/__version__.py‎
Lines changed: 1 addition & 1 deletion b/‎synapse_net/__version__.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎synapse_net/ground_truth/vesicles.py‎
Lines changed: 1 addition & 1 deletion b/‎synapse_net/ground_truth/vesicles.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎synapse_net/inference/inference.py‎
Lines changed: 3 additions & 3 deletions b/‎synapse_net/inference/inference.py‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎synapse_net/inference/scalable_segmentation.py‎
Lines changed: 137 additions & 0 deletions b/‎synapse_net/inference/scalable_segmentation.py‎
Lines changed: 137 additions & 0 deletions
@@ -0,0 +1,103 @@
+import os
+import h5py
+import numpy as np
+import pandas as pd
+
+from synapse_net.inference.inference import get_model
+from synapse_net.inference.compartments import segment_compartments
+from skimage.segmentation import find_boundaries
+
+from elf.evaluation.matching import matching
+
+from train_compartments import get_paths_3d
+from sklearn.model_selection import train_test_split
+
+
+def run_prediction(paths):
+    output_folder = "./compartment_eval"
+    os.makedirs(output_folder, exist_ok=True)
+
+    model = get_model("compartments")
+    for path in paths:
+        with h5py.File(path, "r") as f:
+            input_vol = f["raw"][:]
+        seg, pred = segment_compartments(input_vol, model=model, return_predictions=True)
+        fname = os.path.basename(path)
+        out = os.path.join(output_folder, fname)
+        with h5py.File(out, "a") as f:
+            f.create_dataset("seg", data=seg, compression="gzip")
+            f.create_dataset("pred", data=pred, compression="gzip")
+
+
+def binary_recall(gt, pred):
+    tp = np.logical_and(gt, pred).sum()
+    fn = np.logical_and(gt, ~pred).sum()
+    return float(tp) / (tp + fn) if (tp + fn) else 0.0
+
+
+def run_evaluation(paths):
+    output_folder = "./compartment_eval"
+
+    results = {
+        "name": [],
+        "recall-pred": [],
+        "recall-seg": [],
+    }
+
+    for path in paths:
+        with h5py.File(path, "r") as f:
+            labels = f["labels/compartments"][:]
+        boundary_labels = find_boundaries(labels).astype("bool")
+
+        fname = os.path.basename(path)
+        out = os.path.join(output_folder, fname)
+        with h5py.File(out, "a") as f:
+            seg, pred = f["seg"][:], f["pred"][:]
+
+        recall_pred = binary_recall(boundary_labels, pred > 0.5)
+        recall_seg = matching(seg, labels)["recall"]
+
+        results["name"].append(fname)
+        results["recall-pred"].append(recall_pred)
+        results["recall-seg"].append(recall_seg)
+
+    results = pd.DataFrame(results)
+    print(results)
+    print(results[["recall-pred", "recall-seg"]].mean())
+
+
+def check_predictions(paths):
+    import napari
+    output_folder = "./compartment_eval"
+
+    for path in paths:
+        with h5py.File(path, "r") as f:
+            raw = f["raw"][:]
+            labels = f["labels/compartments"][:]
+        boundary_labels = find_boundaries(labels)
+
+        fname = os.path.basename(path)
+        out = os.path.join(output_folder, fname)
+        with h5py.File(out, "a") as f:
+            seg, pred = f["seg"][:], f["pred"][:]
+
+        v = napari.Viewer()
+        v.add_image(raw)
+        v.add_image(pred)
+        v.add_labels(labels)
+        v.add_labels(boundary_labels)
+        v.add_labels(seg)
+        napari.run()
+
+
+def main():
+    paths = get_paths_3d()
+    _, val_paths = train_test_split(paths, test_size=0.10, random_state=42)
+
+    # run_prediction(val_paths)
+    run_evaluation(val_paths)
+    # check_predictions(val_paths)
+
+
+if __name__ == "__main__":
+    main()
@@ -14,7 +14,6 @@
 from synapse_net.training import supervised_training
 
 TRAIN_ROOT = "/mnt/lustre-emmy-hdd/projects/nim00007/data/synaptic-reconstruction/cooper/ground_truth/compartments"
-# TRAIN_ROOT = "/home/pape/Work/my_projects/synaptic-reconstruction/scripts/cooper/ground_truth/compartments/output/compartment_gt"  # noqa
 
 
 def get_paths_2d():
 
@@ -1 +1 @@
-__version__ = "0.2.0"
+__version__ = "0.3.0"
@@ -227,7 +227,7 @@ def extract_vesicle_training_data(
             relative_path = os.path.relpath(file_path, data_folder)
 
             if to_label_path is None:
-                imod_path = os.path.join(gt_folder, relative_path.replace(Path(relative_path).suffix, ".imod"))
+                imod_path = os.path.join(gt_folder, relative_path.replace(Path(relative_path).suffix, ".mod"))
             else:
                 imod_path = to_label_path(gt_folder, relative_path)
 
 
@@ -22,7 +22,7 @@
 
 def _get_model_registry():
     registry = {
-        "active_zone": "a18f29168aed72edec0f5c2cb1aa9a4baa227812db6082a6538fd38d9f43afb0",
+        "active_zone": "c23652a8fe06daa113546af6d3200c4c1dcc79917056c6ed7357b8c93548372a",
         "compartments": "527983720f9eb215c45c4f4493851fd6551810361eda7b79f185a0d304274ee1",
         "mitochondria": "24625018a5968b36f39fa9d73b121a32e8f66d0f2c0540d3df2e1e39b3d58186",
         "mitochondria2": "553decafaff4838fff6cc8347f22c8db3dee5bcbeffc34ffaec152f8449af673",
@@ -37,7 +37,7 @@ def _get_model_registry():
         "vesicles_3d_innerear": "924f0f7cfb648a3a6931c1d48d8b1fdc6c0c0d2cb3330fe2cae49d13e7c3b69d",
     }
     urls = {
-        "active_zone": "https://owncloud.gwdg.de/index.php/s/zvuY342CyQebPsX/download",
+        "active_zone": "https://owncloud.gwdg.de/index.php/s/wpea9FH9waG4zJd/download",
         "compartments": "https://owncloud.gwdg.de/index.php/s/DnFDeTmDDmZrDDX/download",
         "mitochondria": "https://owncloud.gwdg.de/index.php/s/1T542uvzfuruahD/download",
         "mitochondria2": "https://owncloud.gwdg.de/index.php/s/GZghrXagc54FFXd/download",
@@ -109,7 +109,7 @@ def get_model_training_resolution(model_type: str) -> Dict[str, float]:
         Mapping of axis (x, y, z) to the voxel size (in nm) of that axis.
     """
     resolutions = {
-        "active_zone": {"x": 1.44, "y": 1.44, "z": 1.44},
+        "active_zone": {"x": 1.38, "y": 1.38, "z": 1.38},
         "compartments": {"x": 3.47, "y": 3.47, "z": 3.47},
         "mitochondria": {"x": 2.07, "y": 2.07, "z": 2.07},
         "cristae": {"x": 1.44, "y": 1.44, "z": 1.44},
 
@@ -0,0 +1,137 @@
+import os
+import tempfile
+from typing import Dict, List, Optional
+
+import elf.parallel as parallel
+import numpy as np
+import torch
+
+from elf.io import open_file
+from elf.wrapper import ThresholdWrapper, SimpleTransformationWrapper
+from elf.wrapper.base import MultiTransformationWrapper
+from elf.wrapper.resized_volume import ResizedVolume
+from numpy.typing import ArrayLike
+from synapse_net.inference.util import get_prediction
+
+
+class SelectChannel(SimpleTransformationWrapper):
+    """Wrapper to select a chanel from an array-like dataset object.
+
+    Args:
+        volume: The array-like input dataset.
+        channel: The channel that will be selected.
+    """
+    def __init__(self, volume: np.typing.ArrayLike, channel: int):
+        self.channel = channel
+        super().__init__(volume, lambda x: x[self.channel], with_channels=True)
+
+    @property
+    def shape(self):
+        return self._volume.shape[1:]
+
+    @property
+    def chunks(self):
+        return self._volume.chunks[1:]
+
+    @property
+    def ndim(self):
+        return self._volume.ndim - 1
+
+
+def _run_segmentation(pred, output, seeds, chunks, seed_threshold, min_size, verbose, original_shape):
+    # Create wrappers for selecting the foreground and the boundary channel.
+    foreground = SelectChannel(pred, 0)
+    boundaries = SelectChannel(pred, 1)
+
+    # Create wrappers for subtracting and thresholding boundary subtracted from the foreground.
+    # And then compute the seeds based on this.
+    seed_input = ThresholdWrapper(
+        MultiTransformationWrapper(np.subtract, foreground, boundaries), seed_threshold
+    )
+    parallel.label(seed_input, seeds, verbose=verbose, block_shape=chunks)
+
+    # Run watershed to extend back from the seeds to the boundaries.
+    mask = ThresholdWrapper(foreground, 0.5)
+
+    # Resize if necessary.
+    if original_shape is not None:
+        boundaries = ResizedVolume(boundaries, original_shape, order=1)
+        seeds = ResizedVolume(seeds, original_shape, order=0)
+        mask = ResizedVolume(mask, original_shape, order=0)
+
+    parallel.seeded_watershed(
+        boundaries, seeds=seeds, out=output, verbose=verbose, mask=mask, block_shape=chunks, halo=3 * (16,)
+    )
+
+    # Run the size filter.
+    if min_size > 0:
+        parallel.size_filter(output, output, min_size=min_size, verbose=verbose, block_shape=chunks)
+
+
+def scalable_segmentation(
+    input_: ArrayLike,
+    output: ArrayLike,
+    model: torch.nn.Module,
+    tiling: Optional[Dict[str, Dict[str, int]]] = None,
+    scale: Optional[List[float]] = None,
+    seed_threshold: float = 0.5,
+    min_size: int = 500,
+    prediction: Optional[ArrayLike] = None,
+    verbose: bool = True,
+    mask: Optional[ArrayLike] = None,
+) -> None:
+    """Run segmentation based on a prediction with foreground and boundary channel.
+
+    This function first subtracts the boundary prediction from the foreground prediction,
+    then applies a threshold, connected components, and a watershed to fit the components
+    back to the foreground. All processing steps are implemented in a scalable fashion,
+    so that the function runs for large input volumes.
+
+    Args:
+        input_: The input data.
+        output: The array for storing the output segmentation.
+            Can be a numpy array, a zarr array, or similar.
+        model: The model for prediction.
+        tiling: The tiling configuration for the prediction.
+        scale: The scale factor to use for rescaling the input volume before prediction.
+        seed_threshold: The threshold applied before computing connected components.
+        min_size: The minimum size of a vesicle to be considered.
+        prediction: The array for storing the prediction.
+            If given, this can be a numpy array, a zarr array, or similar
+            If not given will be stored in a temporary n5 array.
+        verbose: Whether to print timing information.
+    """
+    if mask is not None:
+        raise NotImplementedError
+    assert model.out_channels == 2
+
+    # Create a temporary directory for storing the predictions.
+    chunks = (128,) * 3
+    with tempfile.TemporaryDirectory() as tmp_dir:
+
+        if scale is None or np.allclose(scale, 1.0, atol=1e-3):
+            original_shape = None
+        else:
+            original_shape = input_.shape
+            new_shape = tuple(int(sh * sc) for sh, sc in zip(input_.shape, scale))
+            input_ = ResizedVolume(input_, shape=new_shape, order=1)
+
+        if prediction is None:
+            # Create the dataset for storing the prediction.
+            tmp_pred = os.path.join(tmp_dir, "prediction.n5")
+            f = open_file(tmp_pred, mode="a")
+            pred_shape = (2,) + input_.shape
+            pred_chunks = (1,) + chunks
+            prediction = f.create_dataset("pred", shape=pred_shape, dtype="float32", chunks=pred_chunks)
+        else:
+            assert prediction.shape[0] == 2
+            assert prediction.shape[1:] == input_.shape
+
+        # Create temporary storage for the seeds.
+        tmp_seeds = os.path.join(tmp_dir, "seeds.n5")
+        f = open_file(tmp_seeds, mode="a")
+        seeds = f.create_dataset("seeds", shape=input_.shape, dtype="uint64", chunks=chunks)
+
+        # Run prediction and segmentation.
+        get_prediction(input_, prediction=prediction, tiling=tiling, model=model, verbose=verbose)
+        _run_segmentation(prediction, output, seeds, chunks, seed_threshold, min_size, verbose, original_shape)
Original file line number	Diff line number	Diff line change
`@@ -1 +1 @@`
`1`		`-__version__ = "0.2.0"`
	`1`	`+__version__ = "0.3.0"`