Initial evaluation for NIS3D nucleus segmentation

schilling40 · schilling40 · commit f1098871f6fb · 2025-07-31T14:30:48.000+02:00
diff --git a/scripts/baselines/NIS3D_apply.py b/scripts/baselines/NIS3D_apply.py
@@ -0,0 +1,46 @@
+import os
+import sys
+
+script_dir = "/user/schilling40/u15000/flamingo-tools/scripts/prediction"
+sys.path.append(script_dir)
+
+import run_prediction_distance_unet
+
+checkpoint_dir = "/mnt/vast-nhr/projects/nim00007/data/moser/cochlea-lightsheet/trained_models/nucleus"
+model_name = "NIS3D_supervised_2025-07-17"
+model_dir = os.path.join(checkpoint_dir, model_name)
+checkpoint = os.path.join(checkpoint_dir, model_name, "best.pt")
+
+cochlea_dir = "/mnt/vast-nhr/projects/nim00007/data/moser/cochlea-lightsheet"
+
+image_dir = "/mnt/vast-nhr/projects/nim00007/data/moser/cochlea-lightsheet/training_data/nucleus/2025-07_NIS3D/test"
+
+out_dir = os.path.join(cochlea_dir, "predictions", "val_nucleus", "distance_unet_NIS3D")  # /distance_unet
+
+boundary_distance_threshold = 0.5
+seg_class = "ihc"
+
+block_shape = (128, 128, 128)
+halo = (16, 32, 32)
+
+block_shape_str = ",".join([str(b) for b in block_shape])
+halo_str = ",".join([str(h) for h in halo])
+
+images = [entry.path for entry in os.scandir(image_dir) if entry.is_file() and "iitest.tif" in entry.path]
+
+for image in images:
+    sys.argv = [
+        os.path.join(script_dir, "run_prediction_distance_unet.py"),
+        f"--input={image}",
+        f"--output_folder={out_dir}",
+        f"--model={model_dir}",
+        f"--block_shape=[{block_shape_str}]",
+        f"--halo=[{halo_str}]",
+        "--memory",
+        "--time",
+        "--no_masking",
+        f"--seg_class={seg_class}",
+        f"--boundary_distance_threshold={boundary_distance_threshold}"
+    ]
+
+    run_prediction_distance_unet.main()
diff --git a/scripts/baselines/NIS3D_eval.py b/scripts/baselines/NIS3D_eval.py
@@ -0,0 +1,160 @@
+import argparse
+import json
+import multiprocessing as mp
+import os
+from concurrent import futures
+from typing import List
+
+import numpy as np
+import tifffile
+from tqdm import tqdm
+
+GT_DIR = "/mnt/vast-nhr/projects/nim00007/data/moser/cochlea-lightsheet/training_data/nucleus/2025-07_NIS3D/test"
+PRED_DIR = "/mnt/vast-nhr/projects/nim00007/data/moser/cochlea-lightsheet/predictions/val_nucleus/distance_unet_NIS3D"
+
+
+def find_overlapping_masks(
+    arr_base: np.ndarray,
+    arr_ref: np.ndarray,
+    label_id_base: int,
+    min_overlap: float = 0.5,
+) -> List[int]:
+    """Find masks of segmentation, which have an overlap with undefined mask greater than 0.5.
+    """
+    labels_undefined_mask = []
+    arr_base_undefined = arr_base == label_id_base
+
+    # iterate through segmentation ids in reference mask
+    ref_ids = list(np.unique(arr_ref)[1:])
+    for ref_id in ref_ids:
+        arr_ref_instance = arr_ref == ref_id
+
+        intersection = np.logical_and(arr_ref_instance, arr_base_undefined)
+        overlap_ratio = np.sum(intersection) / np.sum(arr_ref_instance)
+        if overlap_ratio >= min_overlap:
+            labels_undefined_mask.append(ref_id)
+
+    return labels_undefined_mask
+
+
+def find_matching_masks(arr_gt, arr_ref, out_path, labels_undefined_mask=[]):
+    """For each instance in the reference array, the corresponding mask of the ground truth array,
+    which has the biggest overlap, is identified.
+
+    Args:
+        arr_gt:
+        arr_ref:
+        out_path: Output path for saving dictionary.
+        labels_undefined_mask: Labels of the reference array to exclude.
+    """
+    seg_ids_ref = [int(i) for i in np.unique(arr_ref)[1:]]
+    print(f"total number of segmentation masks: {len(seg_ids_ref)}")
+    seg_ids_ref = [s for s in seg_ids_ref if s not in labels_undefined_mask]
+    print(f"number of segmentation masks after filtering undefined masks: {len(seg_ids_ref)}")
+
+    def compute_overlap(ref_id):
+        """Identify ID of segmentation mask with biggest overlap.
+        Return matched IDs and overlap.
+        """
+        arr_ref_instance = arr_ref == ref_id
+
+        seg_ids_gt = np.unique(arr_gt[arr_ref_instance])[1:]
+
+        max_overlap = 0
+        gt_id_match = None
+
+        for gt_id in seg_ids_gt:
+            arr_gt_instance = arr_gt == gt_id
+
+            intersection = np.logical_and(arr_ref_instance, arr_gt_instance)
+            overlap_ratio = np.sum(intersection) / np.sum(arr_ref_instance)
+            if overlap_ratio > max_overlap:
+                gt_id_match = int(gt_id.tolist())
+                max_overlap = np.max([max_overlap, overlap_ratio])
+
+        if gt_id_match is not None:
+            return {
+                "ref_id": ref_id,
+                "gt_id": gt_id_match,
+                "overlap": float(max_overlap.tolist())
+            }
+        else:
+            return None
+
+    n_threads = min(16, mp.cpu_count())
+    print(f"Parallelizing with {n_threads} Threads.")
+    with futures.ThreadPoolExecutor(n_threads) as pool:
+        results = list(tqdm(pool.map(compute_overlap, seg_ids_ref), total=len(seg_ids_ref)))
+
+    matching_masks = {r['ref_id']: r for r in results if r is not None}
+
+    with open(out_path, "w") as f:
+        json.dump(matching_masks, f, indent='\t', separators=(',', ': '))
+
+
+def filter_true_positives(output_folder, prefixes, force_overwrite):
+    """ Filter true positives from segmentation.
+    Segmentation instances and ground truth labels are filtered symmetrically.
+    The maximal overlap of each is computed and taken as a true positive if symmetric.
+    The instance ID, the reference ID, and the overlap are saved in dictionaries.
+
+    Args:
+        output_folder: Output folder for dictionaries.
+        prefixes: List of prefixes for evaluation. One or multiple of ["Drosophila", "MusMusculus", "Zebrafish"].
+        force_overwrite: Flag for forced overwrite of existing output files.
+    """
+    if "PRED_DIR" in globals():
+        pred_dir = PRED_DIR
+    if "GT_DIR" in globals():
+        gt_dir = GT_DIR
+
+    if prefixes is None:
+        prefixes = ["Drosophila", "MusMusculus", "Zebrafish"]
+
+    for prefix in prefixes:
+        conf_file = os.path.join(gt_dir, f"{prefix}_1_iitest_confidence.tif")
+        annot_file = os.path.join(gt_dir, f"{prefix}_1_iitest_annotations.tif")
+        conf_arr = tifffile.imread(conf_file)
+        gt_arr = tifffile.imread(annot_file)
+
+        seg_file = os.path.join(pred_dir, f"{prefix}_1_iitest_seg.tif")
+        seg_arr = tifffile.imread(seg_file)
+
+        # find largest overlap of ground truth mask with each segmentation instance
+        out_path = os.path.join(output_folder, f"{prefix}_matching_ref_gt.json")
+        if os.path.isfile(out_path) and not force_overwrite:
+            print(f"Skipping the creation of {out_path}. File already exists.")
+        else:
+            # exclude detections with more than 50% of pixels in undefined category
+            if 1 in np.unique(conf_arr)[1:]:
+                labels_undefined_mask = find_overlapping_masks(conf_arr, seg_arr, label_id_base=1)
+            else:
+                labels_undefined_mask = []
+                print("Array does not contain undefined mask")
+
+            find_matching_masks(gt_arr, seg_arr, out_path, labels_undefined_mask=labels_undefined_mask)
+
+        # find largest overlap of segmentation instance with each ground truth mask
+        out_path = os.path.join(output_folder, f"{prefix}_matching_gt_ref.json")
+        if os.path.isfile(out_path) and not force_overwrite:
+            print(f"Skipping the creation of {out_path}. File already exists.")
+        else:
+            find_matching_masks(seg_arr, gt_arr, out_path)
+
+
+def main():
+    parser = argparse.ArgumentParser()
+    parser.add_argument("--output_folder", "-o", required=True)
+    parser.add_argument("--prefix", "-p", nargs="+", type=str, default=None)
+    parser.add_argument("--force", action="store_true", help="Forcefully overwrite output.")
+    args = parser.parse_args()
+
+    filter_true_positives(
+        args.output_folder,
+        args.prefix,
+        args.force,
+    )
+
+
+if __name__ == "__main__":
+    main()
diff --git a/scripts/baselines/NIS3D_preprocessing.py b/scripts/baselines/NIS3D_preprocessing.py
diff --git a/scripts/baselines/NIS3D_train.sh b/scripts/baselines/NIS3D_train.sh
@@ -0,0 +1,10 @@
+#!/bin/bash
+
+export MODEL_NAME="nucleus_NIS3D_supervised_2025-07-17"
+
+export IDIR=/mnt/vast-nhr/projects/nim00007/data/moser/cochlea-lightsheet/training_data/nucleus/2025-07_NIS3D
+
+export SCRIPT_DIR=/user/schilling40/u15000/flamingo-tools/scripts/training
+
+python $SCRIPT_DIR/train_distance_unet.py -i $IDIR --name $MODEL_NAME
+
diff --git a/scripts/baselines/eval_baseline.py b/scripts/baselines/eval_baseline.py
@@ -154,7 +154,8 @@ def print_accuracy(eval_dir):
             recall = 0
         if precision + recall != 0:
             f1_score = 2 * precision * recall / (precision + recall)
-        else: f1_score = 0
+        else:
+            f1_score = 0
 
         precision_list.append(precision)
         recall_list.append(recall)
@@ -198,9 +199,9 @@ def print_accuracy_ihc():
 
 
 def main():
-    #eval_all_sgn()
-    #eval_all_ihc()
-    #print_accuracy_sgn()
+    eval_all_sgn()
+    eval_all_ihc()
+    print_accuracy_sgn()
     print_accuracy_ihc()
 
 
diff --git a/scripts/prediction/run_prediction_distance_unet.py b/scripts/prediction/run_prediction_distance_unet.py
@@ -27,6 +27,7 @@ def main():
     parser.add_argument("--halo", default=None, type=str)
     parser.add_argument("--memory", action="store_true", help="Perform prediction in memory and save output as tif.")
     parser.add_argument("--time", action="store_true", help="Time prediction process.")
+    parser.add_argument("--no_masking", action="store_true", help="Do not mask input.")
     parser.add_argument("--seg_class", default=None, type=str,
                         help="Segmentation class to load parameters for masking input.")
     parser.add_argument("--center_distance_threshold", default=0.4, type=float,
@@ -67,6 +68,8 @@ def main():
     else:
         halo = tuple(json.loads(args.halo))
 
+    use_mask = ~args.no_masking
+
     if args.time:
         start = time.perf_counter()
 
@@ -75,6 +78,7 @@ def main():
             args.input, args.input_key, output_folder=None, model_path=args.model,
             scale=scale, min_size=min_size,
             block_shape=block_shape, halo=halo,
+            use_mask=use_mask,
             seg_class=args.seg_class,
             center_distance_threshold=args.center_distance_threshold,
             boundary_distance_threshold=args.boundary_distance_threshold,
@@ -92,6 +96,7 @@ def main():
             args.input, args.input_key, output_folder=args.output_folder, model_path=args.model,
             scale=scale, min_size=min_size,
             block_shape=block_shape, halo=halo,
+            use_mask=use_mask,
             seg_class=args.seg_class,
             center_distance_threshold=args.center_distance_threshold,
             boundary_distance_threshold=args.boundary_distance_threshold,