computational-cell-analytics
diff --git a/‎scripts/cooper/revision/assort_new_az_data.py‎
Lines changed: 210 additions & 0 deletions b/‎scripts/cooper/revision/assort_new_az_data.py‎
Lines changed: 210 additions & 0 deletions
diff --git a/‎scripts/cooper/revision/check_training_data.py‎
Lines changed: 37 additions & 0 deletions b/‎scripts/cooper/revision/check_training_data.py‎
Lines changed: 37 additions & 0 deletions
diff --git a/‎scripts/cooper/revision/eval_AZ.sh‎
Lines changed: 8 additions & 0 deletions b/‎scripts/cooper/revision/eval_AZ.sh‎
Lines changed: 8 additions & 0 deletions
diff --git a/‎scripts/cooper/revision/evaluate_result.py‎
Lines changed: 48 additions & 0 deletions b/‎scripts/cooper/revision/evaluate_result.py‎
Lines changed: 48 additions & 0 deletions
diff --git a/‎scripts/cooper/revision/prediction.py‎
Lines changed: 90 additions & 0 deletions b/‎scripts/cooper/revision/prediction.py‎
Lines changed: 90 additions & 0 deletions
@@ -0,0 +1,210 @@
+import os
+from glob import glob
+
+import h5py
+import numpy as np
+from tqdm import tqdm
+from skimage.transform import resize
+
+ROOT = "/mnt/ceph-hdd/cold_store/projects/nim00007/AZ_data/training_data"
+INTER_ROOT = "/mnt/ceph-hdd/cold_store/projects/nim00007/AZ_predictions"
+OUTPUT_ROOT = "/mnt/ceph-hdd/cold_store/projects/nim00007/new_AZ_train_data"
+
+
+def _check_data(files, label_folder, check_thinned):
+    for ff in files:
+        with h5py.File(ff, "r") as f:
+            shape = f["raw"].shape
+            az = f["labels/az"][:]
+        n_az = az.max()
+
+        if check_thinned:
+            label_file = os.path.join(label_folder, os.path.basename(ff))
+            with h5py.File(label_file, "r") as f:
+                az_thin = f["labels/az_thin2"][:]
+            n_az_thin = az_thin.max()
+        else:
+            n_az_thin = None
+
+        print(os.path.basename(ff), ":", shape, ":", n_az, ":", n_az_thin)
+
+
+def assort_tem():
+    old_name = "01data_withoutInvertedFiles_minusSVseg_corrected"
+    new_name = "tem"
+
+    raw_folder = os.path.join(ROOT, old_name)
+    label_folder = os.path.join(INTER_ROOT, old_name)
+    output_folder = os.path.join(OUTPUT_ROOT, new_name)
+    os.makedirs(output_folder, exist_ok=True)
+
+    files = glob(os.path.join(raw_folder, "*.h5"))
+    for ff in tqdm(files):
+        with h5py.File(ff, "r") as f:
+            raw = f["raw"][:]
+            az = f["labels/az"][:]
+
+        label_path = os.path.join(label_folder, os.path.basename(ff))
+        with h5py.File(label_path, "r") as f:
+            az_thin = f["labels/az_thin2"][:]
+
+        z_range1 = np.where(az != 0)[0]
+        z_range2 = np.where(az != 0)[0]
+        z_range = slice(
+            np.min(np.concatenate([z_range1, z_range2])),
+            np.max(np.concatenate([z_range1, z_range2])) + 1,
+        )
+        raw, az, az_thin = raw[z_range], az[z_range], az_thin[z_range]
+
+        out_path = os.path.join(output_folder, os.path.basename(ff))
+        with h5py.File(out_path, "a") as f:
+            f.create_dataset("raw", data=raw, compression="lzf")
+            f.create_dataset("labels/az_thin", data=az_thin, compression="lzf")
+            f.create_dataset("labels/az", data=az, compression="lzf")
+
+
+def assort_chemical_fixation():
+    old_name = "12_chemical_fix_cryopreparation_minusSVseg_corrected"
+    new_name = "chemical_fixation"
+
+    raw_folder = os.path.join(ROOT, old_name)
+    label_folder = os.path.join(INTER_ROOT, old_name)
+    output_folder = os.path.join(OUTPUT_ROOT, new_name)
+    os.makedirs(output_folder, exist_ok=True)
+
+    label_key = "labels/az_thin2"
+
+    files = glob(os.path.join(raw_folder, "*.h5"))
+    for ff in tqdm(files):
+        with h5py.File(ff, "r") as f:
+            raw = f["raw"][:]
+            az = f["labels/az"][:]
+
+        label_path = os.path.join(label_folder, os.path.basename(ff))
+        with h5py.File(label_path, "r") as f:
+            az_thin = f[label_key][:]
+
+        z_range1 = np.where(az != 0)[0]
+        z_range2 = np.where(az != 0)[0]
+        z_range = slice(
+            np.min(np.concatenate([z_range1, z_range2])),
+            np.max(np.concatenate([z_range1, z_range2])) + 1,
+        )
+        raw, az, az_thin = raw[z_range], az[z_range], az_thin[z_range]
+
+        out_path = os.path.join(output_folder, os.path.basename(ff))
+        with h5py.File(out_path, "a") as f:
+            f.create_dataset("raw", data=raw, compression="lzf")
+            f.create_dataset("labels/az_thin", data=az_thin, compression="lzf")
+            f.create_dataset("labels/az", data=az, compression="lzf")
+
+
+def assort_stem():
+    old_names = [
+        "04_hoi_stem_examples_fidi_and_sarah_corrected",
+        "04_hoi_stem_examples_minusSVseg_cropped_corrected",
+        "06_hoi_wt_stem750_fm_minusSVseg_cropped_corrected",
+    ]
+    new_names = ["stem", "stem_cropped", "stem_cropped"]
+    for old_name, new_name in zip(old_names, new_names):
+        print(old_name)
+        raw_folder = os.path.join(ROOT, f"{old_name}_rescaled_tomograms")
+        label_folder = os.path.join(INTER_ROOT, old_name)
+        files = glob(os.path.join(raw_folder, "*.h5"))
+
+        # _check_data(files, label_folder, check_thinned=True)
+        # continue
+
+        output_folder = os.path.join(OUTPUT_ROOT, new_name)
+        os.makedirs(output_folder, exist_ok=True)
+        for ff in tqdm(files):
+            with h5py.File(ff, "r") as f:
+                raw = f["raw"][:]
+                az = f["labels/az"][:]
+
+            label_path = os.path.join(label_folder, os.path.basename(ff))
+            with h5py.File(label_path, "r") as f:
+                az_thin = f["labels/az_thin2"][:]
+            az_thin = resize(az_thin, az.shape, order=0, anti_aliasing=False, preserve_range=True).astype(az_thin.dtype)
+            assert az_thin.shape == az.shape
+
+            out_path = os.path.join(output_folder, os.path.basename(ff))
+            with h5py.File(out_path, "a") as f:
+                f.create_dataset("raw", data=raw, compression="lzf")
+                f.create_dataset("labels/az_thin", data=az_thin, compression="lzf")
+                f.create_dataset("labels/az", data=az, compression="lzf")
+
+
+def assort_wichmann():
+    old_name = "wichmann_withAZ_rescaled_tomograms"
+    new_name = "endbulb_of_held"
+
+    raw_folder = os.path.join(ROOT, old_name)
+    output_folder = os.path.join(OUTPUT_ROOT, new_name)
+    os.makedirs(output_folder, exist_ok=True)
+
+    files = glob(os.path.join(raw_folder, "*.h5"))
+
+    output_folder = os.path.join(OUTPUT_ROOT, new_name)
+    os.makedirs(output_folder, exist_ok=True)
+    for ff in tqdm(files):
+        with h5py.File(ff, "r") as f:
+            raw = f["raw"][:]
+            az = f["labels/az"][:]
+
+        output_file = os.path.join(output_folder, os.path.basename(ff))
+        with h5py.File(output_file, "a") as f:
+            f.create_dataset("raw", data=raw, compression="lzf")
+            f.create_dataset("labels/az", data=az, compression="lzf")
+            f.create_dataset("labels/az_thin", data=az, compression="lzf")
+
+
+def crop_wichmann():
+    input_name = "endbulb_of_held"
+    output_name = "endbulb_of_held_cropped"
+
+    input_folder = os.path.join(OUTPUT_ROOT, input_name)
+    output_folder = os.path.join(OUTPUT_ROOT, output_name)
+    os.makedirs(output_folder, exist_ok=True)
+    files = glob(os.path.join(input_folder, "*.h5"))
+
+    min_shape = (32, 512, 512)
+
+    for ff in tqdm(files):
+        with h5py.File(ff, "r") as f:
+            az = f["labels/az"][:]
+            bb = np.where(az != 0)
+            bb = tuple(slice(int(b.min()), int(b.max()) + 1) for b in bb)
+            pad_width = [max(sh - (b.stop - b.start), 0) // 2 for b, sh in zip(bb, min_shape)]
+            bb = tuple(
+                slice(max(b.start - pw, 0), min(b.stop + pw, sh)) for b, pw, sh in zip(bb, pad_width, az.shape)
+            )
+            az = az[bb]
+            raw = f["raw"][bb]
+
+        # import napari
+        # v = napari.Viewer()
+        # v.add_image(raw)
+        # v.add_labels(az)
+        # v.add_labels(az_thin)
+        # napari.run()
+
+        output_path = os.path.join(output_folder, os.path.basename(ff).replace(".h5", "_cropped.h5"))
+        with h5py.File(output_path, "a") as f:
+            f.create_dataset("raw", data=raw, compression="lzf")
+            f.create_dataset("labels/az", data=az, compression="lzf")
+            f.create_dataset("labels/az_thin", data=az, compression="lzf")
+
+
+def main():
+    # assort_tem()
+    # assort_chemical_fixation()
+
+    # assort_stem()
+
+    # assort_wichmann()
+    crop_wichmann()
+
+
+if __name__ == "__main__":
+    main()
@@ -0,0 +1,37 @@
+import argparse
+import os
+from glob import glob
+
+import napari
+import h5py
+
+ROOT = "/mnt/ceph-hdd/cold_store/projects/nim00007/new_AZ_train_data"
+all_names = [
+    "chemical_fixation",
+    "tem",
+    "stem",
+    "stem_cropped",
+    "endbulb_of_held",
+    "endbulb_of_held_cropped",
+]
+
+
+parser = argparse.ArgumentParser()
+parser.add_argument("-n", "--names", nargs="+", default=all_names)
+args = parser.parse_args()
+names = args.names
+
+
+for ds in names:
+    paths = glob(os.path.join(ROOT, ds, "*.h5"))
+    for p in paths:
+        with h5py.File(p, "r") as f:
+            raw = f["raw"][:]
+            az = f["labels/az"][:]
+            az_thin = f["labels/az_thin"][:]
+        v = napari.Viewer()
+        v.add_image(raw)
+        v.add_labels(az)
+        v.add_labels(az_thin)
+        v.title = os.path.basename(p)
+        napari.run()
@@ -0,0 +1,8 @@
+python run_az_evaluation.py \
+    -s /mnt/ceph-hdd/cold_store/projects/nim00007/AZ_data/segmentations \
+    -g /mnt/ceph-hdd/cold_store/projects/nim00007/AZ_data/training_data \
+    --seg_key /AZ/segment_from_AZmodel_TEM_STEM_ChemFix_v1 \
+    --criterion iop \
+    -o v1
+    # --dataset 01 \
+    # --seg_key AZ/segment_from_AZmodel_TEM_STEM_ChemFix_wichmann_v2 \
@@ -0,0 +1,48 @@
+import argparse
+import pandas as pd
+
+parser = argparse.ArgumentParser()
+parser.add_argument("result_path")
+args = parser.parse_args()
+
+results = pd.read_excel(args.result_path)
+
+
+def summarize_results(res):
+    print("Dice-Score:", res["dice"].mean(), "+-", res["dice"].std())
+    tp, fp, fn = float(res["tp"].sum()), float(res["fp"].sum()), float(res["fn"].sum())
+    precision = tp / (tp + fp)
+    recall = tp / (tp + fn)
+    f1_score = 2 * tp / (2 * tp + fn + fp)
+    print("Precision:", precision)
+    print("Recall:", recall)
+    print("F1-Score:", f1_score)
+
+
+# # Compute the results for Chemical Fixation.
+results_chem_fix = results[results.dataset.str.startswith("12")]
+if results_chem_fix.size > 0:
+    print("Chemical Fixation Results:")
+    summarize_results(results_chem_fix)
+#
+# # Compute the results for STEM (=04).
+results_stem = results[results.dataset.str.startswith(("04", "06"))]
+if results_stem.size > 0:
+    print()
+    print("STEM Results:")
+    summarize_results(results_stem)
+#
+# # Compute the results for TEM (=01).
+results_tem = results[results.dataset.str.startswith("01")]
+if results_tem.size > 0:
+    print()
+    print("TEM Results:")
+    summarize_results(results_tem)
+
+#
+# Compute the results for Wichmann.
+results_wichmann = results[results.dataset.str.startswith("wichmann")]
+if results_wichmann.size > 0:
+    print()
+    print("Wichmann Results:")
+    summarize_results(results_wichmann)
@@ -0,0 +1,90 @@
+import os
+from glob import glob
+
+import h5py
+from synapse_net.inference.inference import get_model, compute_scale_from_voxel_size
+from synapse_net.inference.compartments import segment_compartments
+from synapse_net.inference.vesicles import segment_vesicles
+from tqdm import tqdm
+
+ROOT = "/mnt/ceph-hdd/cold_store/projects/nim00007/AZ_data/training_data"
+OUTPUT_ROOT = "/mnt/ceph-hdd/cold_store/projects/nim00007/AZ_predictions"
+RESOLUTIONS = {
+    "01data_withoutInvertedFiles_minusSVseg_corrected": {"x": 1.554, "y": 1.554, "z": 1.554},
+    "04_hoi_stem_examples_fidi_and_sarah_corrected": {"x": 0.8681, "y": 0.8681, "z": 0.8681},
+    "04_hoi_stem_examples_fidi_and_sarah_corrected_rescaled_tomograms": {"x": 1.554, "y": 1.554, "z": 1.554},
+    "04_hoi_stem_examples_minusSVseg_cropped_corrected": {"x": 0.8681, "y": 0.8681, "z": 0.8681},
+    "04_hoi_stem_examples_minusSVseg_cropped_corrected_rescaled_tomograms": {"x": 1.554, "y": 1.554, "z": 1.554},
+    "06_hoi_wt_stem750_fm_minusSVseg_cropped_corrected": {"x": 0.8681, "y": 0.8681, "z": 0.8681},
+    "06_hoi_wt_stem750_fm_minusSVseg_cropped_corrected_rescaled_tomograms": {"x": 1.554, "y": 1.554, "z": 1.554},
+    "12_chemical_fix_cryopreparation_minusSVseg_corrected": {"x": 1.554, "y": 1.554, "z": 1.554},
+    "wichmann_withAZ": {"x": 1.748, "y": 1.748, "z": 1.748},
+    "wichmann_withAZ_rescaled_tomograms": {"x": 1.554, "y": 1.554, "z": 1.554},
+}
+
+
+def predict_boundaries(model, path, output_path):
+    output_key = "predictions/boundaries"
+    if os.path.exists(output_path):
+        with h5py.File(output_path, "r") as f:
+            if output_key in f:
+                return
+
+    dataset = os.path.basename(os.path.split(path)[0])
+
+    with h5py.File(path, "r") as f:
+        data = f["raw"][:]
+    scale = compute_scale_from_voxel_size(RESOLUTIONS[dataset], "compartments")
+    _, pred = segment_compartments(data, model=model, scale=scale, verbose=False, return_predictions=True)
+    with h5py.File(output_path, "a") as f:
+        f.create_dataset(output_key, data=pred, compression="lzf")
+
+
+def predict_all_boundaries():
+    model = get_model("compartments")
+    files = sorted(glob(os.path.join(ROOT, "**/*.h5"), recursive=True))
+    for path in tqdm(files):
+        folder_name = os.path.basename(os.path.split(path)[0])
+        output_folder = os.path.join(OUTPUT_ROOT, folder_name)
+        os.makedirs(output_folder, exist_ok=True)
+        output_path = os.path.join(output_folder, os.path.basename(path))
+        predict_boundaries(model, path, output_path)
+
+
+def predict_vesicles(model, path, output_path):
+    output_key = "predictions/vesicle_seg"
+    if os.path.exists(output_path):
+        with h5py.File(output_path, "r") as f:
+            if output_key in f:
+                return
+
+    dataset = os.path.basename(os.path.split(path)[0])
+    if "rescaled" in dataset:
+        return
+
+    with h5py.File(path, "r") as f:
+        data = f["raw"][:]
+    scale = compute_scale_from_voxel_size(RESOLUTIONS[dataset], "vesicles_3d")
+    seg = segment_vesicles(data, model=model, scale=scale, verbose=False)
+    with h5py.File(output_path, "a") as f:
+        f.create_dataset(output_key, data=seg, compression="lzf")
+
+
+def predict_all_vesicles():
+    model = get_model("vesicles_3d")
+    files = sorted(glob(os.path.join(ROOT, "**/*.h5"), recursive=True))
+    for path in tqdm(files):
+        folder_name = os.path.basename(os.path.split(path)[0])
+        output_folder = os.path.join(OUTPUT_ROOT, folder_name)
+        os.makedirs(output_folder, exist_ok=True)
+        output_path = os.path.join(output_folder, os.path.basename(path))
+        predict_vesicles(model, path, output_path)
+
+
+def main():
+    # predict_all_boundaries()
+    predict_all_vesicles()
+
+
+if __name__ == "__main__":
+    main()