Refactor state precomputation

constantinpape · constantinpape · commit ed8865ee4ada · 2023-08-17T21:31:50.000+02:00
diff --git a/micro_sam/instance_segmentation.py b/micro_sam/instance_segmentation.py
@@ -1091,6 +1091,35 @@ def set_state(self, state: Dict[str, Any]) -> None:
         super().set_state(state)
 
 
+def get_amg(
+    predictor: SamPredictor,
+    is_tiled: bool,
+    embedding_based_amg: bool = False,
+    **kwargs,
+) -> AMGBase:
+    """Get the automatic mask generator class.
+
+    Args:
+        predictor: The segment anything predictor.
+        is_tiled: Whether tiled embeddings are used.
+        embedding_based_amg: Whether to use the embedding based instance segmentation functionality.
+            This functionality is still experimental.
+        kwargs: The keyword arguments for the amg class.
+
+    Returns:
+        The automatic mask generator.
+    """
+    if embedding_based_amg:
+        warnings.warn("The embedding based instance segmentation functionality is experimental.")
+    if is_tiled:
+        amg = TiledEmbeddingMaskGenerator(predictor, **kwargs) if embedding_based_amg else\
+            TiledAutomaticMaskGenerator(predictor, **kwargs)
+    else:
+        amg = EmbeddingMaskGenerator(predictor, **kwargs) if embedding_based_amg else\
+            AutomaticMaskGenerator(predictor, **kwargs)
+    return amg
+
+
 #
 # Experimental functionality
 #
diff --git a/micro_sam/precompute_state.py b/micro_sam/precompute_state.py
@@ -0,0 +1,157 @@
+import os
+import pickle
+
+from glob import glob
+from pathlib import Path
+from typing import Optional, Tuple, Union
+
+import numpy as np
+from segment_anything.predictor import SamPredictor
+from tqdm import tqdm
+
+from . import instance_segmentation, util
+
+
+def cache_amg_state(
+    predictor: SamPredictor,
+    raw: np.ndarray,
+    image_embeddings: util.ImageEmbeddings,
+    save_path: Union[str, os.PathLike],
+    verbose: bool = True,
+    **kwargs,
+) -> instance_segmentation.AMGBase:
+    """Compute and cache or load the state for the automatic mask generator.
+
+    Args:
+        predictor: The segment anything predictor.
+        raw: The image data.
+        image_embeddings: The image embeddings.
+        save_path: The embedding save path. The AMG state will be stored in <save_path>/amg_state.pickle.
+        verbose: Whether to run the computation verbose.
+        kwargs: The keyword arguments for the amg class.
+
+    Returns:
+        The automatic mask generator class with the cached state.
+    """
+    is_tiled = image_embeddings["input_size"] is None
+    amg = instance_segmentation.get_amg(predictor, is_tiled, **kwargs)
+
+    save_path_amg = os.path.join(save_path, "amg_state.pickle")
+    if os.path.exists(save_path_amg):
+        if verbose:
+            print("Load the AMG state from", save_path_amg)
+        with open(save_path_amg, "rb") as f:
+            amg_state = pickle.load(f)
+        amg.set_state(amg_state)
+        return amg
+
+    if verbose:
+        print("Precomputing the state for instance segmentation.")
+    amg.initialize(raw, image_embeddings=image_embeddings, verbose=verbose)
+    with open(save_path_amg, "wb") as f:
+        pickle.dump(amg.get_state(), f)
+
+    return amg
+
+
+def _precompute_state_for_file(
+    predictor, input_path, output_path, key, ndim, tile_shape, halo, precompute_amg_state,
+):
+    image_data = util.load_image_data(input_path, key)
+    output_path = Path(output_path).with_suffix(".zarr")
+    embeddings = util.precompute_image_embeddings(
+        predictor, image_data, output_path, ndim=ndim, tile_shape=tile_shape, halo=halo,
+    )
+    if precompute_amg_state:
+        cache_amg_state(predictor, image_data, embeddings, output_path, verbose=True)
+
+
+def _precompute_state_for_files(
+    predictor, input_files, output_path, ndim, tile_shape, halo, precompute_amg_state,
+):
+    os.makedirs(output_path, exist_ok=True)
+    for file_path in tqdm(input_files, desc="Precompute state for files."):
+        out_path = os.path.join(output_path, os.path.basename(file_path))
+        _precompute_state_for_file(
+            predictor, file_path, out_path,
+            key=None, ndim=ndim, tile_shape=tile_shape, halo=halo,
+            precompute_amg_state=precompute_amg_state,
+        )
+
+
+def precompute_state(
+    input_path: Union[os.PathLike, str],
+    output_path: Union[os.PathLike, str],
+    model_type: str = util._DEFAULT_MODEL,
+    checkpoint_path: Optional[Union[os.PathLike, str]] = None,
+    key: Optional[str] = None,
+    ndim: Union[int] = None,
+    tile_shape: Optional[Tuple[int, int]] = None,
+    halo: Optional[Tuple[int, int]] = None,
+    precompute_amg_state: bool = False,
+) -> None:
+    """Precompute the image embeddings and other optional state for the input image(s).
+
+    Args:
+        input_path: The input image file(s). Can either be a single image file (e.g. tif or png),
+            a container file (e.g. hdf5 or zarr) or a folder with images files.
+            In case of a container file the argument `key` must be given. In case of a folder
+            it can be given to provide a glob pattern to subselect files from the folder.
+        output_path: The output path were the embeddings and other state will be saved.
+        model_type: The SegmentAnything model to use. Will use the standard vit_h model by default.
+        checkpoint_path: Path to a checkpoint for a custom model.
+        key: The key to the input file. This is needed for contaner files (e.g. hdf5 or zarr)
+            and can be used to provide a glob pattern if the input is a folder with image files.
+        ndim: The dimensionality of the data.
+        tile_shape: Shape of tiles for tiled prediction. By default prediction is run without tiling.
+        halo: Overlap of the tiles for tiled prediction.
+        precompute_amg_state: Whether to precompute the state for automatic instance segmentation
+            in addition to the image embeddings.
+    """
+    predictor = util.get_sam_model(model_type=model_type, checkpoint_path=checkpoint_path)
+    # check if we precompute the state for a single file or for a folder with image files
+    if os.path.isdir(input_path) and Path(input_path).suffix not in (".n5", ".zarr"):
+        pattern = "*" if key is None else key
+        input_files = glob(os.path.join(input_path, pattern))
+        _precompute_state_for_files(
+            predictor, input_files, output_path,
+            ndim=ndim, tile_shape=tile_shape, halo=halo,
+            precompute_amg_state=precompute_amg_state,
+        )
+    else:
+        _precompute_state_for_file(
+            predictor, input_path, output_path, key,
+            ndim=ndim, tile_shape=tile_shape, halo=halo,
+            precompute_amg_state=precompute_amg_state,
+        )
+
+
+def main():
+    """@private"""
+    import argparse
+
+    parser = argparse.ArgumentParser(description="Compute the embeddings for an image.")
+    parser.add_argument("-i", "--input_path", required=True)
+    parser.add_argument("-o", "--output_path", required=True)
+    parser.add_argument("-m", "--model_type", default="vit_h")
+    parser.add_argument("-c", "--checkpoint_path", default=None)
+    parser.add_argument("-k", "--key")
+    parser.add_argument(
+        "--tile_shape", nargs="+", type=int, help="The tile shape for using tiled prediction", default=None
+    )
+    parser.add_argument(
+        "--halo", nargs="+", type=int, help="The halo for using tiled prediction", default=None
+    )
+    parser.add_argument("-n", "--ndim")
+    parser.add_argument("-p", "--precompute_amg_state")
+
+    args = parser.parse_args()
+    precompute_state(
+        args.input_path, args.output_path, args.model_type, args.checkpoint_path,
+        key=args.key, tile_shape=args.tile_shape, halo=args.halo, ndim=args.ndim,
+        precompute_amg_state=args.precompute_amg_state,
+    )
+
+
+if __name__ == "__main__":
+    main()
diff --git a/micro_sam/sam_annotator/annotator_2d.py b/micro_sam/sam_annotator/annotator_2d.py
@@ -9,6 +9,7 @@
 from segment_anything import SamPredictor
 
 from .. import instance_segmentation, util
+from ..precompute_state import cache_amg_state
 from ..visualization import project_embeddings_for_visualization
 from . import util as vutil
 from .gui_utils import show_wrong_file_warning
@@ -57,7 +58,7 @@ def _autosegment_widget(
     global AMG
     is_tiled = IMAGE_EMBEDDINGS["input_size"] is None
     if AMG is None:
-        AMG = vutil.get_amg(PREDICTOR, is_tiled)
+        AMG = instance_segmentation.get_amg(PREDICTOR, is_tiled)
 
     if not AMG.is_initialized:
         AMG.initialize(v.layers["raw"].data, image_embeddings=IMAGE_EMBEDDINGS, verbose=True)
@@ -230,7 +231,7 @@ def annotator_2d(
         wrong_file_callback=show_wrong_file_warning
     )
     if precompute_amg_state and (embedding_path is not None):
-        AMG = vutil.cache_amg_state(PREDICTOR, raw, IMAGE_EMBEDDINGS, embedding_path)
+        AMG = cache_amg_state(PREDICTOR, raw, IMAGE_EMBEDDINGS, embedding_path)
 
     # we set the pre-computed image embeddings if we don't use tiling
     # (if we use tiling we cannot directly set it because the tile will be chosen dynamically)
diff --git a/micro_sam/sam_annotator/image_series_annotator.py b/micro_sam/sam_annotator/image_series_annotator.py
@@ -1,43 +1,19 @@
 import os
 import warnings
+
 from glob import glob
+from pathlib import Path
 from typing import List, Optional, Union
 
 import imageio.v3 as imageio
 import napari
 
 from magicgui import magicgui
-from napari.utils import progress as tqdm
 from segment_anything import SamPredictor
 
 from .. import util
+from ..precompute_state import _precompute_state_for_files
 from .annotator_2d import annotator_2d
-from .util import cache_amg_state
-
-
-def _precompute_embeddings_for_image_series(
-    predictor,
-    image_files,
-    embedding_root,
-    tile_shape,
-    halo,
-    precompute_amg_state,
-):
-    os.makedirs(embedding_root, exist_ok=True)
-    embedding_paths = []
-    for image_file in tqdm(image_files, desc="Precompute embeddings"):
-        fname = os.path.basename(image_file)
-        fname = os.path.splitext(fname)[0] + ".zarr"
-        embedding_path = os.path.join(embedding_root, fname)
-        image = imageio.imread(image_file)
-        embeddings = util.precompute_image_embeddings(
-            predictor, image, save_path=embedding_path, ndim=2,
-            tile_shape=tile_shape, halo=halo
-        )
-        if precompute_amg_state:
-            cache_amg_state(predictor, image, embeddings, embedding_path)
-        embedding_paths.append(embedding_path)
-    return embedding_paths
 
 
 def image_series_annotator(
@@ -73,12 +49,16 @@ def image_series_annotator(
     if embedding_path is None:
         embedding_paths = None
     else:
-        embedding_paths = _precompute_embeddings_for_image_series(
-            predictor, image_files, embedding_path,
+        _precompute_state_for_files(
+            predictor, image_files, embedding_path, ndim=2,
             tile_shape=kwargs.get("tile_shape", None),
             halo=kwargs.get("halo", None),
             precompute_amg_state=kwargs.get("precompute_amg_state", False),
         )
+        embedding_paths = [
+            os.path.join(embedding_path, f"{Path(path).stem}.zarr") for path in image_files
+        ]
+        assert all(os.path.exists(emb_path) for emb_path in embedding_paths)
 
     def _save_segmentation(image_path, segmentation):
         fname = os.path.basename(image_path)
@@ -151,7 +131,7 @@ def main():
     """@private"""
     import argparse
 
-    available_models = list(util._MODEL_URLS.keys())
+    available_models = list(util.get_model_names())
     available_models = ", ".join(available_models)
 
     parser = argparse.ArgumentParser(description="Annotate a series of images from a folder.")
diff --git a/micro_sam/sam_annotator/util.py b/micro_sam/sam_annotator/util.py
@@ -364,39 +364,9 @@ def toggle_label(prompts):
     prompts.refresh_colors()
 
 
-def get_amg(predictor, is_tiled):
-    """@private
-    """
-    if is_tiled:
-        amg = instance_segmentation.TiledAutomaticMaskGenerator(predictor)
-    else:
-        amg = instance_segmentation.AutomaticMaskGenerator(predictor)
-    return amg
-
-
-def cache_amg_state(predictor, raw, image_embeddings, save_path, verbose=True):
-    """@private"""
-    is_tiled = image_embeddings["input_size"] is None
-    amg = get_amg(predictor, is_tiled)
-
-    save_path_amg = os.path.join(save_path, "amg_state.pickle")
-    if os.path.exists(save_path_amg):
-        with open(save_path_amg, "rb") as f:
-            amg_state = pickle.load(f)
-        amg.set_state(amg_state)
-        return amg
-
-    print("Precomputing the state for instance segmentation.")
-    amg.initialize(raw, image_embeddings=image_embeddings, verbose=verbose)
-    with open(save_path_amg, "wb") as f:
-        pickle.dump(amg.get_state(), f)
-
-    return amg
-
-
 def _initialize_parser(description, with_segmentation_result=True, with_show_embeddings=True):
 
-    available_models = list(util._MODEL_URLS.keys())
+    available_models = list(util.get_model_names())
     available_models = ", ".join(available_models)
 
     parser = argparse.ArgumentParser(description=description)
diff --git a/micro_sam/util.py b/micro_sam/util.py
@@ -68,6 +68,11 @@
 """@private"""
 
 
+#
+# Functionality for model download and export
+#
+
+
 def _download(url, path, model_type):
     with requests.get(url, stream=True, verify=True) as r:
         if r.status_code != 200:
@@ -246,6 +251,11 @@ def get_model_names() -> Iterable:
     return _MODEL_URLS.keys()
 
 
+#
+# Functionality for precomputing embeddings and other state
+#
+
+
 def _to_image(input_):
     # we require the input to be uint8
     if input_.dtype != np.dtype("uint8"):
@@ -570,6 +580,11 @@ def set_precomputed(
     return predictor
 
 
+#
+# Misc functionality
+#
+
+
 def compute_iou(mask1: np.ndarray, mask2: np.ndarray) -> float:
     """Compute the intersection over union of two masks.
 
@@ -642,25 +657,3 @@ def load_image_data(
             if not lazy_loading:
                 image_data = image_data[:]
     return image_data
-
-
-def main():
-    """@private"""
-    import argparse
-
-    parser = argparse.ArgumentParser(description="Compute the embeddings for an image.")
-    parser.add_argument("-i", "--input_path", required=True)
-    parser.add_argument("-o", "--output_path", required=True)
-    parser.add_argument("-m", "--model_type", default="vit_h")
-    parser.add_argument("-c", "--checkpoint_path", default=None)
-    parser.add_argument("-k", "--key")
-    args = parser.parse_args()
-
-    predictor = get_sam_model(model_type=args.model_type, checkpoint_path=args.checkpoint_path)
-    with open_file(args.input_path, mode="r") as f:
-        data = f[args.key]
-        precompute_image_embeddings(predictor, data, save_path=args.output_path)
-
-
-if __name__ == "__main__":
-    main()
diff --git a/setup.py b/setup.py