computational-cell-analytics
diff --git a/‎.github/doc_env.yaml‎
Lines changed: 23 additions & 0 deletions b/‎.github/doc_env.yaml‎
Lines changed: 23 additions & 0 deletions
diff --git a/‎.github/workflows/build_docs.yaml‎
Lines changed: 73 additions & 0 deletions b/‎.github/workflows/build_docs.yaml‎
Lines changed: 73 additions & 0 deletions
diff --git a/‎build_doc.py‎
Lines changed: 46 additions & 0 deletions b/‎build_doc.py‎
Lines changed: 46 additions & 0 deletions
diff --git a/‎doc/start_page.md‎
Lines changed: 2 additions & 0 deletions b/‎doc/start_page.md‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎environment.yaml‎
Lines changed: 1 addition & 0 deletions b/‎environment.yaml‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎scripts/cooper/training/train_mitochondria.py‎
Lines changed: 196 additions & 0 deletions b/‎scripts/cooper/training/train_mitochondria.py‎
Lines changed: 196 additions & 0 deletions
@@ -0,0 +1,23 @@
+channels:
+    - conda-forge
+    - pytorch
+name:
+    synaptic-reconstruction
+dependencies:
+    - python=3.12
+    - python-elf
+    - torch_em
+    - napari
+    - pip
+    - pyqt
+    - magicgui
+    - pytorch
+    - bioimageio.core
+    - kornia
+    - tensorboard
+    - pdoc
+    - scikit-learn
+    - mrcfile
+    - trimesh
+    - pip:
+        - napari-skimage-regionprops
@@ -0,0 +1,73 @@
+name: Build and Deploy Docs
+
+on:
+  push:
+    paths:
+      - "doc/*.md"   # Trigger on changes to any markdown file
+      - "**/*.py"   # Optionally include changes in Python files
+    branches:
+      - main        # Run the workflow only on pushes to the main branch
+  workflow_dispatch:
+
+# security: restrict permissions for CI jobs.
+permissions:
+  contents: read
+
+jobs:
+  build:
+    name: Build Documentation
+    runs-on: ubuntu-latest
+
+    steps:
+    - name: Checkout Code
+      uses: actions/checkout@v4
+
+    - name: Set up Micromamba
+      uses: mamba-org/setup-micromamba@v2
+      with:
+        micromamba-version: "latest"       # Use the latest version of micromamba
+        environment-file: .github/doc_env.yaml  # Reference your environment.yml file
+        init-shell: bash
+        cache-environment: true
+        post-cleanup: 'all'
+        # cache: true                        # Cache the micromamba environment
+
+    - name: Install package
+      # shell: bash -l {0}
+      run: pip install -e .
+
+    - name: Generate Documentation
+      shell: bash -l {0} 
+      run: pdoc synaptic_reconstruction -o doc/
+
+    - name: Verify Documentation Output
+      run: ls -la doc/
+
+    - name: Upload Documentation Artifact
+      uses: actions/upload-pages-artifact@v3
+      with:
+        # name: documentation
+        path: doc/
+
+  deploy:
+    name: Deploy Documentation
+    needs: build
+    runs-on: ubuntu-latest
+    permissions:
+      pages: write
+      id-token: write
+    environment:
+      name: github-pages
+      url: ${{ steps.deployment.outputs.page_url }}
+    steps:
+      # - name: Download Documentation Artifact
+      #   uses: actions/download-artifact@v4
+      #   with:
+      #     name: documentation
+      #     path: .
+
+      - name: Deploy to GiHub Pages
+        uses: actions/deploy-pages@v4
+        # with: 
+        #   artifact_name: documentation
+
@@ -0,0 +1,46 @@
+import argparse
+import glob
+import os
+import warnings
+
+from subprocess import run
+
+
+def check_docs_completeness():
+    """@private
+    All markdown and RST documentation files **SHOULD** be included in the module
+    docstring at micro_sam/__init__.py
+    """
+    import micro_sam
+
+    # We don't search in subfolders anymore, to allow putting additional documentation
+    # (e.g. for bioimage.io mdoels) that should not be included in the main documentation here.
+    markdown_doc_files = glob.glob("doc/*.md", recursive=True)
+    rst_doc_files = glob.glob("doc/*.rst", recursive=True)
+    all_doc_files = markdown_doc_files + rst_doc_files
+    missing_from_docs = [f for f in all_doc_files if os.path.basename(f) not in micro_sam.__doc__]
+    if len(missing_from_docs) > 0:
+        warnings.warn(
+            "Documentation files missing! Please add include statements "
+            "to the docstring in micro_sam/__init__.py for every file, eg:"
+            "'.. include:: ../doc/filename.md'. "
+            "List of missing files: "
+            f"{missing_from_docs}"
+        )
+
+
+if __name__ == "__main__":
+    check_docs_completeness()
+
+    parser = argparse.ArgumentParser()
+    parser.add_argument("--out", "-o", action="store_true")
+    args = parser.parse_args()
+
+    logo_url = "https://raw.githubusercontent.com/computational-cell-analytics/micro-sam/master/doc/logo/logo_and_text.png"
+    cmd = ["pdoc", "--docformat", "google", "--logo", logo_url]
+
+    if args.out:
+        cmd.extend(["--out", "tmp/"])
+    cmd.append("micro_sam")
+
+    run(cmd)
@@ -0,0 +1,2 @@
+# Synaptic Reconstruction
+lorem ipsum...
@@ -12,5 +12,6 @@ dependencies:
     - bioimageio.core
     - kornia
     - tensorboard
+    - trimesh
     - pip:
         - napari-skimage-regionprops
@@ -0,0 +1,196 @@
+import torch
+import os
+import argparse
+import time
+import torch_em
+
+from torch_em.data import MinInstanceSampler
+from torch_em.model import AnisotropicUNet
+# from torch_em.util.debug import check_loader, check_trainer
+
+# Import your util.py for data loading
+import util
+
+
+def main():
+    parser = argparse.ArgumentParser(description="3D UNet training for mitochondrial segmentation")
+    parser.add_argument(
+        "--data_dir", type=str, default="/scratch-grete/projects/nim00007/data/mitochondria/cooper/fidi_down_s2",
+        help="Path to the data directory"
+        )
+    parser.add_argument(
+        "--patch_shape", type=int, nargs=3, default=(32, 256, 256), help="Patch shape for data loading (3D tuple)"
+        )
+    parser.add_argument(
+        "--n_iterations", type=int, default=10000, help="Number of training iterations"
+        )
+    parser.add_argument(
+        "--learning_rate", type=float, default=1e-4, help="Learning rate"
+        )
+    parser.add_argument(
+        "--checkpoint_path", type=str, default="", help="Path to checkpoint used to load model's state_dict"
+        )
+    parser.add_argument(
+        "--experiment_name", type=str, default="default-mito-net",
+        help="Name that is used for the experiment and store the model's weights"
+        )
+    parser.add_argument(
+        "--batch_size", type=int, default=1, help="Batch size to be used"
+        )
+    parser.add_argument(
+        "--feature_size", type=int, default=32, help="Initial feature size of the 3D UNet"
+        )
+    parser.add_argument(
+        "--without_rois", type=bool, default=False, help="Train without Regions Of Interest (ROI)"
+        )
+    parser.add_argument(
+        "--early_stopping", type=int, default=10, help="Number of epochs without improvement before stopping training"
+        )
+    parser.add_argument(
+        "--save_dir", type=str, default="./", help="Path where the model checkpoints will be saved."
+        )
+
+    # Parse arguments
+    args = parser.parse_args()
+    checkpoint_path = args.checkpoint_path
+    n_iterations = args.n_iterations
+    learning_rate = args.learning_rate
+    data_dir = args.data_dir
+    save_dir = args.save_dir
+    experiment_name = args.experiment_name
+    batch_size = args.batch_size
+    patch_shape = args.patch_shape
+    initial_features = args.feature_size
+    with_rois = not args.without_rois
+    early_stopping = args.early_stopping
+
+    n_workers = 12 if torch.cuda.is_available() else 1
+    device = "cuda" if torch.cuda.is_available() else "cpu"
+    print(f"\n Experiment: {experiment_name}\n")
+    print(f"Using {device} with {n_workers} workers.")
+    label_transform = torch_em.transform.label.BoundaryTransform(add_binary_target=True)
+
+    loss_name = "dice"
+    metric_name = "dice"
+    ndim = 3
+
+    loss_function = util.get_loss_function(loss_name)
+    metric_function = util.get_loss_function(metric_name)
+    in_channels, out_channels = 1, 2
+    gain = 2
+
+    scale_factors = [
+        [1, 2, 2],
+        [1, 2, 2],
+        [2, 2, 2],
+        [2, 2, 2]
+    ]
+
+    final_activation = None
+    if final_activation is None and loss_name == "dice":
+        final_activation = "Sigmoid"
+
+    # load data paths etc.
+    start_time = time.time()
+    print(f"Start time {time.ctime()}")
+    print(f"Loading Data paths and ROIs if with_rois={with_rois}...")
+
+    if with_rois:
+        data_paths, rois_dict = util.get_data_paths_and_rois(
+            data_dir, min_shape=patch_shape, with_thresholds=True
+            )
+        data, rois_dict = util.split_data_paths_to_dict(
+            data_paths, rois_dict, train_ratio=.8, val_ratio=0.2, test_ratio=0
+            )
+    else:
+        data_paths = util.get_data_paths(data_dir)
+
+        for path in data_paths:
+            if "combined" in path:
+                data_paths.remove(path)
+        data_paths.sort(reverse=True)
+        data = util.split_data_paths_to_dict(
+            data_paths, rois_list=None, train_ratio=.8, val_ratio=0.15, test_ratio=0.05
+            )
+
+    end_time = time.time()
+    # Calculate execution time in seconds
+    execution_time = end_time - start_time
+    print(f"Data and ROI preprocessing execution time: {execution_time:.6f} seconds")
+
+    print("Creating 3d UNet with", in_channels, "input channels and", out_channels, "output channels.")
+    # UNet3d
+    model = AnisotropicUNet(
+        in_channels=in_channels, out_channels=out_channels, initial_features=initial_features,
+        final_activation=final_activation, gain=gain, scale_factors=scale_factors
+    )
+    print("Does a checkpoint exist at", os.path.join(save_dir, "checkpoints", experiment_name, "best.pt"), "?")
+    print(os.path.exists(os.path.join(save_dir, "checkpoints", experiment_name, "best.pt")))
+    if checkpoint_path or os.path.exists(os.path.join(save_dir, "checkpoints", experiment_name, "best.pt")):
+        if not checkpoint_path:
+            checkpoint_path = os.path.join(save_dir, "checkpoints", experiment_name)
+        model = torch_em.util.load_model(checkpoint=checkpoint_path, device=device)
+        print("loaded model from checkpoint:", os.path.join(save_dir, "checkpoints", experiment_name))
+        model.to(device)
+    print(model)
+    with_channels = False
+    with_label_channels = False
+    sampler = MinInstanceSampler(p_reject=0.95)
+
+    print("train", len(data["train"]), "val", len(data["val"]), "test", len(data["test"]))
+    print("data['test']", data["test"])
+
+    if with_rois:
+        train_loader = torch_em.default_segmentation_loader(
+            raw_paths=data["train"], raw_key="raw",
+            label_paths=data["train"], label_key="labels/mitochondria",
+            patch_shape=patch_shape, ndim=ndim, batch_size=batch_size,
+            label_transform=label_transform, num_workers=n_workers,
+            with_channels=with_channels, with_label_channels=with_label_channels,
+            rois=rois_dict["train"]
+        )
+        val_loader = torch_em.default_segmentation_loader(
+            raw_paths=data["val"], raw_key="raw",
+            label_paths=data["val"], label_key="labels/mitochondria",
+            patch_shape=patch_shape, ndim=ndim, batch_size=batch_size,
+            label_transform=label_transform, num_workers=n_workers,
+            with_channels=with_channels, with_label_channels=with_label_channels,
+            rois=rois_dict["val"]
+        )
+    else:
+        train_loader = torch_em.default_segmentation_loader(
+            raw_paths=data["train"], raw_key="raw",
+            label_paths=data["train"], label_key="labels/mitochondria",
+            patch_shape=patch_shape, ndim=ndim, batch_size=batch_size,
+            label_transform=label_transform, num_workers=n_workers,
+            with_channels=with_channels, with_label_channels=with_label_channels,
+            sampler=sampler
+        )
+        val_loader = torch_em.default_segmentation_loader(
+            raw_paths=data["val"], raw_key="raw",
+            label_paths=data["val"], label_key="labels/mitochondria",
+            patch_shape=patch_shape, ndim=ndim, batch_size=batch_size,
+            label_transform=label_transform, num_workers=n_workers,
+            with_channels=with_channels, with_label_channels=with_label_channels,
+            sampler=sampler
+        )
+
+    trainer = torch_em.default_segmentation_trainer(
+        name=experiment_name, model=model,
+        train_loader=train_loader, val_loader=val_loader,
+        loss=loss_function, metric=metric_function,
+        learning_rate=learning_rate,
+        mixed_precision=True,
+        log_image_interval=50,
+        device=device,
+        compile_model=False,
+        save_root=save_dir,
+        early_stopping=early_stopping,
+        # logger=None
+    )
+
+    trainer.fit(n_iterations)
+
+
+if __name__ == "__main__":
+    main()
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,2 @@`
	`1`	`+# Synaptic Reconstruction`
	`2`	`+lorem ipsum...`