diff --git a/.github/workflows/mypy-type-check.yml b/.github/workflows/mypy-type-check.yml
index 7ec585482..cbde391cd 100644
--- a/.github/workflows/mypy-type-check.yml
+++ b/.github/workflows/mypy-type-check.yml
@@ -6,7 +6,7 @@ on:
   push:
     branches: [ develop, pre-release, master, main ]
   pull_request:
-    branches: [ develop, pre-release, master, main ]
+    branches: [ develop, pre-release, master, main, dev-define-engines-abc ]
 
 jobs:
 
diff --git a/.github/workflows/python-package.yml b/.github/workflows/python-package.yml
index 9faabb796..9b89d4839 100644
--- a/.github/workflows/python-package.yml
+++ b/.github/workflows/python-package.yml
@@ -8,7 +8,7 @@ on:
     branches: [ develop, pre-release, master, main ]
     tags: v*
   pull_request:
-    branches: [ develop, pre-release, master, main ]
+    branches: [ develop, pre-release, master, main, dev-define-engines-abc]
 
 jobs:
   build:
diff --git a/requirements/requirements.txt b/requirements/requirements.txt
index c0ace5cfc..045a4ce4e 100644
--- a/requirements/requirements.txt
+++ b/requirements/requirements.txt
@@ -4,6 +4,7 @@ aiohttp>=3.8.1
 albumentations>=1.3.0
 bokeh>=3.1.1, <3.6.0
 Click>=8.1.3, <8.2.0
+dask>=2025.10.0
 defusedxml>=0.7.1
 filelock>=3.9.0
 flask>=2.2.2
diff --git a/tests/conftest.py b/tests/conftest.py
index aab4b374c..75bd7087c 100644
--- a/tests/conftest.py
+++ b/tests/conftest.py
@@ -534,6 +534,7 @@ def sample_wsi_dict(remote_sample: Callable) -> dict:
         "wsi4_4k_4k_svs",
         "wsi3_20k_20k_pred",
         "wsi4_4k_4k_pred",
+        "wsi4_1k_1k_svs",
     ]
     return {name: remote_sample(name) for name in file_names}
 
diff --git a/tests/engines/__init__.py b/tests/engines/__init__.py
new file mode 100644
index 000000000..193a523c1
--- /dev/null
+++ b/tests/engines/__init__.py
@@ -0,0 +1 @@
+"""Unit test package for tiatoolbox engines."""
diff --git a/tests/engines/test_engine_abc.py b/tests/engines/test_engine_abc.py
new file mode 100644
index 000000000..3fb239dac
--- /dev/null
+++ b/tests/engines/test_engine_abc.py
@@ -0,0 +1,601 @@
+"""Test tiatoolbox.models.engine.engine_abc."""
+
+from __future__ import annotations
+
+import copy
+import logging
+import shutil
+from pathlib import Path
+from typing import NoReturn
+
+import numpy as np
+import pytest
+import torch
+import torchvision.models as torch_models
+from typing_extensions import Unpack
+
+from tiatoolbox.models.architecture import (
+    fetch_pretrained_weights,
+    get_pretrained_model,
+)
+from tiatoolbox.models.architecture.vanilla import CNNModel
+from tiatoolbox.models.dataset import PatchDataset, WSIPatchDataset
+from tiatoolbox.models.engine.engine_abc import (
+    EngineABC,
+    EngineABCRunParams,
+    prepare_engines_save_dir,
+)
+from tiatoolbox.models.engine.io_config import ModelIOConfigABC
+
+device = "cuda:0" if torch.cuda.is_available() else "cpu"
+
+
+class TestEngineABC(EngineABC):
+    """Test EngineABC."""
+
+    def __init__(
+        self: TestEngineABC,
+        model: str | torch.nn.Module,
+        weights: str | Path | None = None,
+        *,
+        verbose: bool | None = None,
+    ) -> NoReturn:
+        """Test EngineABC init."""
+        super().__init__(model=model, weights=weights, verbose=verbose)
+
+    def get_dataloader(
+        self: EngineABC,
+        images: Path,
+        masks: Path | None = None,
+        labels: list | None = None,
+        ioconfig: ModelIOConfigABC | None = None,
+        *,
+        patch_mode: bool = True,
+    ) -> torch.utils.data.DataLoader:
+        """Test pre process images."""
+        return super().get_dataloader(
+            images,
+            masks,
+            labels,
+            ioconfig,
+            patch_mode=patch_mode,
+        )
+
+    def post_process_wsi(
+        self: EngineABC,
+        raw_predictions: dict | Path,
+        **kwargs: Unpack[EngineABCRunParams],
+    ) -> dict | Path:
+        """Post process WSI output."""
+        return super().post_process_wsi(
+            raw_predictions=raw_predictions,
+            prediction_shape=(self.batch_size, 1),
+            prediction_dtype=int,
+            **kwargs,
+        )
+
+    def infer_wsi(
+        self: EngineABC,
+        dataloader: torch.utils.data.DataLoader,
+        save_path: Path,
+        **kwargs: dict,
+    ) -> dict | np.ndarray:
+        """Test infer_wsi."""
+        return super().infer_wsi(  # skipcq: PYL-E1121
+            dataloader,
+            save_path,
+            **kwargs,
+        )
+
+
+def test_engine_abc_incorrect_model_type() -> NoReturn:
+    """Test EngineABC initialization with incorrect model type."""
+    with pytest.raises(
+        TypeError,
+        match=r".*missing 1 required positional argument: 'model'",
+    ):
+        TestEngineABC()  # skipcq
+
+    with pytest.raises(
+        TypeError,
+        match=r"Input model must be a string or 'torch.nn.Module'.",
+    ):
+        TestEngineABC(model=1)
+
+
+def test_incorrect_ioconfig() -> NoReturn:
+    """Test EngineABC initialization with incorrect ioconfig."""
+    model = torch_models.resnet18()
+    engine = TestEngineABC(model=model)
+
+    with pytest.raises(
+        ValueError,
+        match=r".*Must provide.*`ioconfig`.*",
+    ):
+        engine.run(images=[], masks=[], ioconfig=None)
+
+
+def test_incorrect_output_type() -> NoReturn:
+    """Test EngineABC for incorrect output type."""
+    pretrained_model = "alexnet-kather100k"
+
+    # Test engine run without ioconfig
+    eng = TestEngineABC(model=pretrained_model)
+
+    with pytest.raises(
+        TypeError,
+        match=r".*output_type must be 'dict' or 'zarr' or 'annotationstore*",
+    ):
+        _ = eng.run(
+            images=np.zeros((10, 224, 224, 3), dtype=np.uint8),
+            on_gpu=False,
+            patch_mode=True,
+            ioconfig=None,
+            output_type="random",
+        )
+
+
+def test_pretrained_ioconfig() -> NoReturn:
+    """Test EngineABC initialization with pretrained model name in the toolbox."""
+    pretrained_model = "alexnet-kather100k"
+
+    # Test engine run without ioconfig
+    eng = TestEngineABC(model=pretrained_model)
+    out = eng.run(
+        images=np.zeros((10, 224, 224, 3), dtype=np.uint8),
+        on_gpu=False,
+        patch_mode=True,
+        ioconfig=None,
+    )
+    assert "probabilities" in out
+    assert "labels" not in out
+
+
+def test_ioconfig() -> NoReturn:
+    """Test EngineABC initialization with valid ioconfig."""
+    ioconfig = ModelIOConfigABC(
+        input_resolutions=[
+            {"units": "baseline", "resolution": 1.0},
+        ],
+        patch_input_shape=(224, 224),
+    )
+
+    eng = TestEngineABC(model="alexnet-kather100k")
+    out = eng.run(
+        images=np.zeros((10, 224, 224, 3), dtype=np.uint8),
+        ioconfig=ioconfig,
+    )
+
+    assert "probabilities" in out
+    assert "labels" not in out
+
+
+def test_prepare_engines_save_dir(
+    track_tmp_path: pytest.TempPathFactory,
+    caplog: pytest.LogCaptureFixture,
+) -> NoReturn:
+    """Test prepare save directory for engines."""
+    out_dir = prepare_engines_save_dir(
+        save_dir=track_tmp_path / "patch_output",
+        patch_mode=True,
+        overwrite=False,
+    )
+
+    assert out_dir == track_tmp_path / "patch_output"
+    assert out_dir.exists()
+
+    out_dir = prepare_engines_save_dir(
+        save_dir=track_tmp_path / "patch_output",
+        patch_mode=True,
+        overwrite=True,
+    )
+
+    assert out_dir == track_tmp_path / "patch_output"
+    assert out_dir.exists()
+
+    out_dir = prepare_engines_save_dir(
+        save_dir=None,
+        patch_mode=True,
+        overwrite=False,
+    )
+    assert out_dir is None
+
+    with pytest.raises(
+        OSError,
+        match=r".*Input WSIs detected but no save directory provided.*",
+    ):
+        _ = prepare_engines_save_dir(
+            save_dir=None,
+            patch_mode=False,
+            overwrite=False,
+        )
+
+    out_dir = prepare_engines_save_dir(
+        save_dir=track_tmp_path / "wsi_single_output",
+        patch_mode=False,
+        overwrite=False,
+    )
+
+    assert out_dir == track_tmp_path / "wsi_single_output"
+    assert out_dir.exists()
+    assert r"When providing multiple whole-slide images / tiles" not in caplog.text
+
+    out_dir = prepare_engines_save_dir(
+        save_dir=track_tmp_path / "wsi_multiple_output",
+        patch_mode=False,
+        overwrite=False,
+    )
+
+    assert out_dir == track_tmp_path / "wsi_multiple_output"
+    assert out_dir.exists()
+    assert r"When providing multiple whole slide images" in caplog.text
+
+    # test for file overwrite with Path.mkdirs() method
+    out_path = prepare_engines_save_dir(
+        save_dir=track_tmp_path / "patch_output" / "output.zarr",
+        patch_mode=True,
+        overwrite=True,
+    )
+    assert out_path.exists()
+
+    out_path = prepare_engines_save_dir(
+        save_dir=track_tmp_path / "patch_output" / "output.zarr",
+        patch_mode=True,
+        overwrite=True,
+    )
+    assert out_path.exists()
+
+    with pytest.raises(FileExistsError):
+        out_path = prepare_engines_save_dir(
+            save_dir=track_tmp_path / "patch_output" / "output.zarr",
+            patch_mode=True,
+            overwrite=False,
+        )
+
+
+def test_engine_initalization() -> NoReturn:
+    """Test engine initialization."""
+    with pytest.raises(
+        TypeError,
+        match=r"Input model must be a string or 'torch.nn.Module'.",
+    ):
+        _ = TestEngineABC(model=0)
+
+    eng = TestEngineABC(model="alexnet-kather100k")
+    assert isinstance(eng, EngineABC)
+    model = CNNModel("alexnet", num_classes=1)
+    eng = TestEngineABC(model=model)
+    assert isinstance(eng, EngineABC)
+
+    model = get_pretrained_model("alexnet-kather100k")[0]
+    weights_path = fetch_pretrained_weights("alexnet-kather100k")
+    eng = TestEngineABC(model=model, weights=weights_path)
+    assert isinstance(eng, EngineABC)
+
+
+def test_engine_run() -> NoReturn:
+    """Test engine run."""
+    eng = TestEngineABC(model="alexnet-kather100k")
+    assert isinstance(eng, EngineABC)
+
+    eng = TestEngineABC(model="alexnet-kather100k")
+    with pytest.raises(
+        ValueError,
+        match=r".*The input numpy array should be four dimensional.*",
+    ):
+        eng.run(images=np.zeros((10, 10)))
+
+    eng = TestEngineABC(model="alexnet-kather100k")
+    with pytest.raises(
+        TypeError,
+        match=r"Input must be a list of file paths or a numpy array.",
+    ):
+        eng.run(images=1)
+
+    eng = TestEngineABC(model="alexnet-kather100k")
+    with pytest.raises(
+        ValueError,
+        match=r".*len\(labels\) is not equal to len(images)*",
+    ):
+        eng.run(
+            images=np.zeros((10, 224, 224, 3), dtype=np.uint8),
+            labels=list(range(1)),
+            on_gpu=False,
+        )
+
+    with pytest.raises(
+        ValueError,
+        match=r".*len\(masks\) is not equal to len(images)*",
+    ):
+        eng.run(
+            images=np.zeros((10, 224, 224, 3), dtype=np.uint8),
+            masks=np.zeros((1, 224, 224, 3)),
+            on_gpu=False,
+        )
+
+    with pytest.raises(
+        ValueError,
+        match=r".*The shape of the numpy array should be NHWC*",
+    ):
+        eng.run(
+            images=np.zeros((10, 224, 224, 3), dtype=np.uint8),
+            masks=np.zeros((10, 3)),
+            on_gpu=False,
+        )
+
+    eng = TestEngineABC(model="alexnet-kather100k")
+    out = eng.run(
+        images=np.zeros((10, 224, 224, 3), dtype=np.uint8),
+        on_gpu=False,
+        patch_mode=True,
+    )
+    assert "probabilities" in out
+    assert "labels" not in out
+
+    eng = TestEngineABC(model="alexnet-kather100k")
+    out = eng.run(
+        images=np.zeros((10, 224, 224, 3), dtype=np.uint8),
+        on_gpu=False,
+        verbose=False,
+    )
+    assert "probabilities" in out
+    assert "labels" not in out
+
+    eng = TestEngineABC(model="alexnet-kather100k")
+    out = eng.run(
+        images=np.zeros((10, 224, 224, 3), dtype=np.uint8),
+        labels=list(range(10)),
+        on_gpu=False,
+    )
+    assert "probabilities" in out
+    assert "labels" in out
+
+    pred = eng.post_process_wsi(
+        raw_predictions=Path("/path/to/raw_predictions.npy"),
+    )
+    assert str(pred) == "/path/to/raw_predictions.npy"
+
+
+def test_engine_run_with_verbose() -> NoReturn:
+    """Test engine run with verbose."""
+    # Run pytest with `-rP` option to view progress bar on the captured stderr call.
+
+    eng = TestEngineABC(model="alexnet-kather100k", verbose=True)
+    out = eng.run(
+        images=np.zeros((10, 224, 224, 3), dtype=np.uint8),
+        labels=list(range(10)),
+        device=device,
+    )
+
+    assert "probabilities" in out
+    assert "labels" in out
+
+
+def test_patch_pred_zarr_store(track_tmp_path: pytest.TempPathFactory) -> NoReturn:
+    """Test the engine run and patch pred store."""
+    save_dir = track_tmp_path / "patch_output"
+
+    eng = TestEngineABC(model="alexnet-kather100k")
+    out = eng.run(
+        images=np.zeros((10, 224, 224, 3), dtype=np.uint8),
+        on_gpu=False,
+        save_dir=save_dir,
+        overwrite=True,
+    )
+    assert Path.exists(out), "Zarr output file does not exist"
+
+    eng = TestEngineABC(model="alexnet-kather100k")
+    out = eng.run(
+        images=np.zeros((10, 224, 224, 3), dtype=np.uint8),
+        on_gpu=False,
+        verbose=False,
+        save_dir=save_dir,
+        overwrite=True,
+    )
+    assert Path.exists(out), "Zarr output file does not exist"
+
+    eng = TestEngineABC(model="alexnet-kather100k")
+    out = eng.run(
+        images=np.zeros((10, 224, 224, 3), dtype=np.uint8),
+        labels=list(range(10)),
+        on_gpu=False,
+        save_dir=save_dir,
+        overwrite=True,
+    )
+    assert Path.exists(out), "Zarr output file does not exist"
+
+    # Test custom zarr output file name
+    eng = TestEngineABC(model="alexnet-kather100k")
+    out = eng.run(
+        images=np.zeros((10, 224, 224, 3), dtype=np.uint8),
+        labels=list(range(10)),
+        on_gpu=False,
+        save_dir=save_dir,
+        overwrite=True,
+        output_file="patch_pred_output",
+    )
+    assert Path.exists(out), "Zarr output file does not exist"
+
+    eng = TestEngineABC(model="alexnet-kather100k")
+    with pytest.raises(
+        ValueError,
+        match=r".*Patch output must contain coordinates.",
+    ):
+        _ = eng.run(
+            images=np.zeros((10, 224, 224, 3), dtype=np.uint8),
+            labels=list(range(10)),
+            on_gpu=False,
+            save_dir=save_dir,
+            overwrite=True,
+            output_type="AnnotationStore",
+        )
+
+    with pytest.raises(
+        ValueError,
+        match=r".*Patch output must contain coordinates.",
+    ):
+        _ = eng.run(
+            images=np.zeros((10, 224, 224, 3), dtype=np.uint8),
+            labels=list(range(10)),
+            on_gpu=False,
+            save_dir=save_dir,
+            overwrite=True,
+            output_type="AnnotationStore",
+            class_dict={0: "class0", 1: "class1"},
+        )
+
+    with pytest.raises(
+        ValueError,
+        match=r".*Patch output must contain coordinates.",
+    ):
+        _ = eng.run(
+            images=np.zeros((10, 224, 224, 3), dtype=np.uint8),
+            labels=list(range(10)),
+            on_gpu=False,
+            save_dir=save_dir,
+            overwrite=True,
+            output_type="AnnotationStore",
+            scale_factor=(2.0, 2.0),
+        )
+
+
+def test_get_dataloader(sample_svs: Path) -> None:
+    """Test the get_dataloader function."""
+    eng = TestEngineABC(model="alexnet-kather100k")
+    ioconfig = ModelIOConfigABC(
+        input_resolutions=[
+            {"units": "baseline", "resolution": 1.0},
+        ],
+        patch_input_shape=(224, 224),
+    )
+    dataloader = eng.get_dataloader(
+        images=np.zeros(shape=(10, 224, 224, 3), dtype=np.uint8),
+        patch_mode=True,
+        ioconfig=ioconfig,
+    )
+
+    assert isinstance(dataloader.dataset, PatchDataset)
+
+    dataloader = eng.get_dataloader(
+        images=sample_svs,
+        patch_mode=False,
+        ioconfig=ioconfig,
+    )
+
+    assert isinstance(dataloader.dataset, WSIPatchDataset)
+
+
+def test_io_config_delegation(
+    track_tmp_path: Path, caplog: pytest.LogCaptureFixture
+) -> None:
+    """Test for delegating args to io config."""
+    # test not providing config / full input info for not pretrained models
+    model = CNNModel("resnet50")
+    eng = TestEngineABC(model=model)
+
+    kwargs = {
+        "patch_input_shape": [224, 224],
+        "input_resolutions": [{"units": "mpp", "resolution": 1.75}],
+    }
+    with caplog.at_level(logging.WARNING):
+        eng.run(
+            np.zeros((10, 224, 224, 3)),
+            patch_mode=True,
+            save_dir=track_tmp_path / "dump",
+            patch_input_shape=kwargs["patch_input_shape"],
+            input_resolutions=kwargs["input_resolutions"],
+        )
+        assert "provide a valid ModelIOConfigABC" in caplog.text
+    shutil.rmtree(track_tmp_path / "dump", ignore_errors=True)
+
+    # test providing config / full input info for non pretrained models
+    ioconfig = ModelIOConfigABC(
+        patch_input_shape=(224, 224),
+        stride_shape=(256, 256),
+        input_resolutions=[{"resolution": 1.35, "units": "mpp"}],
+    )
+    eng.run(
+        images=np.zeros((10, 224, 224, 3), dtype=np.uint8),
+        patch_mode=True,
+        save_dir=f"{track_tmp_path}/dump",
+        ioconfig=ioconfig,
+    )
+    assert eng._ioconfig.patch_input_shape == (224, 224)
+    assert eng._ioconfig.stride_shape == (256, 256)
+    assert eng._ioconfig.input_resolutions == [{"resolution": 1.35, "units": "mpp"}]
+    shutil.rmtree(track_tmp_path / "dump", ignore_errors=True)
+
+    eng.run(
+        images=np.zeros((10, 224, 224, 3), dtype=np.uint8),
+        patch_mode=True,
+        save_dir=f"{track_tmp_path}/dump",
+        **kwargs,
+    )
+    assert eng._ioconfig.patch_input_shape == [224, 224]
+    assert eng._ioconfig.stride_shape == [224, 224]
+    assert eng._ioconfig.input_resolutions == [{"resolution": 1.75, "units": "mpp"}]
+    shutil.rmtree(track_tmp_path / "dump", ignore_errors=True)
+
+    # test overwriting pretrained ioconfig
+    eng = TestEngineABC(model="alexnet-kather100k")
+    eng.run(
+        images=np.zeros((10, 300, 300, 3), dtype=np.uint8),
+        patch_input_shape=(300, 300),
+        stride_shape=(300, 300),
+        input_resolutions=[{"units": "baseline", "resolution": 1.99}],
+        patch_mode=True,
+        save_dir=f"{track_tmp_path}/dump",
+    )
+    assert eng._ioconfig.patch_input_shape == (300, 300)
+    assert eng._ioconfig.stride_shape == (300, 300)
+    assert eng._ioconfig.input_resolutions[0]["resolution"] == 1.99
+    assert eng._ioconfig.input_resolutions[0]["units"] == "baseline"
+    shutil.rmtree(track_tmp_path / "dump", ignore_errors=True)
+
+    eng.run(
+        images=np.zeros((10, 300, 300, 3), dtype=np.uint8),
+        patch_input_shape=(300, 300),
+        stride_shape=(300, 300),
+        input_resolutions=None,
+        patch_mode=True,
+        save_dir=f"{track_tmp_path}/dump",
+    )
+    assert eng._ioconfig.patch_input_shape == (300, 300)
+    assert eng._ioconfig.stride_shape == (300, 300)
+    shutil.rmtree(track_tmp_path / "dump", ignore_errors=True)
+
+    eng.ioconfig = None
+    _ioconfig = eng._update_ioconfig(
+        ioconfig=None,
+        patch_input_shape=(300, 300),
+        stride_shape=(300, 300),
+        input_resolutions=[{"units": "baseline", "resolution": 1.99}],
+    )
+
+    assert _ioconfig.patch_input_shape == (300, 300)
+    assert _ioconfig.stride_shape == (300, 300)
+    assert _ioconfig.input_resolutions[0]["resolution"] == 1.99
+    assert _ioconfig.input_resolutions[0]["units"] == "baseline"
+
+    for key in kwargs:
+        _kwargs = copy.deepcopy(kwargs)
+        _kwargs[key] = None
+        with pytest.raises(
+            ValueError,
+            match=r".*Must provide either `ioconfig` or "
+            r"`patch_input_shape` and `input_resolutions`*",
+        ):
+            eng._update_ioconfig(
+                ioconfig=None,
+                patch_input_shape=_kwargs["patch_input_shape"],
+                stride_shape=(1, 1),
+                input_resolutions=_kwargs["input_resolutions"],
+            )
+
+
+def test_save_predictions_incorrect_output_type() -> None:
+    """Engine should raise TypeError if incorrect output type is requested."""
+    eng = TestEngineABC(model="alexnet-kather100k")
+
+    with pytest.raises(TypeError, match=r".*Unsupported output type.* "):
+        eng.save_predictions({"predictions": np.zeros((20, 9))}, output_type="random")
diff --git a/tests/engines/test_ioconfig.py b/tests/engines/test_ioconfig.py
new file mode 100644
index 000000000..41169298b
--- /dev/null
+++ b/tests/engines/test_ioconfig.py
@@ -0,0 +1,23 @@
+"""Tests for IOconfig."""
+
+import pytest
+
+from tiatoolbox.models import ModelIOConfigABC
+
+
+def test_validation_error_io_config() -> None:
+    """Test Validation Error for ModelIOConfigABC."""
+    with pytest.raises(ValueError, match=r".*Multiple resolution units found.*"):
+        ModelIOConfigABC(
+            input_resolutions=[
+                {"units": "baseline", "resolution": 1.0},
+                {"units": "mpp", "resolution": 0.25},
+            ],
+            patch_input_shape=(224, 224),
+        )
+
+    with pytest.raises(ValueError, match=r"Invalid resolution units.*"):
+        ModelIOConfigABC(
+            input_resolutions=[{"units": "level", "resolution": 1.0}],
+            patch_input_shape=(224, 224),
+        )
diff --git a/tests/engines/test_patch_predictor.py b/tests/engines/test_patch_predictor.py
new file mode 100644
index 000000000..21b7121de
--- /dev/null
+++ b/tests/engines/test_patch_predictor.py
@@ -0,0 +1,712 @@
+"""Test PatchPredictor."""
+
+from __future__ import annotations
+
+import copy
+import json
+import shutil
+import sqlite3
+from pathlib import Path
+from typing import TYPE_CHECKING
+
+import numpy as np
+import torch
+import yaml
+import zarr
+from click.testing import CliRunner
+
+from tests.conftest import timed
+from tiatoolbox import cli, logger, rcParam
+from tiatoolbox.models import IOPatchPredictorConfig
+from tiatoolbox.models.architecture import fetch_pretrained_weights
+from tiatoolbox.models.architecture.vanilla import CNNModel
+from tiatoolbox.models.engine.patch_predictor import PatchPredictor
+from tiatoolbox.utils import env_detection as toolbox_env
+from tiatoolbox.utils.misc import download_data, get_zarr_array, imwrite
+
+if TYPE_CHECKING:
+    from collections.abc import Callable
+
+    import pytest
+
+device = "cuda" if toolbox_env.has_gpu() else "cpu"
+
+
+def _test_predictor_output(
+    inputs: list,
+    model: str,
+    probabilities_check: list | None = None,
+    classification_check: list | None = None,
+    output_type: str = "dict",
+    track_tmp_path: Path | None = None,
+) -> None:
+    """Test the predictions of multiple models included in tiatoolbox."""
+    cache_mode = None if track_tmp_path is None else True
+    save_dir = None if track_tmp_path is None else track_tmp_path / "output"
+    predictor = PatchPredictor(
+        model=model,
+        batch_size=32,
+        verbose=False,
+    )
+    # don't run test on GPU
+    output = predictor.run(
+        inputs,
+        return_labels=False,
+        device=device,
+        cache_mode=cache_mode,
+        save_dir=save_dir,
+        output_type=output_type,
+        return_probabilities=True,
+    )
+
+    if track_tmp_path is not None:
+        output = zarr.open(output, mode="r")
+
+    probabilities = output["probabilities"]
+    classification = output["predictions"]
+    for idx, probabilities_ in enumerate(probabilities):
+        probabilities_max = max(probabilities_)
+        assert np.abs(probabilities_max - probabilities_check[idx]) <= 1e-3, (
+            model,
+            probabilities_max,
+            probabilities_check[idx],
+            probabilities_,
+            classification_check[idx],
+        )
+        assert classification[idx] == classification_check[idx], (
+            model,
+            probabilities_max,
+            probabilities_check[idx],
+            probabilities_,
+            classification_check[idx],
+        )
+    if save_dir:
+        shutil.rmtree(save_dir)
+
+
+def test_io_config_delegation(remote_sample: Callable, track_tmp_path: Path) -> None:
+    """Test for delegating args to io config."""
+    mini_wsi_svs = Path(remote_sample("wsi2_4k_4k_svs"))
+    model = CNNModel("resnet50")
+    predictor = PatchPredictor(model=model, weights=None)
+    kwargs = {
+        "patch_input_shape": [512, 512],
+        "input_resolutions": [{"units": "mpp", "resolution": 1.75}],
+    }
+
+    # test providing config / full input info for default models without weights
+    ioconfig = IOPatchPredictorConfig(
+        patch_input_shape=(512, 512),
+        stride_shape=(256, 256),
+        input_resolutions=[{"resolution": 1.35, "units": "mpp"}],
+    )
+    predictor.run(
+        images=[mini_wsi_svs],
+        ioconfig=ioconfig,
+        patch_mode=False,
+        save_dir=f"{track_tmp_path}/dump",
+    )
+    shutil.rmtree(track_tmp_path / "dump", ignore_errors=True)
+
+    predictor.run(
+        images=[mini_wsi_svs],
+        patch_mode=False,
+        save_dir=f"{track_tmp_path}/dump",
+        **kwargs,
+    )
+    shutil.rmtree(track_tmp_path / "dump", ignore_errors=True)
+
+    # test overwriting pretrained ioconfig
+    predictor = PatchPredictor(model="resnet18-kather100k", batch_size=1)
+    predictor.run(
+        images=[mini_wsi_svs],
+        patch_input_shape=(300, 300),
+        patch_mode=False,
+        save_dir=f"{track_tmp_path}/dump",
+    )
+    assert predictor._ioconfig.patch_input_shape == (300, 300)
+    shutil.rmtree(track_tmp_path / "dump", ignore_errors=True)
+
+    predictor.run(
+        images=[mini_wsi_svs],
+        stride_shape=(300, 300),
+        patch_mode=False,
+        save_dir=f"{track_tmp_path}/dump",
+    )
+    assert predictor._ioconfig.stride_shape == (300, 300)
+    shutil.rmtree(track_tmp_path / "dump", ignore_errors=True)
+
+    predictor.run(
+        images=[mini_wsi_svs],
+        input_resolutions=[{"units": "mpp", "resolution": 1.99}],
+        patch_mode=False,
+        save_dir=f"{track_tmp_path}/dump",
+    )
+    assert predictor._ioconfig.input_resolutions[0]["resolution"] == 1.99
+    shutil.rmtree(track_tmp_path / "dump", ignore_errors=True)
+
+    predictor.run(
+        images=[mini_wsi_svs],
+        input_resolutions=[{"units": "baseline", "resolution": 1.0}],
+        patch_mode=False,
+        save_dir=f"{track_tmp_path}/dump",
+    )
+    assert predictor._ioconfig.input_resolutions[0]["units"] == "baseline"
+    shutil.rmtree(track_tmp_path / "dump", ignore_errors=True)
+
+    predictor.run(
+        images=[mini_wsi_svs],
+        input_resolutions=[{"units": "level", "resolution": 0}],
+        patch_mode=False,
+        save_dir=f"{track_tmp_path}/dump",
+    )
+    assert predictor._ioconfig.input_resolutions[0]["units"] == "level"
+    assert predictor._ioconfig.input_resolutions[0]["resolution"] == 0
+    shutil.rmtree(track_tmp_path / "dump", ignore_errors=True)
+
+    predictor.run(
+        images=[mini_wsi_svs],
+        input_resolutions=[{"units": "power", "resolution": 20}],
+        patch_mode=False,
+        save_dir=f"{track_tmp_path}/dump",
+    )
+    assert predictor._ioconfig.input_resolutions[0]["units"] == "power"
+    assert predictor._ioconfig.input_resolutions[0]["resolution"] == 20
+    shutil.rmtree(track_tmp_path / "dump", ignore_errors=True)
+
+
+def test_patch_predictor_api(
+    sample_patch1: Path,
+    sample_patch2: Path,
+    track_tmp_path: Path,
+) -> None:
+    """Test PatchPredictor API."""
+    save_dir_path = track_tmp_path
+
+    # Test both Path and str
+    inputs = [Path(sample_patch1), str(sample_patch2)]
+    predictor = PatchPredictor(model="resnet18-kather100k", batch_size=1)
+    # don't run test on GPU
+    # Default run
+    output = predictor.run(
+        inputs,
+        device="cpu",
+        return_probabilities=True,
+    )
+    assert sorted(output.keys()) == ["predictions", "probabilities"]
+    assert len(output["probabilities"]) == 2
+    shutil.rmtree(save_dir_path, ignore_errors=True)
+
+    # whether to return labels
+    output = predictor.run(
+        inputs,
+        labels=["1", "a"],
+        return_labels=True,
+        return_probabilities=True,
+    )
+    assert sorted(output.keys()) == sorted(["labels", "predictions", "probabilities"])
+    assert len(output["probabilities"]) == len(output["labels"])
+    assert list(output["labels"]) == ["1", "a"]
+    shutil.rmtree(save_dir_path, ignore_errors=True)
+
+    # test loading user weight
+    pretrained_weights_url = (
+        "https://tiatoolbox.dcs.warwick.ac.uk/models/pc/resnet18-kather100k.pth"
+    )
+
+    # remove prev generated data
+    shutil.rmtree(save_dir_path, ignore_errors=True)
+    save_dir_path.mkdir(parents=True)
+    pretrained_weights = (
+        save_dir_path / "tmp_pretrained_weigths" / "resnet18-kather100k.pth"
+    )
+
+    download_data(pretrained_weights_url, pretrained_weights)
+
+    predictor = PatchPredictor(
+        model="resnet18-kather100k",
+        weights=pretrained_weights,
+        batch_size=1,
+    )
+    ioconfig = predictor.ioconfig
+
+    # --- test different using user model
+    model = CNNModel(backbone="resnet18", num_classes=9)
+    # test prediction
+    predictor = PatchPredictor(model=model, batch_size=1, verbose=False)
+    output = predictor.run(
+        inputs,
+        labels=[1, 2],
+        return_labels=True,
+        ioconfig=ioconfig,
+        return_probabilities=True,
+        num_workers=1,
+    )
+    assert sorted(output.keys()) == sorted(["labels", "predictions", "probabilities"])
+    assert len(output["probabilities"]) == len(output["labels"])
+    assert list(output["labels"]) == [1, 2]
+
+
+def test_wsi_predictor_api(
+    sample_wsi_dict: dict,
+    track_tmp_path: Path,
+) -> None:
+    """Test normal run of wsi predictor."""
+    save_dir_path = track_tmp_path
+
+    # Test both Path and str input
+    mini_wsi_svs = Path(sample_wsi_dict["wsi2_4k_4k_svs"])
+    mini_wsi_jpg = sample_wsi_dict["wsi2_4k_4k_jpg"]
+    mini_wsi_msk = str(sample_wsi_dict["wsi2_4k_4k_msk"])
+
+    patch_size = np.array([224, 224])
+    predictor = PatchPredictor(model="resnet18-kather100k", batch_size=32)
+
+    save_dir = f"{save_dir_path}/model_wsi_output"
+
+    # wrapper to make this more clean
+    kwargs = {
+        "patch_input_shape": patch_size,
+        "stride_shape": patch_size,
+        "input_resolutions": [{"units": "baseline", "resolution": 1.0}],
+        "save_dir": save_dir,
+    }
+    # ! add this test back once the read at `baseline` is fixed
+    # sanity check, both output should be the same with same resolution read args
+    # remove previously generated data
+
+    _kwargs = copy.deepcopy(kwargs)
+    # test reading of multiple whole-slide images
+    output = predictor.run(
+        images=[mini_wsi_svs, str(mini_wsi_jpg)],
+        masks=[mini_wsi_msk, mini_wsi_msk],
+        patch_mode=False,
+        return_probabilities=True,
+        **_kwargs,
+    )
+
+    wsi_out = zarr.open(str(output[mini_wsi_svs]), mode="r")
+    tile_out = zarr.open(str(output[mini_wsi_jpg]), mode="r")
+    diff = tile_out["probabilities"][:] == wsi_out["probabilities"][:]
+    accuracy = np.sum(diff) / np.size(wsi_out["probabilities"][:])
+    assert accuracy > 0.99, np.nonzero(~diff)
+
+    diff = tile_out["predictions"][:] == wsi_out["predictions"][:]
+    accuracy = np.sum(diff) / np.size(wsi_out["predictions"][:])
+    assert accuracy > 0.99, np.nonzero(~diff)
+
+    shutil.rmtree(_kwargs["save_dir"], ignore_errors=True)
+
+
+def test_patch_predictor_kather100k_output(
+    sample_patch1: Path,
+    sample_patch2: Path,
+    track_tmp_path: Path,
+) -> None:
+    """Test the output of patch classification models on Kather100K dataset."""
+    inputs = [Path(sample_patch1), Path(sample_patch2)]
+    pretrained_info = {
+        "alexnet-kather100k": [1.0, 0.9999735355377197],
+        "resnet18-kather100k": [1.0, 0.9999911785125732],
+        "resnet34-kather100k": [1.0, 0.9979840517044067],
+        "resnet50-kather100k": [1.0, 0.9999986886978149],
+        "resnet101-kather100k": [1.0, 0.9999932050704956],
+        "resnext50_32x4d-kather100k": [1.0, 0.9910059571266174],
+        "resnext101_32x8d-kather100k": [1.0, 0.9999971389770508],
+        "wide_resnet50_2-kather100k": [1.0, 0.9953408241271973],
+        "wide_resnet101_2-kather100k": [1.0, 0.9999831914901733],
+        "densenet121-kather100k": [1.0, 1.0],
+        "densenet161-kather100k": [1.0, 0.9999959468841553],
+        "densenet169-kather100k": [1.0, 0.9999934434890747],
+        "densenet201-kather100k": [1.0, 0.9999983310699463],
+        "mobilenet_v2-kather100k": [0.9999998807907104, 0.9999126195907593],
+        "mobilenet_v3_large-kather100k": [0.9999996423721313, 0.9999878406524658],
+        "mobilenet_v3_small-kather100k": [0.9999998807907104, 0.9999997615814209],
+        "googlenet-kather100k": [1.0, 0.9999639987945557],
+    }
+    for model, expected_prob in pretrained_info.items():
+        _test_predictor_output(
+            inputs,
+            model,
+            probabilities_check=expected_prob,
+            classification_check=[6, 3],
+        )
+
+    for model, expected_prob in pretrained_info.items():
+        _test_predictor_output(
+            inputs,
+            model,
+            probabilities_check=expected_prob,
+            classification_check=[6, 3],
+            track_tmp_path=track_tmp_path,
+        )
+
+
+def _extract_probabilities_from_annotation_store(dbfile: str) -> dict:
+    """Helper function to extract probabilities from Annotation Store."""
+    con = sqlite3.connect(dbfile)
+    cur = con.cursor()
+    annotations_properties = list(cur.execute("SELECT properties FROM annotations"))
+
+    output = {"probabilities": [], "predictions": []}
+
+    for item in annotations_properties:
+        for json_str in item:
+            probs_dict = json.loads(json_str)
+            if "proba_0" in probs_dict:
+                output["probabilities"].append(probs_dict.pop("prob_0"))
+            output["predictions"].append(probs_dict.pop("type"))
+
+    return output
+
+
+def _validate_probabilities(output: list | dict | zarr.group) -> bool:
+    """Helper function to test if the probabilities value are valid."""
+    probabilities = np.array([0.5])
+
+    if "probabilities" in output:
+        probabilities = output["probabilities"]
+
+    predictions = output["predictions"]
+    if isinstance(probabilities, dict):
+        return all(0 <= probability <= 1 for _, probability in probabilities.items())
+
+    predictions = np.array(get_zarr_array(predictions)).astype(int)
+    probabilities = get_zarr_array(probabilities)
+
+    if not np.all(np.array(probabilities) <= 1):
+        return False
+
+    if not np.all(np.array(probabilities) >= 0):
+        return False
+
+    return np.all(predictions[:][0:5] == [7, 3, 2, 3, 3])
+
+
+def test_wsi_predictor_zarr(
+    sample_wsi_dict: dict, track_tmp_path: Path, caplog: pytest.LogCaptureFixture
+) -> None:
+    """Test normal run of patch predictor for WSIs."""
+    mini_wsi_svs = Path(sample_wsi_dict["wsi2_4k_4k_svs"])
+
+    predictor = PatchPredictor(
+        model="alexnet-kather100k",
+        batch_size=32,
+        verbose=False,
+    )
+    # don't run test on GPU
+    output = predictor.run(
+        images=[mini_wsi_svs],
+        return_probabilities=True,
+        return_labels=False,
+        device=device,
+        patch_mode=False,
+        save_dir=track_tmp_path / "wsi_out_check",
+    )
+
+    assert output[mini_wsi_svs].exists()
+
+    output_ = zarr.open(output[mini_wsi_svs])
+
+    assert output_["probabilities"].shape == (70, 9)  # number of patches x classes
+    assert output_["probabilities"].ndim == 2
+    # number of patches x [start_x, start_y, end_x, end_y]
+    assert output_["coordinates"].shape == (70, 4)
+    assert output_["coordinates"].ndim == 2
+    # prediction for each patch
+    assert output_["predictions"].shape == (70,)
+    assert output_["predictions"].ndim == 1
+    assert _validate_probabilities(output=output_)
+    assert "Output file saved at " in caplog.text
+
+    output = predictor.run(
+        images=[mini_wsi_svs],
+        return_probabilities=False,
+        return_labels=False,
+        device=device,
+        patch_mode=False,
+        save_dir=track_tmp_path / "wsi_out_check_no_probabilities",
+    )
+
+    assert output[mini_wsi_svs].exists()
+
+    output_ = zarr.open(output[mini_wsi_svs])
+
+    assert "probabilities" not in output_
+    # number of patches x [start_x, start_y, end_x, end_y]
+    assert output_["coordinates"].shape == (70, 4)
+    assert output_["coordinates"].ndim == 2
+    # prediction for each patch
+    assert output_["predictions"].shape == (70,)
+    assert output_["predictions"].ndim == 1
+    assert _validate_probabilities(output=output_)
+    assert "Output file saved at " in caplog.text
+
+
+def test_patch_predictor_patch_mode_annotation_store(
+    sample_patch1: Path,
+    sample_patch2: Path,
+    track_tmp_path: Path,
+) -> None:
+    """Test the output of patch classification models on Kather100K dataset."""
+    inputs = [Path(sample_patch1), Path(sample_patch2)]
+
+    predictor = PatchPredictor(
+        model="alexnet-kather100k",
+        batch_size=32,
+        verbose=False,
+    )
+    # don't run test on GPU
+    output = predictor.run(
+        images=inputs,
+        return_probabilities=True,
+        return_labels=False,
+        device=device,
+        patch_mode=True,
+        save_dir=track_tmp_path / "patch_out_check",
+        output_type="annotationstore",
+    )
+
+    assert output.exists()
+    output = _extract_probabilities_from_annotation_store(output)
+    assert np.all(output["predictions"] == [6, 3])
+    assert np.all(np.array(output["probabilities"]) <= 1)
+    assert np.all(np.array(output["probabilities"]) >= 0)
+
+
+def test_patch_predictor_patch_mode_no_probabilities(
+    sample_patch1: Path,
+    sample_patch2: Path,
+    track_tmp_path: Path,
+) -> None:
+    """Test the output of patch classification models on Kather100K dataset."""
+    inputs = [Path(sample_patch1), Path(sample_patch2)]
+
+    predictor = PatchPredictor(
+        model="alexnet-kather100k",
+        batch_size=32,
+        verbose=False,
+    )
+
+    output = predictor.run(
+        images=inputs,
+        return_probabilities=False,
+        return_labels=False,
+        device=device,
+        patch_mode=True,
+    )
+
+    assert "probabilities" not in output
+
+    # don't run test on GPU
+    output = predictor.run(
+        images=inputs,
+        return_probabilities=False,
+        return_labels=False,
+        device=device,
+        patch_mode=True,
+        save_dir=track_tmp_path / "patch_out_check",
+        output_type="annotationstore",
+    )
+
+    assert output.exists()
+    output = _extract_probabilities_from_annotation_store(output)
+    assert np.all(output["predictions"] == [6, 3])
+    assert output["probabilities"] == []
+
+
+def test_engine_run_wsi_annotation_store(
+    sample_wsi_dict: dict,
+    track_tmp_path: Path,
+    caplog: pytest.LogCaptureFixture,
+) -> None:
+    """Test the engine run for Whole slide images."""
+    # convert to pathlib Path to prevent wsireader complaint
+    mini_wsi_svs = Path(sample_wsi_dict["wsi2_4k_4k_svs"])
+    mini_wsi_msk = Path(sample_wsi_dict["wsi2_4k_4k_msk"])
+
+    eng = PatchPredictor(model="alexnet-kather100k")
+
+    patch_size = np.array([224, 224])
+    save_dir = f"{track_tmp_path}/model_wsi_output"
+
+    kwargs = {
+        "patch_input_shape": patch_size,
+        "stride_shape": patch_size,
+        "resolution": 0.5,
+        "save_dir": save_dir,
+        "units": "mpp",
+        "scale_factor": (2.0, 2.0),
+    }
+
+    output = eng.run(
+        images=[mini_wsi_svs],
+        masks=[mini_wsi_msk],
+        patch_mode=False,
+        output_type="AnnotationStore",
+        batch_size=4,
+        **kwargs,
+    )
+
+    output_ = output[mini_wsi_svs]
+
+    assert output_.exists()
+    assert output_.suffix == ".db"
+    output_ = _extract_probabilities_from_annotation_store(output_)
+
+    # prediction for each patch
+    assert np.array(output_["predictions"]).shape == (69,)
+    assert _validate_probabilities(output_)
+
+    assert "Output file saved at " in caplog.text
+
+    shutil.rmtree(save_dir)
+
+
+# --------------------------------------------------------------------------------------
+# torch.compile
+# --------------------------------------------------------------------------------------
+def test_patch_predictor_torch_compile(
+    sample_patch1: Path,
+    sample_patch2: Path,
+    track_tmp_path: Path,
+) -> None:
+    """Test PatchPredictor with torch.compile functionality.
+
+    Args:
+        sample_patch1 (Path): Path to sample patch 1.
+        sample_patch2 (Path): Path to sample patch 2.
+        track_tmp_path (Path): Path to temporary directory.
+
+    """
+    torch_compile_mode = rcParam["torch_compile_mode"]
+    torch._dynamo.reset()
+    rcParam["torch_compile_mode"] = "default"
+    _, compile_time = timed(
+        test_patch_predictor_api,
+        sample_patch1,
+        sample_patch2,
+        track_tmp_path,
+    )
+    logger.info("torch.compile default mode: %s", compile_time)
+    torch._dynamo.reset()
+    rcParam["torch_compile_mode"] = "reduce-overhead"
+    _, compile_time = timed(
+        test_patch_predictor_api,
+        sample_patch1,
+        sample_patch2,
+        track_tmp_path,
+    )
+    logger.info("torch.compile reduce-overhead mode: %s", compile_time)
+    torch._dynamo.reset()
+    rcParam["torch_compile_mode"] = "max-autotune"
+    _, compile_time = timed(
+        test_patch_predictor_api,
+        sample_patch1,
+        sample_patch2,
+        track_tmp_path,
+    )
+    logger.info("torch.compile max-autotune mode: %s", compile_time)
+    torch._dynamo.reset()
+    rcParam["torch_compile_mode"] = torch_compile_mode
+
+
+# -------------------------------------------------------------------------------------
+# Command Line Interface
+# -------------------------------------------------------------------------------------
+
+
+def test_cli_model_single_file(sample_svs: Path, track_tmp_path: Path) -> None:
+    """Test for models CLI single file."""
+    runner = CliRunner()
+    models_wsi_result = runner.invoke(
+        cli.main,
+        [
+            "patch-predictor",
+            "--img-input",
+            str(sample_svs),
+            "--patch-mode",
+            "False",
+            "--output-path",
+            str(track_tmp_path / "output"),
+        ],
+    )
+
+    assert models_wsi_result.exit_code == 0
+    assert (track_tmp_path / "output" / (sample_svs.stem + ".db")).exists()
+
+
+def test_cli_model_multiple_file_mask(
+    remote_sample: Callable, track_tmp_path: Path
+) -> None:
+    """Test for models CLI multiple file with mask."""
+    mini_wsi_svs = Path(remote_sample("svs-1-small"))
+    sample_wsi_msk = remote_sample("small_svs_tissue_mask")
+    sample_wsi_msk = np.load(sample_wsi_msk).astype(np.uint8)
+    imwrite(f"{track_tmp_path}/small_svs_tissue_mask.jpg", sample_wsi_msk)
+    mini_wsi_msk = track_tmp_path.joinpath("small_svs_tissue_mask.jpg")
+
+    # Make multiple copies for test
+    dir_path = track_tmp_path.joinpath("new_copies")
+    dir_path.mkdir()
+
+    dir_path_masks = track_tmp_path.joinpath("new_copies_masks")
+    dir_path_masks.mkdir()
+
+    config = {
+        "input_resolutions": [{"units": "mpp", "resolution": 0.5}],
+        "patch_input_shape": [224, 224],
+    }
+
+    with Path.open(track_tmp_path.joinpath("config.yaml"), "w") as fptr:
+        yaml.dump(config, fptr)
+
+    model = "alexnet-kather100k"
+    weights = fetch_pretrained_weights(model)
+
+    try:
+        dir_path.joinpath("1_" + mini_wsi_svs.name).symlink_to(mini_wsi_svs)
+        dir_path.joinpath("2_" + mini_wsi_svs.name).symlink_to(mini_wsi_svs)
+        dir_path.joinpath("3_" + mini_wsi_svs.name).symlink_to(mini_wsi_svs)
+    except OSError:
+        shutil.copy(mini_wsi_svs, dir_path / ("1_" + mini_wsi_svs.name))
+        shutil.copy(mini_wsi_svs, dir_path / ("2_" + mini_wsi_svs.name))
+        shutil.copy(mini_wsi_svs, dir_path / ("3_" + mini_wsi_svs.name))
+
+    try:
+        dir_path_masks.joinpath("1_" + mini_wsi_msk.name).symlink_to(mini_wsi_msk)
+        dir_path_masks.joinpath("2_" + mini_wsi_msk.name).symlink_to(mini_wsi_msk)
+        dir_path_masks.joinpath("3_" + mini_wsi_msk.name).symlink_to(mini_wsi_msk)
+    except OSError:
+        shutil.copy(mini_wsi_msk, dir_path_masks / ("1_" + mini_wsi_msk.name))
+        shutil.copy(mini_wsi_msk, dir_path_masks / ("2_" + mini_wsi_msk.name))
+        shutil.copy(mini_wsi_msk, dir_path_masks / ("3_" + mini_wsi_msk.name))
+
+    runner = CliRunner()
+    models_tiles_result = runner.invoke(
+        cli.main,
+        [
+            "patch-predictor",
+            "--img-input",
+            str(dir_path),
+            "--patch-mode",
+            str(False),
+            "--masks",
+            str(dir_path_masks),
+            "--model",
+            model,
+            "--weights",
+            str(weights),
+            "--yaml-config-path",
+            track_tmp_path / "config.yaml",
+            "--output-path",
+            str(track_tmp_path / "output"),
+            "--output-type",
+            "zarr",
+        ],
+    )
+
+    assert models_tiles_result.exit_code == 0
+    assert (track_tmp_path / "output" / ("1_" + mini_wsi_svs.stem + ".zarr")).exists()
+    assert (track_tmp_path / "output" / ("2_" + mini_wsi_svs.stem + ".zarr")).exists()
+    assert (track_tmp_path / "output" / ("3_" + mini_wsi_svs.stem + ".zarr")).exists()
diff --git a/tests/engines/test_semantic_segmentor.py b/tests/engines/test_semantic_segmentor.py
new file mode 100644
index 000000000..ae37a074a
--- /dev/null
+++ b/tests/engines/test_semantic_segmentor.py
@@ -0,0 +1,517 @@
+"""Test SemanticSegmentor."""
+
+from __future__ import annotations
+
+import json
+import sqlite3
+import tempfile
+from pathlib import Path
+from typing import TYPE_CHECKING
+from unittest import mock
+
+import dask.array as da
+import numpy as np
+import pytest
+import torch
+import zarr
+from click.testing import CliRunner
+
+from tiatoolbox import cli
+from tiatoolbox.annotation import SQLiteStore
+from tiatoolbox.models.engine import semantic_segmentor
+from tiatoolbox.models.engine.semantic_segmentor import (
+    SemanticSegmentor,
+    merge_vertical_chunkwise,
+)
+from tiatoolbox.utils import env_detection as toolbox_env
+from tiatoolbox.utils.misc import imread
+from tiatoolbox.wsicore import WSIReader
+
+if TYPE_CHECKING:
+    from collections.abc import Callable
+
+device = "cuda" if toolbox_env.has_gpu() else "cpu"
+
+
+def test_semantic_segmentor_init() -> None:
+    """Tests SemanticSegmentor initialization."""
+    segmentor = SemanticSegmentor(model="fcn-tissue_mask", device=device)
+
+    assert isinstance(segmentor, SemanticSegmentor)
+    assert isinstance(segmentor.model, torch.nn.Module)
+
+
+def test_semantic_segmentor_patches(
+    remote_sample: Callable, track_tmp_path: Path
+) -> None:
+    """Tests SemanticSegmentor on image patches."""
+    segmentor = SemanticSegmentor(
+        model="fcn-tissue_mask", batch_size=32, verbose=False, device=device
+    )
+
+    sample_image = remote_sample("thumbnail-1k-1k")
+
+    inputs = [sample_image, sample_image]
+
+    assert not segmentor.patch_mode
+
+    output = segmentor.run(
+        images=inputs,
+        return_probabilities=True,
+        return_labels=False,
+        device=device,
+        patch_mode=True,
+    )
+
+    assert 0.62 < np.mean(output["predictions"][:]) < 0.66
+    assert 0.48 < np.mean(output["probabilities"][:]) < 0.52
+
+    assert (
+        tuple(segmentor._ioconfig.patch_output_shape)
+        == output["probabilities"][0].shape[:-1]
+    )
+
+    assert (
+        tuple(segmentor._ioconfig.patch_output_shape) == output["predictions"][0].shape
+    )
+
+    output = segmentor.run(
+        images=inputs,
+        return_probabilities=True,
+        return_labels=False,
+        device=device,
+        patch_mode=True,
+        save_dir=track_tmp_path / "output0",
+    )
+
+    assert output == track_tmp_path / "output0" / "output.zarr"
+
+    output = zarr.open(output, mode="r")
+    assert 0.62 < np.mean(output["predictions"][:]) < 0.66
+    assert 0.48 < np.mean(output["probabilities"][:]) < 0.52
+
+    output = segmentor.run(
+        images=inputs,
+        return_probabilities=False,
+        return_labels=False,
+        device=device,
+        patch_mode=True,
+        output_type="zarr",
+        save_dir=track_tmp_path / "output1",
+    )
+
+    assert output == track_tmp_path / "output1" / "output.zarr"
+
+    output = zarr.open(output, mode="r")
+    assert 0.62 < np.mean(output["predictions"][:]) < 0.66
+    assert "probabilities" not in output.keys()  # noqa: SIM118
+
+    output = segmentor.run(
+        images=inputs,
+        return_probabilities=False,
+        return_labels=False,
+        device=device,
+        patch_mode=True,
+        save_dir=track_tmp_path / "output2",
+        output_type="zarr",
+    )
+
+    assert output == track_tmp_path / "output2" / "output.zarr"
+
+    output = zarr.open(output, mode="r")
+    assert 0.62 < np.mean(output["predictions"][:]) < 0.66
+    assert "probabilities" not in output
+    assert "predictions" in output
+
+
+def _test_store_output_patch(output: Path) -> None:
+    """Helper method to test annotation store output for a patch."""
+    store_ = SQLiteStore.open(output)
+    annotations_ = store_.values()
+    annotations_geometry_type = [
+        str(annotation_.geometry_type) for annotation_ in annotations_
+    ]
+    assert "Polygon" in annotations_geometry_type
+
+    con = sqlite3.connect(output)
+    cur = con.cursor()
+    annotations_properties = list(cur.execute("SELECT properties FROM annotations"))
+
+    out = []
+
+    for item in annotations_properties:
+        for json_str in item:
+            probs = json.loads(json_str)
+            if "type" in probs:
+                out.append(probs.pop("type"))
+
+    assert "mask" in out
+
+    assert annotations_properties is not None
+
+
+def test_save_annotation_store(remote_sample: Callable, track_tmp_path: Path) -> None:
+    """Test for saving output as annotation store."""
+    segmentor = SemanticSegmentor(
+        model="fcn-tissue_mask", batch_size=32, verbose=False, device=device
+    )
+
+    # Test str input
+    sample_image = remote_sample("thumbnail-1k-1k")
+
+    inputs = [str(sample_image)]
+
+    output = segmentor.run(
+        images=inputs,
+        return_probabilities=False,
+        return_labels=False,
+        device=device,
+        patch_mode=True,
+        save_dir=track_tmp_path / "output1",
+        output_type="annotationstore",
+        verbose=True,
+    )
+
+    assert output[0] == track_tmp_path / "output1" / (sample_image.stem + ".db")
+    assert len(output) == 1
+    _test_store_output_patch(output[0])
+
+
+def test_save_annotation_store_nparray(
+    remote_sample: Callable, track_tmp_path: Path, caplog: pytest.LogCaptureFixture
+) -> None:
+    """Test for saving output as annotation store using a numpy array."""
+    segmentor = SemanticSegmentor(
+        model="fcn-tissue_mask", batch_size=32, verbose=False, device=device
+    )
+
+    sample_image = remote_sample("thumbnail-1k-1k")
+
+    input_image = imread(sample_image)
+    inputs_list = np.array([input_image, input_image])
+
+    output = segmentor.run(
+        images=inputs_list,
+        return_probabilities=True,
+        return_labels=False,
+        device=device,
+        patch_mode=True,
+        save_dir=track_tmp_path / "output1",
+        output_type="annotationstore",
+    )
+
+    assert output[0] == track_tmp_path / "output1" / "0.db"
+    assert output[1] == track_tmp_path / "output1" / "1.db"
+
+    assert (track_tmp_path / "output1" / "output.zarr").exists()
+
+    zarr_group = zarr.open(str(track_tmp_path / "output1" / "output.zarr"), mode="r")
+    assert "probabilities" in zarr_group
+
+    assert "Probability maps cannot be saved as AnnotationStore." in caplog.text
+
+    _test_store_output_patch(output[0])
+    _test_store_output_patch(output[1])
+
+    output = segmentor.run(
+        images=inputs_list,
+        return_probabilities=False,
+        return_labels=False,
+        device=device,
+        patch_mode=True,
+        save_dir=track_tmp_path / "output2",
+        output_type="annotationstore",
+    )
+
+    assert output[0] == track_tmp_path / "output2" / "0.db"
+    assert output[1] == track_tmp_path / "output2" / "1.db"
+    assert not (track_tmp_path / "output2" / "output.zarr").exists()
+
+    assert len(output) == 2
+
+    _test_store_output_patch(output[0])
+    _test_store_output_patch(output[1])
+
+
+def test_non_overlapping_blocks() -> None:
+    """Test for non-overlapping merge to canvas."""
+    blocks = np.array([np.ones((2, 2, 1)), np.ones((2, 2, 1)) * 2])
+    output_locations = np.array([[0, 0, 2, 2], [2, 0, 4, 2]])
+    merged_shape = (2, 4, 1)
+    canvas, count = semantic_segmentor.merge_batch_to_canvas(
+        blocks, output_locations, merged_shape
+    )
+    assert np.array_equal(canvas[:, :2, :], np.ones((2, 2, 1)))
+    assert np.array_equal(canvas[:, 2:, :], np.ones((2, 2, 1)) * 2)
+    assert np.array_equal(count, np.ones((2, 4, 1)))
+
+
+def test_overlapping_blocks() -> None:
+    """Test for overlapping merge to canvas."""
+    blocks = np.array([np.ones((2, 2, 1)), np.ones((2, 2, 1)) * 3])
+    output_locations = np.array([[0, 0, 2, 2], [1, 0, 3, 2]])
+    merged_shape = (2, 3, 1)
+    canvas, count = semantic_segmentor.merge_batch_to_canvas(
+        blocks, output_locations, merged_shape
+    )
+    expected_canvas = np.array([[[1], [4], [3]], [[1], [4], [3]]])
+    expected_count = np.array([[[1], [2], [1]], [[1], [2], [1]]])
+    assert np.array_equal(canvas, expected_canvas)
+    assert np.array_equal(count, expected_count)
+
+
+def test_zero_block() -> None:
+    """Test for zero merge to canvas."""
+    blocks = np.array([np.zeros((2, 2, 1)), np.ones((2, 2, 1))])
+    output_locations = np.array([[0, 0, 2, 2], [2, 0, 4, 2]])
+    merged_shape = (2, 4, 1)
+    canvas, count = semantic_segmentor.merge_batch_to_canvas(
+        blocks, output_locations, merged_shape
+    )
+    assert np.array_equal(canvas[:, :2, :], np.zeros((2, 2, 1)))
+    assert np.array_equal(canvas[:, 2:, :], np.ones((2, 2, 1)))
+    assert np.array_equal(count[:, :2, :], np.zeros((2, 2, 1)))
+    assert np.array_equal(count[:, 2:, :], np.ones((2, 2, 1)))
+
+
+def test_empty_blocks() -> None:
+    """Test for empty merge to canvas."""
+    blocks = np.empty((0, 2, 2, 1))
+    output_locations = np.empty((0, 4))
+    merged_shape = (2, 2, 1)
+    canvas, count = semantic_segmentor.merge_batch_to_canvas(
+        blocks, output_locations, merged_shape
+    )
+    assert np.array_equal(canvas, np.zeros((2, 2, 1)))
+    assert np.array_equal(count, np.zeros((2, 2, 1), dtype=np.uint8))
+
+
+def test_merge_vertical_chunkwise_memory_threshold_triggered() -> None:
+    """Test merge vertical chunkwise for memory threshold."""
+    # Create dummy canvas and count arrays with 3 vertical chunks
+    data = np.ones((30, 10), dtype=np.uint8)
+    canvas = da.from_array(data, chunks=(10, 10))
+    count = da.from_array(data, chunks=(10, 10))
+
+    # Output locations to simulate overlaps
+    output_locs_y_ = np.array([[0, 10], [10, 20], [20, 30]])
+
+    # Temporary Zarr group
+    with tempfile.TemporaryDirectory() as tmpdir:
+        save_path = Path(tmpdir)
+
+        # Mock psutil to simulate low memory
+        with mock.patch(
+            "tiatoolbox.models.engine.semantic_segmentor.psutil.virtual_memory"
+        ) as mock_vm:
+            mock_vm.return_value.free = 1  # Very low free memory
+
+            result = merge_vertical_chunkwise(
+                canvas=canvas,
+                count=count,
+                output_locs_y_=output_locs_y_,
+                zarr_group=None,
+                save_path=save_path,
+                memory_threshold=0.01,  # Very low threshold to trigger the condition
+            )
+
+        # Assertions
+        assert isinstance(result, da.Array)
+        assert hasattr(result, "name")
+        assert result.name.startswith("from-zarr")
+        assert np.all(result.compute() == data)
+
+        zarr_group = zarr.open(tmpdir, mode="r")
+        assert np.all(zarr_group["probabilities"][:] == data)
+
+
+def test_raise_value_error_return_labels_wsi(
+    sample_svs: Path,
+    track_tmp_path: Path,
+) -> None:
+    """Test for raises value error for return_labels in wsi mode."""
+    segmentor = SemanticSegmentor(
+        model="fcn-tissue_mask",
+        batch_size=64,
+        verbose=False,
+        num_workers=1,
+    )
+    with pytest.raises(
+        ValueError,
+        match=r".*return_labels` is not supported when `patch_mode` is False",
+    ):
+        _ = segmentor.run(
+            images=[sample_svs],
+            return_probabilities=False,
+            return_labels=True,
+            device=device,
+            patch_mode=False,
+            save_dir=track_tmp_path / "wsi_out_check",
+            batch_size=2,
+            output_type="zarr",
+        )
+
+
+def test_wsi_segmentor_zarr(
+    remote_sample: Callable,
+    sample_svs: Path,
+    track_tmp_path: Path,
+) -> None:
+    """Test SemanticSegmentor for WSIs with zarr output."""
+    wsi1_2k_2k_svs = Path(remote_sample("wsi1_2k_2k_svs"))
+
+    segmentor = SemanticSegmentor(
+        model="fcn-tissue_mask",
+        batch_size=64,
+        verbose=False,
+        num_workers=1,
+    )
+    # Return Probabilities is False
+    output = segmentor.run(
+        images=[sample_svs],
+        return_probabilities=False,
+        return_labels=False,
+        device=device,
+        patch_mode=False,
+        save_dir=track_tmp_path / "wsi_out_check",
+        batch_size=2,
+        output_type="zarr",
+        memory_threshold=1,
+    )
+
+    output_ = zarr.open(output[sample_svs], mode="r")
+    assert 0.17 < np.mean(output_["predictions"][:]) < 0.19
+    assert "probabilities" not in output_
+    assert "canvas" not in output_
+    assert "count" not in output_
+
+    segmentor = SemanticSegmentor(
+        model="fcn-tissue_mask",
+        batch_size=64,
+        verbose=False,
+        num_workers=1,
+    )
+    # Return Probabilities is True
+    # Testing with WSIReader
+    output = segmentor.run(
+        images=[WSIReader.open(sample_svs)],
+        return_probabilities=True,
+        return_labels=False,
+        device=device,
+        patch_mode=False,
+        save_dir=track_tmp_path / "task_length_cache",
+        batch_size=2,
+        output_type="zarr",
+        memory_threshold=1,
+    )
+
+    output_ = zarr.open(output[sample_svs], mode="r")
+    assert 0.17 < np.mean(output_["predictions"][:]) < 0.19
+    assert "probabilities" in output_
+    assert "canvas" not in output_
+    assert "count" not in output_
+
+    # Return Probabilities is True
+    # Using small image for faster run
+    segmentor = SemanticSegmentor(
+        model="fcn-tissue_mask",
+        batch_size=32,
+        verbose=False,
+        num_workers=1,
+    )
+    segmentor.drop_keys = []
+    output = segmentor.run(
+        images=[sample_svs, wsi1_2k_2k_svs],
+        return_probabilities=True,
+        return_labels=False,
+        device=device,
+        patch_mode=False,
+        save_dir=track_tmp_path / "wsi_out_check_prob",
+        output_type="zarr",
+    )
+
+    output_ = zarr.open(output[sample_svs], mode="r")
+    assert 0.17 < np.mean(output_["predictions"][:]) < 0.19
+    assert 0.52 < np.mean(output_["probabilities"][:]) < 0.56
+
+    output_ = zarr.open(output[wsi1_2k_2k_svs], mode="r")
+    assert 0.24 < np.mean(output_["predictions"][:]) < 0.25
+    assert 0.48 < np.mean(output_["probabilities"][:]) < 0.52
+
+
+def test_wsi_segmentor_annotationstore(
+    sample_svs: Path, track_tmp_path: Path, caplog: pytest.CaptureFixture
+) -> None:
+    """Test SemanticSegmentor for WSIs with AnnotationStore output."""
+    segmentor = SemanticSegmentor(
+        model="fcn-tissue_mask",
+        batch_size=32,
+        verbose=False,
+    )
+    # Return Probabilities is False
+    output = segmentor.run(
+        images=[sample_svs],
+        return_probabilities=False,
+        return_labels=False,
+        device=device,
+        patch_mode=False,
+        save_dir=track_tmp_path / "wsi_out_check",
+        verbose=True,
+        output_type="annotationstore",
+    )
+
+    assert output[sample_svs] == track_tmp_path / "wsi_out_check" / (
+        sample_svs.stem + ".db"
+    )
+
+    # Return Probabilities
+    segmentor = SemanticSegmentor(
+        model="fcn-tissue_mask",
+        batch_size=32,
+        verbose=False,
+    )
+    # Return Probabilities is False
+    output = segmentor.run(
+        images=[sample_svs],
+        return_probabilities=True,
+        return_labels=False,
+        device=device,
+        patch_mode=False,
+        save_dir=track_tmp_path / "wsi_prob_out_check",
+        verbose=True,
+        output_type="annotationstore",
+    )
+
+    assert output[sample_svs] == track_tmp_path / "wsi_prob_out_check" / (
+        sample_svs.stem + ".db"
+    )
+    assert output[sample_svs].with_suffix(".zarr").exists()
+
+    zarr_group = zarr.open(output[sample_svs].with_suffix(".zarr"), mode="r")
+    assert "probabilities" in zarr_group
+    assert "Probability maps cannot be saved as AnnotationStore." in caplog.text
+
+
+# -------------------------------------------------------------------------------------
+# Command Line Interface
+# -------------------------------------------------------------------------------------
+
+
+def test_cli_model_single_file(sample_svs: Path, track_tmp_path: Path) -> None:
+    """Test for models CLI single file."""
+    runner = CliRunner()
+    models_wsi_result = runner.invoke(
+        cli.main,
+        [
+            "semantic-segmentor",
+            "--img-input",
+            str(sample_svs),
+            "--patch-mode",
+            "False",
+            "--output-path",
+            str(track_tmp_path / "output"),
+        ],
+    )
+
+    assert models_wsi_result.exit_code == 0
+    assert (track_tmp_path / "output" / (sample_svs.stem + ".db")).exists()
diff --git a/tests/models/test_arch_micronet.py b/tests/models/test_arch_micronet.py
index 07064db1b..9cc64cc96 100644
--- a/tests/models/test_arch_micronet.py
+++ b/tests/models/test_arch_micronet.py
@@ -7,7 +7,7 @@
 import pytest
 import torch
 
-from tiatoolbox.models import MicroNet, SemanticSegmentor
+from tiatoolbox.models import MicroNet, NucleusInstanceSegmentor
 from tiatoolbox.models.architecture import fetch_pretrained_weights
 from tiatoolbox.utils import env_detection as toolbox_env
 from tiatoolbox.utils.misc import select_device
@@ -64,7 +64,7 @@ def test_micronet_output(remote_sample: Callable, track_tmp_path: Path) -> None:
     num_loader_workers = 0
     num_postproc_workers = 0
 
-    predictor = SemanticSegmentor(
+    predictor = NucleusInstanceSegmentor(
         pretrained_model=pretrained_model,
         batch_size=batch_size,
         num_loader_workers=num_loader_workers,
diff --git a/tests/models/test_arch_vanilla.py b/tests/models/test_arch_vanilla.py
index a87424dfd..b19fce924 100644
--- a/tests/models/test_arch_vanilla.py
+++ b/tests/models/test_arch_vanilla.py
@@ -33,7 +33,7 @@ def test_functional() -> None:
         "mobilenet_v3_large",
         "mobilenet_v3_small",
     ]
-    assert CNNModel.postproc([1, 2]) == 1
+    assert CNNModel.postproc(np.array([1, 2])) == 1
 
     b = 4
     h = w = 512
@@ -60,7 +60,7 @@ def test_timm_functional() -> None:
     backbones = [
         "efficientnet_b0",
     ]
-    assert TimmModel.postproc([1, 2]) == 1
+    assert TimmModel.postproc(np.array([1, 2])) == 1
 
     b = 4
     h = w = 224
diff --git a/tests/models/test_dataset.py b/tests/models/test_dataset.py
index f9fe541df..8d5b250e4 100644
--- a/tests/models/test_dataset.py
+++ b/tests/models/test_dataset.py
@@ -5,13 +5,25 @@
 import shutil
 from pathlib import Path
 
+import cv2
 import numpy as np
 import pytest
+import torch
 
 from tiatoolbox import rcParam
-from tiatoolbox.models.dataset import DatasetInfoABC, KatherPatchDataset, PatchDataset
-from tiatoolbox.utils import download_data, unzip_data
+from tiatoolbox.models import PatchDataset, WSIPatchDataset
+from tiatoolbox.models.dataset import (
+    DatasetInfoABC,
+    KatherPatchDataset,
+    PatchDatasetABC,
+    predefined_preproc_func,
+)
+from tiatoolbox.utils import download_data, imread, imwrite, unzip_data
 from tiatoolbox.utils import env_detection as toolbox_env
+from tiatoolbox.utils.exceptions import DimensionMismatchError
+from tiatoolbox.wsicore import WSIReader
+
+RNG = np.random.default_rng()  # Numpy Random Generator
 
 
 class Proto1(DatasetInfoABC):
@@ -109,10 +121,424 @@ def test_kather_dataset(track_tmp_path: Path) -> None:
     assert len(dataset.inputs) == len(dataset.labels)
 
     # to actually get the image, we feed it to PatchDataset
-    actual_ds = PatchDataset(dataset.inputs, dataset.labels)
+    actual_ds = PatchDataset(
+        dataset.inputs, dataset.labels, patch_input_shape=(224, 224)
+    )
     sample_patch = actual_ds[89]
     assert isinstance(sample_patch["image"], np.ndarray)
     assert sample_patch["label"] is not None
 
     # remove generated data
     shutil.rmtree(save_dir_path, ignore_errors=True)
+
+
+def test_incorrect_input_shape() -> None:
+    """Incorrect input patch dimensions should raise DimensionMismatchError."""
+    size = (5, 5, 3)
+    img = RNG.integers(low=0, high=255, size=size)
+    list_imgs = [img, img, img]
+    dataset = PatchDataset(list_imgs, patch_input_shape=(100, 100))
+    with pytest.raises(
+        DimensionMismatchError, match=r".*\(100, 100\), but got \(5, 5\).*"
+    ):
+        _ = dataset[0]
+
+
+def test_patch_dataset_path_imgs(
+    sample_patch1: str | Path,
+    sample_patch2: str | Path,
+) -> None:
+    """Test for patch dataset with a list of file paths as input."""
+    size = (224, 224, 3)
+
+    dataset = PatchDataset(
+        [Path(sample_patch1), Path(sample_patch2)], patch_input_shape=size[:-1]
+    )
+
+    for _, sample_data in enumerate(dataset):
+        sampled_img_shape = sample_data["image"].shape
+        assert sampled_img_shape[0] == size[0]
+        assert sampled_img_shape[1] == size[1]
+        assert sampled_img_shape[2] == size[2]
+
+
+def test_patch_dataset_list_imgs(track_tmp_path: Path) -> None:
+    """Test for patch dataset with a list of images as input."""
+    save_dir_path = track_tmp_path
+
+    size = (5, 5, 3)
+    img = RNG.integers(low=0, high=255, size=size)
+    list_imgs = [img, img, img]
+    dataset = PatchDataset(list_imgs, patch_input_shape=size[:-1])
+
+    dataset.preproc_func = lambda x: x
+
+    for _, sample_data in enumerate(dataset):
+        sampled_img_shape = sample_data["image"].shape
+        assert sampled_img_shape[0] == size[0]
+        assert sampled_img_shape[1] == size[1]
+        assert sampled_img_shape[2] == size[2]
+
+    # test for changing to another preproc
+    dataset.preproc_func = lambda x: x - 10
+    item = dataset[0]
+    assert np.sum(item["image"] - (list_imgs[0] - 10)) == 0
+
+    # * test for loading npy
+    # remove previously generated data
+    if Path.exists(save_dir_path):
+        shutil.rmtree(save_dir_path, ignore_errors=True)
+    Path.mkdir(save_dir_path, parents=True)
+    np.save(
+        str(save_dir_path / "sample2.npy"),
+        RNG.integers(0, 255, (4, 4, 3)),
+    )
+    imgs = [
+        save_dir_path / "sample2.npy",
+    ]
+    _ = PatchDataset(imgs)
+    assert imgs[0] is not None
+    # test for path object
+    imgs = [
+        save_dir_path / "sample2.npy",
+    ]
+    _ = PatchDataset(imgs)
+
+
+def test_patch_datasetarray_imgs() -> None:
+    """Test for patch dataset with a numpy array of a list of images."""
+    size = (5, 5, 3)
+    img = RNG.integers(0, 255, size=size)
+    list_imgs = [img, img, img]
+    labels = [1, 2, 3]
+    array_imgs = np.array(list_imgs)
+
+    # test different setter for label
+    dataset = PatchDataset(array_imgs, labels=labels, patch_input_shape=(5, 5))
+    an_item = dataset[2]
+    assert an_item["label"] == 3
+    dataset = PatchDataset(array_imgs, labels=None, patch_input_shape=(5, 5))
+    an_item = dataset[2]
+    assert "label" not in an_item
+
+    dataset = PatchDataset(array_imgs, patch_input_shape=size[:-1])
+    for _, sample_data in enumerate(dataset):
+        sampled_img_shape = sample_data["image"].shape
+        assert sampled_img_shape[0] == size[0]
+        assert sampled_img_shape[1] == size[1]
+        assert sampled_img_shape[2] == size[2]
+
+
+def test_patch_dataset_crash(track_tmp_path: Path) -> None:
+    """Test to make sure patch dataset crashes with incorrect input."""
+    # all below examples should fail when input to PatchDataset
+    save_dir_path = track_tmp_path
+
+    # not supported input type
+    imgs = {"a": RNG.integers(0, 255, (4, 4, 4))}
+    with pytest.raises(
+        ValueError,
+        match=r".*Input must be either a list/array of images.*",
+    ):
+        _ = PatchDataset(imgs)
+
+    # ndarray of mixed dtype
+    imgs = np.array(
+        # string array of the same shape
+        [
+            RNG.integers(0, 255, (4, 5, 3)),
+            np.array(  # skipcq: PYL-E1121
+                ["PatchDataset should crash here" for _ in range(4 * 5 * 3)],
+            ).reshape(
+                4,
+                5,
+                3,
+            ),
+        ],
+        dtype=object,
+    )
+    with pytest.raises(ValueError, match=r"Provided input array is non-numerical."):
+        _ = PatchDataset(imgs)
+
+    # ndarray(s) of NHW images
+    imgs = RNG.integers(0, 255, (4, 4, 4))
+    with pytest.raises(ValueError, match=r".*array of the form HWC*"):
+        _ = PatchDataset(imgs)
+
+    # list of ndarray(s) with different sizes
+    imgs = [
+        RNG.integers(0, 255, (4, 4, 3)),
+        RNG.integers(0, 255, (4, 5, 3)),
+    ]
+    with pytest.raises(ValueError, match=r"Images must have the same dimensions."):
+        _ = PatchDataset(imgs)
+
+    # list of ndarray(s) with HW and HWC mixed up
+    imgs = [
+        RNG.integers(0, 255, (4, 4, 3)),
+        RNG.integers(0, 255, (4, 4)),
+    ]
+    with pytest.raises(
+        ValueError,
+        match=r"Each sample must be an array of the form HWC.",
+    ):
+        _ = PatchDataset(imgs)
+
+    # list of mixed dtype
+    imgs = [RNG.integers(0, 255, (4, 4, 3)), "you_should_crash_here", 123, 456]
+    with pytest.raises(
+        ValueError,
+        match=r"Input must be either a list/array of images or a list of "
+        "valid image paths.",
+    ):
+        _ = PatchDataset(imgs)
+
+    # list of mixed dtype
+    imgs = ["you_should_crash_here", 123, 456]
+    with pytest.raises(
+        ValueError,
+        match=r"Input must be either a list/array of images or a list of "
+        "valid image paths.",
+    ):
+        _ = PatchDataset(imgs)
+
+    # list not exist paths
+    with pytest.raises(
+        ValueError,
+        match=r".*valid image paths.*",
+    ):
+        _ = PatchDataset(["img.npy"])
+
+    # ** test different extension parser
+    # save dummy data to temporary location
+    # remove prev generated data
+    shutil.rmtree(save_dir_path, ignore_errors=True)
+    save_dir_path.mkdir(parents=True)
+
+    torch.save({"a": "a"}, save_dir_path / "sample1.tar")
+    np.save(
+        str(save_dir_path / "sample2.npy"),
+        RNG.integers(0, 255, (4, 4, 3)),
+    )
+
+    imgs = [
+        save_dir_path / "sample1.tar",
+        save_dir_path / "sample2.npy",
+    ]
+    with pytest.raises(
+        TypeError,
+        match="Cannot load image data from",
+    ):
+        _ = PatchDataset(imgs)
+
+    # preproc func for not defined dataset
+    with pytest.raises(
+        ValueError,
+        match=r".* preprocessing .* does not exist.",
+    ):
+        predefined_preproc_func("secret-dataset")
+
+
+def test_wsi_patch_dataset(  # noqa: PLR0915
+    sample_wsi_dict: dict,
+    track_tmp_path: Path,
+) -> None:
+    """A test for creation and bare output."""
+    # convert to pathlib Path to prevent wsireader complaint
+    mini_wsi_svs = Path(sample_wsi_dict["wsi2_4k_4k_svs"])
+    mini_wsi_msk = Path(sample_wsi_dict["wsi2_4k_4k_msk"])
+
+    def reuse_init(img_path: Path = mini_wsi_svs, **kwargs: dict) -> WSIPatchDataset:
+        """Testing function."""
+        return WSIPatchDataset(input_img=img_path, **kwargs)
+
+    def reuse_init_wsi(**kwargs: dict) -> WSIPatchDataset:
+        """Testing function."""
+        return reuse_init(**kwargs)
+
+    # test for ABC validate
+    # intentionally created to check error
+    # skipcq
+    class Proto(PatchDatasetABC):
+        def __init__(self: Proto) -> None:
+            super().__init__()
+            self.inputs = "CRASH"
+            self._check_input_integrity("wsi")
+
+        # skipcq
+        def __getitem__(self: Proto, idx: int) -> object:
+            """Get an item from the dataset."""
+
+    with pytest.raises(
+        ValueError,
+        match=r".*`inputs` should be a list of patch coordinates.*",
+    ):
+        Proto()  # skipcq
+
+    # invalid path input
+    with pytest.raises(ValueError, match=r".*`input_img` must be a valid file path.*"):
+        WSIPatchDataset(
+            input_img="aaaa",
+            patch_input_shape=[512, 512],
+            stride_shape=[256, 256],
+            auto_get_mask=False,
+        )
+
+    # invalid mask path input
+    with pytest.raises(ValueError, match=r".*`mask_path` must be a valid file path.*"):
+        WSIPatchDataset(
+            input_img=mini_wsi_svs,
+            mask_path="aaaa",
+            patch_input_shape=[512, 512],
+            stride_shape=[256, 256],
+            resolution=1.0,
+            units="mpp",
+            auto_get_mask=False,
+        )
+
+    # invalid patch
+    with pytest.raises(ValueError, match=r"Invalid `patch_input_shape` value None."):
+        reuse_init()
+    with pytest.raises(
+        ValueError,
+        match=r"Invalid `patch_input_shape` value \[512 512 512\].",
+    ):
+        reuse_init_wsi(patch_input_shape=[512, 512, 512])
+    with pytest.raises(
+        ValueError,
+        match=r"Invalid `patch_input_shape` value \['512' 'a'\].",
+    ):
+        reuse_init_wsi(patch_input_shape=[512, "a"])
+    with pytest.raises(ValueError, match=r"Invalid `stride_shape` value None."):
+        reuse_init_wsi(patch_input_shape=512)
+    # invalid stride
+    with pytest.raises(
+        ValueError,
+        match=r"Invalid `stride_shape` value \['512' 'a'\].",
+    ):
+        reuse_init_wsi(patch_input_shape=[512, 512], stride_shape=[512, "a"])
+    with pytest.raises(
+        ValueError,
+        match=r"Invalid `stride_shape` value \[512 512 512\].",
+    ):
+        reuse_init_wsi(patch_input_shape=[512, 512], stride_shape=[512, 512, 512])
+    # negative
+    with pytest.raises(
+        ValueError,
+        match=r"Invalid `patch_input_shape` value \[ 512 -512\].",
+    ):
+        reuse_init_wsi(patch_input_shape=[512, -512], stride_shape=[512, 512])
+    with pytest.raises(
+        ValueError,
+        match=r"Invalid `stride_shape` value \[ 512 -512\].",
+    ):
+        reuse_init_wsi(patch_input_shape=[512, 512], stride_shape=[512, -512])
+
+    # * for wsi
+    # dummy test for analysing the output
+    # stride and patch size should be as expected
+    patch_size = (512, 512)
+    stride_size = (256, 256)
+    ds = WSIPatchDataset(
+        input_img=WSIReader.open(mini_wsi_svs),
+        patch_input_shape=patch_size,
+        stride_shape=stride_size,
+        resolution=1.0,
+        units="mpp",
+        auto_get_mask=False,
+    )
+    reader = WSIReader.open(mini_wsi_svs)
+    # tiling top to bottom, left to right
+    ds_roi = ds[2]["image"]
+    step_idx = 2  # manually calibrate
+    start = (step_idx * stride_size[1], 0)
+    end = (start[0] + patch_size[0], start[1] + patch_size[1])
+    rd_roi = reader.read_bounds(
+        start + end,
+        resolution=1.0,
+        units="mpp",
+        coord_space="resolution",
+    )
+    correlation = np.corrcoef(
+        cv2.cvtColor(ds_roi, cv2.COLOR_RGB2GRAY).flatten(),
+        cv2.cvtColor(rd_roi, cv2.COLOR_RGB2GRAY).flatten(),
+    )
+    assert ds_roi.shape[0] == rd_roi.shape[0]
+    assert ds_roi.shape[1] == rd_roi.shape[1]
+    assert np.min(correlation) > 0.9, correlation
+
+    # test creation with auto mask gen and input mask
+    ds = WSIPatchDataset(
+        input_img=mini_wsi_svs,
+        patch_input_shape=patch_size,
+        stride_shape=stride_size,
+        resolution=1.0,
+        units="mpp",
+        auto_get_mask=True,
+    )
+    assert len(ds) > 0
+    _ = WSIPatchDataset(
+        input_img=mini_wsi_svs,
+        mask_path=mini_wsi_msk,
+        patch_input_shape=(512, 512),
+        stride_shape=(256, 256),
+        auto_get_mask=False,
+        resolution=1.0,
+        units="mpp",
+    )
+    negative_mask = imread(mini_wsi_msk)
+    negative_mask = np.zeros_like(negative_mask)
+    negative_mask_path = track_tmp_path / "negative_mask.png"
+    imwrite(negative_mask_path, negative_mask)
+    with pytest.raises(ValueError, match="No patch coordinates remain after filtering"):
+        _ = WSIPatchDataset(
+            input_img=mini_wsi_svs,
+            mask_path=negative_mask_path,
+            patch_input_shape=(512, 512),
+            stride_shape=(256, 256),
+            auto_get_mask=False,
+            resolution=1.0,
+            units="mpp",
+        )
+
+
+def test_patch_dataset_abc() -> None:
+    """Test for ABC methods.
+
+    Test missing definition for abstract intentionally created to check error.
+
+    """
+
+    # skipcq
+    class Proto(PatchDatasetABC):
+        # skipcq
+        def __init__(self: Proto) -> None:
+            super().__init__()
+
+    # crash due to undefined __getitem__
+    with pytest.raises(TypeError):
+        Proto()  # skipcq
+
+    # skipcq
+    class Proto(PatchDatasetABC):
+        # skipcq
+        def __init__(self: Proto) -> None:
+            super().__init__()
+
+        # skipcq
+        def __getitem__(self: Proto, idx: int) -> None:
+            """Get an item from the dataset."""
+
+    ds = Proto()  # skipcq
+
+    # test setter and getter
+    assert ds.preproc_func(1) == 1
+    ds.preproc_func = lambda x: x - 1  # skipcq: PYL-W0201
+    assert ds.preproc_func(1) == 0
+    assert ds.preproc(1) == 1, "Must be unchanged!"
+    ds.preproc_func = None  # skipcq: PYL-W0201
+    assert ds.preproc_func(2) == 2
+
+    # test assign uncallable to preproc_func/postproc_func
+    with pytest.raises(ValueError, match=r".*callable*"):
+        ds.preproc_func = 1  # skipcq: PYL-W0201
diff --git a/tests/models/test_feature_extractor.py b/tests/models/test_feature_extractor.py
deleted file mode 100644
index a5d7bb96b..000000000
--- a/tests/models/test_feature_extractor.py
+++ /dev/null
@@ -1,164 +0,0 @@
-"""Test for feature extractor."""
-
-import shutil
-from collections.abc import Callable
-from pathlib import Path
-
-import numpy as np
-import pytest
-import torch
-
-from tiatoolbox.models.architecture.vanilla import CNNBackbone, TimmBackbone
-from tiatoolbox.models.engine.semantic_segmentor import (
-    DeepFeatureExtractor,
-    IOSegmentorConfig,
-)
-from tiatoolbox.utils import env_detection as toolbox_env
-from tiatoolbox.utils.misc import select_device
-from tiatoolbox.wsicore.wsireader import WSIReader
-
-ON_GPU = not toolbox_env.running_on_ci() and toolbox_env.has_gpu()
-
-# -------------------------------------------------------------------------------------
-# Engine
-# -------------------------------------------------------------------------------------
-
-
-def test_engine(remote_sample: Callable, track_tmp_path: Path) -> None:
-    """Test feature extraction with DeepFeatureExtractor engine."""
-    save_dir = track_tmp_path / "output"
-    # # convert to pathlib Path to prevent wsireader complaint
-    mini_wsi_svs = Path(remote_sample("wsi4_1k_1k_svs"))
-
-    # * test providing pretrained from torch vs pretrained_model.yaml
-    shutil.rmtree(save_dir, ignore_errors=True)  # default output dir test
-    extractor = DeepFeatureExtractor(batch_size=1, pretrained_model="fcn-tissue_mask")
-    output_list = extractor.predict(
-        [mini_wsi_svs],
-        mode="wsi",
-        device=select_device(on_gpu=ON_GPU),
-        crash_on_exception=True,
-        save_dir=save_dir,
-    )
-    wsi_0_root_path = output_list[0][1]
-    positions = np.load(f"{wsi_0_root_path}.position.npy")
-    features = np.load(f"{wsi_0_root_path}.features.0.npy")
-    assert len(positions.shape) == 2
-    assert len(features.shape) == 4
-
-    # * test same output between full infer and engine
-    # pre-emptive clean up
-    shutil.rmtree(save_dir, ignore_errors=True)  # default output dir test
-
-
-@pytest.mark.parametrize(
-    "model", [CNNBackbone("resnet50"), TimmBackbone("efficientnet_b0", pretrained=True)]
-)
-def test_full_inference(
-    remote_sample: Callable, track_tmp_path: Path, model: Callable
-) -> None:
-    """Test full inference with CNNBackbone and TimmBackbone models."""
-    save_dir = track_tmp_path / "output"
-    # pre-emptive clean up
-    shutil.rmtree(save_dir, ignore_errors=True)  # default output dir test
-
-    mini_wsi_svs = Path(remote_sample("wsi4_1k_1k_svs"))
-
-    ioconfig = IOSegmentorConfig(
-        input_resolutions=[
-            {"units": "mpp", "resolution": 0.25},
-        ],
-        output_resolutions=[
-            {"units": "mpp", "resolution": 0.25},
-        ],
-        patch_input_shape=[512, 512],
-        patch_output_shape=[512, 512],
-        stride_shape=[256, 256],
-        save_resolution={"units": "mpp", "resolution": 8.0},
-    )
-
-    extractor = DeepFeatureExtractor(batch_size=4, model=model)
-    # should still run because we skip exception
-    output_list = extractor.predict(
-        [mini_wsi_svs],
-        mode="wsi",
-        ioconfig=ioconfig,
-        device=select_device(on_gpu=ON_GPU),
-        crash_on_exception=True,
-        save_dir=save_dir,
-    )
-    wsi_0_root_path = output_list[0][1]
-    positions = np.load(f"{wsi_0_root_path}.position.npy")
-    features = np.load(f"{wsi_0_root_path}.features.0.npy")
-
-    reader = WSIReader.open(mini_wsi_svs)
-    patches = [
-        reader.read_bounds(
-            positions[patch_idx],
-            resolution=0.25,
-            units="mpp",
-            pad_constant_values=0,
-            coord_space="resolution",
-        )
-        for patch_idx in range(4)
-    ]
-    patches = np.array(patches)
-    patches = torch.from_numpy(patches)  # NHWC
-    patches = patches.permute(0, 3, 1, 2)  # NCHW
-    patches = patches.type(torch.float32)
-    model = model.to("cpu")
-    # Inference mode
-    model.eval()
-    with torch.inference_mode():
-        _features = model(patches).numpy()
-    # ! must maintain same batch size and likely same ordering
-    # ! else the output values will not exactly be the same (still < 1.0e-4
-    # ! of epsilon though)
-    assert np.mean(np.abs(features[:4] - _features)) < 1.0e-1
-
-
-@pytest.mark.skipif(
-    toolbox_env.running_on_ci() or not ON_GPU,
-    reason="Local test on machine with GPU.",
-)
-def test_multi_gpu_feature_extraction(
-    remote_sample: Callable, track_tmp_path: Path
-) -> None:
-    """Local functionality test for feature extraction using multiple GPUs."""
-    save_dir = track_tmp_path / "output"
-    mini_wsi_svs = Path(remote_sample("wsi4_1k_1k_svs"))
-    shutil.rmtree(save_dir, ignore_errors=True)
-
-    # Use multiple GPUs
-    device = select_device(on_gpu=ON_GPU)
-
-    wsi_ioconfig = IOSegmentorConfig(
-        input_resolutions=[{"units": "mpp", "resolution": 0.5}],
-        patch_input_shape=[224, 224],
-        output_resolutions=[{"units": "mpp", "resolution": 0.5}],
-        patch_output_shape=[224, 224],
-        stride_shape=[224, 224],
-    )
-
-    model = TimmBackbone(backbone="UNI", pretrained=True)
-    extractor = DeepFeatureExtractor(
-        model=model,
-        auto_generate_mask=True,
-        batch_size=32,
-        num_loader_workers=4,
-        num_postproc_workers=4,
-    )
-
-    output_list = extractor.predict(
-        [mini_wsi_svs],
-        mode="wsi",
-        device=device,
-        ioconfig=wsi_ioconfig,
-        crash_on_exception=True,
-        save_dir=save_dir,
-    )
-    wsi_0_root_path = output_list[0][1]
-    positions = np.load(f"{wsi_0_root_path}.position.npy")
-    features = np.load(f"{wsi_0_root_path}.features.0.npy")
-    assert len(positions.shape) == 2
-    assert len(features.shape) == 2
diff --git a/tests/models/test_abc.py b/tests/models/test_models_abc.py
similarity index 91%
rename from tests/models/test_abc.py
rename to tests/models/test_models_abc.py
index f7a60e34c..4ef3d5666 100644
--- a/tests/models/test_abc.py
+++ b/tests/models/test_models_abc.py
@@ -70,7 +70,6 @@ def forward(self: Proto) -> None:
     # skipcq
     def infer_batch() -> None:
         """Define infer batch."""
-        pass  # base class definition pass  # noqa: PIE790
 
 
 @pytest.mark.skipif(
@@ -141,16 +140,16 @@ def test_model_abc() -> None:
     model.postproc_func = None  # skipcq: PYL-W0201
     assert model.postproc_func(2) == 0
 
-    # Test on CPU
-    model = model.to(device="cpu")
-    assert isinstance(model, nn.Module)
-    assert model.dummy_param.device.type == "cpu"
-
     # Test load_weights_from_file() method
     weights_path = fetch_pretrained_weights("alexnet-kather100k")
     with pytest.raises(RuntimeError, match=r".*loading state_dict*"):
         _ = model.load_weights_from_file(weights_path)
 
+    # Test on CPU
+    model = model.to(device="cpu")
+    assert isinstance(model, nn.Module)
+    assert model.dummy_param.device.type == "cpu"
+
 
 def test_model_to() -> None:
     """Test for placing model on device."""
@@ -165,3 +164,15 @@ def test_model_to() -> None:
     model = torch_models.resnet18()
     model = model_to(device="cpu", model=model)
     assert isinstance(model, nn.Module)
+
+
+def test_get_pretrained_model_not_str() -> None:
+    """Test TypeError is raised if input is not str."""
+    with pytest.raises(TypeError, match=r"pretrained_model must be a string."):
+        _ = get_pretrained_model(1)
+
+
+def test_get_pretrained_model_not_in_info() -> None:
+    """Test ValueError is raised if input is not in info."""
+    with pytest.raises(ValueError, match=r"Pretrained model `alexnet` does not exist."):
+        _ = get_pretrained_model("alexnet")
diff --git a/tests/models/test_multi_task_segmentor.py b/tests/models/test_multi_task_segmentor.py
deleted file mode 100644
index 90f850d6f..000000000
--- a/tests/models/test_multi_task_segmentor.py
+++ /dev/null
@@ -1,422 +0,0 @@
-"""Unit test package for HoVerNet+."""
-
-import copy
-
-# ! The garbage collector
-import gc
-import multiprocessing
-import shutil
-from collections.abc import Callable
-from pathlib import Path
-
-import joblib
-import numpy as np
-import pytest
-
-from tiatoolbox.models import IOSegmentorConfig, MultiTaskSegmentor, SemanticSegmentor
-from tiatoolbox.utils import env_detection as toolbox_env
-from tiatoolbox.utils import imwrite
-from tiatoolbox.utils.metrics import f1_detection
-from tiatoolbox.utils.misc import select_device
-
-ON_GPU = toolbox_env.has_gpu()
-BATCH_SIZE = 1 if not ON_GPU else 8  # 16
-try:
-    NUM_POSTPROC_WORKERS = multiprocessing.cpu_count()
-except NotImplementedError:
-    NUM_POSTPROC_WORKERS = 2
-
-# ----------------------------------------------------
-
-
-def _crash_func(_: object) -> None:
-    """Helper to induce crash."""
-    msg = "Propagation Crash."
-    raise ValueError(msg)
-
-
-def semantic_postproc_func(raw_output: np.ndarray) -> np.ndarray:
-    """Function to post process semantic segmentations.
-
-    Post processes semantic segmentation to form one map output.
-
-    """
-    return np.argmax(raw_output, axis=-1)
-
-
-@pytest.mark.skipif(
-    toolbox_env.running_on_ci() or not ON_GPU,
-    reason="Local test on machine with GPU.",
-)
-def test_functionality_local(remote_sample: Callable, track_tmp_path: Path) -> None:
-    """Local functionality test for multi task segmentor."""
-    gc.collect()
-    root_save_dir = Path(track_tmp_path)
-    mini_wsi_svs = Path(remote_sample("svs-1-small"))
-    save_dir = root_save_dir / "multitask"
-    shutil.rmtree(save_dir, ignore_errors=True)
-
-    # * generate full output w/o parallel post-processing worker first
-    multi_segmentor = MultiTaskSegmentor(
-        pretrained_model="hovernetplus-oed",
-        batch_size=BATCH_SIZE,
-        num_postproc_workers=0,
-    )
-    output = multi_segmentor.predict(
-        [mini_wsi_svs],
-        mode="wsi",
-        device=select_device(on_gpu=ON_GPU),
-        crash_on_exception=True,
-        save_dir=save_dir,
-    )
-
-    inst_dict_a = joblib.load(f"{output[0][1]}.0.dat")
-
-    # * then test run when using workers, will then compare results
-    # * to ensure the predictions are the same
-    shutil.rmtree(save_dir, ignore_errors=True)
-    multi_segmentor = MultiTaskSegmentor(
-        pretrained_model="hovernetplus-oed",
-        batch_size=BATCH_SIZE,
-        num_postproc_workers=NUM_POSTPROC_WORKERS,
-    )
-    assert multi_segmentor.num_postproc_workers == NUM_POSTPROC_WORKERS
-    output = multi_segmentor.predict(
-        [mini_wsi_svs],
-        mode="wsi",
-        device=select_device(on_gpu=ON_GPU),
-        crash_on_exception=True,
-        save_dir=save_dir,
-    )
-
-    inst_dict_b = joblib.load(f"{output[0][1]}.0.dat")
-    layer_map_b = np.load(f"{output[0][1]}.1.npy")
-    assert len(inst_dict_b) > 0, "Must have some nuclei"
-    assert layer_map_b is not None, "Must have some layers."
-
-    inst_coords_a = np.array([v["centroid"] for v in inst_dict_a.values()])
-    inst_coords_b = np.array([v["centroid"] for v in inst_dict_b.values()])
-    score = f1_detection(inst_coords_b, inst_coords_a, radius=1.0)
-    assert score > 0.95, "Heavy loss of precision!"
-
-
-def test_functionality_hovernetplus(
-    remote_sample: Callable, track_tmp_path: Path
-) -> None:
-    """Functionality test for multitask segmentor."""
-    root_save_dir = Path(track_tmp_path)
-    mini_wsi_svs = Path(remote_sample("wsi4_512_512_svs"))
-    required_dims = (258, 258)
-    # above image is 512 x 512 at 0.252 mpp resolution. This is 258 x 258 at 0.500 mpp.
-
-    save_dir = f"{root_save_dir}/multi/"
-    shutil.rmtree(save_dir, ignore_errors=True)
-
-    multi_segmentor = MultiTaskSegmentor(
-        pretrained_model="hovernetplus-oed",
-        batch_size=BATCH_SIZE,
-        num_postproc_workers=NUM_POSTPROC_WORKERS,
-    )
-    output = multi_segmentor.predict(
-        [mini_wsi_svs],
-        mode="wsi",
-        device=select_device(on_gpu=ON_GPU),
-        crash_on_exception=True,
-        save_dir=save_dir,
-    )
-
-    inst_dict = joblib.load(f"{output[0][1]}.0.dat")
-    layer_map = np.load(f"{output[0][1]}.1.npy")
-
-    assert len(inst_dict) > 0, "Must have some nuclei."
-    assert layer_map is not None, "Must have some layers."
-    assert layer_map.shape == required_dims, (
-        "Output layer map dimensions must be same as the expected output shape"
-    )
-
-
-def test_functionality_hovernet(remote_sample: Callable, track_tmp_path: Path) -> None:
-    """Functionality test for multitask segmentor."""
-    root_save_dir = Path(track_tmp_path)
-    mini_wsi_svs = Path(remote_sample("wsi4_512_512_svs"))
-
-    save_dir = root_save_dir / "multi"
-    shutil.rmtree(save_dir, ignore_errors=True)
-
-    multi_segmentor = MultiTaskSegmentor(
-        pretrained_model="hovernet_fast-pannuke",
-        batch_size=BATCH_SIZE,
-        num_postproc_workers=NUM_POSTPROC_WORKERS,
-    )
-    output = multi_segmentor.predict(
-        [mini_wsi_svs],
-        mode="wsi",
-        device=select_device(on_gpu=ON_GPU),
-        crash_on_exception=True,
-        save_dir=save_dir,
-    )
-
-    inst_dict = joblib.load(f"{output[0][1]}.0.dat")
-
-    assert len(inst_dict) > 0, "Must have some nuclei."
-
-
-def test_masked_segmentor(remote_sample: Callable, track_tmp_path: Path) -> None:
-    """Test segmentor when image is masked."""
-    root_save_dir = Path(track_tmp_path)
-    sample_wsi_svs = Path(remote_sample("svs-1-small"))
-    sample_wsi_msk = remote_sample("small_svs_tissue_mask")
-    sample_wsi_msk = np.load(sample_wsi_msk).astype(np.uint8)
-    imwrite(f"{track_tmp_path}/small_svs_tissue_mask.jpg", sample_wsi_msk)
-    sample_wsi_msk = track_tmp_path.joinpath("small_svs_tissue_mask.jpg")
-
-    save_dir = root_save_dir / "instance"
-
-    # resolution for travis testing, not the correct ones
-    resolution = 4.0
-    ioconfig = IOSegmentorConfig(
-        input_resolutions=[{"units": "mpp", "resolution": resolution}],
-        output_resolutions=[
-            {"units": "mpp", "resolution": resolution},
-            {"units": "mpp", "resolution": resolution},
-            {"units": "mpp", "resolution": resolution},
-        ],
-        margin=128,
-        tile_shape=[512, 512],
-        patch_input_shape=[256, 256],
-        patch_output_shape=[164, 164],
-        stride_shape=[164, 164],
-    )
-    multi_segmentor = MultiTaskSegmentor(
-        batch_size=BATCH_SIZE,
-        num_postproc_workers=2,
-        pretrained_model="hovernet_fast-pannuke",
-    )
-
-    output = multi_segmentor.predict(
-        [sample_wsi_svs],
-        masks=[sample_wsi_msk],
-        mode="wsi",
-        ioconfig=ioconfig,
-        device=select_device(on_gpu=ON_GPU),
-        crash_on_exception=True,
-        save_dir=save_dir,
-    )
-
-    inst_dict = joblib.load(f"{output[0][1]}.0.dat")
-
-    assert len(inst_dict) > 0, "Must have some nuclei."
-
-
-def test_functionality_process_instance_predictions(
-    remote_sample: Callable,
-    track_tmp_path: Path,
-) -> None:
-    """Test the functionality of instance predictions processing."""
-    root_save_dir = Path(track_tmp_path)
-    mini_wsi_svs = Path(remote_sample("wsi4_512_512_svs"))
-
-    save_dir = root_save_dir / "semantic"
-    shutil.rmtree(save_dir, ignore_errors=True)
-
-    semantic_segmentor = SemanticSegmentor(
-        pretrained_model="hovernetplus-oed",
-        batch_size=BATCH_SIZE,
-        num_postproc_workers=0,
-    )
-    multi_segmentor = MultiTaskSegmentor(
-        pretrained_model="hovernetplus-oed",
-        batch_size=BATCH_SIZE,
-        num_postproc_workers=0,
-    )
-
-    output = semantic_segmentor.predict(
-        [mini_wsi_svs],
-        mode="wsi",
-        device=select_device(on_gpu=ON_GPU),
-        crash_on_exception=True,
-        save_dir=save_dir,
-    )
-    raw_maps = [np.load(f"{output[0][1]}.raw.{head_idx}.npy") for head_idx in range(4)]
-
-    dummy_reference = [{i: {"box": np.array([0, 0, 32, 32])} for i in range(1000)}]
-
-    dummy_tiles = [np.zeros((512, 512))]
-    dummy_bounds = np.array([0, 0, 512, 512])
-
-    multi_segmentor.wsi_layers = [np.zeros_like(raw_maps[0][..., 0])]
-    multi_segmentor._wsi_inst_info = copy.deepcopy(dummy_reference)
-    multi_segmentor._futures = [
-        [dummy_reference, [dummy_reference[0].keys()], dummy_tiles, dummy_bounds],
-    ]
-    multi_segmentor._merge_post_process_results()
-    assert len(multi_segmentor._wsi_inst_info[0]) == 0
-
-
-def test_empty_image(track_tmp_path: Path) -> None:
-    """Test MultiTaskSegmentor for an empty image."""
-    root_save_dir = Path(track_tmp_path)
-    sample_patch = np.ones((256, 256, 3), dtype="uint8") * 255
-    sample_patch_path = root_save_dir / "sample_tile.png"
-    imwrite(sample_patch_path, sample_patch)
-
-    save_dir = root_save_dir / "hovernetplus"
-
-    multi_segmentor = MultiTaskSegmentor(
-        pretrained_model="hovernetplus-oed",
-        batch_size=BATCH_SIZE,
-        num_postproc_workers=0,
-    )
-
-    _ = multi_segmentor.predict(
-        [sample_patch_path],
-        mode="tile",
-        device=select_device(on_gpu=ON_GPU),
-        crash_on_exception=True,
-        save_dir=save_dir,
-    )
-
-    save_dir = root_save_dir / "hovernet"
-
-    multi_segmentor = MultiTaskSegmentor(
-        pretrained_model="hovernet_fast-pannuke",
-        batch_size=BATCH_SIZE,
-        num_postproc_workers=0,
-    )
-
-    _ = multi_segmentor.predict(
-        [sample_patch_path],
-        mode="tile",
-        device=select_device(on_gpu=ON_GPU),
-        crash_on_exception=True,
-        save_dir=save_dir,
-    )
-
-    save_dir = root_save_dir / "semantic"
-
-    multi_segmentor = MultiTaskSegmentor(
-        pretrained_model="fcn_resnet50_unet-bcss",
-        batch_size=BATCH_SIZE,
-        num_postproc_workers=0,
-        output_types=["semantic"],
-    )
-
-    bcc_wsi_ioconfig = IOSegmentorConfig(
-        input_resolutions=[{"units": "mpp", "resolution": 0.25}],
-        output_resolutions=[{"units": "mpp", "resolution": 0.25}],
-        tile_shape=2048,
-        patch_input_shape=[1024, 1024],
-        patch_output_shape=[512, 512],
-        stride_shape=[512, 512],
-        margin=128,
-        save_resolution={"units": "mpp", "resolution": 2},
-    )
-
-    _ = multi_segmentor.predict(
-        [sample_patch_path],
-        mode="tile",
-        device=select_device(on_gpu=ON_GPU),
-        crash_on_exception=True,
-        save_dir=save_dir,
-        ioconfig=bcc_wsi_ioconfig,
-    )
-
-
-def test_functionality_semantic(remote_sample: Callable, track_tmp_path: Path) -> None:
-    """Functionality test for multitask segmentor."""
-    root_save_dir = Path(track_tmp_path)
-
-    save_dir = root_save_dir / "multi"
-    shutil.rmtree(save_dir, ignore_errors=True)
-    with pytest.raises(
-        ValueError,
-        match=r"Output type must be specified for instance or semantic segmentation.",
-    ):
-        MultiTaskSegmentor(
-            pretrained_model="fcn_resnet50_unet-bcss",
-            batch_size=BATCH_SIZE,
-            num_postproc_workers=NUM_POSTPROC_WORKERS,
-        )
-
-    mini_wsi_svs = Path(remote_sample("wsi4_512_512_svs"))
-    save_dir = f"{root_save_dir}/multi/"
-
-    multi_segmentor = MultiTaskSegmentor(
-        pretrained_model="fcn_resnet50_unet-bcss",
-        batch_size=BATCH_SIZE,
-        num_postproc_workers=NUM_POSTPROC_WORKERS,
-        output_types=["semantic"],
-    )
-
-    bcc_wsi_ioconfig = IOSegmentorConfig(
-        input_resolutions=[{"units": "mpp", "resolution": 0.25}],
-        output_resolutions=[{"units": "mpp", "resolution": 0.25}],
-        tile_shape=2048,
-        patch_input_shape=[1024, 1024],
-        patch_output_shape=[512, 512],
-        stride_shape=[512, 512],
-        margin=128,
-        save_resolution={"units": "mpp", "resolution": 2},
-    )
-
-    multi_segmentor.model.postproc_func = semantic_postproc_func
-
-    output = multi_segmentor.predict(
-        [mini_wsi_svs],
-        mode="wsi",
-        device=select_device(on_gpu=ON_GPU),
-        crash_on_exception=True,
-        save_dir=save_dir,
-        ioconfig=bcc_wsi_ioconfig,
-    )
-
-    layer_map = np.load(f"{output[0][1]}.0.npy")
-
-    assert layer_map is not None, "Must have some segmentations."
-
-
-def test_crash_segmentor(remote_sample: Callable, track_tmp_path: Path) -> None:
-    """Test engine crash when given malformed input."""
-    root_save_dir = Path(track_tmp_path)
-    sample_wsi_svs = Path(remote_sample("svs-1-small"))
-    sample_wsi_msk = remote_sample("small_svs_tissue_mask")
-    sample_wsi_msk = np.load(sample_wsi_msk).astype(np.uint8)
-    imwrite(f"{track_tmp_path}/small_svs_tissue_mask.jpg", sample_wsi_msk)
-    sample_wsi_msk = track_tmp_path.joinpath("small_svs_tissue_mask.jpg")
-
-    save_dir = f"{root_save_dir}/multi/"
-
-    # resolution for travis testing, not the correct ones
-    resolution = 4.0
-    ioconfig = IOSegmentorConfig(
-        input_resolutions=[{"units": "mpp", "resolution": resolution}],
-        output_resolutions=[
-            {"units": "mpp", "resolution": resolution},
-            {"units": "mpp", "resolution": resolution},
-            {"units": "mpp", "resolution": resolution},
-        ],
-        margin=128,
-        tile_shape=[512, 512],
-        patch_input_shape=[256, 256],
-        patch_output_shape=[164, 164],
-        stride_shape=[164, 164],
-    )
-    multi_segmentor = MultiTaskSegmentor(
-        batch_size=BATCH_SIZE,
-        num_postproc_workers=2,
-        pretrained_model="hovernetplus-oed",
-    )
-
-    # * Test crash propagation when parallelize post-processing
-    shutil.rmtree(save_dir, ignore_errors=True)
-    multi_segmentor.model.postproc_func = _crash_func
-    with pytest.raises(ValueError, match=r"Crash."):
-        multi_segmentor.predict(
-            [sample_wsi_svs],
-            masks=[sample_wsi_msk],
-            mode="wsi",
-            ioconfig=ioconfig,
-            device=select_device(on_gpu=ON_GPU),
-            crash_on_exception=True,
-            save_dir=save_dir,
-        )
diff --git a/tests/models/test_nucleus_instance_segmentor.py b/tests/models/test_nucleus_instance_segmentor.py
deleted file mode 100644
index 11f848f3c..000000000
--- a/tests/models/test_nucleus_instance_segmentor.py
+++ /dev/null
@@ -1,605 +0,0 @@
-"""Test for Nucleus Instance Segmentor."""
-
-import copy
-
-# ! The garbage collector
-import gc
-import shutil
-from collections.abc import Callable
-from pathlib import Path
-
-import joblib
-import numpy as np
-import pytest
-import torch
-import yaml
-from click.testing import CliRunner
-
-from tiatoolbox import cli, rcParam
-from tiatoolbox.models import (
-    IOSegmentorConfig,
-    NucleusInstanceSegmentor,
-    SemanticSegmentor,
-)
-from tiatoolbox.models.architecture import fetch_pretrained_weights
-from tiatoolbox.models.engine.nucleus_instance_segmentor import (
-    _process_tile_predictions,
-)
-from tiatoolbox.utils import env_detection as toolbox_env
-from tiatoolbox.utils import imwrite
-from tiatoolbox.utils.metrics import f1_detection
-from tiatoolbox.utils.misc import select_device
-from tiatoolbox.wsicore.wsireader import WSIReader
-
-ON_GPU = toolbox_env.has_gpu()
-# The value is based on 2 TitanXP each with 12GB
-BATCH_SIZE = 1 if not ON_GPU else 16
-
-# ----------------------------------------------------
-
-
-def _crash_func(_x: object) -> None:
-    """Helper to induce crash."""
-    msg = "Propagation Crash."
-    raise ValueError(msg)
-
-
-def helper_tile_info() -> list:
-    """Helper function for tile information."""
-    torch._dynamo.reset()
-    current_torch_compile_mode = rcParam["torch_compile_mode"]
-    rcParam["torch_compile_mode"] = "disable"
-    predictor = NucleusInstanceSegmentor(model="A")
-    torch._dynamo.reset()
-    rcParam["torch_compile_mode"] = current_torch_compile_mode
-    # ! assuming the tiles organized as follows (coming out from
-    # ! PatchExtractor). If this is broken, need to check back
-    # ! PatchExtractor output ordering first
-    # left to right, top to bottom
-    # ---------------------
-    # |  0 |  1 |  2 |  3 |
-    # ---------------------
-    # |  4 |  5 |  6 |  7 |
-    # ---------------------
-    # |  8 |  9 | 10 | 11 |
-    # ---------------------
-    # | 12 | 13 | 14 | 15 |
-    # ---------------------
-    # ! assume flag index ordering: left right top bottom
-    ioconfig = IOSegmentorConfig(
-        input_resolutions=[{"units": "mpp", "resolution": 0.25}],
-        output_resolutions=[
-            {"units": "mpp", "resolution": 0.25},
-            {"units": "mpp", "resolution": 0.25},
-            {"units": "mpp", "resolution": 0.25},
-        ],
-        margin=1,
-        tile_shape=[4, 4],
-        stride_shape=[4, 4],
-        patch_input_shape=[4, 4],
-        patch_output_shape=[4, 4],
-    )
-
-    return predictor._get_tile_info([16, 16], ioconfig)
-
-
-# ----------------------------------------------------
-
-
-def test_get_tile_info() -> None:
-    """Test for getting tile info."""
-    info = helper_tile_info()
-    _, flag = info[0]  # index 0 should be full grid, removal
-    # removal flag at top edges
-    assert (
-        np.sum(
-            np.nonzero(flag[:, 0])
-            != np.array([4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15]),
-        )
-        == 0
-    ), "Fail Top"
-    # removal flag at bottom edges
-    assert (
-        np.sum(
-            np.nonzero(flag[:, 1]) != np.array([0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11]),
-        )
-        == 0
-    ), "Fail Bottom"
-    # removal flag at left edges
-    assert (
-        np.sum(
-            np.nonzero(flag[:, 2])
-            != np.array([1, 2, 3, 5, 6, 7, 9, 10, 11, 13, 14, 15]),
-        )
-        == 0
-    ), "Fail Left"
-    # removal flag at right edges
-    assert (
-        np.sum(
-            np.nonzero(flag[:, 3])
-            != np.array([0, 1, 2, 4, 5, 6, 8, 9, 10, 12, 13, 14]),
-        )
-        == 0
-    ), "Fail Right"
-
-
-def test_vertical_boundary_boxes() -> None:
-    """Test for vertical boundary boxes."""
-    info = helper_tile_info()
-    _boxes = np.array(
-        [
-            [3, 0, 5, 4],
-            [7, 0, 9, 4],
-            [11, 0, 13, 4],
-            [3, 4, 5, 8],
-            [7, 4, 9, 8],
-            [11, 4, 13, 8],
-            [3, 8, 5, 12],
-            [7, 8, 9, 12],
-            [11, 8, 13, 12],
-            [3, 12, 5, 16],
-            [7, 12, 9, 16],
-            [11, 12, 13, 16],
-        ],
-    )
-    _flag = np.array(
-        [
-            [0, 1, 0, 0],
-            [0, 1, 0, 0],
-            [0, 1, 0, 0],
-            [1, 1, 0, 0],
-            [1, 1, 0, 0],
-            [1, 1, 0, 0],
-            [1, 1, 0, 0],
-            [1, 1, 0, 0],
-            [1, 1, 0, 0],
-            [1, 0, 0, 0],
-            [1, 0, 0, 0],
-            [1, 0, 0, 0],
-        ],
-    )
-    boxes, flag = info[1]
-    assert np.sum(_boxes - boxes) == 0, "Wrong Vertical Bounds"
-    assert np.sum(flag - _flag) == 0, "Fail Vertical Flag"
-
-
-def test_horizontal_boundary_boxes() -> None:
-    """Test for horizontal boundary boxes."""
-    info = helper_tile_info()
-    _boxes = np.array(
-        [
-            [0, 3, 4, 5],
-            [4, 3, 8, 5],
-            [8, 3, 12, 5],
-            [12, 3, 16, 5],
-            [0, 7, 4, 9],
-            [4, 7, 8, 9],
-            [8, 7, 12, 9],
-            [12, 7, 16, 9],
-            [0, 11, 4, 13],
-            [4, 11, 8, 13],
-            [8, 11, 12, 13],
-            [12, 11, 16, 13],
-        ],
-    )
-    _flag = np.array(
-        [
-            [0, 0, 0, 1],
-            [0, 0, 1, 1],
-            [0, 0, 1, 1],
-            [0, 0, 1, 0],
-            [0, 0, 0, 1],
-            [0, 0, 1, 1],
-            [0, 0, 1, 1],
-            [0, 0, 1, 0],
-            [0, 0, 0, 1],
-            [0, 0, 1, 1],
-            [0, 0, 1, 1],
-            [0, 0, 1, 0],
-        ],
-    )
-    boxes, flag = info[2]
-    assert np.sum(_boxes - boxes) == 0, "Wrong Horizontal Bounds"
-    assert np.sum(flag - _flag) == 0, "Fail Horizontal Flag"
-
-
-def test_cross_section_boundary_boxes() -> None:
-    """Test for cross-section boundary boxes."""
-    info = helper_tile_info()
-    _boxes = np.array(
-        [
-            [2, 2, 6, 6],
-            [6, 2, 10, 6],
-            [10, 2, 14, 6],
-            [2, 6, 6, 10],
-            [6, 6, 10, 10],
-            [10, 6, 14, 10],
-            [2, 10, 6, 14],
-            [6, 10, 10, 14],
-            [10, 10, 14, 14],
-        ],
-    )
-    _flag = np.array(
-        [
-            [1, 1, 1, 1],
-            [1, 1, 1, 1],
-            [1, 1, 1, 1],
-            [1, 1, 1, 1],
-            [1, 1, 1, 1],
-            [1, 1, 1, 1],
-            [1, 1, 1, 1],
-            [1, 1, 1, 1],
-            [1, 1, 1, 1],
-        ],
-    )
-    boxes, flag = info[3]
-    assert np.sum(boxes - _boxes) == 0, "Wrong Cross Section Bounds"
-    assert np.sum(flag - _flag) == 0, "Fail Cross Section Flag"
-
-
-def test_crash_segmentor(remote_sample: Callable, track_tmp_path: Path) -> None:
-    """Test engine crash when given malformed input."""
-    root_save_dir = Path(track_tmp_path)
-    sample_wsi_svs = Path(remote_sample("svs-1-small"))
-    sample_wsi_msk = remote_sample("small_svs_tissue_mask")
-    sample_wsi_msk = np.load(sample_wsi_msk).astype(np.uint8)
-    imwrite(f"{track_tmp_path}/small_svs_tissue_mask.jpg", sample_wsi_msk)
-    sample_wsi_msk = track_tmp_path.joinpath("small_svs_tissue_mask.jpg")
-
-    save_dir = f"{root_save_dir}/instance/"
-
-    # resolution for travis testing, not the correct ones
-    resolution = 4.0
-    ioconfig = IOSegmentorConfig(
-        input_resolutions=[{"units": "mpp", "resolution": resolution}],
-        output_resolutions=[
-            {"units": "mpp", "resolution": resolution},
-            {"units": "mpp", "resolution": resolution},
-            {"units": "mpp", "resolution": resolution},
-        ],
-        margin=128,
-        tile_shape=[512, 512],
-        patch_input_shape=[256, 256],
-        patch_output_shape=[164, 164],
-        stride_shape=[164, 164],
-    )
-    instance_segmentor = NucleusInstanceSegmentor(
-        batch_size=BATCH_SIZE,
-        num_postproc_workers=2,
-        pretrained_model="hovernet_fast-pannuke",
-    )
-
-    # * Test crash propagation when parallelize post-processing
-    shutil.rmtree("output", ignore_errors=True)
-    shutil.rmtree(save_dir, ignore_errors=True)
-    instance_segmentor.model.postproc_func = _crash_func
-    with pytest.raises(ValueError, match=r"Propagation Crash."):
-        instance_segmentor.predict(
-            [sample_wsi_svs],
-            masks=[sample_wsi_msk],
-            mode="wsi",
-            ioconfig=ioconfig,
-            device=select_device(on_gpu=ON_GPU),
-            crash_on_exception=True,
-            save_dir=save_dir,
-        )
-
-
-def test_functionality_ci(remote_sample: Callable, track_tmp_path: Path) -> None:
-    """Functionality test for nuclei instance segmentor."""
-    gc.collect()
-    root_save_dir = Path(track_tmp_path)
-    mini_wsi_svs = Path(remote_sample("wsi4_512_512_svs"))
-
-    resolution = 2.0
-
-    reader = WSIReader.open(mini_wsi_svs)
-    thumb = reader.slide_thumbnail(resolution=resolution, units="mpp")
-    mini_wsi_jpg = f"{track_tmp_path}/mini_svs.jpg"
-    imwrite(mini_wsi_jpg, thumb)
-
-    save_dir = f"{root_save_dir}/instance/"
-
-    # * test run on wsi, test run with worker
-    # resolution for travis testing, not the correct ones
-    ioconfig = IOSegmentorConfig(
-        input_resolutions=[{"units": "mpp", "resolution": resolution}],
-        output_resolutions=[
-            {"units": "mpp", "resolution": resolution},
-            {"units": "mpp", "resolution": resolution},
-        ],
-        margin=128,
-        tile_shape=[1024, 1024],
-        patch_input_shape=[256, 256],
-        patch_output_shape=[164, 164],
-        stride_shape=[164, 164],
-    )
-
-    shutil.rmtree(save_dir, ignore_errors=True)
-
-    inst_segmentor = NucleusInstanceSegmentor(
-        batch_size=1,
-        num_loader_workers=0,
-        num_postproc_workers=0,
-        pretrained_model="hovernet_fast-pannuke",
-    )
-    inst_segmentor.predict(
-        [mini_wsi_svs],
-        mode="wsi",
-        ioconfig=ioconfig,
-        device=select_device(on_gpu=ON_GPU),
-        crash_on_exception=True,
-        save_dir=save_dir,
-    )
-
-
-def test_functionality_merge_tile_predictions_ci(
-    remote_sample: Callable,
-    track_tmp_path: Path,
-) -> None:
-    """Functional tests for merging tile predictions."""
-    gc.collect()  # Force clean up everything on hold
-    save_dir = Path(f"{track_tmp_path}/output")
-    mini_wsi_svs = Path(remote_sample("wsi4_512_512_svs"))
-
-    resolution = 0.5
-    ioconfig = IOSegmentorConfig(
-        input_resolutions=[{"units": "mpp", "resolution": resolution}],
-        output_resolutions=[
-            {"units": "mpp", "resolution": resolution},
-            {"units": "mpp", "resolution": resolution},
-            {"units": "mpp", "resolution": resolution},
-        ],
-        margin=128,
-        tile_shape=[512, 512],
-        patch_input_shape=[256, 256],
-        patch_output_shape=[164, 164],
-        stride_shape=[164, 164],
-    )
-
-    # mainly to hook the merge prediction function
-    inst_segmentor = NucleusInstanceSegmentor(
-        batch_size=BATCH_SIZE,
-        num_postproc_workers=0,
-        pretrained_model="hovernet_fast-pannuke",
-    )
-
-    shutil.rmtree(save_dir, ignore_errors=True)
-    semantic_segmentor = SemanticSegmentor(
-        pretrained_model="hovernet_fast-pannuke",
-        batch_size=BATCH_SIZE,
-        num_postproc_workers=0,
-    )
-
-    output = semantic_segmentor.predict(
-        [mini_wsi_svs],
-        mode="wsi",
-        device=select_device(on_gpu=ON_GPU),
-        ioconfig=ioconfig,
-        crash_on_exception=True,
-        save_dir=save_dir,
-    )
-    raw_maps = [np.load(f"{output[0][1]}.raw.{head_idx}.npy") for head_idx in range(3)]
-    raw_maps = [[v] for v in raw_maps]  # mask it as patch output
-
-    dummy_reference = {i: {"box": np.array([0, 0, 32, 32])} for i in range(1000)}
-    dummy_flag_mode_list = [
-        [[1, 1, 0, 0], 1],
-        [[0, 0, 1, 1], 2],
-        [[1, 1, 1, 1], 3],
-        [[0, 0, 0, 0], 0],
-    ]
-
-    inst_segmentor._wsi_inst_info = copy.deepcopy(dummy_reference)
-    inst_segmentor._futures = [[dummy_reference, dummy_reference.keys()]]
-    inst_segmentor._merge_post_process_results()
-    assert len(inst_segmentor._wsi_inst_info) == 0
-
-    blank_raw_maps = [np.zeros_like(v) for v in raw_maps]
-    _process_tile_predictions(
-        ioconfig=ioconfig,
-        tile_bounds=np.array([0, 0, 512, 512]),
-        tile_flag=dummy_flag_mode_list[0][0],
-        tile_mode=dummy_flag_mode_list[0][1],
-        tile_output=[[np.array([0, 0, 512, 512]), blank_raw_maps]],
-        ref_inst_dict=dummy_reference,
-        postproc=semantic_segmentor.model.postproc_func,
-        merge_predictions=semantic_segmentor.merge_prediction,
-    )
-
-    for tile_flag, tile_mode in dummy_flag_mode_list:
-        _process_tile_predictions(
-            ioconfig=ioconfig,
-            tile_bounds=np.array([0, 0, 512, 512]),
-            tile_flag=tile_flag,
-            tile_mode=tile_mode,
-            tile_output=[[np.array([0, 0, 512, 512]), raw_maps]],
-            ref_inst_dict=dummy_reference,
-            postproc=semantic_segmentor.model.postproc_func,
-            merge_predictions=semantic_segmentor.merge_prediction,
-        )
-
-    # test exception flag
-    tile_flag = [0, 0, 0, 0]
-    with pytest.raises(ValueError, match=r".*Unknown tile mode.*"):
-        _process_tile_predictions(
-            ioconfig=ioconfig,
-            tile_bounds=np.array([0, 0, 512, 512]),
-            tile_flag=tile_flag,
-            tile_mode=-1,
-            tile_output=[[np.array([0, 0, 512, 512]), raw_maps]],
-            ref_inst_dict=dummy_reference,
-            postproc=semantic_segmentor.model.postproc_func,
-            merge_predictions=semantic_segmentor.merge_prediction,
-        )
-
-
-@pytest.mark.skipif(
-    toolbox_env.running_on_ci() or not ON_GPU,
-    reason="Local test on machine with GPU.",
-)
-def test_functionality_local(remote_sample: Callable, track_tmp_path: Path) -> None:
-    """Local functionality test for nuclei instance segmentor."""
-    root_save_dir = Path(track_tmp_path)
-    save_dir = Path(f"{track_tmp_path}/output")
-    mini_wsi_svs = Path(remote_sample("wsi4_1k_1k_svs"))
-
-    # * generate full output w/o parallel post-processing worker first
-    shutil.rmtree(save_dir, ignore_errors=True)
-    inst_segmentor = NucleusInstanceSegmentor(
-        batch_size=8,
-        num_postproc_workers=0,
-        pretrained_model="hovernet_fast-pannuke",
-    )
-    output = inst_segmentor.predict(
-        [mini_wsi_svs],
-        mode="wsi",
-        device=select_device(on_gpu=ON_GPU),
-        crash_on_exception=True,
-        save_dir=save_dir,
-    )
-    inst_dict_a = joblib.load(f"{output[0][1]}.dat")
-
-    # * then test run when using workers, will then compare results
-    # * to ensure the predictions are the same
-    shutil.rmtree(save_dir, ignore_errors=True)
-    inst_segmentor = NucleusInstanceSegmentor(
-        pretrained_model="hovernet_fast-pannuke",
-        batch_size=BATCH_SIZE,
-        num_postproc_workers=2,
-    )
-    assert inst_segmentor.num_postproc_workers == 2
-    output = inst_segmentor.predict(
-        [mini_wsi_svs],
-        mode="wsi",
-        device=select_device(on_gpu=ON_GPU),
-        crash_on_exception=True,
-        save_dir=save_dir,
-    )
-    inst_dict_b = joblib.load(f"{output[0][1]}.dat")
-    inst_coords_a = np.array([v["centroid"] for v in inst_dict_a.values()])
-    inst_coords_b = np.array([v["centroid"] for v in inst_dict_b.values()])
-    score = f1_detection(inst_coords_b, inst_coords_a, radius=1.0)
-    assert score > 0.95, "Heavy loss of precision!"
-
-    # **
-    # To evaluate the precision of doing post-processing on tile
-    # then re-assemble without using full image prediction maps,
-    # we compare its output with the output when doing
-    # post-processing on the entire images.
-    save_dir = root_save_dir / "semantic"
-    shutil.rmtree(save_dir, ignore_errors=True)
-    semantic_segmentor = SemanticSegmentor(
-        pretrained_model="hovernet_fast-pannuke",
-        batch_size=BATCH_SIZE,
-        num_postproc_workers=2,
-    )
-    output = semantic_segmentor.predict(
-        [mini_wsi_svs],
-        mode="wsi",
-        device=select_device(on_gpu=ON_GPU),
-        crash_on_exception=True,
-        save_dir=save_dir,
-    )
-    raw_maps = [np.load(f"{output[0][1]}.raw.{head_idx}.npy") for head_idx in range(3)]
-    _, inst_dict_b = semantic_segmentor.model.postproc(raw_maps)
-
-    inst_coords_a = np.array([v["centroid"] for v in inst_dict_a.values()])
-    inst_coords_b = np.array([v["centroid"] for v in inst_dict_b.values()])
-    score = f1_detection(inst_coords_b, inst_coords_a, radius=1.0)
-    assert score > 0.9, "Heavy loss of precision!"
-
-
-def test_cli_nucleus_instance_segment_ioconfig(
-    remote_sample: Callable,
-    track_tmp_path: Path,
-) -> None:
-    """Test for nucleus segmentation with IOConfig."""
-    mini_wsi_svs = Path(remote_sample("wsi4_512_512_svs"))
-    output_path = track_tmp_path / "output"
-
-    resolution = 2.0
-
-    reader = WSIReader.open(mini_wsi_svs)
-    thumb = reader.slide_thumbnail(resolution=resolution, units="mpp")
-    mini_wsi_jpg = f"{track_tmp_path}/mini_svs.jpg"
-    imwrite(mini_wsi_jpg, thumb)
-
-    pretrained_weights = fetch_pretrained_weights("hovernet_fast-pannuke")
-
-    # resolution for travis testing, not the correct ones
-    config = {
-        "input_resolutions": [{"units": "mpp", "resolution": resolution}],
-        "output_resolutions": [
-            {"units": "mpp", "resolution": resolution},
-            {"units": "mpp", "resolution": resolution},
-            {"units": "mpp", "resolution": resolution},
-        ],
-        "margin": 128,
-        "tile_shape": [512, 512],
-        "patch_input_shape": [256, 256],
-        "patch_output_shape": [164, 164],
-        "stride_shape": [164, 164],
-        "save_resolution": {"units": "mpp", "resolution": 8.0},
-    }
-
-    with Path.open(track_tmp_path / "config.yaml", "w") as fptr:
-        yaml.dump(config, fptr)
-
-    runner = CliRunner()
-    nucleus_instance_segment_result = runner.invoke(
-        cli.main,
-        [
-            "nucleus-instance-segment",
-            "--img-input",
-            str(mini_wsi_jpg),
-            "--pretrained-weights",
-            str(pretrained_weights),
-            "--num-loader-workers",
-            str(0),
-            "--num-postproc-workers",
-            str(0),
-            "--mode",
-            "tile",
-            "--output-path",
-            str(output_path),
-            "--yaml-config-path",
-            str(track_tmp_path.joinpath("config.yaml")),
-        ],
-    )
-
-    assert nucleus_instance_segment_result.exit_code == 0
-    assert output_path.joinpath("0.dat").exists()
-    assert output_path.joinpath("file_map.dat").exists()
-    assert output_path.joinpath("results.json").exists()
-
-
-def test_cli_nucleus_instance_segment(
-    remote_sample: Callable, track_tmp_path: Path
-) -> None:
-    """Test for nucleus segmentation."""
-    mini_wsi_svs = Path(remote_sample("wsi4_512_512_svs"))
-    output_path = track_tmp_path / "output"
-
-    runner = CliRunner()
-    nucleus_instance_segment_result = runner.invoke(
-        cli.main,
-        [
-            "nucleus-instance-segment",
-            "--img-input",
-            str(mini_wsi_svs),
-            "--mode",
-            "wsi",
-            "--num-loader-workers",
-            str(0),
-            "--num-postproc-workers",
-            str(0),
-            "--output-path",
-            str(output_path),
-        ],
-    )
-
-    assert nucleus_instance_segment_result.exit_code == 0
-    assert output_path.joinpath("0.dat").exists()
-    assert output_path.joinpath("file_map.dat").exists()
-    assert output_path.joinpath("results.json").exists()
diff --git a/tests/models/test_patch_predictor.py b/tests/models/test_patch_predictor.py
deleted file mode 100644
index 535a841db..000000000
--- a/tests/models/test_patch_predictor.py
+++ /dev/null
@@ -1,1292 +0,0 @@
-"""Test for Patch Predictor."""
-
-from __future__ import annotations
-
-import copy
-import shutil
-from pathlib import Path
-from typing import TYPE_CHECKING
-
-import cv2
-import numpy as np
-import pytest
-import torch
-from click.testing import CliRunner
-
-from tests.conftest import timed
-from tiatoolbox import cli, logger, rcParam
-from tiatoolbox.models import IOPatchPredictorConfig, PatchPredictor
-from tiatoolbox.models.architecture.vanilla import CNNModel
-from tiatoolbox.models.dataset import (
-    PatchDataset,
-    PatchDatasetABC,
-    WSIPatchDataset,
-    predefined_preproc_func,
-)
-from tiatoolbox.utils import download_data, imread, imwrite
-from tiatoolbox.utils import env_detection as toolbox_env
-from tiatoolbox.utils.misc import select_device
-from tiatoolbox.wsicore.wsireader import WSIReader
-
-if TYPE_CHECKING:
-    from collections.abc import Callable
-
-ON_GPU = toolbox_env.has_gpu()
-RNG = np.random.default_rng()  # Numpy Random Generator
-
-# -------------------------------------------------------------------------------------
-# Dataloader
-# -------------------------------------------------------------------------------------
-
-
-def test_patch_dataset_path_imgs(
-    sample_patch1: str | Path,
-    sample_patch2: str | Path,
-) -> None:
-    """Test for patch dataset with a list of file paths as input."""
-    size = (224, 224, 3)
-
-    dataset = PatchDataset([Path(sample_patch1), Path(sample_patch2)])
-
-    for _, sample_data in enumerate(dataset):
-        sampled_img_shape = sample_data["image"].shape
-        assert sampled_img_shape[0] == size[0]
-        assert sampled_img_shape[1] == size[1]
-        assert sampled_img_shape[2] == size[2]
-
-
-def test_patch_dataset_list_imgs(track_tmp_path: Path) -> None:
-    """Test for patch dataset with a list of images as input."""
-    save_dir_path = track_tmp_path
-
-    size = (5, 5, 3)
-    img = RNG.integers(low=0, high=255, size=size)
-    list_imgs = [img, img, img]
-    dataset = PatchDataset(list_imgs)
-
-    dataset.preproc_func = lambda x: x
-
-    for _, sample_data in enumerate(dataset):
-        sampled_img_shape = sample_data["image"].shape
-        assert sampled_img_shape[0] == size[0]
-        assert sampled_img_shape[1] == size[1]
-        assert sampled_img_shape[2] == size[2]
-
-    # test for changing to another preproc
-    dataset.preproc_func = lambda x: x - 10
-    item = dataset[0]
-    assert np.sum(item["image"] - (list_imgs[0] - 10)) == 0
-
-    # * test for loading npy
-    # remove previously generated data
-    if Path.exists(save_dir_path):
-        shutil.rmtree(save_dir_path, ignore_errors=True)
-    Path.mkdir(save_dir_path, parents=True)
-    np.save(
-        str(save_dir_path / "sample2.npy"),
-        RNG.integers(0, 255, (4, 4, 3)),
-    )
-    imgs = [
-        save_dir_path / "sample2.npy",
-    ]
-    _ = PatchDataset(imgs)
-    assert imgs[0] is not None
-    # test for path object
-    imgs = [
-        save_dir_path / "sample2.npy",
-    ]
-    _ = PatchDataset(imgs)
-
-
-def test_patch_datasetarray_imgs() -> None:
-    """Test for patch dataset with a numpy array of a list of images."""
-    size = (5, 5, 3)
-    img = RNG.integers(0, 255, size=size)
-    list_imgs = [img, img, img]
-    labels = [1, 2, 3]
-    array_imgs = np.array(list_imgs)
-
-    # test different setter for label
-    dataset = PatchDataset(array_imgs, labels=labels)
-    an_item = dataset[2]
-    assert an_item["label"] == 3
-    dataset = PatchDataset(array_imgs, labels=None)
-    an_item = dataset[2]
-    assert "label" not in an_item
-
-    dataset = PatchDataset(array_imgs)
-    for _, sample_data in enumerate(dataset):
-        sampled_img_shape = sample_data["image"].shape
-        assert sampled_img_shape[0] == size[0]
-        assert sampled_img_shape[1] == size[1]
-        assert sampled_img_shape[2] == size[2]
-
-
-def test_patch_dataset_crash(track_tmp_path: Path) -> None:
-    """Test to make sure patch dataset crashes with incorrect input."""
-    # all below examples should fail when input to PatchDataset
-    save_dir_path = track_tmp_path
-
-    # not supported input type
-    imgs = {"a": RNG.integers(0, 255, (4, 4, 4))}
-    with pytest.raises(
-        ValueError,
-        match=r".*Input must be either a list/array of images.*",
-    ):
-        _ = PatchDataset(imgs)
-
-    # ndarray of mixed dtype
-    imgs = np.array(
-        # string array of the same shape
-        [
-            RNG.integers(0, 255, (4, 5, 3)),
-            np.array(  # skipcq: PYL-E1121
-                ["you_should_crash_here" for _ in range(4 * 5 * 3)],
-            ).reshape(
-                4,
-                5,
-                3,
-            ),
-        ],
-        dtype=object,
-    )
-    with pytest.raises(ValueError, match=r"Provided input array is non-numerical."):
-        _ = PatchDataset(imgs)
-
-    # ndarray(s) of NHW images
-    imgs = RNG.integers(0, 255, (4, 4, 4))
-    with pytest.raises(ValueError, match=r".*array of the form HWC*"):
-        _ = PatchDataset(imgs)
-
-    # list of ndarray(s) with different sizes
-    imgs = [
-        RNG.integers(0, 255, (4, 4, 3)),
-        RNG.integers(0, 255, (4, 5, 3)),
-    ]
-    with pytest.raises(ValueError, match=r"Images must have the same dimensions."):
-        _ = PatchDataset(imgs)
-
-    # list of ndarray(s) with HW and HWC mixed up
-    imgs = [
-        RNG.integers(0, 255, (4, 4, 3)),
-        RNG.integers(0, 255, (4, 4)),
-    ]
-    with pytest.raises(
-        ValueError,
-        match=r"Each sample must be an array of the form HWC.",
-    ):
-        _ = PatchDataset(imgs)
-
-    # list of mixed dtype
-    imgs = [RNG.integers(0, 255, (4, 4, 3)), "you_should_crash_here", 123, 456]
-    with pytest.raises(
-        ValueError,
-        match=r"Input must be either a list/array of images or a list of "
-        "valid image paths.",
-    ):
-        _ = PatchDataset(imgs)
-
-    # list of mixed dtype
-    imgs = ["you_should_crash_here", 123, 456]
-    with pytest.raises(
-        ValueError,
-        match=r"Input must be either a list/array of images or a list of "
-        "valid image paths.",
-    ):
-        _ = PatchDataset(imgs)
-
-    # list not exist paths
-    with pytest.raises(
-        ValueError,
-        match=r".*valid image paths.*",
-    ):
-        _ = PatchDataset(["img.npy"])
-
-    # ** test different extension parser
-    # save dummy data to temporary location
-    # remove prev generated data
-    shutil.rmtree(save_dir_path, ignore_errors=True)
-    save_dir_path.mkdir(parents=True)
-
-    torch.save({"a": "a"}, save_dir_path / "sample1.tar")
-    np.save(
-        str(save_dir_path / "sample2.npy"),
-        RNG.integers(0, 255, (4, 4, 3)),
-    )
-
-    imgs = [
-        save_dir_path / "sample1.tar",
-        save_dir_path / "sample2.npy",
-    ]
-    with pytest.raises(
-        ValueError,
-        match="Cannot load image data from",
-    ):
-        _ = PatchDataset(imgs)
-
-    # preproc func for not defined dataset
-    with pytest.raises(
-        ValueError,
-        match=r".* preprocessing .* does not exist.",
-    ):
-        predefined_preproc_func("secret-dataset")
-
-
-def test_wsi_patch_dataset(  # noqa: PLR0915
-    sample_wsi_dict: dict,
-    track_tmp_path: Path,
-) -> None:
-    """A test for creation and bare output."""
-    # convert to pathlib Path to prevent wsireader complaint
-    mini_wsi_svs = Path(sample_wsi_dict["wsi2_4k_4k_svs"])
-    mini_wsi_jpg = Path(sample_wsi_dict["wsi2_4k_4k_jpg"])
-    mini_wsi_msk = Path(sample_wsi_dict["wsi2_4k_4k_msk"])
-
-    def reuse_init(img_path: Path = mini_wsi_svs, **kwargs: dict) -> WSIPatchDataset:
-        """Testing function."""
-        return WSIPatchDataset(img_path=img_path, **kwargs)
-
-    def reuse_init_wsi(**kwargs: dict) -> WSIPatchDataset:
-        """Testing function."""
-        return reuse_init(mode="wsi", **kwargs)
-
-    # test for ABC validate
-    # intentionally created to check error
-    # skipcq
-    class Proto(PatchDatasetABC):
-        def __init__(self: Proto) -> None:
-            super().__init__()
-            self.inputs = "CRASH"
-            self._check_input_integrity("wsi")
-
-        # skipcq
-        def __getitem__(self: Proto, idx: int) -> object:
-            """Get an item from the dataset."""
-
-    with pytest.raises(
-        ValueError,
-        match=r".*`inputs` should be a list of patch coordinates.*",
-    ):
-        Proto()  # skipcq
-
-    # invalid path input
-    with pytest.raises(ValueError, match=r".*`img_path` must be a valid file path.*"):
-        WSIPatchDataset(
-            img_path="aaaa",
-            mode="wsi",
-            patch_input_shape=[512, 512],
-            stride_shape=[256, 256],
-            auto_get_mask=False,
-        )
-
-    # invalid mask path input
-    with pytest.raises(ValueError, match=r".*`mask_path` must be a valid file path.*"):
-        WSIPatchDataset(
-            img_path=mini_wsi_svs,
-            mask_path="aaaa",
-            mode="wsi",
-            patch_input_shape=[512, 512],
-            stride_shape=[256, 256],
-            resolution=1.0,
-            units="mpp",
-            auto_get_mask=False,
-        )
-
-    # invalid mode
-    with pytest.raises(ValueError, match=r"`X` is not supported."):
-        reuse_init(mode="X")
-
-    # invalid patch
-    with pytest.raises(ValueError, match=r"Invalid `patch_input_shape` value None."):
-        reuse_init()
-    with pytest.raises(
-        ValueError,
-        match=r"Invalid `patch_input_shape` value \[512 512 512\].",
-    ):
-        reuse_init_wsi(patch_input_shape=[512, 512, 512])
-    with pytest.raises(
-        ValueError,
-        match=r"Invalid `patch_input_shape` value \['512' 'a'\].",
-    ):
-        reuse_init_wsi(patch_input_shape=[512, "a"])
-    with pytest.raises(ValueError, match=r"Invalid `stride_shape` value None."):
-        reuse_init_wsi(patch_input_shape=512)
-    # invalid stride
-    with pytest.raises(
-        ValueError,
-        match=r"Invalid `stride_shape` value \['512' 'a'\].",
-    ):
-        reuse_init_wsi(patch_input_shape=[512, 512], stride_shape=[512, "a"])
-    with pytest.raises(
-        ValueError,
-        match=r"Invalid `stride_shape` value \[512 512 512\].",
-    ):
-        reuse_init_wsi(patch_input_shape=[512, 512], stride_shape=[512, 512, 512])
-    # negative
-    with pytest.raises(
-        ValueError,
-        match=r"Invalid `patch_input_shape` value \[ 512 -512\].",
-    ):
-        reuse_init_wsi(patch_input_shape=[512, -512], stride_shape=[512, 512])
-    with pytest.raises(
-        ValueError,
-        match=r"Invalid `stride_shape` value \[ 512 -512\].",
-    ):
-        reuse_init_wsi(patch_input_shape=[512, 512], stride_shape=[512, -512])
-
-    # * for wsi
-    # dummy test for analysing the output
-    # stride and patch size should be as expected
-    patch_size = [512, 512]
-    stride_size = [256, 256]
-    ds = reuse_init_wsi(
-        patch_input_shape=patch_size,
-        stride_shape=stride_size,
-        resolution=1.0,
-        units="mpp",
-        auto_get_mask=False,
-    )
-    reader = WSIReader.open(mini_wsi_svs)
-    # tiling top to bottom, left to right
-    ds_roi = ds[2]["image"]
-    step_idx = 2  # manually calibrate
-    start = (step_idx * stride_size[1], 0)
-    end = (start[0] + patch_size[0], start[1] + patch_size[1])
-    rd_roi = reader.read_bounds(
-        start + end,
-        resolution=1.0,
-        units="mpp",
-        coord_space="resolution",
-    )
-    correlation = np.corrcoef(
-        cv2.cvtColor(ds_roi, cv2.COLOR_RGB2GRAY).flatten(),
-        cv2.cvtColor(rd_roi, cv2.COLOR_RGB2GRAY).flatten(),
-    )
-    assert ds_roi.shape[0] == rd_roi.shape[0]
-    assert ds_roi.shape[1] == rd_roi.shape[1]
-    assert np.min(correlation) > 0.9, correlation
-
-    # test creation with auto mask gen and input mask
-    ds = reuse_init_wsi(
-        patch_input_shape=patch_size,
-        stride_shape=stride_size,
-        resolution=1.0,
-        units="mpp",
-        auto_get_mask=True,
-    )
-    assert len(ds) > 0
-    ds = WSIPatchDataset(
-        img_path=mini_wsi_svs,
-        mask_path=mini_wsi_msk,
-        mode="wsi",
-        patch_input_shape=[512, 512],
-        stride_shape=[256, 256],
-        auto_get_mask=False,
-        resolution=1.0,
-        units="mpp",
-    )
-    negative_mask = imread(mini_wsi_msk)
-    negative_mask = np.zeros_like(negative_mask)
-    negative_mask_path = track_tmp_path / "negative_mask.png"
-    imwrite(negative_mask_path, negative_mask)
-    with pytest.raises(ValueError, match="No patch coordinates remain after filtering"):
-        ds = WSIPatchDataset(
-            img_path=mini_wsi_svs,
-            mask_path=negative_mask_path,
-            mode="wsi",
-            patch_input_shape=[512, 512],
-            stride_shape=[256, 256],
-            auto_get_mask=False,
-            resolution=1.0,
-            units="mpp",
-        )
-
-    # * for tile
-    reader = WSIReader.open(mini_wsi_jpg)
-    tile_ds = WSIPatchDataset(
-        img_path=mini_wsi_jpg,
-        mode="tile",
-        patch_input_shape=patch_size,
-        stride_shape=stride_size,
-        auto_get_mask=False,
-    )
-    step_idx = 3  # manually calibrate
-    start = (step_idx * stride_size[1], 0)
-    end = (start[0] + patch_size[0], start[1] + patch_size[1])
-    roi2 = reader.read_bounds(
-        start + end,
-        resolution=1.0,
-        units="baseline",
-        coord_space="resolution",
-    )
-    roi1 = tile_ds[3]["image"]  # match with step_index
-    correlation = np.corrcoef(
-        cv2.cvtColor(roi1, cv2.COLOR_RGB2GRAY).flatten(),
-        cv2.cvtColor(roi2, cv2.COLOR_RGB2GRAY).flatten(),
-    )
-    assert roi1.shape[0] == roi2.shape[0]
-    assert roi1.shape[1] == roi2.shape[1]
-    assert np.min(correlation) > 0.9, correlation
-
-
-def test_patch_dataset_abc() -> None:
-    """Test for ABC methods.
-
-    Test missing definition for abstract intentionally created to check error.
-
-    """
-
-    # skipcq
-    class Proto(PatchDatasetABC):
-        # skipcq
-        def __init__(self: Proto) -> None:
-            super().__init__()
-
-    # crash due to undefined __getitem__
-    with pytest.raises(TypeError):
-        Proto()  # skipcq
-
-    # skipcq
-    class Proto(PatchDatasetABC):
-        # skipcq
-        def __init__(self: Proto) -> None:
-            super().__init__()
-
-        # skipcq
-        def __getitem__(self: Proto, idx: int) -> None:
-            """Get an item from the dataset."""
-
-    ds = Proto()  # skipcq
-
-    # test setter and getter
-    assert ds.preproc_func(1) == 1
-    ds.preproc_func = lambda x: x - 1  # skipcq: PYL-W0201
-    assert ds.preproc_func(1) == 0
-    assert ds.preproc(1) == 1, "Must be unchanged!"
-    ds.preproc_func = None  # skipcq: PYL-W0201
-    assert ds.preproc_func(2) == 2
-
-    # test assign uncallable to preproc_func/postproc_func
-    with pytest.raises(ValueError, match=r".*callable*"):
-        ds.preproc_func = 1  # skipcq: PYL-W0201
-
-
-# -------------------------------------------------------------------------------------
-# Dataloader
-# -------------------------------------------------------------------------------------
-
-
-def test_io_patch_predictor_config() -> None:
-    """Test for IOConfig."""
-    # test for creating
-    cfg = IOPatchPredictorConfig(
-        patch_input_shape=[224, 224],
-        stride_shape=[224, 224],
-        input_resolutions=[{"resolution": 0.5, "units": "mpp"}],
-        # test adding random kwarg and they should be accessible as kwargs
-        crop_from_source=True,
-    )
-    assert cfg.crop_from_source
-
-
-# -------------------------------------------------------------------------------------
-# Engine
-# -------------------------------------------------------------------------------------
-
-
-def test_predictor_crash(track_tmp_path: Path) -> None:
-    """Test for crash when making predictor."""
-    # without providing any model
-    with pytest.raises(ValueError, match=r"Must provide.*"):
-        PatchPredictor()
-
-    # provide wrong unknown pretrained model
-    with pytest.raises(ValueError, match=r"Pretrained .* does not exist"):
-        PatchPredictor(pretrained_model="secret_model-kather100k")
-
-    # provide wrong model of unknown type, deprecated later with type hint
-    with pytest.raises(TypeError, match=r".*must be a string.*"):
-        PatchPredictor(pretrained_model=123)
-
-    # test predict crash
-    predictor = PatchPredictor(pretrained_model="resnet18-kather100k", batch_size=32)
-
-    with pytest.raises(ValueError, match=r".*not a valid mode.*"):
-        predictor.predict("aaa", mode="random", save_dir=track_tmp_path)
-    # remove previously generated data
-    shutil.rmtree(track_tmp_path / "output", ignore_errors=True)
-    with pytest.raises(TypeError, match=r".*must be a list of file paths.*"):
-        predictor.predict("aaa", mode="wsi", save_dir=track_tmp_path)
-    # remove previously generated data
-    shutil.rmtree(track_tmp_path / "output", ignore_errors=True)
-    with pytest.raises(ValueError, match=r".*masks.*!=.*imgs.*"):
-        predictor.predict([1, 2, 3], masks=[1, 2], mode="wsi", save_dir=track_tmp_path)
-    with pytest.raises(ValueError, match=r".*labels.*!=.*imgs.*"):
-        predictor.predict(
-            [1, 2, 3], labels=[1, 2], mode="patch", save_dir=track_tmp_path
-        )
-    # remove previously generated data
-    shutil.rmtree(track_tmp_path / "output", ignore_errors=True)
-
-
-def test_io_config_delegation(remote_sample: Callable, track_tmp_path: Path) -> None:
-    """Test for delegating args to io config."""
-    mini_wsi_svs = Path(remote_sample("wsi2_4k_4k_svs"))
-
-    # test not providing config / full input info for not pretrained models
-    model = CNNModel("resnet50")
-    predictor = PatchPredictor(model=model)
-    with pytest.raises(ValueError, match=r".*Must provide.*`ioconfig`.*"):
-        predictor.predict([mini_wsi_svs], mode="wsi", save_dir=track_tmp_path / "dump")
-    shutil.rmtree(track_tmp_path / "dump", ignore_errors=True)
-
-    kwargs = {
-        "patch_input_shape": [512, 512],
-        "resolution": 1.75,
-        "units": "mpp",
-    }
-    for key in kwargs:
-        _kwargs = copy.deepcopy(kwargs)
-        _kwargs.pop(key)
-        with pytest.raises(ValueError, match=r".*Must provide.*`ioconfig`.*"):
-            predictor.predict(
-                [mini_wsi_svs],
-                mode="wsi",
-                save_dir=f"{track_tmp_path}/dump",
-                device=select_device(on_gpu=ON_GPU),
-                **_kwargs,
-            )
-        shutil.rmtree(track_tmp_path / "dump", ignore_errors=True)
-
-    # test providing config / full input info for not pretrained models
-    ioconfig = IOPatchPredictorConfig(
-        patch_input_shape=(512, 512),
-        stride_shape=(256, 256),
-        input_resolutions=[{"resolution": 1.35, "units": "mpp"}],
-    )
-    predictor.predict(
-        [mini_wsi_svs],
-        ioconfig=ioconfig,
-        mode="wsi",
-        save_dir=f"{track_tmp_path}/dump",
-        device=select_device(on_gpu=ON_GPU),
-    )
-    shutil.rmtree(track_tmp_path / "dump", ignore_errors=True)
-
-    predictor.predict(
-        [mini_wsi_svs],
-        mode="wsi",
-        save_dir=f"{track_tmp_path}/dump",
-        device=select_device(on_gpu=ON_GPU),
-        **kwargs,
-    )
-    shutil.rmtree(track_tmp_path / "dump", ignore_errors=True)
-
-    # test overwriting pretrained ioconfig
-    predictor = PatchPredictor(pretrained_model="resnet18-kather100k", batch_size=1)
-    predictor.predict(
-        [mini_wsi_svs],
-        patch_input_shape=(300, 300),
-        mode="wsi",
-        device=select_device(on_gpu=ON_GPU),
-        save_dir=f"{track_tmp_path}/dump",
-    )
-    assert predictor._ioconfig.patch_input_shape == (300, 300)
-    shutil.rmtree(track_tmp_path / "dump", ignore_errors=True)
-
-    predictor.predict(
-        [mini_wsi_svs],
-        stride_shape=(300, 300),
-        mode="wsi",
-        device=select_device(on_gpu=ON_GPU),
-        save_dir=f"{track_tmp_path}/dump",
-    )
-    assert predictor._ioconfig.stride_shape == (300, 300)
-    shutil.rmtree(track_tmp_path / "dump", ignore_errors=True)
-
-    predictor.predict(
-        [mini_wsi_svs],
-        resolution=1.99,
-        mode="wsi",
-        device=select_device(on_gpu=ON_GPU),
-        save_dir=f"{track_tmp_path}/dump",
-    )
-    assert predictor._ioconfig.input_resolutions[0]["resolution"] == 1.99
-    shutil.rmtree(track_tmp_path / "dump", ignore_errors=True)
-
-    predictor.predict(
-        [mini_wsi_svs],
-        units="baseline",
-        mode="wsi",
-        device=select_device(on_gpu=ON_GPU),
-        save_dir=f"{track_tmp_path}/dump",
-    )
-    assert predictor._ioconfig.input_resolutions[0]["units"] == "baseline"
-    shutil.rmtree(track_tmp_path / "dump", ignore_errors=True)
-
-    predictor = PatchPredictor(pretrained_model="resnet18-kather100k")
-    predictor.predict(
-        [mini_wsi_svs],
-        mode="wsi",
-        merge_predictions=True,
-        save_dir=f"{track_tmp_path}/dump",
-        device=select_device(on_gpu=ON_GPU),
-    )
-    shutil.rmtree(track_tmp_path / "dump", ignore_errors=True)
-
-
-def test_patch_predictor_api(
-    sample_patch1: Path,
-    sample_patch2: Path,
-    track_tmp_path: Path,
-) -> None:
-    """Helper function to get the model output using API 1."""
-    save_dir_path = track_tmp_path
-
-    # convert to pathlib Path to prevent reader complaint
-    inputs = [Path(sample_patch1), Path(sample_patch2)]
-    predictor = PatchPredictor(pretrained_model="resnet18-kather100k", batch_size=1)
-    # don't run test on GPU
-    output = predictor.predict(
-        inputs,
-        device=select_device(on_gpu=ON_GPU),
-        save_dir=save_dir_path,
-    )
-    assert sorted(output.keys()) == ["predictions"]
-    assert len(output["predictions"]) == 2
-    shutil.rmtree(save_dir_path, ignore_errors=True)
-
-    output = predictor.predict(
-        inputs,
-        labels=[1, "a"],
-        return_labels=True,
-        device=select_device(on_gpu=ON_GPU),
-        save_dir=save_dir_path,
-    )
-    assert sorted(output.keys()) == sorted(["labels", "predictions"])
-    assert len(output["predictions"]) == len(output["labels"])
-    assert output["labels"] == [1, "a"]
-    shutil.rmtree(save_dir_path, ignore_errors=True)
-
-    output = predictor.predict(
-        inputs,
-        return_probabilities=True,
-        device=select_device(on_gpu=ON_GPU),
-        save_dir=save_dir_path,
-    )
-    assert sorted(output.keys()) == sorted(["predictions", "probabilities"])
-    assert len(output["predictions"]) == len(output["probabilities"])
-    shutil.rmtree(save_dir_path, ignore_errors=True)
-
-    output = predictor.predict(
-        inputs,
-        return_probabilities=True,
-        labels=[1, "a"],
-        return_labels=True,
-        device=select_device(on_gpu=ON_GPU),
-        save_dir=save_dir_path,
-    )
-    assert sorted(output.keys()) == sorted(["labels", "predictions", "probabilities"])
-    assert len(output["predictions"]) == len(output["labels"])
-    assert len(output["predictions"]) == len(output["probabilities"])
-
-    # test saving output, should have no effect
-    _ = predictor.predict(
-        inputs,
-        device=select_device(on_gpu=ON_GPU),
-        save_dir="special_dir_not_exist",
-    )
-    assert not Path.is_dir(Path("special_dir_not_exist"))
-
-    # test loading user weight
-    pretrained_weights_url = (
-        "https://tiatoolbox.dcs.warwick.ac.uk/models/pc/resnet18-kather100k.pth"
-    )
-
-    # remove prev generated data
-    shutil.rmtree(save_dir_path, ignore_errors=True)
-    save_dir_path.mkdir(parents=True)
-    pretrained_weights = (
-        save_dir_path / "tmp_pretrained_weigths" / "resnet18-kather100k.pth"
-    )
-
-    download_data(pretrained_weights_url, pretrained_weights)
-
-    _ = PatchPredictor(
-        pretrained_model="resnet18-kather100k",
-        pretrained_weights=pretrained_weights,
-        batch_size=1,
-    )
-
-    # --- test different using user model
-    model = CNNModel(backbone="resnet18", num_classes=9)
-    # test prediction
-    predictor = PatchPredictor(model=model, batch_size=1, verbose=False)
-    output = predictor.predict(
-        inputs,
-        return_probabilities=True,
-        labels=[1, "a"],
-        return_labels=True,
-        device=select_device(on_gpu=ON_GPU),
-        save_dir=save_dir_path,
-    )
-    assert sorted(output.keys()) == sorted(["labels", "predictions", "probabilities"])
-    assert len(output["predictions"]) == len(output["labels"])
-    assert len(output["predictions"]) == len(output["probabilities"])
-
-
-def test_wsi_predictor_api(
-    sample_wsi_dict: dict,
-    track_tmp_path: Path,
-    chdir: Callable,
-) -> None:
-    """Test normal run of wsi predictor."""
-    save_dir_path = track_tmp_path
-
-    # convert to pathlib Path to prevent wsireader complaint
-    mini_wsi_svs = Path(sample_wsi_dict["wsi2_4k_4k_svs"])
-    mini_wsi_jpg = Path(sample_wsi_dict["wsi2_4k_4k_jpg"])
-    mini_wsi_msk = Path(sample_wsi_dict["wsi2_4k_4k_msk"])
-
-    patch_size = np.array([224, 224])
-    predictor = PatchPredictor(pretrained_model="resnet18-kather100k", batch_size=32)
-
-    save_dir = f"{save_dir_path}/model_wsi_output"
-
-    # wrapper to make this more clean
-    kwargs = {
-        "return_probabilities": True,
-        "return_labels": True,
-        "device": select_device(on_gpu=ON_GPU),
-        "patch_input_shape": patch_size,
-        "stride_shape": patch_size,
-        "resolution": 1.0,
-        "units": "baseline",
-        "save_dir": save_dir,
-    }
-    # ! add this test back once the read at `baseline` is fixed
-    # sanity check, both output should be the same with same resolution read args
-    wsi_output = predictor.predict(
-        [mini_wsi_svs],
-        masks=[mini_wsi_msk],
-        mode="wsi",
-        **kwargs,
-    )
-
-    shutil.rmtree(save_dir, ignore_errors=True)
-
-    tile_output = predictor.predict(
-        [mini_wsi_jpg],
-        masks=[mini_wsi_msk],
-        mode="tile",
-        **kwargs,
-    )
-
-    wpred = np.array(wsi_output[0]["predictions"])
-    tpred = np.array(tile_output[0]["predictions"])
-    diff = tpred == wpred
-    accuracy = np.sum(diff) / np.size(wpred)
-    assert accuracy > 0.9, np.nonzero(~diff)
-
-    # remove previously generated data
-    shutil.rmtree(save_dir, ignore_errors=True)
-
-    kwargs = {
-        "return_probabilities": True,
-        "return_labels": True,
-        "device": select_device(on_gpu=ON_GPU),
-        "patch_input_shape": patch_size,
-        "stride_shape": patch_size,
-        "resolution": 0.5,
-        "save_dir": save_dir,
-        "merge_predictions": True,  # to test the api coverage
-        "units": "mpp",
-    }
-
-    _kwargs = copy.deepcopy(kwargs)
-    _kwargs["merge_predictions"] = False
-    # test reading of multiple whole-slide images
-    output = predictor.predict(
-        [mini_wsi_svs, mini_wsi_svs],
-        masks=[mini_wsi_msk, mini_wsi_msk],
-        mode="wsi",
-        **_kwargs,
-    )
-    for output_info in output.values():
-        assert Path(output_info["raw"]).exists()
-        assert "merged" not in output_info
-    shutil.rmtree(_kwargs["save_dir"], ignore_errors=True)
-
-    # coverage test
-    _kwargs = copy.deepcopy(kwargs)
-    _kwargs["merge_predictions"] = True
-    # test reading of multiple whole-slide images
-    predictor.predict(
-        [mini_wsi_svs, mini_wsi_svs],
-        masks=[mini_wsi_msk, mini_wsi_msk],
-        mode="wsi",
-        **_kwargs,
-    )
-    _kwargs = copy.deepcopy(kwargs)
-    with pytest.raises(FileExistsError):
-        predictor.predict(
-            [mini_wsi_svs, mini_wsi_svs],
-            masks=[mini_wsi_msk, mini_wsi_msk],
-            mode="wsi",
-            **_kwargs,
-        )
-    # remove previously generated data
-    shutil.rmtree(_kwargs["save_dir"], ignore_errors=True)
-
-    with chdir(save_dir_path):
-        # test reading of multiple whole-slide images
-        _kwargs = copy.deepcopy(kwargs)
-        _kwargs["save_dir"] = None  # default coverage
-        _kwargs["return_probabilities"] = False
-        output = predictor.predict(
-            [mini_wsi_svs, mini_wsi_svs],
-            masks=[mini_wsi_msk, mini_wsi_msk],
-            mode="wsi",
-            **_kwargs,
-        )
-        assert Path.exists(Path("output"))
-        for output_info in output.values():
-            assert Path(output_info["raw"]).exists()
-            assert "merged" in output_info
-            assert Path(output_info["merged"]).exists()
-
-        # remove previously generated data
-        shutil.rmtree("output", ignore_errors=True)
-
-
-def test_wsi_predictor_merge_predictions(sample_wsi_dict: dict) -> None:
-    """Test normal run of wsi predictor with merge predictions option."""
-    # convert to pathlib Path to prevent reader complaint
-    mini_wsi_svs = Path(sample_wsi_dict["wsi2_4k_4k_svs"])
-    mini_wsi_jpg = Path(sample_wsi_dict["wsi2_4k_4k_jpg"])
-    mini_wsi_msk = Path(sample_wsi_dict["wsi2_4k_4k_msk"])
-
-    # blind test
-    # pseudo output dict from model with 2 patches
-    output = {
-        "resolution": 1.0,
-        "units": "baseline",
-        "probabilities": [[0.45, 0.55], [0.90, 0.10]],
-        "predictions": [1, 0],
-        "coordinates": [[0, 0, 2, 2], [2, 2, 4, 4]],
-    }
-    merged = PatchPredictor.merge_predictions(
-        np.zeros([4, 4]),
-        output,
-        resolution=1.0,
-        units="baseline",
-    )
-    _merged = np.array([[2, 2, 0, 0], [2, 2, 0, 0], [0, 0, 1, 1], [0, 0, 1, 1]])
-    assert np.sum(merged - _merged) == 0
-
-    # blind test for merging probabilities
-    merged = PatchPredictor.merge_predictions(
-        np.zeros([4, 4]),
-        output,
-        resolution=1.0,
-        units="baseline",
-        return_raw=True,
-    )
-    _merged = np.array(
-        [
-            [0.45, 0.45, 0, 0],
-            [0.45, 0.45, 0, 0],
-            [0, 0, 0.90, 0.90],
-            [0, 0, 0.90, 0.90],
-        ],
-    )
-    assert merged.shape == (4, 4, 2)
-    assert np.mean(np.abs(merged[..., 0] - _merged)) < 1.0e-6
-
-    # integration test
-    predictor = PatchPredictor(pretrained_model="resnet18-kather100k", batch_size=1)
-
-    kwargs = {
-        "return_probabilities": True,
-        "return_labels": True,
-        "device": select_device(on_gpu=ON_GPU),
-        "patch_input_shape": np.array([224, 224]),
-        "stride_shape": np.array([224, 224]),
-        "resolution": 1.0,
-        "units": "baseline",
-        "merge_predictions": True,
-    }
-    # sanity check, both output should be the same with same resolution read args
-    wsi_output = predictor.predict(
-        [mini_wsi_svs],
-        masks=[mini_wsi_msk],
-        mode="wsi",
-        **kwargs,
-    )
-
-    # mock up to change the preproc func and
-    # force to use the default in merge function
-    # still should have the same results
-    kwargs["merge_predictions"] = False
-    tile_output = predictor.predict(
-        [mini_wsi_jpg],
-        masks=[mini_wsi_msk],
-        mode="tile",
-        **kwargs,
-    )
-    merged_tile_output = predictor.merge_predictions(
-        mini_wsi_jpg,
-        tile_output[0],
-        resolution=kwargs["resolution"],
-        units=kwargs["units"],
-    )
-    tile_output.append(merged_tile_output)
-
-    # first make sure nothing breaks with predictions
-    wpred = np.array(wsi_output[0]["predictions"])
-    tpred = np.array(tile_output[0]["predictions"])
-    diff = tpred == wpred
-    accuracy = np.sum(diff) / np.size(wpred)
-    assert accuracy > 0.9, np.nonzero(~diff)
-
-    merged_wsi = wsi_output[1]
-    merged_tile = tile_output[1]
-    # ensure shape of merged predictions of tile and wsi input are the same
-    assert merged_wsi.shape == merged_tile.shape
-    # ensure consistent predictions between tile and wsi mode
-    diff = merged_tile == merged_wsi
-    accuracy = np.sum(diff) / np.size(merged_wsi)
-    assert accuracy > 0.9, np.nonzero(~diff)
-
-
-def _test_predictor_output(
-    inputs: list,
-    pretrained_model: str,
-    probabilities_check: list | None = None,
-    predictions_check: list | None = None,
-    device: str = select_device(on_gpu=ON_GPU),
-) -> None:
-    """Test the predictions of multiple models included in tiatoolbox."""
-    predictor = PatchPredictor(
-        pretrained_model=pretrained_model,
-        batch_size=32,
-        verbose=False,
-    )
-    # don't run test on GPU
-    output = predictor.predict(
-        inputs,
-        return_probabilities=True,
-        return_labels=False,
-        device=device,
-    )
-    predictions = output["predictions"]
-    probabilities = output["probabilities"]
-    for idx, probabilities_ in enumerate(probabilities):
-        probabilities_max = max(probabilities_)
-        assert np.abs(probabilities_max - probabilities_check[idx]) <= 1e-3, (
-            pretrained_model,
-            probabilities_max,
-            probabilities_check[idx],
-            predictions[idx],
-            predictions_check[idx],
-        )
-        assert predictions[idx] == predictions_check[idx], (
-            pretrained_model,
-            probabilities_max,
-            probabilities_check[idx],
-            predictions[idx],
-            predictions_check[idx],
-        )
-
-
-def test_patch_predictor_kather100k_output(
-    sample_patch1: Path,
-    sample_patch2: Path,
-) -> None:
-    """Test the output of patch prediction models on Kather100K dataset."""
-    inputs = [Path(sample_patch1), Path(sample_patch2)]
-    pretrained_info = {
-        "alexnet-kather100k": [1.0, 0.9999735355377197],
-        "resnet18-kather100k": [1.0, 0.9999911785125732],
-        "resnet34-kather100k": [1.0, 0.9979840517044067],
-        "resnet50-kather100k": [1.0, 0.9999986886978149],
-        "resnet101-kather100k": [1.0, 0.9999932050704956],
-        "resnext50_32x4d-kather100k": [1.0, 0.9910059571266174],
-        "resnext101_32x8d-kather100k": [1.0, 0.9999971389770508],
-        "wide_resnet50_2-kather100k": [1.0, 0.9953408241271973],
-        "wide_resnet101_2-kather100k": [1.0, 0.9999831914901733],
-        "densenet121-kather100k": [1.0, 1.0],
-        "densenet161-kather100k": [1.0, 0.9999959468841553],
-        "densenet169-kather100k": [1.0, 0.9999934434890747],
-        "densenet201-kather100k": [1.0, 0.9999983310699463],
-        "mobilenet_v2-kather100k": [0.9999998807907104, 0.9999126195907593],
-        "mobilenet_v3_large-kather100k": [0.9999996423721313, 0.9999878406524658],
-        "mobilenet_v3_small-kather100k": [0.9999998807907104, 0.9999997615814209],
-        "googlenet-kather100k": [1.0, 0.9999639987945557],
-    }
-    for pretrained_model, expected_prob in pretrained_info.items():
-        _test_predictor_output(
-            inputs,
-            pretrained_model,
-            probabilities_check=expected_prob,
-            predictions_check=[6, 3],
-            device=select_device(on_gpu=ON_GPU),
-        )
-        # only test 1 on travis to limit runtime
-        if toolbox_env.running_on_ci():
-            break
-
-
-def test_patch_predictor_pcam_output(sample_patch3: Path, sample_patch4: Path) -> None:
-    """Test the output of patch prediction models on PCam dataset."""
-    inputs = [Path(sample_patch3), Path(sample_patch4)]
-    pretrained_info = {
-        "alexnet-pcam": [0.999980092048645, 0.9769067168235779],
-        "resnet18-pcam": [0.999992847442627, 0.9466130137443542],
-        "resnet34-pcam": [1.0, 0.9976525902748108],
-        "resnet50-pcam": [0.9999270439147949, 0.9999996423721313],
-        "resnet101-pcam": [1.0, 0.9997289776802063],
-        "resnext50_32x4d-pcam": [0.9999996423721313, 0.9984435439109802],
-        "resnext101_32x8d-pcam": [0.9997072815895081, 0.9969086050987244],
-        "wide_resnet50_2-pcam": [0.9999837875366211, 0.9959040284156799],
-        "wide_resnet101_2-pcam": [1.0, 0.9945427179336548],
-        "densenet121-pcam": [0.9999251365661621, 0.9997479319572449],
-        "densenet161-pcam": [0.9999969005584717, 0.9662821292877197],
-        "densenet169-pcam": [0.9999998807907104, 0.9993504881858826],
-        "densenet201-pcam": [0.9999942779541016, 0.9950824975967407],
-        "mobilenet_v2-pcam": [0.9999876022338867, 0.9942564368247986],
-        "mobilenet_v3_large-pcam": [0.9999922513961792, 0.9719613790512085],
-        "mobilenet_v3_small-pcam": [0.9999963045120239, 0.9747149348258972],
-        "googlenet-pcam": [0.9999929666519165, 0.8701475858688354],
-    }
-    for pretrained_model, expected_prob in pretrained_info.items():
-        _test_predictor_output(
-            inputs,
-            pretrained_model,
-            probabilities_check=expected_prob,
-            predictions_check=[1, 0],
-            device=select_device(on_gpu=ON_GPU),
-        )
-        # only test 1 on travis to limit runtime
-        if toolbox_env.running_on_ci():
-            break
-
-
-# -------------------------------------------------------------------------------------
-# Command Line Interface
-# -------------------------------------------------------------------------------------
-
-
-def test_command_line_models_file_not_found(
-    sample_svs: Path, track_tmp_path: Path
-) -> None:
-    """Test for models CLI file not found error."""
-    runner = CliRunner()
-    model_file_not_found_result = runner.invoke(
-        cli.main,
-        [
-            "patch-predictor",
-            "--img-input",
-            str(sample_svs)[:-1],
-            "--file-types",
-            '"*.ndpi, *.svs"',
-            "--output-path",
-            str(track_tmp_path.joinpath("output")),
-        ],
-    )
-
-    assert model_file_not_found_result.output == ""
-    assert model_file_not_found_result.exit_code == 1
-    assert isinstance(model_file_not_found_result.exception, FileNotFoundError)
-
-
-def test_command_line_models_incorrect_mode(
-    sample_svs: Path, track_tmp_path: Path
-) -> None:
-    """Test for models CLI mode not in wsi, tile."""
-    runner = CliRunner()
-    mode_not_in_wsi_tile_result = runner.invoke(
-        cli.main,
-        [
-            "patch-predictor",
-            "--img-input",
-            str(sample_svs),
-            "--file-types",
-            '"*.ndpi, *.svs"',
-            "--mode",
-            '"patch"',
-            "--output-path",
-            str(track_tmp_path.joinpath("output")),
-        ],
-    )
-
-    assert "Invalid value for '--mode'" in mode_not_in_wsi_tile_result.output
-    assert mode_not_in_wsi_tile_result.exit_code != 0
-    assert isinstance(mode_not_in_wsi_tile_result.exception, SystemExit)
-
-
-def test_cli_model_single_file(sample_svs: Path, track_tmp_path: Path) -> None:
-    """Test for models CLI single file."""
-    runner = CliRunner()
-    models_wsi_result = runner.invoke(
-        cli.main,
-        [
-            "patch-predictor",
-            "--img-input",
-            str(sample_svs),
-            "--mode",
-            "wsi",
-            "--output-path",
-            str(track_tmp_path.joinpath("output")),
-        ],
-    )
-
-    assert models_wsi_result.exit_code == 0
-    assert track_tmp_path.joinpath("output/0.merged.npy").exists()
-    assert track_tmp_path.joinpath("output/0.raw.json").exists()
-    assert track_tmp_path.joinpath("output/results.json").exists()
-
-
-def test_cli_model_single_file_mask(
-    remote_sample: Callable, track_tmp_path: Path
-) -> None:
-    """Test for models CLI single file with mask."""
-    mini_wsi_svs = Path(remote_sample("svs-1-small"))
-    sample_wsi_msk = remote_sample("small_svs_tissue_mask")
-    sample_wsi_msk = np.load(sample_wsi_msk).astype(np.uint8)
-    imwrite(f"{track_tmp_path}/small_svs_tissue_mask.jpg", sample_wsi_msk)
-    sample_wsi_msk = f"{track_tmp_path}/small_svs_tissue_mask.jpg"
-
-    runner = CliRunner()
-    models_tiles_result = runner.invoke(
-        cli.main,
-        [
-            "patch-predictor",
-            "--img-input",
-            str(mini_wsi_svs),
-            "--mode",
-            "wsi",
-            "--masks",
-            str(sample_wsi_msk),
-            "--output-path",
-            str(track_tmp_path.joinpath("output")),
-        ],
-    )
-
-    assert models_tiles_result.exit_code == 0
-    assert track_tmp_path.joinpath("output/0.merged.npy").exists()
-    assert track_tmp_path.joinpath("output/0.raw.json").exists()
-    assert track_tmp_path.joinpath("output/results.json").exists()
-
-
-def test_cli_model_multiple_file_mask(
-    remote_sample: Callable, track_tmp_path: Path
-) -> None:
-    """Test for models CLI multiple file with mask."""
-    mini_wsi_svs = Path(remote_sample("svs-1-small"))
-    sample_wsi_msk = remote_sample("small_svs_tissue_mask")
-    sample_wsi_msk = np.load(sample_wsi_msk).astype(np.uint8)
-    imwrite(f"{track_tmp_path}/small_svs_tissue_mask.jpg", sample_wsi_msk)
-    mini_wsi_msk = track_tmp_path.joinpath("small_svs_tissue_mask.jpg")
-
-    # Make multiple copies for test
-    dir_path = track_tmp_path.joinpath("new_copies")
-    dir_path.mkdir()
-
-    dir_path_masks = track_tmp_path.joinpath("new_copies_masks")
-    dir_path_masks.mkdir()
-
-    try:
-        dir_path.joinpath("1_" + mini_wsi_svs.name).symlink_to(mini_wsi_svs)
-        dir_path.joinpath("2_" + mini_wsi_svs.name).symlink_to(mini_wsi_svs)
-        dir_path.joinpath("3_" + mini_wsi_svs.name).symlink_to(mini_wsi_svs)
-    except OSError:
-        shutil.copy(mini_wsi_svs, dir_path.joinpath("1_" + mini_wsi_svs.name))
-        shutil.copy(mini_wsi_svs, dir_path.joinpath("2_" + mini_wsi_svs.name))
-        shutil.copy(mini_wsi_svs, dir_path.joinpath("3_" + mini_wsi_svs.name))
-
-    try:
-        dir_path_masks.joinpath("1_" + mini_wsi_msk.name).symlink_to(mini_wsi_msk)
-        dir_path_masks.joinpath("2_" + mini_wsi_msk.name).symlink_to(mini_wsi_msk)
-        dir_path_masks.joinpath("3_" + mini_wsi_msk.name).symlink_to(mini_wsi_msk)
-    except OSError:
-        shutil.copy(mini_wsi_msk, dir_path_masks.joinpath("1_" + mini_wsi_msk.name))
-        shutil.copy(mini_wsi_msk, dir_path_masks.joinpath("2_" + mini_wsi_msk.name))
-        shutil.copy(mini_wsi_msk, dir_path_masks.joinpath("3_" + mini_wsi_msk.name))
-
-    track_tmp_path = track_tmp_path.joinpath("output")
-
-    runner = CliRunner()
-    models_tiles_result = runner.invoke(
-        cli.main,
-        [
-            "patch-predictor",
-            "--img-input",
-            str(dir_path),
-            "--mode",
-            "wsi",
-            "--masks",
-            str(dir_path_masks),
-            "--output-path",
-            str(track_tmp_path),
-        ],
-    )
-
-    assert models_tiles_result.exit_code == 0
-    assert track_tmp_path.joinpath("0.merged.npy").exists()
-    assert track_tmp_path.joinpath("0.raw.json").exists()
-    assert track_tmp_path.joinpath("1.merged.npy").exists()
-    assert track_tmp_path.joinpath("1.raw.json").exists()
-    assert track_tmp_path.joinpath("2.merged.npy").exists()
-    assert track_tmp_path.joinpath("2.raw.json").exists()
-    assert track_tmp_path.joinpath("results.json").exists()
-
-
-# -------------------------------------------------------------------------------------
-# torch.compile
-# -------------------------------------------------------------------------------------
-
-
-def test_patch_predictor_torch_compile(
-    sample_patch1: Path,
-    sample_patch2: Path,
-    track_tmp_path: Path,
-) -> None:
-    """Test PatchPredictor with with torch.compile functionality.
-
-    Args:
-        sample_patch1 (Path): Path to sample patch 1.
-        sample_patch2 (Path): Path to sample patch 2.
-        track_tmp_path (Path): Path to temporary directory.
-
-    """
-    torch_compile_mode = rcParam["torch_compile_mode"]
-    torch._dynamo.reset()
-    rcParam["torch_compile_mode"] = "default"
-    _, compile_time = timed(
-        test_patch_predictor_api,
-        sample_patch1,
-        sample_patch2,
-        track_tmp_path,
-    )
-    logger.info("torch.compile default mode: %s", compile_time)
-    torch._dynamo.reset()
-    rcParam["torch_compile_mode"] = "reduce-overhead"
-    _, compile_time = timed(
-        test_patch_predictor_api,
-        sample_patch1,
-        sample_patch2,
-        track_tmp_path,
-    )
-    logger.info("torch.compile reduce-overhead mode: %s", compile_time)
-    torch._dynamo.reset()
-    rcParam["torch_compile_mode"] = "max-autotune"
-    _, compile_time = timed(
-        test_patch_predictor_api,
-        sample_patch1,
-        sample_patch2,
-        track_tmp_path,
-    )
-    logger.info("torch.compile max-autotune mode: %s", compile_time)
-    torch._dynamo.reset()
-    rcParam["torch_compile_mode"] = torch_compile_mode
diff --git a/tests/models/test_semantic_segmentation.py b/tests/models/test_semantic_segmentation.py
deleted file mode 100644
index c7ac9c2aa..000000000
--- a/tests/models/test_semantic_segmentation.py
+++ /dev/null
@@ -1,950 +0,0 @@
-"""Test for Semantic Segmentor."""
-
-from __future__ import annotations
-
-import copy
-
-# ! The garbage collector
-import gc
-import multiprocessing
-import shutil
-from pathlib import Path
-from typing import TYPE_CHECKING
-
-import numpy as np
-import pytest
-import torch
-import torch.multiprocessing as torch_mp
-import torch.nn.functional as F  # noqa: N812
-import yaml
-from click.testing import CliRunner
-from torch import nn
-
-from tests.conftest import timed
-from tiatoolbox import cli, logger, rcParam
-from tiatoolbox.models import SemanticSegmentor
-from tiatoolbox.models.architecture import fetch_pretrained_weights
-from tiatoolbox.models.architecture.utils import centre_crop
-from tiatoolbox.models.engine.semantic_segmentor import (
-    IOSegmentorConfig,
-    WSIStreamDataset,
-)
-from tiatoolbox.models.models_abc import ModelABC
-from tiatoolbox.utils import env_detection as toolbox_env
-from tiatoolbox.utils import imread, imwrite
-from tiatoolbox.utils.misc import select_device
-from tiatoolbox.wsicore.wsireader import WSIReader
-
-if TYPE_CHECKING:
-    from collections.abc import Callable
-
-ON_GPU = toolbox_env.has_gpu()
-# The value is based on 2 TitanXP each with 12GB
-BATCH_SIZE = 1 if not ON_GPU else 16
-try:
-    NUM_POSTPROC_WORKERS = multiprocessing.cpu_count()
-except NotImplementedError:
-    NUM_POSTPROC_WORKERS = 2
-
-# ----------------------------------------------------
-
-
-def _crash_func(_x: object) -> None:
-    """Helper to induce crash."""
-    msg = "Propagation Crash."
-    raise ValueError(msg)
-
-
-class _CNNTo1(ModelABC):
-    """Contains a convolution.
-
-    Simple model to test functionality, this contains a single
-    convolution layer which has weight=0 and bias=1.
-
-    """
-
-    def __init__(self: _CNNTo1) -> None:
-        super().__init__()
-        self.conv = nn.Conv2d(3, 1, 3, padding=1)
-        self.conv.weight.data.fill_(0)
-        self.conv.bias.data.fill_(1)
-
-    def forward(self: _CNNTo1, img: np.ndarray) -> torch.Tensor:
-        """Define how to use layer."""
-        return self.conv(img)
-
-    @staticmethod
-    def infer_batch(model: nn.Module, batch_data: torch.Tensor, device: str) -> list:
-        """Run inference on an input batch.
-
-        Contains logic for forward operation as well as i/o
-        aggregation for a single data batch.
-
-        Args:
-            model (nn.Module): PyTorch defined model.
-            batch_data (torch.Tensor): A batch of data generated by
-                torch.utils.data.DataLoader.
-            device (str):
-                :class:`torch.device` to run the model.
-                Select the device to run the model. Please see
-                https://pytorch.org/docs/stable/tensor_attributes.html#torch.device
-                for more details on input parameters for device. Default value is "cpu".
-
-        """
-        device = "cuda" if ON_GPU else "cpu"
-        ####
-        model.eval()  # infer mode
-
-        ####
-        img_list = batch_data
-
-        img_list = img_list.to(device).type(torch.float32)
-        img_list = img_list.permute(0, 3, 1, 2)  # to NCHW
-
-        hw = np.array(img_list.shape[2:])
-        with torch.inference_mode():  # do not compute gradient
-            logit_list = model(img_list)
-            logit_list = centre_crop(logit_list, hw // 2)
-            logit_list = logit_list.permute(0, 2, 3, 1)  # to NHWC
-            prob_list = F.relu(logit_list)
-
-        prob_list = prob_list.cpu().numpy()
-        return [prob_list]
-
-
-# -------------------------------------------------------------------------------------
-# IOConfig
-# -------------------------------------------------------------------------------------
-
-
-def test_segmentor_ioconfig() -> None:
-    """Test for IOConfig."""
-    default_config = {
-        "input_resolutions": [
-            {"units": "mpp", "resolution": 0.25},
-            {"units": "mpp", "resolution": 0.50},
-            {"units": "mpp", "resolution": 0.75},
-        ],
-        "output_resolutions": [
-            {"units": "mpp", "resolution": 0.25},
-            {"units": "mpp", "resolution": 0.50},
-        ],
-        "patch_input_shape": [2048, 2048],
-        "patch_output_shape": [1024, 1024],
-        "stride_shape": [512, 512],
-    }
-
-    # error when uniform resolution units are not uniform
-    xconfig = copy.deepcopy(default_config)
-    xconfig["input_resolutions"] = [
-        {"units": "mpp", "resolution": 0.25},
-        {"units": "power", "resolution": 0.50},
-    ]
-    with pytest.raises(ValueError, match=r".*Invalid resolution units.*"):
-        _ = IOSegmentorConfig(**xconfig)
-
-    # error when uniform resolution units are not supported
-    xconfig = copy.deepcopy(default_config)
-    xconfig["input_resolutions"] = [
-        {"units": "alpha", "resolution": 0.25},
-        {"units": "alpha", "resolution": 0.50},
-    ]
-    with pytest.raises(ValueError, match=r".*Invalid resolution units.*"):
-        _ = IOSegmentorConfig(**xconfig)
-
-    ioconfig = IOSegmentorConfig(
-        input_resolutions=[
-            {"units": "mpp", "resolution": 0.25},
-            {"units": "mpp", "resolution": 0.50},
-            {"units": "mpp", "resolution": 0.75},
-        ],
-        output_resolutions=[
-            {"units": "mpp", "resolution": 0.25},
-            {"units": "mpp", "resolution": 0.50},
-        ],
-        patch_input_shape=[2048, 2048],
-        patch_output_shape=[1024, 1024],
-        stride_shape=[512, 512],
-    )
-    assert ioconfig.highest_input_resolution == {"units": "mpp", "resolution": 0.25}
-    ioconfig = ioconfig.to_baseline()
-    assert ioconfig.input_resolutions[0]["resolution"] == 1.0
-    assert ioconfig.input_resolutions[1]["resolution"] == 0.5
-    assert ioconfig.input_resolutions[2]["resolution"] == 1 / 3
-
-    ioconfig = IOSegmentorConfig(
-        input_resolutions=[
-            {"units": "power", "resolution": 20},
-            {"units": "power", "resolution": 40},
-        ],
-        output_resolutions=[
-            {"units": "power", "resolution": 20},
-            {"units": "power", "resolution": 40},
-        ],
-        patch_input_shape=[2048, 2048],
-        patch_output_shape=[1024, 1024],
-        stride_shape=[512, 512],
-        save_resolution={"units": "power", "resolution": 8.0},
-    )
-    assert ioconfig.highest_input_resolution == {"units": "power", "resolution": 40}
-    ioconfig = ioconfig.to_baseline()
-    assert ioconfig.input_resolutions[0]["resolution"] == 0.5
-    assert ioconfig.input_resolutions[1]["resolution"] == 1.0
-    assert ioconfig.save_resolution["resolution"] == 8.0 / 40.0
-
-    resolutions = [
-        {"units": "mpp", "resolution": 0.25},
-        {"units": "mpp", "resolution": 0.50},
-        {"units": "mpp", "resolution": 0.75},
-    ]
-    with pytest.raises(ValueError, match=r".*Unknown units.*"):
-        ioconfig.scale_to_highest(resolutions, "axx")
-
-
-# -------------------------------------------------------------------------------------
-# Dataset
-# -------------------------------------------------------------------------------------
-
-
-def test_functional_wsi_stream_dataset(remote_sample: Callable) -> None:
-    """Functional test for WSIStreamDataset."""
-    gc.collect()  # Force clean up everything on hold
-    mini_wsi_svs = Path(remote_sample("wsi4_512_512_svs"))
-
-    ioconfig = IOSegmentorConfig(
-        input_resolutions=[
-            {"units": "mpp", "resolution": 0.25},
-            {"units": "mpp", "resolution": 0.50},
-            {"units": "mpp", "resolution": 0.75},
-        ],
-        output_resolutions=[
-            {"units": "mpp", "resolution": 0.25},
-            {"units": "mpp", "resolution": 0.50},
-        ],
-        patch_input_shape=[2048, 2048],
-        patch_output_shape=[1024, 1024],
-        stride_shape=[512, 512],
-    )
-    mp_manager = torch_mp.Manager()
-    mp_shared_space = mp_manager.Namespace()
-
-    sds = WSIStreamDataset(ioconfig, [mini_wsi_svs], mp_shared_space)
-    # test for collate
-    out = sds.collate_fn([None, 1, 2, 3])
-    assert np.sum(out.numpy() != np.array([1, 2, 3])) == 0
-
-    # artificial data injection
-    mp_shared_space.wsi_idx = torch.tensor(0)  # a scalar
-    mp_shared_space.patch_inputs = torch.from_numpy(
-        np.array(
-            [
-                [0, 0, 256, 256],
-                [256, 256, 512, 512],
-            ],
-        ),
-    )
-    mp_shared_space.patch_outputs = torch.from_numpy(
-        np.array(
-            [
-                [0, 0, 256, 256],
-                [256, 256, 512, 512],
-            ],
-        ),
-    )
-    # test read
-    for _, sample in enumerate(sds):
-        patch_data, _ = sample
-        (patch_resolution1, patch_resolution2, patch_resolution3) = patch_data
-        assert np.round(patch_resolution1.shape[0] / patch_resolution2.shape[0]) == 2
-        assert np.round(patch_resolution1.shape[0] / patch_resolution3.shape[0]) == 3
-
-
-# -------------------------------------------------------------------------------------
-# Engine
-# -------------------------------------------------------------------------------------
-
-
-def test_crash_segmentor(remote_sample: Callable, track_tmp_path: Path) -> None:
-    """Functional crash tests for segmentor."""
-    # # convert to pathlib Path to prevent wsireader complaint
-    mini_wsi_svs = Path(remote_sample("wsi2_4k_4k_svs"))
-    mini_wsi_jpg = Path(remote_sample("wsi2_4k_4k_jpg"))
-    mini_wsi_msk = Path(remote_sample("wsi2_4k_4k_msk"))
-
-    model = _CNNTo1()
-
-    save_dir = track_tmp_path / "test_crash_segmentor"
-    semantic_segmentor = SemanticSegmentor(batch_size=BATCH_SIZE, model=model)
-
-    # fake injection to trigger Segmentor to create parallel
-    # post processing workers because baseline Semantic Segmentor does not support
-    # post processing out of the box. It only contains condition to create it
-    # for any subclass
-    semantic_segmentor.num_postproc_workers = 1
-
-    # * test basic crash
-    with pytest.raises(TypeError, match=r".*`mask_reader`.*"):
-        semantic_segmentor.filter_coordinates(mini_wsi_msk, np.array(["a", "b", "c"]))
-    with pytest.raises(ValueError, match=r".*ndarray.*integer.*"):
-        semantic_segmentor.filter_coordinates(
-            WSIReader.open(mini_wsi_msk),
-            np.array([1.0, 2.0]),
-        )
-    semantic_segmentor.get_reader(mini_wsi_svs, None, "wsi", auto_get_mask=True)
-    with pytest.raises(ValueError, match=r".*must be a valid file path.*"):
-        semantic_segmentor.get_reader(
-            mini_wsi_msk,
-            "not_exist",
-            "wsi",
-            auto_get_mask=True,
-        )
-
-    shutil.rmtree(save_dir, ignore_errors=True)  # default output dir test
-    with pytest.raises(ValueError, match=r".*provide.*"):
-        SemanticSegmentor()
-    with pytest.raises(ValueError, match=r".*valid mode.*"):
-        semantic_segmentor.predict([], mode="abc")
-
-    # * test not providing any io_config info when not using pretrained model
-    with pytest.raises(ValueError, match=r".*provide either `ioconfig`.*"):
-        semantic_segmentor.predict(
-            [mini_wsi_jpg],
-            mode="tile",
-            device=select_device(on_gpu=ON_GPU),
-            crash_on_exception=True,
-            save_dir=save_dir,
-        )
-    with pytest.raises(ValueError, match=r".*already exists.*"):
-        semantic_segmentor.predict(
-            [],
-            mode="tile",
-            patch_input_shape=(2048, 2048),
-            save_dir=save_dir,
-        )
-    shutil.rmtree(save_dir, ignore_errors=True)
-
-    # * test not providing any io_config info when not using pretrained model
-    with pytest.raises(ValueError, match=r".*provide either `ioconfig`.*"):
-        semantic_segmentor.predict(
-            [mini_wsi_jpg],
-            mode="tile",
-            device=select_device(on_gpu=ON_GPU),
-            crash_on_exception=True,
-            save_dir=save_dir,
-        )
-    shutil.rmtree(save_dir, ignore_errors=True)
-
-    # * Test crash propagation when parallelize post-processing
-    semantic_segmentor.num_postproc_workers = 2
-    semantic_segmentor.model.forward = _crash_func
-    with pytest.raises(ValueError, match=r"Propagation Crash."):
-        semantic_segmentor.predict(
-            [mini_wsi_svs],
-            patch_input_shape=(2048, 2048),
-            mode="wsi",
-            device=select_device(on_gpu=ON_GPU),
-            crash_on_exception=True,
-            save_dir=save_dir,
-        )
-    shutil.rmtree(save_dir, ignore_errors=True)
-
-    # test ignore crash
-    semantic_segmentor.predict(
-        [mini_wsi_svs],
-        patch_input_shape=(2048, 2048),
-        mode="wsi",
-        device=select_device(on_gpu=ON_GPU),
-        crash_on_exception=False,
-        save_dir=save_dir,
-    )
-
-
-def test_functional_segmentor_merging(track_tmp_path: Path) -> None:
-    """Functional test for assmebling output."""
-    save_dir = Path(track_tmp_path)
-
-    model = _CNNTo1()
-    semantic_segmentor = SemanticSegmentor(batch_size=BATCH_SIZE, model=model)
-
-    shutil.rmtree(save_dir, ignore_errors=True)
-    save_dir.mkdir()
-    # predictions with HW
-    _output = np.array(
-        [
-            [1, 1, 0, 0],
-            [1, 1, 0, 0],
-            [0, 0, 2, 2],
-            [0, 0, 2, 2],
-        ],
-    )
-    canvas = semantic_segmentor.merge_prediction(
-        [4, 4],
-        [np.full((2, 2), 1), np.full((2, 2), 2)],
-        [[0, 0, 2, 2], [2, 2, 4, 4]],
-        save_path=f"{save_dir}/raw.py",
-        cache_count_path=f"{save_dir}/count.py",
-    )
-    assert np.sum(canvas - _output) < 1.0e-8
-    # a second rerun to test overlapping count,
-    # should still maintain same result
-    canvas = semantic_segmentor.merge_prediction(
-        [4, 4],
-        [np.full((2, 2), 1), np.full((2, 2), 2)],
-        [[0, 0, 2, 2], [2, 2, 4, 4]],
-        save_path=f"{save_dir}/raw.py",
-        cache_count_path=f"{save_dir}/count.py",
-    )
-    assert np.sum(canvas - _output) < 1.0e-8
-    # else will leave hanging file pointer
-    # and hence cant remove its folder later
-    del canvas  # skipcq
-
-    # * predictions with HWC
-    shutil.rmtree(save_dir, ignore_errors=True)
-    save_dir.mkdir()
-    _ = semantic_segmentor.merge_prediction(
-        [4, 4],
-        [np.full((2, 2, 1), 1), np.full((2, 2, 1), 2)],
-        [[0, 0, 2, 2], [2, 2, 4, 4]],
-        save_path=f"{save_dir}/raw.py",
-        cache_count_path=f"{save_dir}/count.py",
-    )
-    del _  # skipcq
-
-    # * test crashing when switch to image having larger
-    # * shape but still provide old links
-    semantic_segmentor.merge_prediction(
-        [8, 8],
-        [np.full((2, 2, 1), 1), np.full((2, 2, 1), 2)],
-        [[0, 0, 2, 2], [2, 2, 4, 4]],
-        save_path=f"{save_dir}/raw.1.py",
-        cache_count_path=f"{save_dir}/count.1.py",
-    )
-    with pytest.raises(ValueError, match=r".*`save_path` does not match.*"):
-        semantic_segmentor.merge_prediction(
-            [4, 4],
-            [np.full((2, 2, 1), 1), np.full((2, 2, 1), 2)],
-            [[0, 0, 2, 2], [2, 2, 4, 4]],
-            save_path=f"{save_dir}/raw.1.py",
-            cache_count_path=f"{save_dir}/count.py",
-        )
-
-    with pytest.raises(ValueError, match=r".*`cache_count_path` does not match.*"):
-        semantic_segmentor.merge_prediction(
-            [4, 4],
-            [np.full((2, 2, 1), 1), np.full((2, 2, 1), 2)],
-            [[0, 0, 2, 2], [2, 2, 4, 4]],
-            save_path=f"{save_dir}/raw.py",
-            cache_count_path=f"{save_dir}/count.1.py",
-        )
-    # * test non HW predictions
-    with pytest.raises(ValueError, match=r".*Prediction is no HW or HWC.*"):
-        semantic_segmentor.merge_prediction(
-            [4, 4],
-            [np.full((2,), 1), np.full((2,), 2)],
-            [[0, 0, 2, 2], [2, 2, 4, 4]],
-            save_path=f"{save_dir}/raw.py",
-            cache_count_path=f"{save_dir}/count.1.py",
-        )
-
-    shutil.rmtree(save_dir, ignore_errors=True)
-    save_dir.mkdir()
-
-    # * with an out of bound location
-    canvas = semantic_segmentor.merge_prediction(
-        [4, 4],
-        [
-            np.full((2, 2), 1),
-            np.full((2, 2), 2),
-            np.full((2, 2), 3),
-            np.full((2, 2), 4),
-        ],
-        [[0, 0, 2, 2], [2, 2, 4, 4], [0, 4, 2, 6], [4, 0, 6, 2]],
-        save_path=None,
-    )
-    assert np.sum(canvas - _output) < 1.0e-8
-    del canvas  # skipcq
-
-
-def test_functional_segmentor(
-    remote_sample: Callable,
-    track_tmp_path: Path,
-    chdir: Callable,
-) -> None:
-    """Functional test for segmentor."""
-    save_dir = track_tmp_path / "dump"
-    # # convert to pathlib Path to prevent wsireader complaint
-    resolution = 2.0
-    mini_wsi_svs = Path(remote_sample("wsi4_1k_1k_svs"))
-    reader = WSIReader.open(mini_wsi_svs)
-    thumb = reader.slide_thumbnail(resolution=resolution, units="baseline")
-    mini_wsi_jpg = f"{track_tmp_path}/mini_svs.jpg"
-    imwrite(mini_wsi_jpg, thumb)
-    mini_wsi_msk = f"{track_tmp_path}/mini_mask.jpg"
-    imwrite(mini_wsi_msk, (thumb > 0).astype(np.uint8))
-
-    # preemptive clean up
-    shutil.rmtree(save_dir, ignore_errors=True)
-    model = _CNNTo1()
-    semantic_segmentor = SemanticSegmentor(batch_size=BATCH_SIZE, model=model)
-    # fake injection to trigger Segmentor to create parallel
-    # post-processing workers because baseline Semantic Segmentor does not support
-    # post-processing out of the box. It only contains condition to create it
-    # for any subclass
-    semantic_segmentor.num_postproc_workers = 1
-
-    # should still run because we skip exception
-    semantic_segmentor.predict(
-        [mini_wsi_jpg],
-        mode="tile",
-        device=select_device(on_gpu=ON_GPU),
-        patch_input_shape=(512, 512),
-        resolution=resolution,
-        units="mpp",
-        crash_on_exception=False,
-        save_dir=save_dir,
-    )
-
-    shutil.rmtree(save_dir, ignore_errors=True)
-    semantic_segmentor.predict(
-        [mini_wsi_jpg],
-        mode="tile",
-        device=select_device(on_gpu=ON_GPU),
-        patch_input_shape=(512, 512),
-        resolution=1 / resolution,
-        units="baseline",
-        crash_on_exception=True,
-        save_dir=save_dir,
-    )
-    shutil.rmtree(save_dir, ignore_errors=True)
-
-    with chdir(track_tmp_path):
-        # * check exception bypass in the log
-        # there should be no exception, but how to check the log?
-        semantic_segmentor.predict(
-            [mini_wsi_jpg],
-            mode="tile",
-            device=select_device(on_gpu=ON_GPU),
-            patch_input_shape=(512, 512),
-            patch_output_shape=(512, 512),
-            stride_shape=(512, 512),
-            resolution=1 / resolution,
-            units="baseline",
-            crash_on_exception=False,
-        )
-        shutil.rmtree(
-            track_tmp_path / "output",
-            ignore_errors=True,
-        )  # default output dir test
-
-    # * test basic running and merging prediction
-    # * should dumping all 1 in the output
-    ioconfig = IOSegmentorConfig(
-        input_resolutions=[{"units": "baseline", "resolution": 1.0}],
-        output_resolutions=[{"units": "baseline", "resolution": 1.0}],
-        patch_input_shape=[512, 512],
-        patch_output_shape=[512, 512],
-        stride_shape=[512, 512],
-    )
-
-    shutil.rmtree(save_dir, ignore_errors=True)
-    file_list = [
-        mini_wsi_jpg,
-        mini_wsi_jpg,
-    ]
-    output_list = semantic_segmentor.predict(
-        file_list,
-        mode="tile",
-        device=select_device(on_gpu=ON_GPU),
-        ioconfig=ioconfig,
-        crash_on_exception=True,
-        save_dir=f"{save_dir}/raw/",
-    )
-    pred_1 = np.load(output_list[0][1] + ".raw.0.npy")
-    pred_2 = np.load(output_list[1][1] + ".raw.0.npy")
-    assert len(output_list) == 2
-    assert np.sum(pred_1 - pred_2) == 0
-    # due to overlapping merge and division, will not be
-    # exactly 1, but should be approximately so
-    assert np.sum((pred_1 - 1) > 1.0e-6) == 0
-    shutil.rmtree(save_dir, ignore_errors=True)
-
-    # * test running with mask and svs
-    # * also test merging prediction at designated resolution
-    ioconfig = IOSegmentorConfig(
-        input_resolutions=[{"units": "mpp", "resolution": resolution}],
-        output_resolutions=[{"units": "mpp", "resolution": resolution}],
-        save_resolution={"units": "mpp", "resolution": resolution},
-        patch_input_shape=[512, 512],
-        patch_output_shape=[256, 256],
-        stride_shape=[512, 512],
-    )
-    shutil.rmtree(save_dir, ignore_errors=True)
-    output_list = semantic_segmentor.predict(
-        [mini_wsi_svs],
-        masks=[mini_wsi_msk],
-        mode="wsi",
-        device=select_device(on_gpu=ON_GPU),
-        ioconfig=ioconfig,
-        crash_on_exception=True,
-        save_dir=f"{save_dir}/raw/",
-    )
-    reader = WSIReader.open(mini_wsi_svs)
-    expected_shape = reader.slide_dimensions(**ioconfig.save_resolution)
-    expected_shape = np.array(expected_shape)[::-1]  # to YX
-    pred_1 = np.load(output_list[0][1] + ".raw.0.npy")
-    saved_shape = np.array(pred_1.shape[:2])
-    assert np.sum(expected_shape - saved_shape) == 0
-    assert np.sum((pred_1 - 1) > 1.0e-6) == 0
-    shutil.rmtree(save_dir, ignore_errors=True)
-
-    # check normal run with auto get mask
-    semantic_segmentor = SemanticSegmentor(
-        batch_size=BATCH_SIZE,
-        model=model,
-        auto_generate_mask=True,
-    )
-    _ = semantic_segmentor.predict(
-        [mini_wsi_svs],
-        masks=[mini_wsi_msk],
-        mode="wsi",
-        device=select_device(on_gpu=ON_GPU),
-        ioconfig=ioconfig,
-        crash_on_exception=True,
-        save_dir=f"{save_dir}/raw/",
-    )
-
-
-def test_subclass(remote_sample: Callable, track_tmp_path: Path) -> None:
-    """Create subclass and test parallel processing setup."""
-    save_dir = Path(track_tmp_path)
-    mini_wsi_jpg = Path(remote_sample("wsi2_4k_4k_jpg"))
-
-    model = _CNNTo1()
-
-    class XSegmentor(SemanticSegmentor):
-        """Dummy class to test subclassing."""
-
-        def __init__(self: XSegmentor) -> None:
-            super().__init__(model=model)
-            self.num_postproc_worker = 2
-
-    semantic_segmentor = XSegmentor()
-    shutil.rmtree(save_dir, ignore_errors=True)  # default output dir test
-    semantic_segmentor.predict(
-        [mini_wsi_jpg],
-        mode="tile",
-        device=select_device(on_gpu=ON_GPU),
-        patch_input_shape=(1024, 1024),
-        patch_output_shape=(512, 512),
-        stride_shape=(256, 256),
-        resolution=1.0,
-        units="baseline",
-        crash_on_exception=False,
-        save_dir=save_dir / "raw",
-    )
-
-
-# specifically designed for travis
-def test_functional_pretrained(remote_sample: Callable, track_tmp_path: Path) -> None:
-    """Test for load up pretrained and over-writing tile mode ioconfig."""
-    save_dir = Path(f"{track_tmp_path}/output")
-    mini_wsi_svs = Path(remote_sample("wsi4_512_512_svs"))
-    reader = WSIReader.open(mini_wsi_svs)
-    thumb = reader.slide_thumbnail(resolution=1.0, units="baseline")
-    mini_wsi_jpg = f"{track_tmp_path}/mini_svs.jpg"
-    imwrite(mini_wsi_jpg, thumb)
-
-    semantic_segmentor = SemanticSegmentor(
-        batch_size=BATCH_SIZE,
-        pretrained_model="fcn-tissue_mask",
-    )
-
-    shutil.rmtree(save_dir, ignore_errors=True)
-    semantic_segmentor.predict(
-        [mini_wsi_svs],
-        mode="wsi",
-        device=select_device(on_gpu=ON_GPU),
-        crash_on_exception=True,
-        save_dir=f"{save_dir}/raw/",
-    )
-
-    shutil.rmtree(save_dir, ignore_errors=True)
-
-    # mainly to test prediction on tile
-    semantic_segmentor.predict(
-        [mini_wsi_jpg],
-        mode="tile",
-        device=select_device(on_gpu=ON_GPU),
-        crash_on_exception=True,
-        save_dir=f"{save_dir}/raw/",
-    )
-
-    assert save_dir.joinpath("raw/0.raw.0.npy").exists()
-    assert save_dir.joinpath("raw/file_map.dat").exists()
-
-
-@pytest.mark.skipif(
-    toolbox_env.running_on_ci() or not ON_GPU,
-    reason="Local test on machine with GPU.",
-)
-def test_behavior_tissue_mask_local(
-    remote_sample: Callable, track_tmp_path: Path
-) -> None:
-    """Contain test for behavior of the segmentor and pretrained models."""
-    save_dir = track_tmp_path
-    wsi_with_artifacts = Path(remote_sample("wsi3_20k_20k_svs"))
-    mini_wsi_jpg = Path(remote_sample("wsi2_4k_4k_jpg"))
-
-    semantic_segmentor = SemanticSegmentor(
-        batch_size=BATCH_SIZE,
-        pretrained_model="fcn-tissue_mask",
-    )
-    shutil.rmtree(save_dir, ignore_errors=True)
-    semantic_segmentor.predict(
-        [wsi_with_artifacts],
-        mode="wsi",
-        device=select_device(on_gpu=ON_GPU),
-        crash_on_exception=True,
-        save_dir=save_dir / "raw",
-    )
-    # load up the raw prediction and perform precision check
-    _cache_pred = imread(Path(remote_sample("wsi3_20k_20k_pred")))
-    _test_pred = np.load(str(save_dir / "raw" / "0.raw.0.npy"))
-    _test_pred = (_test_pred[..., 1] > 0.75) * 255
-    # divide 255 to binarize
-    assert np.mean(_cache_pred[..., 0] == _test_pred) > 0.99
-
-    shutil.rmtree(save_dir, ignore_errors=True)
-    # mainly to test prediction on tile
-    semantic_segmentor.predict(
-        [mini_wsi_jpg],
-        mode="tile",
-        device=select_device(on_gpu=ON_GPU),
-        crash_on_exception=True,
-        save_dir=f"{save_dir}/raw/",
-    )
-
-
-@pytest.mark.skipif(
-    toolbox_env.running_on_ci() or not ON_GPU,
-    reason="Local test on machine with GPU.",
-)
-def test_behavior_bcss_local(remote_sample: Callable, track_tmp_path: Path) -> None:
-    """Contain test for behavior of the segmentor and pretrained models."""
-    save_dir = track_tmp_path
-
-    wsi_breast = Path(remote_sample("wsi4_4k_4k_svs"))
-    semantic_segmentor = SemanticSegmentor(
-        num_loader_workers=4,
-        batch_size=BATCH_SIZE,
-        pretrained_model="fcn_resnet50_unet-bcss",
-    )
-    semantic_segmentor.predict(
-        [wsi_breast],
-        mode="wsi",
-        device=select_device(on_gpu=ON_GPU),
-        crash_on_exception=True,
-        save_dir=save_dir / "raw",
-    )
-    # load up the raw prediction and perform precision check
-    _cache_pred = np.load(Path(remote_sample("wsi4_4k_4k_pred")))
-    _test_pred = np.load(f"{save_dir}/raw/0.raw.0.npy")
-    _test_pred = np.argmax(_test_pred, axis=-1)
-    assert np.mean(np.abs(_cache_pred - _test_pred)) < 1.0e-2
-
-
-# -------------------------------------------------------------------------------------
-# Command Line Interface
-# -------------------------------------------------------------------------------------
-
-
-def test_cli_semantic_segment_out_exists_error(
-    remote_sample: Callable,
-    track_tmp_path: Path,
-) -> None:
-    """Test for semantic segmentation if output path exists."""
-    mini_wsi_svs = Path(remote_sample("svs-1-small"))
-    sample_wsi_msk = remote_sample("small_svs_tissue_mask")
-    sample_wsi_msk = np.load(sample_wsi_msk).astype(np.uint8)
-    imwrite(f"{track_tmp_path}/small_svs_tissue_mask.jpg", sample_wsi_msk)
-    sample_wsi_msk = f"{track_tmp_path}/small_svs_tissue_mask.jpg"
-    runner = CliRunner()
-    semantic_segment_result = runner.invoke(
-        cli.main,
-        [
-            "semantic-segment",
-            "--img-input",
-            str(mini_wsi_svs),
-            "--mode",
-            "wsi",
-            "--masks",
-            str(sample_wsi_msk),
-            "--output-path",
-            track_tmp_path,
-        ],
-    )
-
-    assert semantic_segment_result.output == ""
-    assert semantic_segment_result.exit_code == 1
-    assert isinstance(semantic_segment_result.exception, FileExistsError)
-
-
-def test_cli_semantic_segmentation_ioconfig(
-    remote_sample: Callable,
-    track_tmp_path: Path,
-) -> None:
-    """Test for semantic segmentation single file custom ioconfig."""
-    mini_wsi_svs = Path(remote_sample("svs-1-small"))
-    sample_wsi_msk = remote_sample("small_svs_tissue_mask")
-    sample_wsi_msk = np.load(sample_wsi_msk).astype(np.uint8)
-    imwrite(f"{track_tmp_path}/small_svs_tissue_mask.jpg", sample_wsi_msk)
-    sample_wsi_msk = f"{track_tmp_path}/small_svs_tissue_mask.jpg"
-
-    pretrained_weights = fetch_pretrained_weights("fcn-tissue_mask")
-
-    config = {
-        "input_resolutions": [{"units": "mpp", "resolution": 2.0}],
-        "output_resolutions": [{"units": "mpp", "resolution": 2.0}],
-        "patch_input_shape": [1024, 1024],
-        "patch_output_shape": [512, 512],
-        "stride_shape": [256, 256],
-        "save_resolution": {"units": "mpp", "resolution": 8.0},
-    }
-    with Path.open(track_tmp_path.joinpath("config.yaml"), "w") as fptr:
-        yaml.dump(config, fptr)
-
-    runner = CliRunner()
-
-    semantic_segment_result = runner.invoke(
-        cli.main,
-        [
-            "semantic-segment",
-            "--img-input",
-            str(mini_wsi_svs),
-            "--pretrained-weights",
-            str(pretrained_weights),
-            "--mode",
-            "wsi",
-            "--masks",
-            str(sample_wsi_msk),
-            "--output-path",
-            track_tmp_path.joinpath("output"),
-            "--yaml-config-path",
-            track_tmp_path.joinpath("config.yaml"),
-        ],
-    )
-
-    assert semantic_segment_result.exit_code == 0
-    assert track_tmp_path.joinpath("output/0.raw.0.npy").exists()
-    assert track_tmp_path.joinpath("output/file_map.dat").exists()
-    assert track_tmp_path.joinpath("output/results.json").exists()
-
-
-def test_cli_semantic_segmentation_multi_file(
-    remote_sample: Callable,
-    track_tmp_path: Path,
-) -> None:
-    """Test for models CLI multiple file with mask."""
-    mini_wsi_svs = Path(remote_sample("svs-1-small"))
-    sample_wsi_msk = remote_sample("small_svs_tissue_mask")
-    sample_wsi_msk = np.load(sample_wsi_msk).astype(np.uint8)
-    imwrite(f"{track_tmp_path}/small_svs_tissue_mask.jpg", sample_wsi_msk)
-    sample_wsi_msk = track_tmp_path / "small_svs_tissue_mask.jpg"
-
-    # Make multiple copies for test
-    dir_path = track_tmp_path / "new_copies"
-    dir_path.mkdir()
-
-    dir_path_masks = track_tmp_path / "new_copies_masks"
-    dir_path_masks.mkdir()
-
-    try:
-        dir_path.joinpath("1_" + mini_wsi_svs.name).symlink_to(mini_wsi_svs)
-        dir_path.joinpath("2_" + mini_wsi_svs.name).symlink_to(mini_wsi_svs)
-    except OSError:
-        shutil.copy(mini_wsi_svs, dir_path.joinpath("1_" + mini_wsi_svs.name))
-        shutil.copy(mini_wsi_svs, dir_path.joinpath("2_" + mini_wsi_svs.name))
-
-    try:
-        dir_path_masks.joinpath("1_" + sample_wsi_msk.name).symlink_to(sample_wsi_msk)
-        dir_path_masks.joinpath("2_" + sample_wsi_msk.name).symlink_to(sample_wsi_msk)
-    except OSError:
-        shutil.copy(sample_wsi_msk, dir_path_masks.joinpath("1_" + sample_wsi_msk.name))
-        shutil.copy(sample_wsi_msk, dir_path_masks.joinpath("2_" + sample_wsi_msk.name))
-
-    track_tmp_path = track_tmp_path / "output"
-
-    runner = CliRunner()
-    semantic_segment_result = runner.invoke(
-        cli.main,
-        [
-            "semantic-segment",
-            "--img-input",
-            str(dir_path),
-            "--mode",
-            "wsi",
-            "--masks",
-            str(dir_path_masks),
-            "--output-path",
-            str(track_tmp_path),
-        ],
-    )
-
-    assert semantic_segment_result.exit_code == 0
-    assert track_tmp_path.joinpath("0.raw.0.npy").exists()
-    assert track_tmp_path.joinpath("1.raw.0.npy").exists()
-    assert track_tmp_path.joinpath("file_map.dat").exists()
-    assert track_tmp_path.joinpath("results.json").exists()
-
-    # load up the raw prediction and perform precision check
-    _cache_pred = imread(Path(remote_sample("small_svs_tissue_mask")))
-    _test_pred = np.load(str(track_tmp_path.joinpath("0.raw.0.npy")))
-    _test_pred = (_test_pred[..., 1] > 0.50) * 255
-
-    assert np.mean(np.abs(_cache_pred - _test_pred) / 255) < 1e-3
-
-
-# -------------------------------------------------------------------------------------
-# torch.compile
-# -------------------------------------------------------------------------------------
-
-
-def test_semantic_segmentor_torch_compile(
-    remote_sample: Callable,
-    track_tmp_path: Path,
-) -> None:
-    """Test SemanticSegmentor using pretrained model with torch.compile functionality.
-
-    Args:
-        remote_sample (Callable): Callable object used to extract remote sample.
-        track_tmp_path (Path): Path to temporary directory.
-
-    """
-    torch_compile_mode = rcParam["torch_compile_mode"]
-    torch._dynamo.reset()
-    rcParam["torch_compile_mode"] = "default"
-    _, compile_time = timed(
-        test_functional_pretrained,
-        remote_sample,
-        track_tmp_path,
-    )
-    logger.info("torch.compile default mode: %s", compile_time)
-    torch._dynamo.reset()
-    rcParam["torch_compile_mode"] = "reduce-overhead"
-    _, compile_time = timed(
-        test_functional_pretrained,
-        remote_sample,
-        track_tmp_path,
-    )
-    logger.info("torch.compile reduce-overhead mode: %s", compile_time)
-    torch._dynamo.reset()
-    rcParam["torch_compile_mode"] = "max-autotune"
-    _, compile_time = timed(
-        test_functional_pretrained,
-        remote_sample,
-        track_tmp_path,
-    )
-    logger.info("torch.compile max-autotune mode: %s", compile_time)
-    torch._dynamo.reset()
-    rcParam["torch_compile_mode"] = torch_compile_mode
diff --git a/tests/test_app_bokeh.py b/tests/test_app_bokeh.py
index ce97fb2fd..ae66926a9 100644
--- a/tests/test_app_bokeh.py
+++ b/tests/test_app_bokeh.py
@@ -18,7 +18,7 @@
 import requests
 from bokeh.application import Application
 from bokeh.application.handlers import FunctionHandler
-from bokeh.events import ButtonClick, DoubleTap, MenuItemClick
+from bokeh.events import DoubleTap, MenuItemClick
 from flask_cors import CORS
 from matplotlib import colormaps
 from PIL import Image
@@ -462,54 +462,7 @@ def test_load_img_overlay(doc: Document, data_path: pytest.TempPathFactory) -> N
     assert full_name in main.UI["vstate"].layer_dict
 
 
-def test_hovernet_on_box(doc: Document, data_path: pytest.TempPathFactory) -> None:
-    """Test running hovernet on a box."""
-    slide_select = doc.get_model_by_name("slide_select0")
-    slide_select.value = [data_path["slide2"].name]
-    run_button = doc.get_model_by_name("to_model0")
-    assert len(main.UI["color_column"].children) == 0
-    slide_select.value = [data_path["slide1"].name]
-    # set up a box selection
-    main.UI["box_source"].data = {
-        "x": [1200],
-        "y": [-2000],
-        "width": [400],
-        "height": [400],
-    }
-
-    # select hovernet model and run it on box
-    model_select = doc.get_model_by_name("model_drop0")
-    model_select.value = "hovernet"
-
-    click = ButtonClick(run_button)
-    run_button._trigger_event(click)
-    im = get_tile("overlay", 4, 8, 4, show=False)
-    _, num = label(np.any(im[:, :, :3], axis=2))
-    # check there are multiple cells being detected
-    assert len(main.UI["color_column"].children) > 3
-    assert num > 10
-
-    # test save functionality
-    save_button = doc.get_model_by_name("save_button0")
-    click = ButtonClick(save_button)
-    save_button._trigger_event(click)
-    saved_path = (
-        data_path["base_path"]
-        / "overlays"
-        / (data_path["slide1"].stem + "_saved_anns.db")
-    )
-    assert saved_path.exists()
-
-    # load an overlay with different types
-    cprop_select = doc.get_model_by_name("cprop0")
-    cprop_select.value = ["prob"]
-    layer_drop = doc.get_model_by_name("layer_drop0")
-    click = MenuItemClick(layer_drop, str(data_path["dat_anns"]))
-    layer_drop._trigger_event(click)
-    assert main.UI["vstate"].types == ["annotation"]
-    # check the per-type ui controls have been updated
-    assert len(main.UI["color_column"].children) == 1
-    assert len(main.UI["type_column"].children) == 1
+# test_hovernet_on_box should be fixed before merge to develop.
 
 
 def test_alpha_sliders(doc: Document) -> None:
diff --git a/tests/test_utils.py b/tests/test_utils.py
index 9ee896365..26725dc36 100644
--- a/tests/test_utils.py
+++ b/tests/test_utils.py
@@ -9,6 +9,7 @@
 from typing import TYPE_CHECKING, NoReturn
 
 import cv2
+import dask.array as da
 import joblib
 import numpy as np
 import pandas as pd
@@ -34,6 +35,7 @@
 )
 from tiatoolbox.utils import misc
 from tiatoolbox.utils.exceptions import FileNotSupportedError
+from tiatoolbox.utils.misc import cast_to_min_dtype
 from tiatoolbox.utils.transforms import locsize2bounds
 
 if TYPE_CHECKING:
@@ -1679,12 +1681,13 @@ def test_patch_pred_store() -> None:
     """Test patch_pred_store."""
     # Define a mock patch_output
     patch_output = {
+        "probabilities": [(0.99, 0.01), (0.01, 0.99), (0.99, 0.01)],
         "predictions": [1, 0, 1],
         "coordinates": [(0, 0, 1, 1), (1, 1, 2, 2), (2, 2, 3, 3)],
         "other": "other",
     }
 
-    store = misc.dict_to_store(patch_output, (1.0, 1.0))
+    store = misc.dict_to_store_patch_predictions(patch_output, (1.0, 1.0))
 
     # Check that it is an SQLiteStore containing the expected annotations
     assert isinstance(store, SQLiteStore)
@@ -1697,7 +1700,18 @@ def test_patch_pred_store() -> None:
     patch_output.pop("coordinates")
     # check correct error is raised if coordinates are missing
     with pytest.raises(ValueError, match="coordinates"):
-        misc.dict_to_store(patch_output, (1.0, 1.0))
+        misc.dict_to_store_patch_predictions(patch_output, (1.0, 1.0))
+
+    patch_output = {
+        "predictions": [1, 0, 1],
+        "coordinates": [(0, 0, 1, 1), (1, 1, 2, 2), (2, 2, 3, 3)],
+        "other": "other",
+    }
+
+    store = misc.dict_to_store_patch_predictions(patch_output, (1.0, 1.0))
+
+    # Check that it is an SQLiteStore containing the expected annotations
+    assert isinstance(store, SQLiteStore)
 
 
 def test_patch_pred_store_cdict() -> None:
@@ -1711,7 +1725,9 @@ def test_patch_pred_store_cdict() -> None:
         "other": "other",
     }
     class_dict = {0: "class0", 1: "class1"}
-    store = misc.dict_to_store(patch_output, (1.0, 1.0), class_dict=class_dict)
+    store = misc.dict_to_store_patch_predictions(
+        patch_output, (1.0, 1.0), class_dict=class_dict
+    )
 
     # Check that it is an SQLiteStore containing the expected annotations
     assert isinstance(store, SQLiteStore)
@@ -1732,7 +1748,7 @@ def test_patch_pred_store_sf() -> None:
         "probabilities": [[0.1, 0.9], [0.9, 0.1], [0.4, 0.6]],
         "labels": [1, 0, 1],
     }
-    store = misc.dict_to_store(patch_output, (2.0, 2.0))
+    store = misc.dict_to_store_patch_predictions(patch_output, (2.0, 2.0))
 
     # Check that its an SQLiteStore containing the expected annotations
     assert isinstance(store, SQLiteStore)
@@ -1741,43 +1757,6 @@ def test_patch_pred_store_sf() -> None:
         assert annotation.geometry.area == 4
 
 
-def test_patch_pred_store_zarr(track_tmp_path: pytest.TempPathFactory) -> None:
-    """Test patch_pred_store_zarr."""
-    # Define a mock patch_output
-    patch_output = {
-        "predictions": [1, 0, 1],
-        "coordinates": [(0, 0, 1, 1), (1, 1, 2, 2), (2, 2, 3, 3)],
-        "probabilities": [[0.1, 0.9], [0.9, 0.1], [0.4, 0.6]],
-        "labels": [1, 0, 1],
-    }
-
-    save_path = track_tmp_path / "patch_output" / "output.zarr"
-
-    store_path = misc.dict_to_zarr(patch_output, save_path=save_path)
-
-    print("Zarr path: ", store_path)
-    assert Path.exists(store_path), "Zarr output file does not exist"
-
-
-def test_patch_pred_store_zarr_ext(track_tmp_path: pytest.TempPathFactory) -> None:
-    """Test patch_pred_store_zarr and ensures the output file extension is `.zarr`."""
-    # Define a mock patch_output
-    patch_output = {
-        "predictions": [1, 0, 1],
-        "coordinates": [(0, 0, 1, 1), (1, 1, 2, 2), (2, 2, 3, 3)],
-        "probabilities": [[0.1, 0.9], [0.9, 0.1], [0.4, 0.6]],
-        "labels": [1, 0, 1],
-    }
-
-    # sends the path of a jpeg source image, expects .zarr file in the same directory
-    save_path = track_tmp_path / "patch_output" / "patch.jpeg"
-
-    store_path = misc.dict_to_zarr(patch_output, save_path=save_path)
-
-    print("Zarr path: ", store_path)
-    assert Path.exists(store_path), "Zarr output file does not exist"
-
-
 def test_patch_pred_store_persist(track_tmp_path: pytest.TempPathFactory) -> None:
     """Test patch_pred_store. and persists store output to a .db file."""
     # Define a mock patch_output
@@ -1789,7 +1768,9 @@ def test_patch_pred_store_persist(track_tmp_path: pytest.TempPathFactory) -> Non
     }
     save_path = track_tmp_path / "patch_output" / "output.db"
 
-    store_path = misc.dict_to_store(patch_output, (1.0, 1.0), save_path=save_path)
+    store_path = misc.dict_to_store_patch_predictions(
+        patch_output, (1.0, 1.0), save_path=save_path
+    )
 
     print("Annotation store path: ", store_path)
     assert Path.exists(store_path), "Annotation Store output file does not exist"
@@ -1807,7 +1788,7 @@ def test_patch_pred_store_persist(track_tmp_path: pytest.TempPathFactory) -> Non
     patch_output.pop("coordinates")
     # check correct error is raised if coordinates are missing
     with pytest.raises(ValueError, match="coordinates"):
-        misc.dict_to_store(patch_output, (1.0, 1.0))
+        misc.dict_to_store_patch_predictions(patch_output, (1.0, 1.0))
 
 
 def test_patch_pred_store_persist_ext(track_tmp_path: pytest.TempPathFactory) -> None:
@@ -1823,7 +1804,9 @@ def test_patch_pred_store_persist_ext(track_tmp_path: pytest.TempPathFactory) ->
     # sends the path of a jpeg source image, expects .db file in the same directory
     save_path = track_tmp_path / "patch_output" / "output.jpeg"
 
-    store_path = misc.dict_to_store(patch_output, (1.0, 1.0), save_path=save_path)
+    store_path = misc.dict_to_store_patch_predictions(
+        patch_output, (1.0, 1.0), save_path=save_path
+    )
 
     print("Annotation store path: ", store_path)
     assert Path.exists(store_path), "Annotation Store output file does not exist"
@@ -1841,7 +1824,7 @@ def test_patch_pred_store_persist_ext(track_tmp_path: pytest.TempPathFactory) ->
     patch_output.pop("coordinates")
     # check correct error is raised if coordinates are missing
     with pytest.raises(ValueError, match="coordinates"):
-        misc.dict_to_store(patch_output, (1.0, 1.0))
+        misc.dict_to_store_patch_predictions(patch_output, (1.0, 1.0))
 
 
 def test_torch_compile_already_compiled() -> None:
@@ -2211,3 +2194,45 @@ def test_save_zarr_array_probability_ome_tiff(
     assert_ome_metadata_value(ome_xml, "PhysicalSizeY", "0.25")
     assert_ome_metadata_value(ome_xml, "PhysicalSizeXUnit", "µm")
     assert_ome_metadata_value(ome_xml, "PhysicalSizeYUnit", "µm")
+
+
+@pytest.mark.parametrize(
+    ("input_array", "expected_dtype"),
+    [
+        (np.array([0, 1]), np.bool_),  # Should cast to bool
+        (np.array([0, 255]), np.uint8),  # Should cast to uint8
+        (np.array([0, 256]), np.uint16),  # Should cast to uint16
+        (np.array([0, 70000]), np.uint32),  # Should cast to uint32
+        (np.array([0, 2**32]), np.uint64),  # Should cast to uint64
+    ],
+)
+def test_cast_to_min_dtype_numpy(input_array: np.ndarray, expected_dtype: type) -> None:
+    """Check expected np array dtype cast_to_min_dtype."""
+    result = cast_to_min_dtype(input_array)
+    assert isinstance(result, np.ndarray)
+    assert result.dtype == expected_dtype
+
+
+@pytest.mark.parametrize(
+    ("input_array", "expected_dtype"),
+    [
+        (da.from_array(np.array([0, 1])), np.bool_),  # Should cast to bool
+        (da.from_array(np.array([0, 255])), np.uint8),  # Should cast to uint8
+        (da.from_array(np.array([0, 256])), np.uint16),  # Should cast to uint16
+        (da.from_array(np.array([0, 70000])), np.uint32),  # Should cast to uint32
+        (da.from_array(np.array([0, 2**32])), np.uint64),  # Should cast to uint64
+    ],
+)
+def test_cast_to_min_dtype_dask(input_array: da.Array, expected_dtype: type) -> None:
+    """Check expected dask array dtype cast_to_min_dtype."""
+    result = cast_to_min_dtype(input_array)
+    assert isinstance(result, da.Array)
+    assert result.dtype == expected_dtype
+
+
+def test_cast_to_min_dtype_numpy_large_value() -> None:
+    """Check if return type is changed for large value."""
+    large_value = np.array([np.iinfo(np.uint64).max + 1], dtype=object)
+    result = cast_to_min_dtype(large_value)
+    assert result == large_value
+    assert result.dtype == object
diff --git a/tiatoolbox/cli/__init__.py b/tiatoolbox/cli/__init__.py
index cf6b35701..38c69aa85 100644
--- a/tiatoolbox/cli/__init__.py
+++ b/tiatoolbox/cli/__init__.py
@@ -11,7 +11,7 @@
 from tiatoolbox.cli.patch_predictor import patch_predictor
 from tiatoolbox.cli.read_bounds import read_bounds
 from tiatoolbox.cli.save_tiles import save_tiles
-from tiatoolbox.cli.semantic_segment import semantic_segment
+from tiatoolbox.cli.semantic_segmentor import semantic_segmentor
 from tiatoolbox.cli.show_wsi import show_wsi
 from tiatoolbox.cli.slide_info import slide_info
 from tiatoolbox.cli.slide_thumbnail import slide_thumbnail
@@ -42,7 +42,7 @@ def main() -> click.BaseCommand:
 main.add_command(patch_predictor)
 main.add_command(read_bounds)
 main.add_command(save_tiles)
-main.add_command(semantic_segment)
+main.add_command(semantic_segmentor)
 main.add_command(slide_info)
 main.add_command(slide_thumbnail)
 main.add_command(tissue_mask)
diff --git a/tiatoolbox/cli/common.py b/tiatoolbox/cli/common.py
index 88364fa45..75d32af8e 100644
--- a/tiatoolbox/cli/common.py
+++ b/tiatoolbox/cli/common.py
@@ -10,7 +10,7 @@
 if TYPE_CHECKING:  # pragma: no cover
     from collections.abc import Callable
 
-    from tiatoolbox.models.models_abc import IOConfigABC
+    from tiatoolbox.models.engine.io_config import ModelIOConfigABC
 
 
 def add_default_to_usage_help(
@@ -91,6 +91,26 @@ def cli_file_type(
     )
 
 
+def cli_output_type(
+    usage_help: str = "The format of the output type. "
+    "'output_type' can be 'zarr' or 'AnnotationStore'. "
+    "Default value is 'AnnotationStore'.",
+    default: str = "AnnotationStore",
+    input_type: click.Choice | None = None,
+) -> Callable:
+    """Enables --file-types option for cli."""
+    click_choices = click.Choice(
+        choices=["zarr", "AnnotationStore"], case_sensitive=False
+    )
+    input_type = click_choices if input_type is None else input_type
+    return click.option(
+        "--output-type",
+        help=add_default_to_usage_help(usage_help, default=default),
+        default=default,
+        type=input_type,
+    )
+
+
 def cli_mode(
     usage_help: str = "Selected mode to show or save the required information.",
     default: str = "save",
@@ -107,6 +127,20 @@ def cli_mode(
     )
 
 
+def cli_patch_mode(
+    usage_help: str = "Whether to run the model in patch mode or WSI mode.",
+    *,
+    default: bool = False,
+) -> Callable:
+    """Enables --return-probabilities option for cli."""
+    return click.option(
+        "--patch-mode",
+        type=bool,
+        help=add_default_to_usage_help(usage_help, default=default),
+        default=default,
+    )
+
+
 def cli_region(
     usage_help: str = "Image region in the whole slide image to read from. "
     "default=0 0 2000 2000",
@@ -220,7 +254,7 @@ def cli_pretrained_model(
 ) -> Callable:
     """Enables --pretrained-model option for cli."""
     return click.option(
-        "--pretrained-model",
+        "--model",
         help=add_default_to_usage_help(usage_help, default=default),
         default=default,
     )
@@ -239,6 +273,39 @@ def cli_pretrained_weights(
     )
 
 
+def cli_model(
+    usage_help: str = "Name of the predefined model used to process the data. "
+    "The format is <model_name>_<dataset_trained_on>. For example, "
+    "`resnet18-kather100K` is a resnet18 model trained on the Kather dataset. "
+    "Please see "
+    "https://tia-toolbox.readthedocs.io/en/latest/usage.html#deep-learning-models "
+    "for a detailed list of available pretrained models."
+    "By default, the corresponding pretrained weights will also be"
+    "downloaded. However, you can override with your own set of weights"
+    "via the `pretrained_weights` argument. Argument is case insensitive.",
+    default: str = "resnet18-kather100k",
+) -> Callable:
+    """Enables --pretrained-model option for cli."""
+    return click.option(
+        "--model",
+        help=add_default_to_usage_help(usage_help, default=default),
+        default=default,
+    )
+
+
+def cli_weights(
+    usage_help: str = "Path to the model weight file. If not supplied, the default "
+    "pretrained weight will be used.",
+    default: str | None = None,
+) -> Callable:
+    """Enables --pretrained-weights option for cli."""
+    return click.option(
+        "--weights",
+        help=add_default_to_usage_help(usage_help, default=default),
+        default=default,
+    )
+
+
 def cli_device(
     usage_help: str = "Select the device (cpu/cuda/mps) to use for inference.",
     default: str = "cpu",
@@ -282,7 +349,7 @@ def cli_merge_predictions(
 def cli_return_labels(
     usage_help: str = "Whether to return raw model output as labels.",
     *,
-    default: bool = True,
+    default: bool = False,
 ) -> Callable:
     """Enables --return-labels option for cli."""
     return click.option(
@@ -322,14 +389,28 @@ def cli_masks(
     )
 
 
-def cli_auto_generate_mask(
+def cli_memory_threshold(
+    usage_help: str = (
+        "Memory usage threshold (in percentage) to trigger caching behavior."
+    ),
+    default: int = 80,
+) -> Callable:
+    """Enables --batch-size option for cli."""
+    return click.option(
+        "--memory-threshold",
+        help=add_default_to_usage_help(usage_help, default=default),
+        default=default,
+    )
+
+
+def cli_auto_get_mask(
     usage_help: str = "Automatically generate tile/WSI tissue mask.",
     *,
     default: bool = False,
 ) -> Callable:
     """Enables --auto-generate-mask option for cli."""
     return click.option(
-        "--auto-generate-mask",
+        "--auto-get-mask",
         help=add_default_to_usage_help(usage_help, default=default),
         type=bool,
         default=default,
@@ -350,27 +431,14 @@ def cli_yaml_config_path(
     )
 
 
-def cli_num_loader_workers(
+def cli_num_workers(
     usage_help: str = "Number of workers to load the data. Please note that they will "
     "also perform preprocessing.",
     default: int = 0,
 ) -> Callable:
     """Enables --num-loader-workers option for cli."""
     return click.option(
-        "--num-loader-workers",
-        help=add_default_to_usage_help(usage_help, default=default),
-        type=int,
-        default=default,
-    )
-
-
-def cli_num_postproc_workers(
-    usage_help: str = "Number of workers to post-process the network output.",
-    default: int = 0,
-) -> Callable:
-    """Enables --num-postproc-workers option for cli."""
-    return click.option(
-        "--num-postproc-workers",
+        "--num-workers",
         help=add_default_to_usage_help(usage_help, default=default),
         type=int,
         default=default,
@@ -563,17 +631,17 @@ def prepare_model_cli(
 tiatoolbox_cli = TIAToolboxCLI()
 
 
-def prepare_ioconfig_seg(
-    segment_config_class: type[IOConfigABC],
+def prepare_ioconfig(
+    config_class: type[ModelIOConfigABC],
     pretrained_weights: str | Path | None,
     yaml_config_path: str | Path,
-) -> IOConfigABC | None:
-    """Prepare ioconfig for segmentation."""
+) -> ModelIOConfigABC | None:
+    """Prepare ioconfig for CLI."""
     import yaml  # noqa: PLC0415
 
     if pretrained_weights is not None:
         with Path(yaml_config_path).open() as registry_handle:
             ioconfig = yaml.safe_load(registry_handle)
-        return segment_config_class(**ioconfig)
+        return config_class(**ioconfig)
 
     return None
diff --git a/tiatoolbox/cli/nucleus_instance_segment.py b/tiatoolbox/cli/nucleus_instance_segment.py
index ab5ad8548..707e71f5b 100644
--- a/tiatoolbox/cli/nucleus_instance_segment.py
+++ b/tiatoolbox/cli/nucleus_instance_segment.py
@@ -5,21 +5,20 @@
 import click
 
 from tiatoolbox.cli.common import (
-    cli_auto_generate_mask,
+    cli_auto_get_mask,
     cli_batch_size,
     cli_device,
     cli_file_type,
     cli_img_input,
     cli_masks,
     cli_mode,
-    cli_num_loader_workers,
-    cli_num_postproc_workers,
+    cli_num_workers,
     cli_output_path,
     cli_pretrained_model,
     cli_pretrained_weights,
     cli_verbose,
     cli_yaml_config_path,
-    prepare_ioconfig_seg,
+    prepare_ioconfig,
     prepare_model_cli,
     tiatoolbox_cli,
 )
@@ -45,10 +44,9 @@
 @cli_batch_size()
 @cli_masks(default=None)
 @cli_yaml_config_path(default=None)
-@cli_num_loader_workers()
+@cli_num_workers()
 @cli_verbose(default=True)
-@cli_num_postproc_workers(default=0)
-@cli_auto_generate_mask(default=False)
+@cli_auto_get_mask(default=False)
 def nucleus_instance_segment(
     pretrained_model: str,
     pretrained_weights: str,
@@ -60,7 +58,6 @@ def nucleus_instance_segment(
     batch_size: int,
     yaml_config_path: str,
     num_loader_workers: int,
-    num_postproc_workers: int,
     device: str,
     *,
     auto_generate_mask: bool,
@@ -68,7 +65,7 @@ def nucleus_instance_segment(
 ) -> None:
     """Process an image/directory of input images with a patch classification CNN."""
     from tiatoolbox.models import (  # noqa: PLC0415
-        IOSegmentorConfig,
+        IOInstanceSegmentorConfig,
         NucleusInstanceSegmentor,
     )
     from tiatoolbox.utils import save_as_json  # noqa: PLC0415
@@ -80,8 +77,8 @@ def nucleus_instance_segment(
         file_types=file_types,
     )
 
-    ioconfig = prepare_ioconfig_seg(
-        IOSegmentorConfig,
+    ioconfig = prepare_ioconfig(
+        IOInstanceSegmentorConfig,
         pretrained_weights,
         yaml_config_path,
     )
@@ -91,7 +88,6 @@ def nucleus_instance_segment(
         pretrained_weights=pretrained_weights,
         batch_size=batch_size,
         num_loader_workers=num_loader_workers,
-        num_postproc_workers=num_postproc_workers,
         auto_generate_mask=auto_generate_mask,
         verbose=verbose,
     )
diff --git a/tiatoolbox/cli/patch_predictor.py b/tiatoolbox/cli/patch_predictor.py
index fdb85e3ea..17ed9ebf9 100644
--- a/tiatoolbox/cli/patch_predictor.py
+++ b/tiatoolbox/cli/patch_predictor.py
@@ -2,25 +2,25 @@
 
 from __future__ import annotations
 
-import click
-
 from tiatoolbox.cli.common import (
+    cli_auto_get_mask,
     cli_batch_size,
     cli_device,
     cli_file_type,
     cli_img_input,
     cli_masks,
-    cli_merge_predictions,
-    cli_mode,
-    cli_num_loader_workers,
+    cli_memory_threshold,
+    cli_model,
+    cli_num_workers,
     cli_output_path,
-    cli_pretrained_model,
-    cli_pretrained_weights,
-    cli_resolution,
+    cli_output_type,
+    cli_patch_mode,
     cli_return_labels,
     cli_return_probabilities,
-    cli_units,
     cli_verbose,
+    cli_weights,
+    cli_yaml_config_path,
+    prepare_ioconfig,
     prepare_model_cli,
     tiatoolbox_cli,
 )
@@ -35,45 +35,47 @@
 @cli_file_type(
     default="*.png, *.jpg, *.jpeg, *.tif, *.tiff, *.svs, *.ndpi, *.jp2, *.mrxs",
 )
-@cli_mode(
-    usage_help="Type of input file to process.",
-    default="wsi",
-    input_type=click.Choice(["patch", "wsi", "tile"], case_sensitive=False),
-)
-@cli_pretrained_model(default="resnet18-kather100k")
-@cli_pretrained_weights()
-@cli_return_probabilities(default=False)
-@cli_merge_predictions(default=True)
-@cli_return_labels(default=True)
+@cli_model(default="resnet18-kather100k")
+@cli_weights()
 @cli_device(default="cpu")
 @cli_batch_size(default=1)
-@cli_resolution(default=0.5)
-@cli_units(default="mpp")
+@cli_yaml_config_path()
 @cli_masks(default=None)
-@cli_num_loader_workers(default=0)
+@cli_num_workers(default=0)
+@cli_output_type(
+    default="AnnotationStore",
+)
+@cli_memory_threshold(default=80)
+@cli_patch_mode(default=False)
+@cli_return_probabilities(default=True)
+@cli_return_labels(default=False)
+@cli_auto_get_mask(default=True)
 @cli_verbose(default=True)
 def patch_predictor(
-    pretrained_model: str,
-    pretrained_weights: str,
+    model: str,
+    weights: str,
     img_input: str,
     file_types: str,
     masks: str | None,
-    mode: str,
     output_path: str,
     batch_size: int,
-    resolution: float,
-    units: str,
-    num_loader_workers: int,
+    yaml_config_path: str,
+    num_workers: int,
     device: str,
+    output_type: str,
+    memory_threshold: int,
     *,
+    patch_mode: bool,
     return_probabilities: bool,
     return_labels: bool,
-    merge_predictions: bool,
+    auto_get_mask: bool,
     verbose: bool,
 ) -> None:
-    """Process an image/directory of input images with a patch classification CNN."""
-    from tiatoolbox.models import PatchPredictor  # noqa: PLC0415
-    from tiatoolbox.utils import save_as_json  # noqa: PLC0415
+    """Process an image/directory of input images with a patch classification engine."""
+    from tiatoolbox.models.engine.io_config import (  # noqa: PLC0415
+        IOPatchPredictorConfig,
+    )
+    from tiatoolbox.models.engine.patch_predictor import PatchPredictor  # noqa: PLC0415
 
     files_all, masks_all, output_path = prepare_model_cli(
         img_input=img_input,
@@ -83,26 +85,29 @@ def patch_predictor(
     )
 
     predictor = PatchPredictor(
-        pretrained_model=pretrained_model,
-        pretrained_weights=pretrained_weights,
+        model=model,
+        weights=weights,
         batch_size=batch_size,
-        num_loader_workers=num_loader_workers,
+        num_workers=num_workers,
         verbose=verbose,
     )
 
-    output = predictor.predict(
-        imgs=files_all,
+    ioconfig = prepare_ioconfig(
+        IOPatchPredictorConfig,
+        pretrained_weights=weights,
+        yaml_config_path=yaml_config_path,
+    )
+
+    _ = predictor.run(
+        images=files_all,
         masks=masks_all,
-        mode=mode,
-        return_probabilities=return_probabilities,
-        merge_predictions=merge_predictions,
-        labels=None,
-        return_labels=return_labels,
-        resolution=resolution,
-        units=units,
+        patch_mode=patch_mode,
+        ioconfig=ioconfig,
         device=device,
         save_dir=output_path,
-        save_output=True,
+        output_type=output_type,
+        return_probabilities=return_probabilities,
+        return_labels=return_labels,
+        auto_get_mask=auto_get_mask,
+        memory_threshold=memory_threshold,
     )
-
-    save_as_json(output, str(output_path.joinpath("results.json")))
diff --git a/tiatoolbox/cli/semantic_segment.py b/tiatoolbox/cli/semantic_segment.py
deleted file mode 100644
index ec59ca311..000000000
--- a/tiatoolbox/cli/semantic_segment.py
+++ /dev/null
@@ -1,97 +0,0 @@
-"""Command line interface for semantic segmentation."""
-
-from __future__ import annotations
-
-import click
-
-from tiatoolbox.cli.common import (
-    cli_batch_size,
-    cli_device,
-    cli_file_type,
-    cli_img_input,
-    cli_masks,
-    cli_mode,
-    cli_num_loader_workers,
-    cli_output_path,
-    cli_pretrained_model,
-    cli_pretrained_weights,
-    cli_verbose,
-    cli_yaml_config_path,
-    prepare_ioconfig_seg,
-    prepare_model_cli,
-    tiatoolbox_cli,
-)
-
-
-@tiatoolbox_cli.command()
-@cli_img_input()
-@cli_output_path(
-    usage_help="Output directory where model predictions will be saved.",
-    default="semantic_segmentation",
-)
-@cli_file_type(
-    default="*.png, *.jpg, *.jpeg, *.tif, *.tiff, *.svs, *.ndpi, *.jp2, *.mrxs",
-)
-@cli_mode(
-    usage_help="Type of input file to process.",
-    default="wsi",
-    input_type=click.Choice(["patch", "wsi", "tile"], case_sensitive=False),
-)
-@cli_pretrained_model(default="fcn-tissue_mask")
-@cli_pretrained_weights(default=None)
-@cli_device()
-@cli_batch_size()
-@cli_masks(default=None)
-@cli_yaml_config_path()
-@cli_num_loader_workers()
-@cli_verbose()
-def semantic_segment(
-    pretrained_model: str,
-    pretrained_weights: str,
-    img_input: str,
-    file_types: str,
-    masks: str | None,
-    mode: str,
-    output_path: str,
-    batch_size: int,
-    yaml_config_path: str,
-    num_loader_workers: int,
-    device: str,
-    *,
-    verbose: bool,
-) -> None:
-    """Process an image/directory of input images with a patch classification CNN."""
-    from tiatoolbox.models import IOSegmentorConfig, SemanticSegmentor  # noqa: PLC0415
-    from tiatoolbox.utils import save_as_json  # noqa: PLC0415
-
-    files_all, masks_all, output_path = prepare_model_cli(
-        img_input=img_input,
-        output_path=output_path,
-        masks=masks,
-        file_types=file_types,
-    )
-
-    ioconfig = prepare_ioconfig_seg(
-        IOSegmentorConfig,
-        pretrained_weights,
-        yaml_config_path,
-    )
-
-    predictor = SemanticSegmentor(
-        pretrained_model=pretrained_model,
-        pretrained_weights=pretrained_weights,
-        batch_size=batch_size,
-        num_loader_workers=num_loader_workers,
-        verbose=verbose,
-    )
-
-    output = predictor.predict(
-        imgs=files_all,
-        masks=masks_all,
-        mode=mode,
-        device=device,
-        save_dir=output_path,
-        ioconfig=ioconfig,
-    )
-
-    save_as_json(output, str(output_path.joinpath("results.json")))
diff --git a/tiatoolbox/cli/semantic_segmentor.py b/tiatoolbox/cli/semantic_segmentor.py
new file mode 100644
index 000000000..78b27b83c
--- /dev/null
+++ b/tiatoolbox/cli/semantic_segmentor.py
@@ -0,0 +1,110 @@
+"""Command line interface for semantic segmentation."""
+
+from __future__ import annotations
+
+from tiatoolbox.cli.common import (
+    cli_auto_get_mask,
+    cli_batch_size,
+    cli_device,
+    cli_file_type,
+    cli_img_input,
+    cli_masks,
+    cli_memory_threshold,
+    cli_model,
+    cli_num_workers,
+    cli_output_path,
+    cli_output_type,
+    cli_patch_mode,
+    cli_return_labels,
+    cli_return_probabilities,
+    cli_verbose,
+    cli_weights,
+    cli_yaml_config_path,
+    prepare_ioconfig,
+    prepare_model_cli,
+    tiatoolbox_cli,
+)
+
+
+@tiatoolbox_cli.command()
+@cli_img_input()
+@cli_output_path(
+    usage_help="Output directory where model segmentation will be saved.",
+    default="semantic_segmentation",
+)
+@cli_file_type(
+    default="*.png, *.jpg, *.jpeg, *.tif, *.tiff, *.svs, *.ndpi, *.jp2, *.mrxs",
+)
+@cli_model(default="fcn-tissue_mask")
+@cli_weights()
+@cli_device(default="cpu")
+@cli_batch_size(default=1)
+@cli_yaml_config_path()
+@cli_masks(default=None)
+@cli_num_workers(default=0)
+@cli_output_type(
+    default="AnnotationStore",
+)
+@cli_memory_threshold(default=80)
+@cli_patch_mode(default=False)
+@cli_return_probabilities(default=True)
+@cli_return_labels(default=False)
+@cli_auto_get_mask(default=True)
+@cli_verbose(default=True)
+def semantic_segmentor(
+    model: str,
+    weights: str,
+    img_input: str,
+    file_types: str,
+    masks: str | None,
+    output_path: str,
+    batch_size: int,
+    yaml_config_path: str,
+    num_workers: int,
+    device: str,
+    output_type: str,
+    memory_threshold: int,
+    *,
+    patch_mode: bool,
+    return_probabilities: bool,
+    return_labels: bool,
+    auto_get_mask: bool,
+    verbose: bool,
+) -> None:
+    """Process a set of input images with a semantic segmentation engine."""
+    from tiatoolbox.models import IOSegmentorConfig, SemanticSegmentor  # noqa: PLC0415
+
+    files_all, masks_all, output_path = prepare_model_cli(
+        img_input=img_input,
+        output_path=output_path,
+        masks=masks,
+        file_types=file_types,
+    )
+
+    ioconfig = prepare_ioconfig(
+        IOSegmentorConfig,
+        pretrained_weights=weights,
+        yaml_config_path=yaml_config_path,
+    )
+
+    segmentor = SemanticSegmentor(
+        model=model,
+        weights=weights,
+        batch_size=batch_size,
+        num_workers=num_workers,
+        verbose=verbose,
+    )
+
+    _ = segmentor.run(
+        images=files_all,
+        masks=masks_all,
+        patch_mode=patch_mode,
+        ioconfig=ioconfig,
+        device=device,
+        save_dir=output_path,
+        output_type=output_type,
+        return_probabilities=return_probabilities,
+        return_labels=return_labels,
+        auto_get_mask=auto_get_mask,
+        memory_threshold=memory_threshold,
+    )
diff --git a/tiatoolbox/data/pretrained_model.yaml b/tiatoolbox/data/pretrained_model.yaml
index 19ce8f45d..880c623fe 100644
--- a/tiatoolbox/data/pretrained_model.yaml
+++ b/tiatoolbox/data/pretrained_model.yaml
@@ -6,7 +6,7 @@ alexnet-kather100k:
             backbone: alexnet
             num_classes: 9
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [224, 224]
             stride_shape: [224, 224]
@@ -20,7 +20,7 @@ resnet18-kather100k:
             backbone: resnet18
             num_classes: 9
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [224, 224]
             stride_shape: [224, 224]
@@ -34,7 +34,7 @@ resnet34-kather100k:
             backbone: resnet34
             num_classes: 9
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [224, 224]
             stride_shape: [224, 224]
@@ -48,7 +48,7 @@ resnet50-kather100k:
             backbone: resnet50
             num_classes: 9
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [224, 224]
             stride_shape: [224, 224]
@@ -62,7 +62,7 @@ resnet101-kather100k:
             backbone: resnet101
             num_classes: 9
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [224, 224]
             stride_shape: [224, 224]
@@ -76,7 +76,7 @@ resnext50_32x4d-kather100k:
             backbone: resnext50_32x4d
             num_classes: 9
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [224, 224]
             stride_shape: [224, 224]
@@ -90,7 +90,7 @@ resnext101_32x8d-kather100k:
             backbone: resnext101_32x8d
             num_classes: 9
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [224, 224]
             stride_shape: [224, 224]
@@ -104,7 +104,7 @@ wide_resnet50_2-kather100k:
             backbone: wide_resnet50_2
             num_classes: 9
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [224, 224]
             stride_shape: [224, 224]
@@ -118,7 +118,7 @@ wide_resnet101_2-kather100k:
             backbone: wide_resnet101_2
             num_classes: 9
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [224, 224]
             stride_shape: [224, 224]
@@ -132,7 +132,7 @@ densenet121-kather100k:
             backbone: densenet121
             num_classes: 9
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [224, 224]
             stride_shape: [224, 224]
@@ -146,7 +146,7 @@ densenet161-kather100k:
             backbone: densenet161
             num_classes: 9
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [224, 224]
             stride_shape: [224, 224]
@@ -160,7 +160,7 @@ densenet169-kather100k:
             backbone: densenet169
             num_classes: 9
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [224, 224]
             stride_shape: [224, 224]
@@ -174,7 +174,7 @@ densenet201-kather100k:
             backbone: densenet201
             num_classes: 9
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [224, 224]
             stride_shape: [224, 224]
@@ -188,7 +188,7 @@ mobilenet_v2-kather100k:
             backbone: mobilenet_v2
             num_classes: 9
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [224, 224]
             stride_shape: [224, 224]
@@ -202,7 +202,7 @@ mobilenet_v3_large-kather100k:
             backbone: mobilenet_v3_large
             num_classes: 9
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [224, 224]
             stride_shape: [224, 224]
@@ -216,7 +216,7 @@ mobilenet_v3_small-kather100k:
             backbone: mobilenet_v3_small
             num_classes: 9
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [224, 224]
             stride_shape: [224, 224]
@@ -230,7 +230,7 @@ googlenet-kather100k:
             backbone: googlenet
             num_classes: 9
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [224, 224]
             stride_shape: [224, 224]
@@ -245,7 +245,7 @@ alexnet-pcam:
             backbone: alexnet
             num_classes: 2
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [96, 96]
             stride_shape: [96, 96]
@@ -259,7 +259,7 @@ resnet18-pcam:
             backbone: resnet18
             num_classes: 2
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [96, 96]
             stride_shape: [96, 96]
@@ -273,7 +273,7 @@ resnet34-pcam:
             backbone: resnet34
             num_classes: 2
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [96, 96]
             stride_shape: [96, 96]
@@ -287,7 +287,7 @@ resnet50-pcam:
             backbone: resnet50
             num_classes: 2
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [96, 96]
             stride_shape: [96, 96]
@@ -301,7 +301,7 @@ resnet101-pcam:
             backbone: resnet101
             num_classes: 2
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [96, 96]
             stride_shape: [96, 96]
@@ -315,7 +315,7 @@ resnext50_32x4d-pcam:
             backbone: resnext50_32x4d
             num_classes: 2
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [96, 96]
             stride_shape: [96, 96]
@@ -329,7 +329,7 @@ resnext101_32x8d-pcam:
             backbone: resnext101_32x8d
             num_classes: 2
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [96, 96]
             stride_shape: [96, 96]
@@ -343,7 +343,7 @@ wide_resnet50_2-pcam:
             backbone: wide_resnet50_2
             num_classes: 2
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [96, 96]
             stride_shape: [96, 96]
@@ -357,7 +357,7 @@ wide_resnet101_2-pcam:
             backbone: wide_resnet101_2
             num_classes: 2
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [96, 96]
             stride_shape: [96, 96]
@@ -371,7 +371,7 @@ densenet121-pcam:
             backbone: densenet121
             num_classes: 2
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [96, 96]
             stride_shape: [96, 96]
@@ -385,7 +385,7 @@ densenet161-pcam:
             backbone: densenet161
             num_classes: 2
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [96, 96]
             stride_shape: [96, 96]
@@ -399,7 +399,7 @@ densenet169-pcam:
             backbone: densenet169
             num_classes: 2
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [96, 96]
             stride_shape: [96, 96]
@@ -413,7 +413,7 @@ densenet201-pcam:
             backbone: densenet201
             num_classes: 2
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [96, 96]
             stride_shape: [96, 96]
@@ -427,7 +427,7 @@ mobilenet_v2-pcam:
             backbone: mobilenet_v2
             num_classes: 2
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [96, 96]
             stride_shape: [96, 96]
@@ -441,7 +441,7 @@ mobilenet_v3_large-pcam:
             backbone: mobilenet_v3_large
             num_classes: 2
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [96, 96]
             stride_shape: [96, 96]
@@ -455,7 +455,7 @@ mobilenet_v3_small-pcam:
             backbone: mobilenet_v3_small
             num_classes: 2
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [96, 96]
             stride_shape: [96, 96]
@@ -469,7 +469,7 @@ googlenet-pcam:
             backbone: googlenet
             num_classes: 2
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [96, 96]
             stride_shape: [96, 96]
@@ -484,7 +484,7 @@ resnet18-idars-tumour:
             backbone: resnet18
             num_classes: 2
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [512, 512]
             stride_shape: [512, 512]
@@ -497,7 +497,7 @@ resnet34-idars-msi:
             backbone: resnet34
             num_classes: 2
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [224, 224]
             stride_shape: [224, 224]
@@ -510,7 +510,7 @@ resnet34-idars-braf:
             backbone: resnet34
             num_classes: 2
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [224, 224]
             stride_shape: [224, 224]
@@ -523,7 +523,7 @@ resnet34-idars-cimp:
             backbone: resnet34
             num_classes: 2
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [224, 224]
             stride_shape: [224, 224]
@@ -536,7 +536,7 @@ resnet34-idars-cin:
             backbone: resnet34
             num_classes: 2
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [224, 224]
             stride_shape: [224, 224]
@@ -549,7 +549,7 @@ resnet34-idars-tp53:
             backbone: resnet34
             num_classes: 2
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [224, 224]
             stride_shape: [224, 224]
@@ -562,7 +562,7 @@ resnet34-idars-hm:
             backbone: resnet34
             num_classes: 2
     ioconfig:
-        class: patch_predictor.IOPatchPredictorConfig
+        class: io_config.IOPatchPredictorConfig
         kwargs:
             patch_input_shape: [224, 224]
             stride_shape: [224, 224]
@@ -579,7 +579,7 @@ fcn-tissue_mask:
             encoder: "resnet50"
             decoder_block: [3]
     ioconfig:
-        class: semantic_segmentor.IOSegmentorConfig
+        class: io_config.IOSegmentorConfig
         kwargs:
             input_resolutions:
                 - {'units': 'mpp', 'resolution': 2.0}
@@ -587,7 +587,7 @@ fcn-tissue_mask:
                 - {'units': 'mpp', 'resolution': 2.0}
             patch_input_shape: [1024, 1024]
             patch_output_shape: [512, 512]
-            stride_shape: [256, 256]
+            stride_shape: [450, 450]
             save_resolution: {'units': 'mpp', 'resolution': 8.0}
 
 fcn_resnet50_unet-bcss:
@@ -600,7 +600,7 @@ fcn_resnet50_unet-bcss:
             encoder: "resnet50"
             decoder_block: [3, 3]
     ioconfig:
-        class: semantic_segmentor.IOSegmentorConfig
+        class: io_config.IOSegmentorConfig
         kwargs:
             input_resolutions:
                 - {'units': 'mpp', 'resolution': 0.25}
@@ -608,7 +608,7 @@ fcn_resnet50_unet-bcss:
                 - {'units': 'mpp', 'resolution': 0.25}
             patch_input_shape: [1024, 1024]
             patch_output_shape: [512, 512]
-            stride_shape: [256, 256]
+            stride_shape: [450, 450]
             save_resolution: {'units': 'mpp', 'resolution': 0.25}
 
 unet_tissue_mask_tsef:
@@ -625,7 +625,7 @@ unet_tissue_mask_tsef:
             encoder: "resnet50"
             decoder_block: [3, 3]
     ioconfig:
-        class: semantic_segmentor.IOSegmentorConfig
+        class: io_config.IOSegmentorConfig
         kwargs:
             input_resolutions:
                 - {'units': 'baseline', 'resolution': 1.0}
@@ -652,7 +652,7 @@ hovernet_fast-pannuke:
                 5: "Non-Neoplastic Epithelial",
             }
     ioconfig:
-        class: semantic_segmentor.IOSegmentorConfig
+        class: io_config.IOInstanceSegmentorConfig
         kwargs:
             input_resolutions:
                 - {"units": "mpp", "resolution": 0.25}
@@ -682,7 +682,7 @@ hovernet_fast-monusac:
                 4: "Neutrophil",
             }
     ioconfig:
-        class: semantic_segmentor.IOSegmentorConfig
+        class: io_config.IOInstanceSegmentorConfig
         kwargs:
             input_resolutions:
                 - {"units": "mpp", "resolution": 0.25}
@@ -712,7 +712,7 @@ hovernet_original-consep:
                 4: "Miscellaneous",
             }
     ioconfig:
-        class: semantic_segmentor.IOSegmentorConfig
+        class: io_config.IOInstanceSegmentorConfig
         kwargs:
             input_resolutions:
                 - {"units": "mpp", "resolution": 0.25}
@@ -735,7 +735,7 @@ hovernet_original-kumar:
             num_types: null  # None in python ?, only do instance segmentation
             mode: "original"
     ioconfig:
-        class: semantic_segmentor.IOSegmentorConfig
+        class: io_config.IOInstanceSegmentorConfig
         kwargs:
             input_resolutions:
                 - {"units": "mpp", "resolution": 0.25}
@@ -769,7 +769,7 @@ hovernetplus-oed:
                 4: "Keratin",
             }
     ioconfig:
-        class: semantic_segmentor.IOSegmentorConfig
+        class: io_config.IOInstanceSegmentorConfig
         kwargs:
             input_resolutions:
                 - {"units": "mpp", "resolution": 0.50}
@@ -793,7 +793,7 @@ micronet-consep:
             num_input_channels: 3
             num_output_channels: 2
     ioconfig:
-        class: semantic_segmentor.IOSegmentorConfig
+        class: io_config.IOSegmentorConfig
         kwargs:
             input_resolutions:
                 - {"units": "mpp", "resolution": 0.25}
diff --git a/tiatoolbox/data/remote_samples.yaml b/tiatoolbox/data/remote_samples.yaml
index 1b7bf2bf1..44e7d3492 100644
--- a/tiatoolbox/data/remote_samples.yaml
+++ b/tiatoolbox/data/remote_samples.yaml
@@ -21,6 +21,8 @@ files:
     extract: True
   svs-1-small:
     url: [*wsis, "CMU-1-Small-Region.svs"]
+  thumbnail-1k-1k:
+    url: [*wsis, "CMU-2_1k_1k-thumbnail.png"]
   tiled-tiff-1-small-jpeg:
     url: [*wsis, "CMU-1-Small-Region.jpeg.tiff"]
   tiled-tiff-1-small-jp2k:
diff --git a/tiatoolbox/models/__init__.py b/tiatoolbox/models/__init__.py
index 39d1441ce..5de543aad 100644
--- a/tiatoolbox/models/__init__.py
+++ b/tiatoolbox/models/__init__.py
@@ -1,7 +1,8 @@
 """Models package for the models implemented in tiatoolbox."""
 
-from tiatoolbox.models import architecture, dataset, engine, models_abc
+from __future__ import annotations
 
+from . import architecture, dataset, engine, models_abc
 from .architecture.hovernet import HoVerNet
 from .architecture.hovernetplus import HoVerNetPlus
 from .architecture.idars import IDaRS
@@ -9,31 +10,39 @@
 from .architecture.micronet import MicroNet
 from .architecture.nuclick import NuClick
 from .architecture.sccnn import SCCNN
-from .engine.multi_task_segmentor import MultiTaskSegmentor
-from .engine.nucleus_instance_segmentor import NucleusInstanceSegmentor
-from .engine.patch_predictor import (
+from .dataset import PatchDataset, WSIPatchDataset, WSIStreamDataset
+from .engine.io_config import (
+    IOInstanceSegmentorConfig,
     IOPatchPredictorConfig,
-    PatchDataset,
-    PatchPredictor,
-    WSIPatchDataset,
-)
-from .engine.semantic_segmentor import (
-    DeepFeatureExtractor,
     IOSegmentorConfig,
-    SemanticSegmentor,
-    WSIStreamDataset,
+    ModelIOConfigABC,
 )
+from .engine.multi_task_segmentor import MultiTaskSegmentor
+from .engine.nucleus_instance_segmentor import NucleusInstanceSegmentor
+from .engine.patch_predictor import PatchPredictor
+from .engine.semantic_segmentor import SemanticSegmentor
 
 __all__ = [
     "SCCNN",
     "HoVerNet",
     "HoVerNetPlus",
     "IDaRS",
+    "IOInstanceSegmentorConfig",
+    "IOPatchPredictorConfig",
+    "IOSegmentorConfig",
     "MapDe",
     "MicroNet",
+    "ModelIOConfigABC",
     "MultiTaskSegmentor",
     "NuClick",
     "NucleusInstanceSegmentor",
+    "PatchDataset",
     "PatchPredictor",
     "SemanticSegmentor",
+    "WSIPatchDataset",
+    "WSIStreamDataset",
+    "architecture",
+    "dataset",
+    "engine",
+    "models_abc",
 ]
diff --git a/tiatoolbox/models/architecture/__init__.py b/tiatoolbox/models/architecture/__init__.py
index da8e9ed4a..97111bb9f 100644
--- a/tiatoolbox/models/architecture/__init__.py
+++ b/tiatoolbox/models/architecture/__init__.py
@@ -6,15 +6,16 @@
 from pydoc import locate
 from typing import TYPE_CHECKING
 
-import torch
 from huggingface_hub import hf_hub_download
 
 from tiatoolbox import rcParam
 from tiatoolbox.models.dataset.classification import predefined_preproc_func
+from tiatoolbox.models.models_abc import load_torch_model
 
 if TYPE_CHECKING:  # pragma: no cover
-    from tiatoolbox.models.models_abc import IOConfigABC
+    import torch
 
+    from tiatoolbox.models.engine.io_config import ModelIOConfigABC
 
 __all__ = ["fetch_pretrained_weights", "get_pretrained_model"]
 PRETRAINED_INFO = rcParam["pretrained_model_info"]
@@ -68,7 +69,7 @@ def get_pretrained_model(
     pretrained_weights: str | Path | None = None,
     *,
     overwrite: bool = False,
-) -> tuple[torch.nn.Module, IOConfigABC]:
+) -> tuple[torch.nn.Module, ModelIOConfigABC]:
     """Load a predefined PyTorch model with the appropriate pretrained weights.
 
     Args:
@@ -154,12 +155,7 @@ def get_pretrained_model(
             overwrite=overwrite,
         )
 
-    # ! assume to be saved in single GPU mode
-    # always load on to the CPU
-    saved_state_dict = torch.load(pretrained_weights, map_location="cpu")
-    model.load_state_dict(saved_state_dict, strict=True)
-
-    # !
+    model = load_torch_model(model=model, weights=pretrained_weights)
 
     io_info = info["ioconfig"]
     io_class_info = io_info["class"]
@@ -169,5 +165,5 @@ def get_pretrained_model(
     engine_module = locate(f"tiatoolbox.models.engine.{io_module_name}")
     engine_class = getattr(engine_module, io_class_name)
 
-    iostate = engine_class(**io_info["kwargs"])
-    return model, iostate
+    ioconfig = engine_class(**io_info["kwargs"])
+    return model, ioconfig
diff --git a/tiatoolbox/models/architecture/hovernet.py b/tiatoolbox/models/architecture/hovernet.py
index c0be9ad47..19d02e7a5 100644
--- a/tiatoolbox/models/architecture/hovernet.py
+++ b/tiatoolbox/models/architecture/hovernet.py
@@ -784,7 +784,7 @@ def postproc(raw_maps: list[np.ndarray]) -> tuple[np.ndarray, dict]:
 
     @staticmethod
     def infer_batch(  # skipcq: PYL-W0221
-        model: nn.Module, batch_data: np.ndarray, *, device: str
+        model: nn.Module, batch_data: np.ndarray, device: str
     ) -> tuple:
         """Run inference on an input batch.
 
diff --git a/tiatoolbox/models/architecture/unet.py b/tiatoolbox/models/architecture/unet.py
index 6385e7587..8d38eb7fc 100644
--- a/tiatoolbox/models/architecture/unet.py
+++ b/tiatoolbox/models/architecture/unet.py
@@ -2,7 +2,7 @@
 
 from __future__ import annotations
 
-from typing import Any
+from typing import TYPE_CHECKING, Any
 
 import torch
 import torch.nn.functional as F  # noqa: N812
@@ -10,9 +10,16 @@
 from torchvision.models.resnet import Bottleneck as ResNetBottleneck
 from torchvision.models.resnet import ResNet
 
-from tiatoolbox.models.architecture.utils import UpSample2x, centre_crop
+from tiatoolbox.models.architecture.utils import (
+    UpSample2x,
+    argmax_last_axis,
+    centre_crop,
+)
 from tiatoolbox.models.models_abc import ModelABC
 
+if TYPE_CHECKING:  # pragma: no cover
+    import numpy as np
+
 
 class ResNetEncoder(ResNet):
     """A subclass of ResNet defined in torch.
@@ -416,7 +423,7 @@ def infer_batch(
         batch_data: torch.Tensor,
         *,
         device: str,
-    ) -> list:
+    ) -> np.ndarray:
         """Run inference on an input batch.
 
         This contains logic for forward operation as well as i/o
@@ -432,9 +439,8 @@ def infer_batch(
                 Transfers model to the specified device. Default is "cpu".
 
         Returns:
-            list:
-                List of network output head, each output is an
-                :class:`numpy.ndarray`.
+            np.ndarray:
+                The model predictions as a :class:`numpy.ndarray`.
 
         """
         model.eval()
@@ -457,7 +463,14 @@ def infer_batch(
                 align_corners=False,
             )
             probs = centre_crop(probs, crop_shape)
-            probs = probs.permute(0, 2, 3, 1)  # to NHWC
+            output = probs.permute(0, 2, 3, 1)  # to NHWC
+
+        return output.cpu().numpy()
 
-        probs = probs.cpu().numpy()
-        return [probs]
+    def postproc(self: UNetModel, image: np.ndarray) -> np.ndarray:
+        """Define post-processing of this class of model.
+
+        This simply applies argmax along last axis of the input.
+
+        """
+        return argmax_last_axis(image=image)
diff --git a/tiatoolbox/models/architecture/utils.py b/tiatoolbox/models/architecture/utils.py
index 8f8f2bb22..9b60cc7a9 100644
--- a/tiatoolbox/models/architecture/utils.py
+++ b/tiatoolbox/models/architecture/utils.py
@@ -3,7 +3,7 @@
 from __future__ import annotations
 
 import sys
-from typing import cast
+from typing import TYPE_CHECKING, cast
 
 import numpy as np
 import torch
@@ -11,6 +11,9 @@
 
 from tiatoolbox import logger
 
+if TYPE_CHECKING:  # pragma: no cover
+    from tiatoolbox.models.models_abc import ModelABC
+
 
 def is_torch_compile_compatible() -> bool:
     """Check if the current GPU is compatible with torch-compile.
@@ -46,10 +49,10 @@ def is_torch_compile_compatible() -> bool:
 
 
 def compile_model(
-    model: nn.Module,
+    model: nn.Module | ModelABC | None = None,
     *,
     mode: str = "default",
-) -> nn.Module:
+) -> torch.nn.Module | ModelABC:
     """A decorator to compile a model using torch-compile.
 
     Args:
@@ -68,7 +71,7 @@ def compile_model(
               CUDA graphs
 
     Returns:
-        torch.nn.Module:
+        torch.nn.Module or ModelABC:
             Compiled model.
 
     """
@@ -231,3 +234,20 @@ def forward(self: UpSample2x, x: torch.Tensor) -> torch.Tensor:
         ret = torch.tensordot(x, mat, dims=1)  # bxcxhxwxshxsw
         ret = ret.permute(0, 1, 2, 4, 3, 5)
         return ret.reshape((-1, input_shape[1], input_shape[2] * 2, input_shape[3] * 2))
+
+
+def argmax_last_axis(image: np.ndarray) -> np.ndarray:
+    """Define the post-processing of this class of model.
+
+    This simply applies argmax along last axis of the input.
+
+    Args:
+        image (np.ndarray):
+            The input image array.
+
+    Returns:
+        np.ndarray:
+            The post-processed image array.
+
+    """
+    return image.argmax(axis=-1)
diff --git a/tiatoolbox/models/architecture/vanilla.py b/tiatoolbox/models/architecture/vanilla.py
index 55a7c60b8..9bab502d0 100644
--- a/tiatoolbox/models/architecture/vanilla.py
+++ b/tiatoolbox/models/architecture/vanilla.py
@@ -4,16 +4,17 @@
 
 from typing import TYPE_CHECKING
 
-import numpy as np
 import timm
 import torch
 import torchvision.models as torch_models
 from timm.layers import SwiGLUPacked
 from torch import nn
 
+from tiatoolbox.models.architecture.utils import argmax_last_axis
 from tiatoolbox.models.models_abc import ModelABC
 
 if TYPE_CHECKING:  # pragma: no cover
+    import numpy as np
     from torchvision.models import WeightsEnum
 
 
@@ -207,28 +208,11 @@ def _get_timm_architecture(
     raise ValueError(msg)
 
 
-def _postproc(image: np.ndarray) -> np.ndarray:
-    """Define the post-processing of this class of model.
-
-    This simply applies argmax along last axis of the input.
-
-    Args:
-        image (np.ndarray):
-            The input image array.
-
-    Returns:
-        np.ndarray:
-            The post-processed image array.
-
-    """
-    return np.argmax(image, axis=-1)
-
-
 def _infer_batch(
     model: nn.Module,
     batch_data: torch.Tensor,
     device: str,
-) -> dict[str, np.ndarray]:
+) -> np.ndarray:
     """Run inference on an input batch.
 
     Contains logic for forward operation as well as i/o aggregation.
@@ -342,14 +326,14 @@ def postproc(image: np.ndarray) -> np.ndarray:
                 The post-processed image array.
 
         """
-        return _postproc(image=image)
+        return argmax_last_axis(image=image)
 
     @staticmethod
     def infer_batch(
         model: nn.Module,
         batch_data: torch.Tensor,
         device: str = "cpu",
-    ) -> dict[str, np.ndarray]:
+    ) -> np.ndarray:
         """Run inference on an input batch.
 
         Contains logic for forward operation as well as i/o aggregation.
@@ -466,14 +450,14 @@ def postproc(image: np.ndarray) -> np.ndarray:
                 The post-processed image array.
 
         """
-        return _postproc(image=image)
+        return argmax_last_axis(image=image)
 
     @staticmethod
     def infer_batch(
         model: nn.Module,
         batch_data: torch.Tensor,
         device: str,
-    ) -> dict[str, np.ndarray]:
+    ) -> np.ndarray:
         """Run inference on an input batch.
 
         Contains logic for forward operation as well as i/o aggregation.
@@ -485,10 +469,10 @@ def infer_batch(
                 A batch of data generated by
                 `torch.utils.data.DataLoader`.
             device (str):
-                Transfers model to the specified device. Default is "cpu".
+                Transfers model to the specified device.
 
         Returns:
-            dict[str, np.ndarray]:
+            np.ndarray:
                 The model predictions as a NumPy array.
 
         Example:
@@ -577,7 +561,7 @@ def infer_batch(
         model: nn.Module,
         batch_data: torch.Tensor,
         device: str,
-    ) -> list[dict[str, np.ndarray]]:
+    ) -> list[np.ndarray]:
         """Run inference on an input batch.
 
         Contains logic for forward operation as well as i/o aggregation.
@@ -592,7 +576,7 @@ def infer_batch(
                 Transfers model to the specified device. Default is "cpu".
 
         Returns:
-            list[dict[str, np.ndarray]]:
+            list[np.ndarray]:
                 list of dictionary values with numpy arrays.
 
         Example:
@@ -669,7 +653,7 @@ def infer_batch(
         model: nn.Module,
         batch_data: torch.Tensor,
         device: str,
-    ) -> list[dict[str, np.ndarray]]:
+    ) -> list[np.ndarray]:
         """Run inference on an input batch.
 
         Contains logic for forward operation as well as i/o aggregation.
@@ -684,7 +668,7 @@ def infer_batch(
                 Transfers model to the specified device. Default is "cpu".
 
         Returns:
-            list[dict[str, np.ndarray]]:
+            list[np.ndarray]:
                 list of dictionary values with numpy arrays.
 
         Example:
diff --git a/tiatoolbox/models/dataset/__init__.py b/tiatoolbox/models/dataset/__init__.py
index 9c09991fa..16c80fd18 100644
--- a/tiatoolbox/models/dataset/__init__.py
+++ b/tiatoolbox/models/dataset/__init__.py
@@ -1,9 +1,21 @@
 """Contains dataset functionality for use with models in tiatoolbox."""
 
-from tiatoolbox.models.dataset.classification import (
+from tiatoolbox.models.dataset.classification import predefined_preproc_func
+
+from .dataset_abc import (
     PatchDataset,
+    PatchDatasetABC,
     WSIPatchDataset,
-    predefined_preproc_func,
+    WSIStreamDataset,
 )
-from tiatoolbox.models.dataset.dataset_abc import PatchDatasetABC
-from tiatoolbox.models.dataset.info import DatasetInfoABC, KatherPatchDataset
+from .info import DatasetInfoABC, KatherPatchDataset
+
+__all__ = [
+    "DatasetInfoABC",
+    "KatherPatchDataset",
+    "PatchDataset",
+    "PatchDatasetABC",
+    "WSIPatchDataset",
+    "WSIStreamDataset",
+    "predefined_preproc_func",
+]
diff --git a/tiatoolbox/models/dataset/classification.py b/tiatoolbox/models/dataset/classification.py
index 359d8c52a..c1bf8fa8c 100644
--- a/tiatoolbox/models/dataset/classification.py
+++ b/tiatoolbox/models/dataset/classification.py
@@ -2,27 +2,14 @@
 
 from __future__ import annotations
 
-from pathlib import Path
 from typing import TYPE_CHECKING
 
-import cv2
-import numpy as np
 from torchvision import transforms
 
-from tiatoolbox import logger
-from tiatoolbox.models.dataset import dataset_abc
-from tiatoolbox.tools.patchextraction import PatchExtractor
-from tiatoolbox.utils import imread
-from tiatoolbox.wsicore.wsimeta import WSIMeta
-from tiatoolbox.wsicore.wsireader import VirtualWSIReader, WSIReader
-
 if TYPE_CHECKING:  # pragma: no cover
-    from collections.abc import Callable
-
+    import numpy as np
     import torch
-    from PIL.Image import Image
-
-    from tiatoolbox.type_hints import IntPair, Resolution, Units
+    from PIL import Image
 
 
 class _TorchPreprocCaller:
@@ -74,302 +61,3 @@ def predefined_preproc_func(dataset_name: str) -> _TorchPreprocCaller:
 
     preprocs = preproc_dict[dataset_name]
     return _TorchPreprocCaller(preprocs)
-
-
-class PatchDataset(dataset_abc.PatchDatasetABC):
-    """Define PatchDataset for torch inference.
-
-    Define a simple patch dataset, which inherits from the
-      `torch.utils.data.Dataset` class.
-
-    Attributes:
-        inputs (list or np.ndarray):
-            Either a list of patches, where each patch is a ndarray or a
-            list of valid path with its extension be (".jpg", ".jpeg",
-            ".tif", ".tiff", ".png") pointing to an image.
-        labels (list):
-            List of labels for sample at the same index in `inputs`.
-            Default is `None`.
-
-    Examples:
-        >>> # A user defined preproc func and expected behavior
-        >>> preproc_func = lambda img: img/2  # reduce intensity by half
-        >>> transformed_img = preproc_func(img)
-        >>> # create a dataset to get patches preprocessed by the above function
-        >>> ds = PatchDataset(
-        ...     inputs=['/A/B/C/img1.png', '/A/B/C/img2.png'],
-        ...     labels=["labels1", "labels2"],
-        ... )
-
-    """
-
-    def __init__(
-        self: PatchDataset,
-        inputs: np.ndarray | list,
-        labels: list | None = None,
-    ) -> None:
-        """Initialize :class:`PatchDataset`."""
-        super().__init__()
-
-        self.data_is_npy_alike = False
-
-        self.inputs = inputs
-        self.labels = labels
-
-        # perform check on the input
-        self._check_input_integrity(mode="patch")
-
-    def __getitem__(self: PatchDataset, idx: int) -> dict:
-        """Get an item from the dataset."""
-        patch = self.inputs[idx]
-
-        # Mode 0 is list of paths
-        if not self.data_is_npy_alike:
-            patch = self.load_img(patch)
-
-        # Apply preprocessing to selected patch
-        patch = self._preproc(patch)
-
-        data = {
-            "image": patch,
-        }
-        if self.labels is not None:
-            data["label"] = self.labels[idx]
-            return data
-
-        return data
-
-
-class WSIPatchDataset(dataset_abc.PatchDatasetABC):
-    """Define a WSI-level patch dataset.
-
-    Attributes:
-        reader (:class:`.WSIReader`):
-            A WSI Reader or Virtual Reader for reading pyramidal image
-            or large tile in pyramidal way.
-        inputs:
-            List of coordinates to read from the `reader`, each
-            coordinate is of the form `[start_x, start_y, end_x,
-            end_y]`.
-        patch_input_shape:
-            A tuple (int, int) or ndarray of shape (2,). Expected size to
-            read from `reader` at requested `resolution` and `units`.
-            Expected to be `(height, width)`.
-        resolution:
-            See (:class:`.WSIReader`) for details.
-        units:
-            See (:class:`.WSIReader`) for details.
-        preproc_func:
-            Preprocessing function used to transform the input data. It will
-            be called on each patch before returning it.
-
-    """
-
-    def __init__(  # skipcq: PY-R1000
-        self: WSIPatchDataset,
-        img_path: str | Path,
-        mode: str = "wsi",
-        mask_path: str | Path | None = None,
-        patch_input_shape: IntPair = None,
-        stride_shape: IntPair = None,
-        resolution: Resolution = None,
-        units: Units = None,
-        min_mask_ratio: float = 0,
-        preproc_func: Callable | None = None,
-        *,
-        auto_get_mask: bool = True,
-    ) -> None:
-        """Create a WSI-level patch dataset.
-
-        Args:
-            mode (str):
-                Can be either `wsi` or `tile` to denote the image to
-                read is either a whole-slide image or a large image
-                tile.
-            img_path (str or Path):
-                Valid to pyramidal whole-slide image or large tile to
-                read.
-            mask_path (str or Path):
-                Valid mask image.
-            patch_input_shape:
-                A tuple (int, int) or ndarray of shape (2,). Expected
-                shape to read from `reader` at requested `resolution`
-                and `units`. Expected to be positive and of (height,
-                width). Note, this is not at `resolution` coordinate
-                space.
-            stride_shape:
-                A tuple (int, int) or ndarray of shape (2,). Expected
-                stride shape to read at requested `resolution` and
-                `units`. Expected to be positive and of (height, width).
-                Note, this is not at level 0.
-            resolution (Resolution):
-                Check (:class:`.WSIReader`) for details. When
-                `mode='tile'`, value is fixed to be `resolution=1.0` and
-                `units='baseline'` units: check (:class:`.WSIReader`) for
-                details.
-            units (Units):
-                Units in which `resolution` is defined.
-            auto_get_mask (bool):
-                If `True`, then automatically get simple threshold mask using
-                WSIReader.tissue_mask() function.
-            min_mask_ratio (float):
-                Only patches with positive area percentage above this value are
-                included. Defaults to 0.
-            preproc_func (Callable):
-                Preprocessing function used to transform the input data. If
-                supplied, the function will be called on each patch before
-                returning it.
-
-        Examples:
-            >>> # A user defined preproc func and expected behavior
-            >>> preproc_func = lambda img: img/2  # reduce intensity by half
-            >>> transformed_img = preproc_func(img)
-            >>> # Create a dataset to get patches from WSI with above
-            >>> # preprocessing function
-            >>> ds = WSIPatchDataset(
-            ...     img_path='/A/B/C/wsi.svs',
-            ...     mode="wsi",
-            ...     patch_input_shape=[512, 512],
-            ...     stride_shape=[256, 256],
-            ...     auto_get_mask=False,
-            ...     preproc_func=preproc_func
-            ... )
-
-        """
-        super().__init__()
-
-        # Is there a generic func for path test in toolbox?
-        if not Path.is_file(Path(img_path)):
-            msg = "`img_path` must be a valid file path."
-            raise ValueError(msg)
-        if mode not in ["wsi", "tile"]:
-            msg = f"`{mode}` is not supported."
-            raise ValueError(msg)
-        patch_input_shape = np.array(patch_input_shape)
-        stride_shape = np.array(stride_shape)
-
-        if (
-            not np.issubdtype(patch_input_shape.dtype, np.integer)
-            or np.size(patch_input_shape) > 2  # noqa: PLR2004
-            or np.any(patch_input_shape < 0)
-        ):
-            msg = f"Invalid `patch_input_shape` value {patch_input_shape}."
-            raise ValueError(msg)
-        if (
-            not np.issubdtype(stride_shape.dtype, np.integer)
-            or np.size(stride_shape) > 2  # noqa: PLR2004
-            or np.any(stride_shape < 0)
-        ):
-            msg = f"Invalid `stride_shape` value {stride_shape}."
-            raise ValueError(msg)
-
-        self.preproc_func = preproc_func
-        self.img_path = Path(img_path)
-        self.mode = mode
-        self.reader = None
-        reader = self._get_reader(self.img_path)
-        if mode != "wsi":
-            units = "mpp"
-            resolution = 1.0
-
-        # may decouple into misc ?
-        # the scaling factor will scale base level to requested read resolution/units
-        wsi_shape = reader.slide_dimensions(resolution=resolution, units=units)
-
-        # use all patches, as long as it overlaps source image
-        self.inputs = PatchExtractor.get_coordinates(
-            image_shape=wsi_shape,
-            patch_input_shape=patch_input_shape[::-1],
-            stride_shape=stride_shape[::-1],
-            input_within_bound=False,
-        )
-
-        mask_reader = None
-        if mask_path is not None:
-            mask_path = Path(mask_path)
-            if not Path.is_file(mask_path):
-                msg = "`mask_path` must be a valid file path."
-                raise ValueError(msg)
-            mask = imread(mask_path)  # assume to be gray
-            mask = cv2.cvtColor(mask, cv2.COLOR_RGB2GRAY)
-            mask = np.array(mask > 0, dtype=np.uint8)
-
-            mask_reader = VirtualWSIReader(mask)
-            mask_reader.info = reader.info
-        elif auto_get_mask and mode == "wsi" and mask_path is None:
-            # if no mask provided and `wsi` mode, generate basic tissue
-            # mask on the fly
-            mask_reader = reader.tissue_mask(resolution=1.25, units="power")
-            # ? will this mess up  ?
-            mask_reader.info = reader.info
-
-        if mask_reader is not None:
-            selected = PatchExtractor.filter_coordinates(
-                mask_reader,  # must be at the same resolution
-                self.inputs,  # must already be at requested resolution
-                wsi_shape=wsi_shape,
-                min_mask_ratio=min_mask_ratio,
-            )
-            self.inputs = self.inputs[selected]
-
-        if len(self.inputs) == 0:
-            msg = "No patch coordinates remain after filtering."
-            raise ValueError(msg)
-
-        self.patch_input_shape = patch_input_shape
-        self.resolution = resolution
-        self.units = units
-
-        # Perform check on the input
-        self._check_input_integrity(mode="wsi")
-
-    def _get_reader(self: WSIPatchDataset, img_path: str | Path) -> WSIReader:
-        """Get a reader for the image."""
-        if self.mode == "wsi":
-            reader = WSIReader.open(img_path)
-        else:
-            logger.warning(
-                "WSIPatchDataset only reads image tile at "
-                '`units="baseline"` and `resolution=1.0`.',
-                stacklevel=2,
-            )
-            img = imread(img_path)
-            axes = "YXS"[: len(img.shape)]
-            # initialise metadata for VirtualWSIReader.
-            # here, we simulate a whole-slide image, but with a single level.
-            # ! should we expose this so that use can provide their metadata ?
-            metadata = WSIMeta(
-                mpp=np.array([1.0, 1.0]),
-                axes=axes,
-                objective_power=10,
-                slide_dimensions=np.array(img.shape[:2][::-1]),
-                level_downsamples=[1.0],
-                level_dimensions=[np.array(img.shape[:2][::-1])],
-            )
-            # infer value such that read if mask provided is through
-            # 'mpp' or 'power' as varying 'baseline' is locked atm
-            reader = VirtualWSIReader(
-                img,
-                info=metadata,
-            )
-        return reader
-
-    def __getitem__(self: WSIPatchDataset, idx: int) -> dict:
-        """Get an item from the dataset."""
-        coords = self.inputs[idx]
-        # Read image patch from the whole-slide image
-        if self.reader is None:
-            # only set the reader on first call so that it is initially picklable
-            self.reader = self._get_reader(self.img_path)
-        patch = self.reader.read_bounds(
-            coords,
-            resolution=self.resolution,
-            units=self.units,
-            pad_constant_values=255,
-            coord_space="resolution",
-        )
-
-        # Apply preprocessing to selected patch
-        patch = self._preproc(patch)
-
-        return {"image": patch, "coords": np.array(coords)}
diff --git a/tiatoolbox/models/dataset/dataset_abc.py b/tiatoolbox/models/dataset/dataset_abc.py
index 7d7160e48..f81312827 100644
--- a/tiatoolbox/models/dataset/dataset_abc.py
+++ b/tiatoolbox/models/dataset/dataset_abc.py
@@ -2,23 +2,30 @@
 
 from __future__ import annotations
 
+import copy
+import os
 from abc import ABC, abstractmethod
 from pathlib import Path
 from typing import TYPE_CHECKING
 
-if TYPE_CHECKING:  # pragma: no cover
-    from collections.abc import Callable, Iterable
-
-    try:
-        from typing import TypeGuard
-    except ImportError:
-        from typing import TypeGuard  # to support python <3.10
-
-
+import cv2
 import numpy as np
 import torch
+import torch.utils.data as torch_data
 
+from tiatoolbox import logger
+from tiatoolbox.tools.patchextraction import PatchExtractor
 from tiatoolbox.utils import imread
+from tiatoolbox.utils.exceptions import DimensionMismatchError
+from tiatoolbox.wsicore.wsireader import VirtualWSIReader, WSIMeta, WSIReader
+
+if TYPE_CHECKING:  # pragma: no cover
+    from collections.abc import Callable, Iterable
+    from multiprocessing.managers import Namespace
+    from typing import TypeGuard
+
+    from tiatoolbox.models.engine.io_config import IOSegmentorConfig
+    from tiatoolbox.type_hints import IntPair, Resolution, Units
 
 input_type = list[str | Path | np.ndarray] | np.ndarray
 
@@ -136,7 +143,7 @@ def load_img(path: str | Path) -> np.ndarray:
 
         if path.suffix not in (".npy", ".jpg", ".jpeg", ".tif", ".tiff", ".png"):
             msg = f"Cannot load image data from `{path.suffix}` files."
-            raise ValueError(msg)
+            raise TypeError(msg)
 
         return imread(path, as_uint8=False)
 
@@ -182,3 +189,489 @@ def __len__(self: PatchDatasetABC) -> int:
     def __getitem__(self: PatchDatasetABC, idx: int) -> None:
         """Get an item from the dataset."""
         ...  # pragma: no cover
+
+
+class WSIStreamDataset(torch_data.Dataset):
+    """Reading a wsi in parallel mode with persistent workers.
+
+    To speed up the inference process for multiple WSIs. The
+    `torch.utils.data.Dataloader` is set to run in persistent mode.
+    Normally, this will prevent workers from altering their initial
+    states (such as provided input etc.). To sidestep this, we use a
+    shared parallel workspace context manager to send data and signal
+    from the main thread, thus allowing each worker to load a new wsi as
+    well as corresponding patch information.
+
+    Args:
+        mp_shared_space (:class:`Namespace`):
+            A shared multiprocessing space, must be from
+            `torch.multiprocessing`.
+        ioconfig (:class:`IOSegmentorConfig`):
+            An object which contains I/O placement for patches.
+        wsi_paths (list): List of paths pointing to a WSI or tiles.
+        preproc (Callable):
+            Pre-processing function to be applied to a patch.
+        mode (str):
+            Either `"wsi"` or `"tile"` to indicate the format of images
+            in `wsi_paths`.
+
+    Examples:
+        >>> ioconfig = IOSegmentorConfig(
+        ...     input_resolutions=[{"units": "baseline", "resolution": 1.0}],
+        ...     output_resolutions=[{"units": "baseline", "resolution": 1.0}],
+        ...     patch_input_shape=[2048, 2048],
+        ...     patch_output_shape=[1024, 1024],
+        ...     stride_shape=[512, 512],
+        ... )
+        >>> mp_manager = torch_mp.Manager()
+        >>> mp_shared_space = mp_manager.Namespace()
+        >>> mp_shared_space.signal = 1  # adding variable to the shared space
+        >>> wsi_paths = ['A.svs', 'B.svs']
+        >>> wsi_dataset = WSIStreamDataset(ioconfig, wsi_paths, mp_shared_space)
+
+    """
+
+    def __init__(
+        self: WSIStreamDataset,
+        ioconfig: IOSegmentorConfig,
+        wsi_paths: list[str | Path],
+        mp_shared_space: Namespace,
+        preproc: Callable[[np.ndarray], np.ndarray] | None = None,
+        mode: str = "wsi",
+    ) -> None:
+        """Initialize :class:`WSIStreamDataset`."""
+        super().__init__()
+        self.mode = mode
+        self.preproc = preproc
+        self.ioconfig = copy.deepcopy(ioconfig)
+
+        if mode == "tile":
+            logger.warning(
+                "WSIPatchDataset only reads image tile at "
+                '`units="baseline"`. Resolutions will be converted '
+                "to baseline value.",
+                stacklevel=2,
+            )
+            self.ioconfig = self.ioconfig.to_baseline()
+
+        self.mp_shared_space = mp_shared_space
+        self.wsi_paths = wsi_paths
+        self.wsi_idx = None  # to be received externally via thread communication
+        self.reader = None
+
+    def _get_reader(self: WSIStreamDataset, img_path: str | Path) -> WSIReader:
+        """Get appropriate reader for input path."""
+        img_path = Path(img_path)
+        if self.mode == "wsi":
+            return WSIReader.open(img_path)
+        img = imread(img_path)
+        # initialise metadata for VirtualWSIReader.
+        # here, we simulate a whole-slide image, but with a single level.
+        metadata = WSIMeta(
+            mpp=np.array([1.0, 1.0]),
+            objective_power=10,
+            axes="YXS",
+            slide_dimensions=np.array(img.shape[:2][::-1]),
+            level_downsamples=[1.0],
+            level_dimensions=[np.array(img.shape[:2][::-1])],
+        )
+        return VirtualWSIReader(
+            img,
+            info=metadata,
+        )
+
+    def __len__(self: WSIStreamDataset) -> int:
+        """Return the length of the instance attributes."""
+        return len(self.mp_shared_space.patch_inputs)
+
+    @staticmethod
+    def collate_fn(batch: list | np.ndarray) -> torch.Tensor:
+        """Prototype to handle reading exception.
+
+        This will exclude any sample with `None` from the batch. As
+        such, wrapping `__getitem__` with try-catch and return `None`
+        upon exceptions will prevent crashing the entire program. But as
+        a side effect, the batch may not have the size as defined.
+
+        """
+        batch = [v for v in batch if v is not None]
+        return torch.utils.data.dataloader.default_collate(batch)
+
+    def __getitem__(self: WSIStreamDataset, idx: int) -> tuple:
+        """Get an item from the dataset."""
+        # ! no need to lock as we do not modify source value in shared space
+        if self.wsi_idx != self.mp_shared_space.wsi_idx:
+            self.wsi_idx = int(self.mp_shared_space.wsi_idx.item())
+            self.reader = self._get_reader(self.wsi_paths[self.wsi_idx])
+
+        # this is in XY and at requested resolution (not baseline)
+        bounds = self.mp_shared_space.patch_inputs[idx]
+        bounds = bounds.numpy()  # expected to be a torch.Tensor
+
+        # be the same as bounds br-tl, unless bounds are of float
+        patch_data_ = []
+        scale_factors = self.ioconfig.scale_to_highest(
+            self.ioconfig.input_resolutions,
+            self.ioconfig.resolution_unit,
+        )
+        for idy, resolution in enumerate(self.ioconfig.input_resolutions):
+            resolution_bounds = np.round(bounds * scale_factors[idy])
+            patch_data = self.reader.read_bounds(
+                resolution_bounds.astype(np.int32),
+                coord_space="resolution",
+                pad_constant_values=0,  # expose this ?
+                **resolution,
+            )
+
+            if self.preproc is not None:
+                patch_data = patch_data.copy()
+                patch_data = self.preproc(patch_data)
+            patch_data_.append(patch_data)
+        if len(patch_data_) == 1:
+            patch_data_ = patch_data_[0]
+
+        bound = self.mp_shared_space.patch_outputs[idx]
+        return patch_data_, bound
+
+
+class WSIPatchDataset(PatchDatasetABC):
+    """Define a WSI-level patch dataset.
+
+    Attributes:
+        reader (:class:`.WSIReader`):
+            A WSI Reader or Virtual Reader for reading pyramidal image
+            or large tile in pyramidal way.
+        inputs:
+            List of coordinates to read from the `reader`, each
+            coordinate is of the form `[start_x, start_y, end_x,
+            end_y]`.
+        patch_input_shape:
+            A tuple (int, int) or ndarray of shape (2,). Expected size to
+            read from `reader` at requested `resolution` and `units`.
+            Expected to be `(height, width)`.
+        resolution:
+            See (:class:`.WSIReader`) for details.
+        units:
+            See (:class:`.WSIReader`) for details.
+        preproc_func:
+            Preprocessing function used to transform the input data. It will
+            be called on each patch before returning it.
+
+    """
+
+    def __init__(  # skipcq: PY-R1000
+        self: WSIPatchDataset,
+        input_img: str | Path | WSIReader,
+        mask_path: str | Path | None = None,
+        patch_input_shape: IntPair = None,
+        patch_output_shape: IntPair = None,
+        stride_shape: IntPair = None,
+        resolution: Resolution = None,
+        units: Units = None,
+        min_mask_ratio: float = 0,
+        preproc_func: Callable | None = None,
+        *,
+        auto_get_mask: bool = True,
+    ) -> None:
+        """Create a WSI-level patch dataset.
+
+        Args:
+            input_img (str or Path or WSIReader):
+                Valid path to a whole-slide image class:`WSIReader`.
+            mask_path (str or Path):
+                Valid mask image.
+            patch_input_shape:
+                A tuple (int, int) or ndarray of shape (2,). Expected
+                shape to read from `reader` at requested `resolution`
+                and `units`. Expected to be positive and of (height,
+                width). Note, this is not at `resolution` coordinate
+                space.
+            patch_output_shape:
+                A tuple (int, int) or ndarray of shape (2,). Expected
+                output shape from the model at requested `resolution`
+                and `units`. Expected to be positive and of (height,
+                width). Note, this is not at `resolution` coordinate
+                space.
+            stride_shape:
+                A tuple (int, int) or ndarray of shape (2,). Expected
+                stride shape to read at requested `resolution` and
+                `units`. Expected to be positive and of (height, width).
+                Note, this is not at level 0.
+            resolution (Resolution):
+                Requested resolution corresponding to units. Check
+                (:class:`WSIReader`) for details.
+            units (Units):
+                Units in which `resolution` is defined.
+            auto_get_mask (bool):
+                If `True`, then automatically get simple threshold mask using
+                WSIReader.tissue_mask() function.
+            min_mask_ratio (float):
+                Only patches with positive area percentage above this value are
+                included. Defaults to 0.
+            preproc_func (Callable):
+                Preprocessing function used to transform the input data. If
+                supplied, the function will be called on each patch before
+                returning it.
+
+        Examples:
+            >>> # A user defined preproc func and expected behavior
+            >>> preproc_func = lambda img: img/2  # reduce intensity by half
+            >>> transformed_img = preproc_func(img)
+            >>> # Create a dataset to get patches from WSI with above
+            >>> # preprocessing function
+            >>> ds = WSIPatchDataset(
+            ...     input_img='/A/B/C/wsi.svs',
+            ...     patch_input_shape=[512, 512],
+            ...     stride_shape=[256, 256],
+            ...     auto_get_mask=False,
+            ...     preproc_func=preproc_func
+            ... )
+
+        """
+        super().__init__()
+
+        valid_path = bool(
+            isinstance(input_img, (str, Path)) and Path(input_img).is_file()
+        )
+        # Is there a generic func for path test in toolbox?
+        if not valid_path and not isinstance(input_img, WSIReader):
+            msg = "`input_img` must be a valid file path or a `WSIReader` instance."
+            raise ValueError(msg)
+        patch_input_shape = np.array(patch_input_shape)
+        stride_shape = np.array(stride_shape)
+
+        _validate_patch_stride_shape(patch_input_shape, stride_shape)
+
+        self.preproc_func = preproc_func
+        img_path = (
+            input_img if not isinstance(input_img, WSIReader) else input_img.input_path
+        )
+        self.img_path = Path(img_path)
+        reader = (
+            input_img
+            if isinstance(input_img, WSIReader)
+            else WSIReader.open(self.img_path)
+        )
+        # To support multi-threading on Windows
+        # Helps pickle using Path
+        self.reader = None if os.name == "nt" else reader
+        # may decouple into misc ?
+        # the scaling factor will scale base level to requested read resolution/units
+        wsi_shape = reader.slide_dimensions(resolution=resolution, units=units)
+        self.reader_info = reader.info
+
+        # use all patches, as long as it overlaps source image
+        if patch_output_shape is not None:
+            self.inputs, self.outputs = PatchExtractor.get_coordinates(
+                image_shape=wsi_shape,
+                patch_input_shape=patch_input_shape[::-1],
+                stride_shape=stride_shape[::-1],
+                patch_output_shape=patch_output_shape,
+            )
+            self.full_outputs = self.outputs
+        else:
+            self.inputs = PatchExtractor.get_coordinates(
+                image_shape=wsi_shape,
+                patch_input_shape=patch_input_shape[::-1],
+                stride_shape=stride_shape[::-1],
+            )
+
+        mask_reader = None
+        if mask_path is not None:
+            mask_path = Path(mask_path)
+            if not Path.is_file(mask_path):
+                msg = "`mask_path` must be a valid file path."
+                raise ValueError(msg)
+            mask = imread(mask_path)  # assume to be gray
+            mask = cv2.cvtColor(mask, cv2.COLOR_RGB2GRAY)
+            mask = np.array(mask > 0, dtype=np.uint8)
+
+            mask_reader = VirtualWSIReader(mask)
+            mask_reader.info = self.reader_info
+        elif auto_get_mask and mask_path is None:
+            # if no mask provided and `wsi` mode, generate basic tissue
+            # mask on the fly
+            mask_reader = reader.tissue_mask(resolution=1.25, units="power")
+            # ? will this mess up  ?
+            mask_reader.info = self.reader_info
+
+        if mask_reader is not None:
+            selected = PatchExtractor.filter_coordinates(
+                mask_reader,  # must be at the same resolution
+                self.inputs,  # must already be at requested resolution
+                wsi_shape=wsi_shape,
+                min_mask_ratio=min_mask_ratio,
+            )
+            self.inputs = self.inputs[selected]
+            if hasattr(self, "outputs"):
+                self.full_outputs = self.outputs  # Full list of outputs
+                self.outputs = self.outputs[selected]
+
+        self._check_inputs()
+
+        self.patch_input_shape = patch_input_shape
+        self.resolution = resolution
+        self.units = units
+
+        # Perform check on the input
+        self._check_input_integrity(mode="wsi")
+
+    def _check_inputs(self: WSIPatchDataset) -> None:
+        """Check if input length is valid after filtering."""
+        if len(self.inputs) == 0:
+            msg = "No patch coordinates remain after filtering."
+            raise ValueError(msg)
+
+    def _get_reader(self: WSIPatchDataset, img_path: str | Path) -> WSIReader:
+        """Get a reader for the image."""
+        # To avoid ruff errors and compatibility with base class.
+        return self.reader if self.reader else WSIReader.open(img_path)
+
+    def __getitem__(self: WSIPatchDataset, idx: int) -> dict:
+        """Get an item from the dataset."""
+        coords = self.inputs[idx]
+        output_locs = None
+        if hasattr(self, "outputs"):
+            output_locs = self.outputs[idx]
+
+        # Read image patch from the whole-slide image
+        self.reader = self._get_reader(self.img_path)
+        patch = self.reader.read_bounds(
+            coords,
+            resolution=self.resolution,
+            units=self.units,
+            pad_constant_values=255,
+            coord_space="resolution",
+        )
+
+        # Apply preprocessing to selected patch
+        patch = self._preproc(patch)
+
+        if output_locs is not None:
+            return {
+                "image": patch,
+                "coords": np.array(coords),
+                "output_locs": output_locs,
+            }
+
+        return {"image": patch, "coords": np.array(coords)}
+
+
+class PatchDataset(PatchDatasetABC):
+    """Define PatchDataset for torch inference.
+
+    Define a simple patch dataset, which inherits from the
+      `torch.utils.data.Dataset` class.
+
+    Attributes:
+        inputs (list or np.ndarray):
+            Either a list of patches, where each patch is a ndarray or a
+            list of valid path with its extension be (".jpg", ".jpeg",
+            ".tif", ".tiff", ".png") pointing to an image.
+        labels (list):
+            List of labels for sample at the same index in `inputs`.
+            Default is `None`.
+        patch_input_shape (tuple):
+            Size of patches input to the model. Patches are at
+            requested read resolution, not with respect to level 0,
+            and must be positive.
+
+    Examples:
+        >>> # A user defined preproc func and expected behavior
+        >>> preproc_func = lambda img: img/2  # reduce intensity by half
+        >>> transformed_img = preproc_func(img)
+        >>> # create a dataset to get patches preprocessed by the above function
+        >>> ds = PatchDataset(
+        ...     inputs=['/A/B/C/img1.png', '/A/B/C/img2.png'],
+        ...     labels=["labels1", "labels2"],
+        ...     patch_input_shape=(224, 224),
+        ... )
+
+    """
+
+    def __init__(
+        self: PatchDataset,
+        inputs: np.ndarray | list,
+        labels: list | None = None,
+        patch_input_shape: IntPair | None = None,
+    ) -> None:
+        """Initialize :class:`PatchDataset`."""
+        super().__init__()
+
+        self.data_is_npy_alike = False
+
+        self.inputs = inputs
+        self.labels = labels
+        self.patch_input_shape = patch_input_shape
+
+        # perform check on the input
+        self._check_input_integrity(mode="patch")
+
+    def __getitem__(self: PatchDataset, idx: int) -> dict:
+        """Get an item from the dataset."""
+        patch = self.inputs[idx]
+
+        # Mode 0 is list of paths
+        if not self.data_is_npy_alike:
+            patch = self.load_img(patch)
+
+        if patch.shape[:-1] != tuple(self.patch_input_shape):
+            msg = (
+                f"Patch size is not compatible with the model. "
+                f"Expected dimensions {tuple(self.patch_input_shape)}, but got "
+                f"{patch.shape[:-1]}."
+            )
+            logger.error(msg=msg)
+            raise DimensionMismatchError(
+                expected_dims=tuple(self.patch_input_shape),
+                actual_dims=patch.shape[:-1],
+            )
+
+        # Apply preprocessing to selected patch
+        patch = self._preproc(patch)
+
+        data = {
+            "image": patch,
+        }
+        if self.labels is not None:
+            data["label"] = self.labels[idx]
+            return data
+
+        return data
+
+
+def _validate_patch_stride_shape(
+    patch_input_shape: np.ndarray, stride_shape: np.ndarray
+) -> None:
+    """Validate patch and stride shape inputs for semantic segmentation.
+
+    Checks that both `patch_input_shape` and `stride_shape` are integer arrays of
+    length ≤ 2 and contain non-negative values. Raises a ValueError if any
+    condition fails.
+
+    Parameters:
+        patch_input_shape (np.ndarray):
+            Shape of the input patch (e.g., height, width).
+        stride_shape (np.ndarray):
+            Stride dimensions used for patch extraction.
+
+    Raises:
+        ValueError:
+            If either input is not a valid integer array of appropriate
+            shape and values.
+
+    """
+    if (
+        not np.issubdtype(patch_input_shape.dtype, np.integer)
+        or np.size(patch_input_shape) > 2  # noqa: PLR2004
+        or np.any(patch_input_shape < 0)
+    ):
+        msg = f"Invalid `patch_input_shape` value {patch_input_shape}."
+        raise ValueError(msg)
+    if (
+        not np.issubdtype(stride_shape.dtype, np.integer)
+        or np.size(stride_shape) > 2  # noqa: PLR2004
+        or np.any(stride_shape < 0)
+    ):
+        msg = f"Invalid `stride_shape` value {stride_shape}."
+        raise ValueError(msg)
diff --git a/tiatoolbox/models/engine/__init__.py b/tiatoolbox/models/engine/__init__.py
index 4293fae0c..9c00ac4a2 100644
--- a/tiatoolbox/models/engine/__init__.py
+++ b/tiatoolbox/models/engine/__init__.py
@@ -1,7 +1,15 @@
 """Engines to run models implemented in tiatoolbox."""
 
-from tiatoolbox.models.engine import (
+from . import (
+    engine_abc,
     nucleus_instance_segmentor,
     patch_predictor,
     semantic_segmentor,
 )
+
+__all__ = [
+    "engine_abc",
+    "nucleus_instance_segmentor",
+    "patch_predictor",
+    "semantic_segmentor",
+]
diff --git a/tiatoolbox/models/engine/engine_abc.py b/tiatoolbox/models/engine/engine_abc.py
new file mode 100644
index 000000000..73b4ca1c1
--- /dev/null
+++ b/tiatoolbox/models/engine/engine_abc.py
@@ -0,0 +1,1440 @@
+"""Abstract Base Class for TIAToolbox Deep Learning Engines.
+
+This module defines the `EngineABC` class, which serves as a base for implementing
+deep learning inference workflows in TIAToolbox. It supports both patch-based and
+whole slide image (WSI) processing, and provides a unified interface for model
+initialization, data loading, inference, post-processing, and output saving.
+
+Classes:
+    - EngineABC: Abstract base class for deep learning engines.
+    - EngineABCRunParams: TypedDict for runtime configuration parameters.
+
+Functions:
+    - prepare_engines_save_dir: Utility to create or validate output directories.
+
+Features:
+    - Supports patch and WSI modes.
+    - Handles caching and memory-efficient inference using Dask.
+    - Integrates with TIAToolbox models and IO configurations.
+    - Outputs predictions in multiple formats including dict, zarr, and AnnotationStore.
+
+Intended Usage:
+    Subclass `EngineABC` to implement specific inference logic by overriding
+    abstract methods such as preprocessing, postprocessing, and model-specific behavior.
+
+Example:
+    >>> class MyEngine(EngineABC):
+    >>>     def __init__(self, model, weights, verbose):
+    >>>         super().__init__(model=model, weights=weights, verbose=verbose)
+    >>> # Implement base class functions and then call.
+    >>> engine = MyEngine(model="resnet18-kather100k")
+    >>> output = engine.run(images, patch_mode=True)
+
+"""
+
+from __future__ import annotations
+
+import copy
+from abc import ABC
+from pathlib import Path
+from typing import TYPE_CHECKING, TypedDict
+
+import dask
+import dask.array as da
+import numpy as np
+import torch
+import zarr
+from dask import compute
+from dask.diagnostics import ProgressBar
+from torch import nn
+from typing_extensions import Unpack
+
+from tiatoolbox import DuplicateFilter, logger, rcParam
+from tiatoolbox.models.architecture import get_pretrained_model
+from tiatoolbox.models.architecture.utils import compile_model
+from tiatoolbox.models.dataset.dataset_abc import PatchDataset, WSIPatchDataset
+from tiatoolbox.models.models_abc import load_torch_model
+from tiatoolbox.utils.misc import (
+    dict_to_store_patch_predictions,
+    get_tqdm,
+)
+from tiatoolbox.wsicore.wsireader import WSIReader, is_zarr
+
+from .io_config import ModelIOConfigABC
+
+if TYPE_CHECKING:  # pragma: no cover
+    import os
+
+    from torch.utils.data import DataLoader
+
+    from tiatoolbox.annotation import AnnotationStore
+    from tiatoolbox.models.models_abc import ModelABC
+    from tiatoolbox.type_hints import IntPair, Resolution, Units
+
+
+class EngineABCRunParams(TypedDict, total=False):
+    """Parameters for configuring the :func:`EngineABC.run()` method.
+
+    Optional Keys:
+        auto_get_mask (bool):
+            Whether to automatically generate segmentation masks using
+            `wsireader.tissue_mask()` during processing.
+        batch_size (int):
+            Number of image patches per forward pass.
+        class_dict (dict):
+            Mapping of classification outputs to class names.
+        device (str):
+            Device to run the model on (e.g., "cpu", "cuda").
+            See https://pytorch.org/docs/stable/tensor_attributes.html#torch.device
+            for more details.
+        input_resolutions (list[dict[Units, Resolution]]):
+            Resolution settings for input heads. Supported units are `level`,
+            `power`, and `mpp`. Keys should be "units" and "resolution", e.g.,
+            [{"units": "mpp", "resolution": 0.25}]. See :class:`WSIReader` for details.
+        ioconfig (ModelIOConfigABC):
+            IO configuration (:class:`ModelIOConfigABC`) for model input/output.
+        memory_threshold (int):
+            Memory usage threshold (in percentage) to trigger caching behavior.
+        num_workers (int):
+            Number of workers for DataLoader and post-processing.
+        output_file (str):
+            Filename for saving output (e.g., "zarr" or "annotationstore").
+        patch_input_shape (IntPair):
+            Shape of input patches (height, width), requested at read resolution.
+            Must be positive.
+        return_labels (bool):
+            Whether to return labels with predictions.
+        scale_factor (tuple[float, float]):
+            Scale factor for annotations (model_mpp / slide_mpp).
+            Used to convert coordinates from non-baseline to baseline resolution.
+        stride_shape (IntPair):
+            Stride used during WSI processing, at requested read resolution.
+            Must be positive. Defaults to `patch_input_shape` if not provided.
+        verbose (bool):
+            Whether to enable verbose logging.
+
+    """
+
+    auto_get_mask: bool
+    batch_size: int
+    class_dict: dict
+    device: str
+    input_resolutions: list[dict[Units, Resolution]]
+    ioconfig: ModelIOConfigABC
+    memory_threshold: int
+    num_workers: int
+    output_file: str
+    patch_input_shape: IntPair
+    return_labels: bool
+    scale_factor: tuple[float, float]
+    stride_shape: IntPair
+    verbose: bool
+
+
+class EngineABC(ABC):  # noqa: B024
+    """Abstract base class for TIAToolbox deep learning engines to run CNN models.
+
+    This class provides a unified interface for running inference on image patches
+    or whole slide images (WSIs), handling preprocessing, batching, postprocessing,
+    and saving predictions.
+
+    Args:
+        model (str | ModelABC):
+            Model name from TIAToolbox or a PyTorch model instance.
+            The user can request pretrained models from the toolbox model zoo using
+            the list of pretrained models available at this `link
+            <https://tia-toolbox.readthedocs.io/en/latest/pretrained.html>`_
+            By default, the corresponding pretrained weights will also
+            be downloaded. However, you can override with your own set
+            of weights using the `weights` parameter.
+        batch_size (int):
+            Number of patches per forward pass. Default is 8.
+        num_workers (int):
+            Number of workers for data loading. Default is 0.
+        weights (str | Path | None):
+            Path to model weights. If None, default weights are used.
+
+            >>> engine = EngineABC(
+            ...    model="pretrained-model",
+            ...    weights="/path/to/pretrained-local-weights.pth"
+            ... )
+
+        device (str):
+            Device to run the model on (e.g., "cpu", "cuda"). Please see
+            https://pytorch.org/docs/stable/tensor_attributes.html#torch.device
+            for more details on input parameters for device. Default is "cpu".
+        verbose (bool):
+            Enable verbose logging. Default is False.
+
+    Attributes:
+        images (list[str | Path] | np.ndarray):
+            Input images or patches.
+            A list of image patches in NHWC format as a numpy array
+            or a list of str/paths to WSIs.
+        masks (list[str | Path] | np.ndarray):
+            Optional masks for WSIs.
+            A list of tissue masks or binary masks corresponding to processing area of
+            input images. These can be a list of numpy arrays or paths to
+            the saved image masks. These are only utilized when patch_mode is False.
+            Patches are only generated within a masked area.
+            If not provided, then a tissue mask will be automatically
+            generated for whole slide images, if auto_get_mask is True.
+        patch_mode (bool):
+            Whether input is treated as patches. TIAToolbox defines
+            an image as a patch if HWC of the input image matches with the HWC expected
+            by the model. If HWC of the input image does not match with the HWC expected
+            by the model, then the patch_mode must be set to False which will allow the
+            engine to extract patches from the input image.
+            In this case, when the patch_mode is False the input images are treated
+            as WSIs. Default value is True.
+        model (ModelABC):
+            Loaded PyTorch model. For a full list of pretrained models,
+            refer to the `docs
+            <https://tia-toolbox.readthedocs.io/en/latest/pretrained.html>`_
+            By default, the corresponding pretrained weights will also
+            be downloaded. However, you can override with your own set
+            of weights via the `weights` argument. Argument
+            is case-insensitive.
+        ioconfig (ModelIOConfigABC):
+            IO configuration (:class:`ModelIOConfigABC`) for model input/output.
+        dataloader (DataLoader):
+            Torch DataLoader for inference.
+        return_labels (bool):
+            Whether to return labels with probabilities and predictions.
+        input_resolutions (list[dict[Units, Resolution]]):
+            Resolution settings for input heads. Supported
+            units are `level`, `power` and `mpp`. Keys should be "units" and
+            "resolution" e.g., [{"units": "mpp", "resolution": 0.25}]. Please see
+            :class:`WSIReader` for details.
+        patch_input_shape (IntPair):
+            Shape of input patches. Patches are at
+            requested read resolution, not with respect to level 0,
+            and must be positive.
+        stride_shape (IntPair):
+            Stride used during WSI processing. Stride is
+            at requested read resolution, not with respect to
+            level 0, and must be positive. If not provided,
+            `stride_shape=patch_input_shape`.
+        batch_size (int):
+            Number of patches per forward pass.
+        labels (list | None):
+            Optional labels for input images. Only a single label per image is
+            supported.
+        num_workers (int):
+            Number of workers for data loading.
+        patch_input_shape (IntPair | None):
+            Shape of input patches.
+        input_resolutions (list[dict[Units, Resolution]] | None):
+            Resolution settings for input heads.
+        return_labels (bool):
+            Whether to return labels with predictions.
+        stride_shape (IntPair | None):
+            Stride used during WSI processing.
+        verbose (bool):
+            Whether to enable verbose logging.
+        dataloader (DataLoader | None):
+            Torch DataLoader for inference.
+        drop_keys (list):
+            Keys to exclude from model output.
+        output_type (Any):
+            Format of output ("dict", "zarr", "AnnotationStore").
+        verbose (bool):
+            Whether to enable verbose logging.
+
+    Example:
+        >>> # Inherit from EngineABC
+        >>> class MyEngine(EngineABC):
+        >>>     def __init__(self, model, weights, verbose):
+        >>>         super().__init__(model=model, weights=weights, verbose=verbose)
+        >>> engine = MyEngine(model="resnet18-kather100k")
+        >>> output = engine.run(images, patch_mode=True)
+
+        >>> # Define all the abstract classes
+
+        >>> data = np.array([np.ndarray, np.ndarray])
+        >>> engine = TestEngineABC(model="resnet18-kather100k")
+        >>> output = engine.run(data, patch_mode=True)
+
+        >>> # array of list of 2 image patches as input
+        >>> data = np.array([np.ndarray, np.ndarray])
+        >>> engine = TestEngineABC(model="resnet18-kather100k")
+        >>> output = engine.run(data, patch_mode=True)
+
+        >>> # list of 2 image files as input
+        >>> image = ['path/image1.png', 'path/image2.png']
+        >>> engine = TestEngineABC(model="resnet18-kather100k")
+        >>> output = engine.run(image, patch_mode=False)
+
+        >>> # list of 2 wsi files as input
+        >>> wsi_file = ['path/wsi1.svs', 'path/wsi2.svs']
+        >>> engine = TestEngineABC(model="resnet18-kather100k")
+        >>> output = engine.run(wsi_file, patch_mode=False)
+
+    """
+
+    def __init__(
+        self: EngineABC,
+        model: str | ModelABC,
+        batch_size: int = 8,
+        num_workers: int = 0,
+        weights: str | Path | None = None,
+        *,
+        device: str = "cpu",
+        verbose: bool = False,
+    ) -> None:
+        """Initialize the EngineABC instance.
+
+        Args:
+            model (str | ModelABC):
+                Model name from TIAToolbox or a PyTorch model instance.
+            batch_size (int):
+                Number of patches per forward pass. Default is 8.
+            num_workers (int):
+                Number of workers for data loading. Default is 0.
+            weights (str | Path | None):
+                Path to model weights. If None, default weights are used.
+            device (str):
+                Device to run the model on (e.g., "cpu", "cuda"). Default is "cpu".
+            verbose (bool):
+                Enable verbose logging. Default is False.
+
+        """
+        self.images = None
+        self.masks = None
+        self.patch_mode = None
+        self.device = device
+
+        # Initialize model with specified weights and ioconfig.
+        self.model, self.ioconfig = self._initialize_model_ioconfig(
+            model=model, weights=weights
+        )
+        self.model.to(device=self.device)
+        self.model = (
+            compile_model(  # for runtime, such as after wrapping with nn.DataParallel
+                self.model,
+                mode=rcParam["torch_compile_mode"],
+            )
+        )
+        self._ioconfig = self.ioconfig  # runtime ioconfig
+        self.batch_size = batch_size
+        self.labels: list | None = None
+        self.num_workers = num_workers
+        self.patch_input_shape: IntPair | None = None
+        self.input_resolutions: list[dict[Units, Resolution]] | None = None
+        self.return_labels: bool = False
+        self.stride_shape: IntPair | None = None
+        self.verbose: bool = verbose
+        self.dataloader: DataLoader | None = None
+        self.drop_keys: list = []
+        self.output_type = None
+
+    @staticmethod
+    def _initialize_model_ioconfig(
+        model: str | ModelABC,
+        weights: str | Path | None,
+    ) -> tuple[nn.Module, ModelIOConfigABC | None]:
+        """Helper function to initialize model and IO configuration.
+
+        If a pretrained model from TIAToolbox is specified by name, this function
+        loads the model and its associated IO configuration. If a custom model is
+        provided, it loads the weights if specified and returns None for IO config.
+
+        Args:
+            model (str | ModelABC):
+                A model name from TIAToolbox or a PyTorch model instance.
+                The user can request pretrained models from the toolbox model zoo using
+                the list of pretrained models available at this `link
+                <https://tia-toolbox.readthedocs.io/en/latest/pretrained.html>`_
+                By default, the corresponding pretrained weights will also
+                be downloaded. However, you can override with your own set
+                of weights using the `weights` parameter.
+
+            weights (str | Path | None):
+                Path to pretrained weights. If None and a TIAToolbox model is used,
+                default weights are automatically downloaded.
+
+        Returns:
+            tuple[nn.Module, ModelIOConfigABC | None]:
+                A tuple containing the loaded PyTorch model and its IO configuration.
+                If the model is not from TIAToolbox, IO config will be None.
+
+        Raises:
+            TypeError:
+                If the model is neither a string (TIAToolbox model)
+                nor a torch.nn.Module.
+
+        """
+        if not isinstance(model, (str, nn.Module)):
+            msg = "Input model must be a string or 'torch.nn.Module'."
+            raise TypeError(msg)
+
+        if isinstance(model, str):
+            # ioconfig is retrieved from the pretrained model in the toolbox.
+            # list of pretrained models in the TIA Toolbox is available here:
+            # https://tia-toolbox.readthedocs.io/en/latest/pretrained.html
+            # no need to provide ioconfig in EngineABC.run() this case.
+            return get_pretrained_model(model, weights)
+
+        if weights is not None:
+            model = load_torch_model(model=model, weights=weights)
+
+        return model, None
+
+    def get_dataloader(
+        self: EngineABC,
+        images: str | Path | list[str | Path] | np.ndarray,
+        masks: Path | None = None,
+        labels: list | None = None,
+        ioconfig: ModelIOConfigABC | None = None,
+        *,
+        patch_mode: bool = True,
+        auto_get_mask: bool = True,
+    ) -> torch.utils.data.DataLoader:
+        """Pre-process images and masks and return a DataLoader for inference.
+
+        Args:
+            images (list[str | Path] | np.ndarray):
+                A list of image patches in NHWC format as a numpy array,
+                or a list of file paths to WSIs. When `patch_mode` is False,
+                expects file paths to WSIs.
+            masks (Path | None):
+                Optional list of masks used when `patch_mode` is False.
+                Patches are generated only within masked areas. If not provided,
+                tissue masks are automatically generated.
+            labels (list | None):
+                Optional list of labels. Only one label per image is supported.
+            ioconfig (ModelIOConfigABC | None):
+                IO configuration object specifying patch size, stride, and resolution.
+            patch_mode (bool):
+                Whether to treat input as patches (`True`) or WSIs (`False`).
+            auto_get_mask (bool):
+                Whether to automatically generate a tissue mask using
+                `wsireader.tissue_mask()` when `patch_mode` is False.
+                If `True`, only tissue regions are processed. If `False`,
+                all patches are processed. Default is `True`.
+
+        Returns:
+            torch.utils.data.DataLoader:
+                A PyTorch DataLoader configured for inference.
+
+        """
+        if labels:
+            # if a labels is provided, then return with the prediction
+            self.return_labels = bool(labels)
+
+        if not patch_mode:
+            dataset = WSIPatchDataset(
+                input_img=images,
+                mask_path=masks,
+                patch_input_shape=ioconfig.patch_input_shape,
+                stride_shape=ioconfig.stride_shape,
+                resolution=ioconfig.input_resolutions[0]["resolution"],
+                units=ioconfig.input_resolutions[0]["units"],
+                auto_get_mask=auto_get_mask,
+            )
+
+            dataset.preproc_func = self.model.preproc_func
+
+            # preprocessing must be defined with the dataset
+            return torch.utils.data.DataLoader(
+                dataset,
+                num_workers=self.num_workers,
+                batch_size=self.batch_size,
+                drop_last=False,
+                shuffle=False,
+                persistent_workers=self.num_workers > 0,
+            )
+
+        dataset = PatchDataset(
+            inputs=images, labels=labels, patch_input_shape=ioconfig.patch_input_shape
+        )
+
+        dataset.preproc_func = self.model.preproc_func
+
+        # preprocessing must be defined with the dataset
+        return torch.utils.data.DataLoader(
+            dataset,
+            num_workers=self.num_workers,
+            batch_size=self.batch_size,
+            drop_last=False,
+            shuffle=False,
+        )
+
+    def _get_coordinates(self: EngineABC, batch_data: dict) -> np.ndarray:
+        """Extract coordinates for each image patch in a batch.
+
+        This method returns coordinates for each patch, either based on
+        the patch dimensions (if in patch mode) or from precomputed values
+        (if in WSI mode).
+
+        Args:
+            batch_data (dict):
+                Dictionary containing batch data, including image and
+                optional coordinates.
+
+        Returns:
+            np.ndarray:
+                Array of coordinates for each patch in the batch.
+                Shape is (N, 4), where N is the number of patches.
+
+        """
+        if self.patch_mode:
+            coordinates = [0, 0, *batch_data["image"].shape[1:3]]
+            return np.tile(coordinates, reps=(batch_data["image"].shape[0], 1))
+        return np.array(batch_data["coords"])
+
+    def infer_patches(
+        self: EngineABC,
+        dataloader: DataLoader,
+        *,
+        return_coordinates: bool = False,
+    ) -> dict[str, da.Array]:
+        """Run model inference on image patches and return predictions.
+
+        This method performs batched inference using a PyTorch DataLoader,
+        and accumulates predictions in Dask arrays. It supports optional inclusion
+        of coordinates and labels in the output.
+
+        Args:
+            dataloader (DataLoader):
+                PyTorch DataLoader containing image patches for inference.
+            return_coordinates (bool):
+                Whether to include coordinates in the output. Required when
+                called by `infer_wsi` and `patch_mode` is False.
+
+        Returns:
+            dict[str, dask.array.Array]:
+                Dictionary containing prediction results as Dask arrays.
+                Keys include:
+                    - "probabilities": Model output probabilities.
+                    - "labels": Ground truth labels (if `return_labels` is True).
+                    - "coordinates": Patch coordinates (if `return_coordinates` is
+                      True).
+
+        """
+        keys = ["probabilities"]
+        probabilities, labels, coordinates = [], [], []
+
+        if self.return_labels:
+            keys.append("labels")
+            labels = []
+
+        if return_coordinates:
+            keys.append("coordinates")
+            coordinates = []
+
+        # Main output dictionary
+        raw_predictions = dict(zip(keys, [[]] * len(keys), strict=False))
+
+        # Inference loop
+        tqdm = get_tqdm()
+        tqdm_loop = (
+            tqdm(dataloader, leave=False, desc="Inferring patches")
+            if self.verbose
+            else self.dataloader
+        )
+
+        for batch_data in tqdm_loop:
+            batch_output = self.model.infer_batch(
+                self.model,
+                batch_data["image"],
+                device=self.device,
+            )
+
+            probabilities.append(
+                da.from_array(
+                    batch_output,  # probabilities
+                )
+            )
+
+            if return_coordinates:
+                coordinates.append(
+                    da.from_array(
+                        self._get_coordinates(batch_data),
+                    )
+                )
+
+            if self.return_labels:
+                labels.append(da.from_array(np.array(batch_data["label"])))
+
+        raw_predictions["probabilities"] = da.concatenate(probabilities, axis=0)
+
+        if return_coordinates:
+            raw_predictions["coordinates"] = da.concatenate(coordinates, axis=0)
+
+        if self.return_labels:
+            labels = [label.reshape(-1) for label in labels]
+            raw_predictions["labels"] = da.concatenate(labels, axis=0)
+
+        return raw_predictions
+
+    def post_process_patches(  # skipcq: PYL-R0201
+        self: EngineABC,
+        raw_predictions: da.Array,
+        prediction_shape: tuple[int, ...],  # noqa: ARG002
+        prediction_dtype: type,  # noqa: ARG002
+        **kwargs: Unpack[EngineABCRunParams],  # noqa: ARG002
+    ) -> dask.array.Array:
+        """Post-process raw patch predictions from inference.
+
+        This method applies a post-processing function (e.g., smoothing, filtering)
+        to the raw model predictions. It supports delayed execution using Dask
+        and returns a Dask array for efficient computation.
+
+        Args:
+            raw_predictions (dask.array.Array):
+                Raw model predictions as a dask array.
+            prediction_shape (tuple[int, ...]):
+                Shape of the prediction output.
+            prediction_dtype (type):
+                Data type of the prediction output.
+            **kwargs (EngineABCRunParams):
+                Additional runtime parameters used for post-processing.
+
+        Returns:
+            dask.array.Array:
+                Post-processed predictions as a Dask array.
+
+        """
+        return raw_predictions
+
+    def save_predictions(
+        self: EngineABC,
+        processed_predictions: dict,
+        output_type: str,
+        save_path: Path | None = None,
+        **kwargs: Unpack[EngineABCRunParams],
+    ) -> dict | AnnotationStore | Path:
+        """Save model predictions to disk or return them in memory.
+
+        Depending on the output type, this method saves predictions as a zarr group,
+        an AnnotationStore (SQLite database), or returns them as a dictionary.
+
+        Args:
+            processed_predictions (dict):
+                Dictionary containing processed model predictions.
+            output_type (str):
+                Desired output format.
+                Supported values are "dict", "zarr", and "annotationstore".
+            save_path (Path | None):
+                Path to save the output file.
+                Required for "zarr" and "annotationstore" formats.
+            **kwargs (EngineABCRunParams):
+                Additional runtime parameters including:
+                    - output_file: Name of the output file.
+                    - scale_factor: Scaling factor for annotations.
+                    - class_dict: Mapping of class indices to names.
+
+        Returns:
+            dict | AnnotationStore | Path:
+                - If output_type is "dict": returns predictions as a dictionary.
+                - If output_type is "zarr": returns path to saved zarr file.
+                - If output_type is "annotationstore": returns an AnnotationStore
+                  or path to .db file.
+
+        Raises:
+            TypeError:
+                If an unsupported output_type is provided.
+
+        """
+        keys_to_compute = [k for k in processed_predictions if k not in self.drop_keys]
+
+        if output_type.lower() == "zarr":
+            if is_zarr(save_path):
+                zarr_group = zarr.open(save_path, mode="r")
+                keys_to_compute = [k for k in keys_to_compute if k not in zarr_group]
+            write_tasks = []
+            for key in keys_to_compute:
+                dask_array = processed_predictions[key].rechunk("auto")
+                task = dask_array.to_zarr(
+                    url=save_path,
+                    component=key,
+                    compute=False,
+                )
+                write_tasks.append(task)
+            msg = f"Saving output to {save_path}."
+            logger.info(msg=msg)
+            with ProgressBar():
+                compute(*write_tasks)
+
+            zarr_group = zarr.open(save_path, mode="r+")
+            for key in self.drop_keys:
+                if key in zarr_group:
+                    del zarr_group[key]
+
+            return save_path
+
+        values_to_compute = [processed_predictions[k] for k in keys_to_compute]
+
+        # Compute all at once
+        computed_values = compute(*values_to_compute)
+
+        # Assign computed values
+        processed_predictions = dict(
+            zip(keys_to_compute, computed_values, strict=False)
+        )
+
+        if output_type.lower() == "dict":
+            return processed_predictions
+
+        if output_type.lower() == "annotationstore":
+            save_path = Path(kwargs.get("output_file", save_path.parent / "output.db"))
+
+            # scale_factor set from kwargs
+            scale_factor = kwargs.get("scale_factor", (1.0, 1.0))
+            # class_dict set from kwargs
+            class_dict = kwargs.get("class_dict")
+
+            return dict_to_store_patch_predictions(
+                processed_predictions,
+                scale_factor,
+                class_dict,
+                save_path,
+            )
+
+        msg = f"Unsupported output type: {output_type}"
+        raise TypeError(msg)
+
+    def infer_wsi(
+        self: EngineABC,
+        dataloader: DataLoader,
+        save_path: Path,
+        **kwargs: Unpack[EngineABCRunParams],
+    ) -> dict:
+        """Run model inference on a whole slide image (WSI).
+
+        This method performs inference on a WSI using the provided DataLoader,
+        and accumulates predictions in Dask arrays. Optionally includes
+        coordinates and labels in the output.
+
+        Args:
+            dataloader (DataLoader):
+                PyTorch DataLoader configured for WSI processing.
+            save_path (Path):
+                Path to save the intermediate output. The intermediate output is saved
+                in a zarr file.
+            **kwargs (EngineABCRunParams):
+                Additional runtime parameters used during inference.
+
+        Returns:
+            dict:
+                Dictionary containing prediction results as Dask arrays.
+
+        """
+        _ = kwargs.get("patch_mode", False)
+        _ = save_path
+        return self.infer_patches(
+            dataloader=dataloader,
+            return_coordinates=True,
+        )
+
+    # This is not a static model for child classes.
+    def post_process_wsi(  # skipcq: PYL-R0201
+        self: EngineABC,
+        raw_predictions: da.Array,
+        prediction_shape: tuple[int, ...],  # noqa: ARG002
+        prediction_dtype: type,  # noqa: ARG002
+        **kwargs: Unpack[EngineABCRunParams],  # noqa: ARG002
+    ) -> dask.array.Array:
+        """Post-process predictions from whole slide image (WSI) inference.
+
+        This method applies a post-processing function (e.g., smoothing, filtering)
+        to the raw model predictions. It supports delayed execution using Dask
+        and returns a Dask array for efficient computation.
+
+        Args:
+            raw_predictions (dask.array.Array):
+                Raw model predictions as a Dask array.
+            prediction_shape (tuple[int, ...]):
+                Shape of the prediction output.
+            prediction_dtype (type):
+                Data type of the prediction output.
+            **kwargs (EngineABCRunParams):
+                Additional runtime parameters used for post-processing.
+
+        Returns:
+            dask.array.Array:
+                Post-processed predictions as a Dask array.
+
+        """
+        return raw_predictions
+
+    def _load_ioconfig(self: EngineABC, ioconfig: ModelIOConfigABC) -> ModelIOConfigABC:
+        """Load or validate the IO configuration for the engine.
+
+        If the model is from TIAToolbox and no IO configuration is provided,
+        this method attempts to use the default configuration. Otherwise,
+        it validates and sets the provided configuration.
+
+        Args:
+            ioconfig (ModelIOConfigABC):
+                IO configuration to use for model inference.
+
+        Returns:
+            ModelIOConfigABC:
+                The IO configuration to be used during inference.
+
+        Raises:
+            ValueError:
+                If no IO configuration is provided and none is available from the model.
+
+        """
+        if self.ioconfig is None and ioconfig is None:
+            msg = (
+                "Please provide a valid ModelIOConfigABC. "
+                "No default ModelIOConfigABC found."
+            )
+            logger.warning(msg)
+
+        if ioconfig and isinstance(ioconfig, ModelIOConfigABC):
+            self.ioconfig = ioconfig
+
+        return self.ioconfig
+
+    def _update_ioconfig(
+        self: EngineABC,
+        ioconfig: ModelIOConfigABC,
+        patch_input_shape: IntPair,
+        stride_shape: IntPair,
+        input_resolutions: list[dict[Units, Resolution]],
+    ) -> ModelIOConfigABC:
+        """Update the IO configuration used for patch-based inference.
+
+        This method updates the patch input shape, stride, and input resolutions
+        in the IO configuration. If no configuration is provided, it creates a new one.
+
+        Args:
+            ioconfig (ModelIOConfigABC):
+                Existing IO configuration to update. If None, a new one is created.
+            patch_input_shape (IntPair):
+                Size of patches input to the model (height, width). Patches are at
+                requested read resolution, not with respect to level 0,
+                and must be positive.
+            stride_shape (IntPair):
+                Stride used during patch extraction.
+                If None, defaults to patch_input_shape.
+                Stride is at requested read resolution, not with respect to
+                level 0, and must be positive. If not provided,
+                `stride_shape=patch_input_shape`.
+            input_resolutions (list[dict[Units, Resolution]]):
+                List of dictionaries specifying resolution and units
+                for each input head. Supported units are `level`, `power` and `mpp`.
+                Keys should be "units" and "resolution"
+                e.g., [{"units": "mpp", "resolution": 0.25}]. Please see
+                :class:`WSIReader` for details.
+
+        Returns:
+            ModelIOConfigABC:
+                Updated IO configuration for patch-based inference.
+
+        Raises:
+            ValueError:
+                If neither an IO configuration nor patch/resolution parameters
+                are provided.
+
+        """
+        config_flag = (
+            patch_input_shape is None,
+            input_resolutions is None,
+        )
+        if isinstance(ioconfig, ModelIOConfigABC):
+            return ioconfig
+
+        if self.ioconfig is None and any(config_flag):
+            msg = (
+                "Must provide either "
+                "`ioconfig` or `patch_input_shape` and `input_resolutions`."
+            )
+            raise ValueError(
+                msg,
+            )
+
+        if stride_shape is None:
+            stride_shape = patch_input_shape
+
+        if self.ioconfig:
+            ioconfig = copy.deepcopy(self.ioconfig)
+            # ! not sure if there is a nicer way to set this
+            if patch_input_shape is not None:
+                ioconfig.patch_input_shape = patch_input_shape
+            if stride_shape is not None:
+                ioconfig.stride_shape = stride_shape
+            if input_resolutions is not None:
+                ioconfig.input_resolutions = input_resolutions
+
+            return ioconfig
+
+        return ModelIOConfigABC(
+            input_resolutions=input_resolutions,
+            patch_input_shape=patch_input_shape,
+            stride_shape=stride_shape,
+            output_resolutions=[],
+        )
+
+    @staticmethod
+    def _validate_images_masks(images: list | np.ndarray) -> list | np.ndarray:
+        """Validate the format and shape of input images or masks.
+
+        Ensures that the input is either a list of file paths or a 4D NumPy array
+        in NHWC format.
+
+        Args:
+            images (list | np.ndarray):
+                List of image paths or a NumPy array of image patches.
+
+        Returns:
+            list | np.ndarray:
+                The validated input images or masks.
+
+        Raises:
+            TypeError:
+                If the input is neither a list nor a NumPy array.
+            ValueError:
+                If the input is a NumPy array but not 4D (NHWC).
+
+        """
+        if not isinstance(images, (list, np.ndarray)):
+            msg = "Input must be a list of file paths or a numpy array."
+            raise TypeError(
+                msg,
+            )
+
+        if isinstance(images, np.ndarray) and images.ndim != 4:  # noqa: PLR2004
+            msg = (
+                "The input numpy array should be four dimensional."
+                "The shape of the numpy array should be NHWC."
+            )
+            raise ValueError(msg)
+
+        return [Path(image) if isinstance(image, str) else image for image in images]
+
+    @staticmethod
+    def _validate_input_numbers(
+        images: list | np.ndarray,
+        masks: list[os.PathLike] | np.ndarray | None = None,
+        labels: list | None = None,
+    ) -> None:
+        """Validate that the number of images, masks, and labels match.
+
+        Ensures that the lengths of masks and labels (if provided) match
+        the number of input images.
+
+        Args:
+            images (list | np.ndarray):
+                List of input images or a NumPy array.
+            masks (list[PathLike] | np.ndarray | None):
+                Optional list of masks corresponding to the input images.
+            labels (list | None):
+                Optional list of labels corresponding to the input images.
+
+        Returns:
+            None
+
+        Raises:
+            ValueError:
+                If the number of masks or labels does not match the number of images.
+
+        """
+        if masks is None and labels is None:
+            return
+
+        len_images = len(images)
+
+        if masks is not None and len_images != len(masks):
+            msg = (
+                f"len(masks) is not equal to len(images) "
+                f": {len(masks)} != {len(images)}"
+            )
+            raise ValueError(
+                msg,
+            )
+
+        if labels is not None and len_images != len(labels):
+            msg = (
+                f"len(labels) is not equal to len(images) "
+                f": {len(labels)} != {len(images)}"
+            )
+            raise ValueError(
+                msg,
+            )
+        return
+
+    def _update_run_params(
+        self: EngineABC,
+        images: list[os.PathLike | Path | WSIReader] | np.ndarray,
+        masks: list[os.PathLike | Path] | np.ndarray | None = None,
+        labels: list | None = None,
+        save_dir: os.PathLike | Path | None = None,
+        ioconfig: ModelIOConfigABC | None = None,
+        output_type: str = "dict",
+        *,
+        overwrite: bool = False,
+        patch_mode: bool,
+        **kwargs: Unpack[EngineABCRunParams],
+    ) -> Path | None:
+        """Update runtime parameters for the engine before running inference.
+
+        This method sets internal attributes such as caching, batch size,
+        IO configuration, and output format based on user input and keyword arguments.
+
+        Args:
+            images (list[PathLike | Path | WSIReader] | np.ndarray):
+                List of input images or a NumPy array of patches.
+            masks (list[PathLike | Path] | np.ndarray | None):
+                Optional list of masks for WSI processing.
+            labels (list | None):
+                Optional list of labels for input images.
+            save_dir (PathLike | Path | None):
+                Directory to save output files. Required for WSI mode.
+            ioconfig (ModelIOConfigABC | None):
+                IO configuration for patch extraction and resolution settings.
+            output_type (str):
+                Desired output format: "dict", "zarr", or "annotationstore".
+            overwrite (bool):
+                Whether to overwrite existing output files. Default is False.
+            patch_mode (bool):
+                Whether to treat input as patches (`True`) or WSIs (`False`).
+            **kwargs (EngineABCRunParams):
+                Additional runtime parameters to update engine attributes.
+
+        Returns:
+            Path | None:
+                Path to the save directory if applicable, otherwise None.
+
+        Raises:
+            TypeError:
+                If an unsupported output_type is provided.
+            ValueError:
+                If required configuration or input parameters are missing.
+
+        """
+        for key in kwargs:
+            setattr(self, key, kwargs.get(key))
+
+        if self.num_workers > 0:
+            dask.config.set(scheduler="threads", num_workers=self.num_workers)
+        else:
+            dask.config.set(scheduler="threads")
+
+        if not self.return_labels:
+            self.drop_keys.append("label")
+
+        self.patch_mode = patch_mode
+
+        self._validate_input_numbers(images=images, masks=masks, labels=labels)
+        if output_type.lower() not in ["dict", "zarr", "annotationstore"]:
+            msg = "output_type must be 'dict' or 'zarr' or 'annotationstore'."
+            raise TypeError(msg)
+
+        self.output_type = output_type
+
+        if save_dir is not None and output_type.lower() not in [
+            "zarr",
+            "annotationstore",
+        ]:
+            self.output_type = "zarr"
+            msg = (
+                f"output_type has been updated to 'zarr' "
+                f"for saving the file to {save_dir}."
+                f"Remove `save_dir` input to return the output as a `dict`."
+            )
+            logger.info(msg)
+
+        self.images = self._validate_images_masks(images=images)
+
+        if masks is not None:
+            self.masks = self._validate_images_masks(images=masks)
+
+        self.labels = labels
+
+        # if necessary move model parameters to "cpu" or "gpu" and update ioconfig
+        self._ioconfig = self._load_ioconfig(ioconfig=ioconfig)
+        self.model = self.model.to(device=self.device)
+        self._ioconfig = self._update_ioconfig(
+            ioconfig,
+            self.patch_input_shape,
+            self.stride_shape,
+            self.input_resolutions,
+        )
+
+        return prepare_engines_save_dir(
+            save_dir=save_dir,
+            patch_mode=patch_mode,
+            overwrite=overwrite,
+        )
+
+    def _run_patch_mode(
+        self: EngineABC,
+        output_type: str,
+        save_dir: Path,
+        **kwargs: EngineABCRunParams,
+    ) -> dict | AnnotationStore | Path:
+        """Run the engine in patch mode.
+
+        This method performs inference on image patches, post-processes the predictions,
+        and saves the output in the specified format.
+
+        Args:
+            output_type (str):
+                Desired output format. Supported values are "dict", "zarr",
+                and "annotationstore".
+            save_dir (Path):
+                Directory to save the output files.
+            **kwargs (EngineABCRunParams):
+                Additional runtime parameters including:
+                    - output_file: Name of the output file.
+                    - scale_factor: Scaling factor for annotations.
+                    - class_dict: Mapping of class indices to names.
+
+        Returns:
+            dict | AnnotationStore | Path:
+                - If output_type is "dict": returns predictions as a dictionary.
+                - If output_type is "zarr": returns path to saved zarr file.
+                - If output_type is "annotationstore": returns an AnnotationStore
+                  or path to .db file.
+
+        """
+        save_path = None
+        if save_dir:
+            output_file = Path(kwargs.get("output_file", "output.zarr"))
+            save_path = save_dir / (str(output_file.stem) + ".zarr")
+
+        duplicate_filter = DuplicateFilter()
+        logger.addFilter(duplicate_filter)
+
+        self.dataloader = self.get_dataloader(
+            images=self.images,
+            masks=self.masks,
+            labels=self.labels,
+            patch_mode=True,
+            ioconfig=self._ioconfig,
+        )
+        raw_predictions = self.infer_patches(
+            dataloader=self.dataloader,
+            return_coordinates=output_type == "annotationstore",
+        )
+
+        raw_predictions["predictions"] = self.post_process_patches(
+            raw_predictions=raw_predictions["probabilities"],
+            prediction_shape=raw_predictions["probabilities"].shape[:-1],
+            prediction_dtype=raw_predictions["probabilities"].dtype,
+            **kwargs,
+        )
+
+        logger.removeFilter(duplicate_filter)
+
+        out = self.save_predictions(
+            processed_predictions=raw_predictions,
+            output_type=output_type,
+            save_path=save_path,
+            **kwargs,
+        )
+
+        msg = f"Output file saved at {out}."
+        logger.info(msg=msg)
+        return out
+
+    @staticmethod
+    def _calculate_scale_factor(dataloader: DataLoader) -> float | tuple[float, float]:
+        """Calculate the scale factor for final output based on dataloader resolution.
+
+        This method compares the resolution used during reading with the slide's
+        baseline resolution to compute a scale factor for coordinate transformation.
+
+        Args:
+            dataloader (DataLoader):
+                PyTorch DataLoader used for WSI inference. Must contain resolution
+                and unit metadata in its dataset.
+
+        Returns:
+            float | tuple[float, float]:
+                Scale factor for converting coordinates to baseline resolution.
+                - If units are "mpp": returns (model_mpp / slide_mpp).
+                - If units are "level": returns downsample ratio.
+                - If units are "power": returns objective_power / model_power.
+                - If units are "baseline": returns the resolution directly.
+
+        """
+        # get units and resolution from dataloader.
+        dataloader_units = dataloader.dataset.units
+        dataloader_resolution = dataloader.dataset.resolution
+
+        # if dataloader units is baseline slide resolution is 1.0.
+        # in this case dataloader resolution / slide resolution will be
+        # equal to dataloader resolution.
+
+        if dataloader_units in ["mpp", "level", "power"]:
+            wsimeta_dict = dataloader.dataset.reader_info.as_dict()
+
+        if dataloader_units == "mpp":
+            slide_resolution = wsimeta_dict[dataloader_units]
+            scale_factor = np.divide(dataloader_resolution, slide_resolution)
+            return scale_factor[0], scale_factor[1]
+
+        if dataloader_units == "level":
+            downsample_ratio = wsimeta_dict["level_downsamples"][dataloader_resolution]
+            return downsample_ratio, downsample_ratio
+
+        if dataloader_units == "power":
+            slide_objective_power = wsimeta_dict["objective_power"]
+            return (
+                slide_objective_power / dataloader_resolution,
+                slide_objective_power / dataloader_resolution,
+            )
+
+        return dataloader_resolution
+
+    def _run_wsi_mode(
+        self: EngineABC,
+        output_type: str,
+        save_dir: Path,
+        **kwargs: Unpack[EngineABCRunParams],
+    ) -> dict | AnnotationStore | Path:
+        """Run the engine in WSI mode (patch_mode = False).
+
+        This method performs inference on each whole slide image (WSI),
+        post-processes the predictions, and saves the output in the specified format.
+
+        Args:
+            output_type (str):
+                Desired output format. Supported values are "dict", "zarr",
+                and "annotationstore".
+            save_dir (Path):
+                Directory to save the output files.
+            **kwargs (EngineABCRunParams):
+                Additional runtime parameters including:
+                    - output_file: Name of the output file.
+                    - scale_factor: Scaling factor for annotations.
+                    - class_dict: Mapping of class indices to names.
+
+        Returns:
+            dict | AnnotationStore | Path:
+                Dictionary mapping each input WSI to its corresponding output path.
+                Output may be a zarr file, SQLite database, or in-memory dictionary.
+
+        """
+        progress_bar = None
+        tqdm = get_tqdm()
+
+        if self.verbose:
+            progress_bar = tqdm(
+                total=len(self.images),
+                desc="Processing WSIs",
+            )
+        suffix = ".zarr"
+        if output_type == "AnnotationStore":
+            suffix = ".db"
+
+        def get_path(image: Path | WSIReader) -> Path:
+            """Return path to output file."""
+            return image.input_path if isinstance(image, WSIReader) else image
+
+        out = {
+            get_path(image): save_dir / (get_path(image).stem + suffix)
+            for image in self.images
+        }
+
+        save_path = {
+            get_path(image): save_dir / (get_path(image).stem + ".zarr")
+            for image in self.images
+        }
+
+        for image_num, image in enumerate(self.images):
+            duplicate_filter = DuplicateFilter()
+            logger.addFilter(duplicate_filter)
+            mask = self.masks[image_num] if self.masks is not None else None
+            self.dataloader = self.get_dataloader(
+                images=image,
+                masks=mask,
+                patch_mode=False,
+                ioconfig=self._ioconfig,
+                auto_get_mask=kwargs.get("auto_get_mask", True),
+            )
+
+            scale_factor = self._calculate_scale_factor(dataloader=self.dataloader)
+
+            raw_predictions = self.infer_wsi(
+                dataloader=self.dataloader,
+                save_path=save_path[get_path(image)],
+                **kwargs,
+            )
+
+            raw_predictions["predictions"] = self.post_process_wsi(
+                raw_predictions=raw_predictions["probabilities"],
+                prediction_shape=raw_predictions["probabilities"].shape[:-1],
+                prediction_dtype=raw_predictions["probabilities"].dtype,
+                **kwargs,
+            )
+
+            kwargs["output_file"] = out[get_path(image)]
+            kwargs["scale_factor"] = scale_factor
+            out[get_path(image)] = self.save_predictions(
+                processed_predictions=raw_predictions,
+                output_type=output_type,
+                save_path=save_path[get_path(image)],
+                **kwargs,
+            )
+            logger.removeFilter(duplicate_filter)
+            msg = f"Output file saved at {out[get_path(image)]}."
+            logger.info(msg=msg)
+
+            if progress_bar:
+                progress_bar.update()
+
+        if progress_bar:
+            progress_bar.close()
+
+        return out
+
+    def run(
+        self: EngineABC,
+        images: list[os.PathLike | Path | WSIReader] | np.ndarray,
+        masks: list[os.PathLike | Path] | np.ndarray | None = None,
+        labels: list | None = None,
+        ioconfig: ModelIOConfigABC | None = None,
+        *,
+        patch_mode: bool = True,
+        save_dir: os.PathLike | Path | None = None,
+        overwrite: bool = False,
+        output_type: str = "dict",
+        **kwargs: Unpack[EngineABCRunParams],
+    ) -> AnnotationStore | Path | str | dict:
+        """Run the engine on input images.
+
+        This method orchestrates the full inference pipeline, including preprocessing,
+        model inference, post-processing, and saving results. It supports both patch
+        and WSI modes.
+
+        Args:
+            images (list[PathLike | Path | WSIReader] | np.ndarray):
+                List of input images or a NumPy array of patches.
+            masks (list[PathLike | Path] | np.ndarray | None):
+                Optional list of masks for WSI processing.
+                Only utilised when patch_mode is False.
+                Patches are only generated within a masked area.
+                If not provided, then a tissue mask will be automatically
+                generated for whole slide images.
+            labels (list | None):
+                Optional list of labels for input images.
+            ioconfig (ModelIOConfigABC | None):
+                IO configuration for patch extraction and resolution settings.
+            patch_mode (bool):
+                Whether to treat input as patches (`True`) or WSIs (`False`).
+                Default is True.
+            save_dir (PathLike | Path | None):
+                Directory to save output files. Required for WSI mode.
+            overwrite (bool):
+                Whether to overwrite existing output files. Default is False.
+            output_type (str):
+                Desired output format: "dict", "zarr", or "annotationstore".
+            **kwargs (EngineABCRunParams):
+                Additional runtime parameters to update engine attributes.
+
+        Returns:
+            AnnotationStore | Path | str | dict:
+                - If patch_mode is True: returns predictions or path to saved output.
+                - If patch_mode is False: returns a dictionary mapping each WSI to
+                  its output path.
+
+        Examples:
+            >>> wsis = ['wsi1.svs', 'wsi2.svs']
+            >>> class PatchPredictor(EngineABC):
+            >>> # Define all Abstract methods.
+            >>>     ...
+            >>> predictor = PatchPredictor(model="resnet18-kather100k")
+            >>> output = predictor.run(image_patches, patch_mode=True)
+            >>> output
+            ... "/path/to/Output.db"
+            >>> output = predictor.run(
+            >>>     image_patches,
+            >>>     patch_mode=True,
+            >>>     output_type="zarr")
+            >>> output
+            ... "/path/to/Output.zarr"
+            >>> output = predictor.run(wsis, patch_mode=False)
+            >>> output.keys()
+            ... ['wsi1.svs', 'wsi2.svs']
+            >>> output['wsi1.svs']
+            ... {'/path/to/wsi1.db'}
+
+        """
+        save_dir = self._update_run_params(
+            images=images,
+            masks=masks,
+            labels=labels,
+            save_dir=save_dir,
+            ioconfig=ioconfig,
+            overwrite=overwrite,
+            patch_mode=patch_mode,
+            output_type=output_type,
+            **kwargs,
+        )
+
+        if patch_mode:
+            return self._run_patch_mode(
+                output_type=self.output_type,
+                save_dir=save_dir,
+                **kwargs,
+            )
+
+        # All inherited classes will get scale_factors,
+        # highest_input_resolution, implement dataloader,
+        # pre-processing, post-processing and save_output
+        # for WSIs separately.
+        return self._run_wsi_mode(
+            output_type=self.output_type,
+            save_dir=save_dir,
+            **kwargs,
+        )
+
+
+def prepare_engines_save_dir(
+    save_dir: str | Path | None,
+    *,
+    patch_mode: bool,
+    overwrite: bool = False,
+) -> Path | None:
+    """Create or validate the save directory for engine outputs.
+
+    Args:
+        save_dir (str | Path | None):
+            Path to the output directory.
+        patch_mode (bool):
+            Whether the input is treated as patches.
+        overwrite (bool):
+            Whether to overwrite existing directory. Default is False.
+
+    Returns:
+        Path | None:
+            Path to the output directory if created or validated, else None.
+
+    Raises:
+        OSError:
+            If patch_mode is False and save_dir is not provided.
+
+    """
+    if patch_mode:
+        if save_dir is not None:
+            save_dir = Path(save_dir)
+            save_dir.mkdir(parents=True, exist_ok=overwrite)
+            return save_dir
+        return None
+
+    if save_dir is None:
+        msg = (
+            "Input WSIs detected but no save directory provided. "
+            "Please provide a 'save_dir'."
+        )
+        raise OSError(msg)
+
+    logger.info(
+        "When providing multiple whole slide images, "
+        "the outputs will be saved and the locations of outputs "
+        "will be returned to the calling function when `run()` "
+        "finishes successfully."
+    )
+
+    save_dir = Path(save_dir)
+    save_dir.mkdir(parents=True, exist_ok=overwrite)
+
+    return save_dir
diff --git a/tiatoolbox/models/engine/io_config.py b/tiatoolbox/models/engine/io_config.py
new file mode 100644
index 000000000..e8d8b2399
--- /dev/null
+++ b/tiatoolbox/models/engine/io_config.py
@@ -0,0 +1,455 @@
+"""Defines IOConfig for Model Engines."""
+
+from __future__ import annotations
+
+from dataclasses import dataclass, field, replace
+from typing import TYPE_CHECKING
+
+import numpy as np
+
+if TYPE_CHECKING:  # pragma: no cover
+    from tiatoolbox.type_hints import Resolution, Units
+
+
+@dataclass
+class ModelIOConfigABC:
+    """Defines a data class for holding a deep learning model's I/O information.
+
+    Enforcing such that following attributes must always be defined by
+    the subclass.
+
+    Args:
+        input_resolutions (list(dict)):
+            Resolution of each input head of model inference, must be in
+            the same order as `target model.forward()`.
+        patch_input_shape (:class:`numpy.ndarray`, list(int), tuple(int, int)):
+            Shape of the largest input in (height, width).
+        stride_shape (:class:`numpy.ndarray`, list(int), tuple(int)):
+            Stride in (x, y) direction for patch extraction.
+        output_resolutions (list(dict)):
+            Resolution of each output head from model inference, must be
+            in the same order as target model.infer_batch().
+
+    Attributes:
+        input_resolutions (list(dict)):
+            Resolution of each input head of model inference, must be in
+            the same order as `target model.forward()`.
+        patch_input_shape (:class:`numpy.ndarray`, list(int), tuple(int, int)):
+            Shape of the largest input in (height, width).
+        stride_shape (:class:`numpy.ndarray`, list(int), tuple(int, int)):
+            Stride in (x, y) direction for patch extraction.
+        output_resolutions (list(dict)):
+            Resolution of each output head from model inference, must be
+            in the same order as target model.infer_batch().
+        highest_input_resolution (dict):
+            Highest resolution to process the image based on input and
+            output resolutions. This helps to read the image at the optimal
+            resolution and improves performance.
+
+    Examples:
+        >>> # Defining io for a base network and converting to baseline.
+        >>> ioconfig = ModelIOConfigABC(
+        ...     input_resolutions=[{"units": "mpp", "resolution": 0.5}],
+        ...     output_resolutions=[{"units": "mpp", "resolution": 1.0}],
+        ...     patch_input_shape=(224, 224),
+        ...     stride_shape=(224, 224),
+        ... )
+        >>> ioconfig = ioconfig.to_baseline()
+
+    """
+
+    input_resolutions: list[dict]
+    patch_input_shape: list[int] | np.ndarray | tuple[int, int]
+    stride_shape: list[int] | np.ndarray | tuple[int, int] = None
+    output_resolutions: list[dict] = field(default_factory=list)
+
+    def __post_init__(self: ModelIOConfigABC) -> None:
+        """Perform post initialization tasks."""
+        if self.stride_shape is None:
+            self.stride_shape = self.patch_input_shape
+
+        self.resolution_unit = self.input_resolutions[0]["units"]
+        self.highest_input_resolution = self.input_resolutions[0]["resolution"]
+
+        if self.resolution_unit == "mpp":
+            self.highest_input_resolution = min(
+                self.input_resolutions,
+                key=lambda x: x["resolution"],
+            )
+        else:
+            self.highest_input_resolution = max(
+                self.input_resolutions,
+                key=lambda x: x["resolution"],
+            )
+
+        self._validate()
+
+    def _validate(self: ModelIOConfigABC) -> None:
+        """Validate the data format."""
+        resolutions = self.input_resolutions + self.output_resolutions
+        units = {v["units"] for v in resolutions}
+
+        if len(units) != 1:
+            msg = (
+                f"Multiple resolution units found: `{units}`. "
+                f"Mixing resolution units is not allowed."
+            )
+            raise ValueError(
+                msg,
+            )
+
+        if units.pop() not in [
+            "power",
+            "baseline",
+            "mpp",
+        ]:
+            msg = f"Invalid resolution units `{units}`."
+            raise ValueError(msg)
+
+    @staticmethod
+    def scale_to_highest(
+        resolutions: list[dict[Units, Resolution]], units: Units
+    ) -> np.array:
+        """Get the scaling factor from input resolutions.
+
+        This will convert resolutions to a scaling factor with respect to
+        the highest resolution found in the input resolutions list. If a model
+        requires images at multiple resolutions. This helps to read the image a
+        single resolution. The image will be read at the highest required resolution
+        and will be scaled for low resolution requirements using interpolation.
+
+        Args:
+            resolutions (list(dict(Units, Resolution))):
+                A list of resolutions where one is defined as
+                `{'resolution': value, 'unit': value}`
+            units (Units):
+                Resolution units.
+
+        Returns:
+            :class:`numpy.ndarray`:
+                A 1D array of scaling factors having the same length as
+                `resolutions`.
+
+        Examples:
+            >>> # Defining io for a base network and converting to baseline.
+            >>> ioconfig = ModelIOConfigABC(
+            ...     input_resolutions=[
+            ...                {"units": "mpp", "resolution": 0.25},
+            ...                {"units": "mpp", "resolution": 0.5},
+            ...                ],
+            ...     output_resolutions=[{"units": "mpp", "resolution": 1.0}],
+            ...     patch_input_shape=(224, 224),
+            ...     stride_shape=(224, 224),
+            ... )
+            >>> ioconfig = ioconfig.scale_to_highest()
+            ... array([1. , 0.5])  # output
+            >>>
+            >>> # Defining io for a base network and converting to baseline.
+            >>> ioconfig = ModelIOConfigABC(
+            ...     input_resolutions=[
+            ...                {"units": "mpp", "resolution": 0.5},
+            ...                {"units": "mpp", "resolution": 0.25},
+            ...                ],
+            ...     output_resolutions=[{"units": "mpp", "resolution": 1.0}],
+            ...     patch_input_shape=(224, 224),
+            ...     stride_shape=(224, 224),
+            ... )
+            >>> ioconfig = ioconfig.scale_to_highest()
+            ... array([0.5 , 1.])  # output
+
+        """
+        old_vals = [v["resolution"] for v in resolutions]
+        if units not in {"baseline", "mpp", "power"}:
+            msg = (
+                f"Unknown units `{units}`. "
+                f"Units should be one of 'baseline', 'mpp' or 'power'."
+            )
+            raise ValueError(
+                msg,
+            )
+        if units == "baseline":
+            return old_vals
+        if units == "mpp":
+            return np.min(old_vals) / np.array(old_vals)
+        return np.array(old_vals) / np.max(old_vals)
+
+    def to_baseline(self: ModelIOConfigABC) -> ModelIOConfigABC:
+        """Returns a new config object converted to baseline form.
+
+        This will return a new :class:`ModelIOConfigABC` where
+        resolutions have been converted to baseline format with the
+        highest possible resolution found in both input and output as
+        reference.
+
+        """
+        resolutions = self.input_resolutions + self.output_resolutions
+        save_resolution = getattr(self, "save_resolution", None)
+        if save_resolution is not None:
+            resolutions.append(save_resolution)
+
+        scale_factors = self.scale_to_highest(resolutions, self.resolution_unit)
+        num_input_resolutions = len(self.input_resolutions)
+
+        end_idx = num_input_resolutions
+        input_resolutions = [
+            {"units": "baseline", "resolution": v} for v in scale_factors[:end_idx]
+        ]
+
+        num_input_resolutions = len(self.input_resolutions)
+        num_output_resolutions = len(self.output_resolutions)
+
+        end_idx = num_input_resolutions + num_output_resolutions
+        output_resolutions = [
+            {"units": "baseline", "resolution": v}
+            for v in scale_factors[num_input_resolutions:end_idx]
+        ]
+
+        return replace(
+            self,
+            input_resolutions=input_resolutions,
+            output_resolutions=output_resolutions,
+        )
+
+
+@dataclass
+class IOSegmentorConfig(ModelIOConfigABC):
+    """Contains semantic segmentor input and output information.
+
+    Args:
+        input_resolutions (list(dict)):
+            Resolution of each input head of model inference, must be in
+            the same order as `target model.forward()`.
+        patch_input_shape (:class:`numpy.ndarray`, list(int), tuple(int, int)):
+            Shape of the largest input in (height, width).
+        stride_shape (:class:`numpy.ndarray`, list(int), tuple(int)):
+            Stride in (x, y) direction for patch extraction.
+        output_resolutions (list(dict)):
+            Resolution of each output head from model inference, must be
+            in the same order as target model.infer_batch().
+        patch_output_shape (:class:`numpy.ndarray`, list(int)):
+            Shape of the largest output in (height, width).
+        save_resolution (dict):
+            Resolution to save all output.
+
+    Attributes:
+        input_resolutions (list(dict)):
+            Resolution of each input head of model inference, must be in
+            the same order as `target model.forward()`.
+        patch_input_shape (:class:`numpy.ndarray`, list(int), tuple(int, int)):
+            Shape of the largest input in (height, width).
+        stride_shape (:class:`numpy.ndarray`, list(int), tuple(int, int)):
+            Stride in (x, y) direction for patch extraction.
+        output_resolutions (list(dict)):
+            Resolution of each output head from model inference, must be
+            in the same order as target model.infer_batch().
+        patch_output_shape (:class:`numpy.ndarray`, list(int)):
+            Shape of the largest output in (height, width).
+        save_resolution (dict):
+            Resolution to save all output.
+        highest_input_resolution (dict):
+            Highest resolution to process the image based on input and
+            output resolutions. This helps to read the image at the optimal
+            resolution and improves performance.
+
+    Examples:
+        >>> # Defining io for a network having 1 input and 1 output at the
+        >>> # same resolution
+        >>> ioconfig = IOSegmentorConfig(
+        ...     input_resolutions=[{"units": "baseline", "resolution": 1.0}],
+        ...     output_resolutions=[{"units": "baseline", "resolution": 1.0}],
+        ...     patch_input_shape=(2048, 2048),
+        ...     patch_output_shape=(1024, 1024),
+        ...     stride_shape=(512, 512),
+        ... )
+        ...
+        >>> # Defining io for a network having 3 input and 2 output
+        >>> # at the same resolution, the output is then merged at a
+        >>> # different resolution.
+        >>> ioconfig = IOSegmentorConfig(
+        ...     input_resolutions=[
+        ...         {"units": "mpp", "resolution": 0.25},
+        ...         {"units": "mpp", "resolution": 0.50},
+        ...         {"units": "mpp", "resolution": 0.75},
+        ...     ],
+        ...     output_resolutions=[
+        ...         {"units": "mpp", "resolution": 0.25},
+        ...         {"units": "mpp", "resolution": 0.50},
+        ...     ],
+        ...     patch_input_shape=(2048, 2048),
+        ...     patch_output_shape=(1024, 1024),
+        ...     stride_shape=(512, 512),
+        ...     save_resolution={"units": "mpp", "resolution": 4.0},
+        ... )
+
+    """
+
+    patch_output_shape: list[int] | np.ndarray | tuple[int, int] = None
+    save_resolution: dict = None
+
+    def to_baseline(self: IOSegmentorConfig) -> IOSegmentorConfig:
+        """Returns a new config object converted to baseline form.
+
+        This will return a new :class:`IOSegmentorConfig` where
+        resolutions have been converted to baseline format with the
+        highest possible resolution found in both input and output as
+        reference.
+
+        """
+        new_config = super().to_baseline()
+        resolutions = self.input_resolutions + self.output_resolutions
+        if self.save_resolution is not None:
+            resolutions.append(self.save_resolution)
+
+        scale_factors = self.scale_to_highest(resolutions, self.resolution_unit)
+
+        save_resolution = None
+        if self.save_resolution is not None:
+            save_resolution = {"units": "baseline", "resolution": scale_factors[-1]}
+
+        return replace(
+            self,
+            input_resolutions=new_config.input_resolutions,
+            output_resolutions=new_config.output_resolutions,
+            save_resolution=save_resolution,
+        )
+
+
+class IOPatchPredictorConfig(ModelIOConfigABC):
+    """Contains patch predictor input and output information.
+
+    Args:
+        input_resolutions (list(dict)):
+            Resolution of each input head of model inference, must be in
+            the same order as `target model.forward()`.
+        patch_input_shape (:class:`numpy.ndarray`, list(int), tuple(int)):
+            Shape of the largest input in (height, width).
+        stride_shape (:class:`numpy.ndarray`, list(int), tuple(int)):
+            Stride in (x, y) direction for patch extraction.
+        output_resolutions (list(dict)):
+            Resolution of each output head from model inference, must be
+            in the same order as target model.infer_batch().
+
+    Attributes:
+        input_resolutions (list(dict)):
+            Resolution of each input head of model inference, must be in
+            the same order as `target model.forward()`.
+        patch_input_shape (:class:`numpy.ndarray`, list(int), tuple(int)):
+            Shape of the largest input in (height, width).
+        stride_shape (:class:`numpy.ndarray`, list(int), tuple(int)):
+            Stride in (x, y) direction for patch extraction.
+        output_resolutions (list(dict)):
+            Resolution of each output head from model inference, must be
+            in the same order as target model.infer_batch().
+        highest_input_resolution (dict):
+            Highest resolution to process the image based on input and
+            output resolutions. This helps to read the image at the optimal
+            resolution and improves performance.
+
+    Examples:
+        >>> # Defining io for a patch predictor network
+        >>> ioconfig = IOPatchPredictorConfig(
+        ...     input_resolutions=[{"units": "mpp", "resolution": 0.5}],
+        ...     output_resolutions=[{"units": "mpp", "resolution": 0.5}],
+        ...     patch_input_shape=(224, 224),
+        ...     stride_shape=(224, 224),
+        ... )
+
+    """
+
+
+@dataclass
+class IOInstanceSegmentorConfig(IOSegmentorConfig):
+    """Contains instance segmentor input and output information.
+
+    Args:
+        input_resolutions (list(dict)):
+            Resolution of each input head of model inference, must be in
+            the same order as `target model.forward()`.
+        patch_input_shape (:class:`numpy.ndarray`, list(int), tuple(int, int)):
+            Shape of the largest input in (height, width).
+        stride_shape (:class:`numpy.ndarray`, list(int), tuple(int, int)):
+            Stride in (x, y) direction for patch extraction.
+        output_resolutions (list(dict)):
+            Resolution of each output head from model inference, must be
+            in the same order as target model.infer_batch().
+        patch_output_shape (:class:`numpy.ndarray`, list(int)):
+            Shape of the largest output in (height, width).
+        save_resolution (dict):
+            Resolution to save all output.
+        margin (int):
+            Tile margin to accumulate the output.
+        tile_shape (tuple(int, int)):
+            Tile shape to process the WSI.
+
+    Attributes:
+        input_resolutions (list(dict)):
+            Resolution of each input head of model inference, must be in
+            the same order as `target model.forward()`.
+        patch_input_shape (:class:`numpy.ndarray`, list(int), tuple(int, int)):
+            Shape of the largest input in (height, width).
+        stride_shape (:class:`numpy.ndarray`, list(int), tuple(int)):
+            Stride in (x, y) direction for patch extraction.
+        output_resolutions (list(dict)):
+            Resolution of each output head from model inference, must be
+            in the same order as target model.infer_batch().
+        patch_output_shape (:class:`numpy.ndarray`, list(int)):
+            Shape of the largest output in (height, width).
+        save_resolution (dict):
+            Resolution to save all output.
+        highest_input_resolution (dict):
+            Highest resolution to process the image based on input and
+            output resolutions. This helps to read the image at the optimal
+            resolution and improves performance.
+        margin (int):
+            Tile margin to accumulate the output.
+        tile_shape (tuple(int, int)):
+            Tile shape to process the WSI.
+
+    Examples:
+        >>> # Defining io for a network having 1 input and 1 output at the
+        >>> # same resolution
+        >>> ioconfig = IOInstanceSegmentorConfig(
+        ...     input_resolutions=[{"units": "baseline", "resolution": 1.0}],
+        ...     output_resolutions=[{"units": "baseline", "resolution": 1.0}],
+        ...     patch_input_shape=(2048, 2048),
+        ...     patch_output_shape=(1024, 1024),
+        ...     stride_shape=(512, 512),
+        ...     margin=128,
+        ...     tile_shape=(1024, 1024),
+        ... )
+        >>> # Defining io for a network having 3 input and 2 output
+        >>> # at the same resolution, the output is then merged at a
+        >>> # different resolution.
+        >>> ioconfig = IOInstanceSegmentorConfig(
+        ...     input_resolutions=[
+        ...         {"units": "mpp", "resolution": 0.25},
+        ...         {"units": "mpp", "resolution": 0.50},
+        ...         {"units": "mpp", "resolution": 0.75},
+        ...     ],
+        ...     output_resolutions=[
+        ...         {"units": "mpp", "resolution": 0.25},
+        ...         {"units": "mpp", "resolution": 0.50},
+        ...     ],
+        ...     patch_input_shape=(2048, 2048),
+        ...     patch_output_shape=(1024, 1024),
+        ...     stride_shape=(512, 512),
+        ...     save_resolution={"units": "mpp", "resolution": 4.0},
+        ...     margin=128,
+        ...     tile_shape=(1024, 1024),
+        ... )
+
+    """
+
+    margin: int = None
+    tile_shape: tuple[int, int] = None
+
+    def to_baseline(self: IOInstanceSegmentorConfig) -> IOInstanceSegmentorConfig:
+        """Returns a new config object converted to baseline form.
+
+        This will return a new :class:`IOSegmentorConfig` where
+        resolutions have been converted to baseline format with the
+        highest possible resolution found in both input and output as
+        reference.
+
+        """
+        return super().to_baseline()
diff --git a/tiatoolbox/models/engine/multi_task_segmentor.py b/tiatoolbox/models/engine/multi_task_segmentor.py
index 55fd1a2d8..7293e78cc 100644
--- a/tiatoolbox/models/engine/multi_task_segmentor.py
+++ b/tiatoolbox/models/engine/multi_task_segmentor.py
@@ -31,14 +31,11 @@
 from shapely.geometry import box as shapely_box
 from shapely.strtree import STRtree
 
+from tiatoolbox.models.dataset.dataset_abc import WSIStreamDataset
 from tiatoolbox.models.engine.nucleus_instance_segmentor import (
     NucleusInstanceSegmentor,
     _process_instance_predictions,
 )
-from tiatoolbox.models.engine.semantic_segmentor import (
-    IOSegmentorConfig,
-    WSIStreamDataset,
-)
 
 if TYPE_CHECKING:  # pragma: no cover
     from collections.abc import Callable
@@ -47,6 +44,8 @@
 
     from tiatoolbox.type_hints import IntBounds
 
+    from .io_config import IOInstanceSegmentorConfig, IOSegmentorConfig
+
 
 # Python is yet to be able to natively pickle Object method/static method.
 # Only top-level function is passable to multi-processing as caller.
@@ -295,19 +294,23 @@ def __init__(
     def _predict_one_wsi(
         self: MultiTaskSegmentor,
         wsi_idx: int,
-        ioconfig: IOSegmentorConfig,
+        ioconfig: IOInstanceSegmentorConfig,
         save_path: str,
         mode: str,
     ) -> None:
         """Make a prediction on tile/wsi.
 
         Args:
-            wsi_idx (int): Index of the tile/wsi to be processed within `self`.
-            ioconfig (IOSegmentorConfig): Object which defines I/O placement during
-                inference and when assembling back to full tile/wsi.
-            save_path (str): Location to save output prediction as well as possible
+            wsi_idx (int):
+                Index of the tile/wsi to be processed within `self`.
+            ioconfig (IOInstanceSegmentorConfig):
+                Object which defines I/O placement
+                during inference and when assembling back to full tile/wsi.
+            save_path (str):
+                Location to save output prediction as well as possible
                 intermediate results.
-            mode (str): `tile` or `wsi` to indicate run mode.
+            mode (str):
+                `tile` or `wsi` to indicate run mode.
 
         """
         cache_dir = f"{self._cache_dir}/"
diff --git a/tiatoolbox/models/engine/nucleus_instance_segmentor.py b/tiatoolbox/models/engine/nucleus_instance_segmentor.py
index 18d795a34..ce74355ae 100644
--- a/tiatoolbox/models/engine/nucleus_instance_segmentor.py
+++ b/tiatoolbox/models/engine/nucleus_instance_segmentor.py
@@ -14,16 +14,15 @@
 from shapely.geometry import box as shapely_box
 from shapely.strtree import STRtree
 
-from tiatoolbox.models.engine.semantic_segmentor import (
-    IOSegmentorConfig,
-    SemanticSegmentor,
-    WSIStreamDataset,
-)
+from tiatoolbox.models.dataset.dataset_abc import WSIStreamDataset
+from tiatoolbox.models.engine.semantic_segmentor import SemanticSegmentor
 from tiatoolbox.tools.patchextraction import PatchExtractor
 
 if TYPE_CHECKING:  # pragma: no cover
     from collections.abc import Callable
 
+    from .io_config import IOInstanceSegmentorConfig, IOSegmentorConfig
+
 
 def _process_instance_predictions(
     inst_dict: dict,
@@ -409,7 +408,7 @@ def __init__(
     @staticmethod
     def _get_tile_info(
         image_shape: list[int] | np.ndarray,
-        ioconfig: IOSegmentorConfig,
+        ioconfig: IOInstanceSegmentorConfig,
     ) -> list[list, ...]:
         """Generating tile information.
 
@@ -427,7 +426,7 @@ def _get_tile_info(
             image_shape (:class:`numpy.ndarray`, list(int)):
                 The shape of WSI to extract the tile from, assumed to be
                 in `[width, height]`.
-            ioconfig (:obj:IOSegmentorConfig):
+            ioconfig (:obj:IOInstanceSegmentorConfig):
                 The input and output configuration objects.
 
         Returns:
@@ -442,7 +441,7 @@ def _get_tile_info(
                     - :class:`numpy.ndarray` - Horizontal strip tiles
                     - :class:`numpy.ndarray` - Removal flags
                 - :py:obj:`list` - Tiles and flags
-                    - :class:`numpy.ndarray` - Cross-section tiles
+                    - :class:`numpy.ndarray` - Cross section tiles
                     - :class:`numpy.ndarray` - Removal flags
 
         """
@@ -678,7 +677,7 @@ def _predict_one_wsi(
         Args:
             wsi_idx (int):
                 Index of the tile/wsi to be processed within `self`.
-            ioconfig (IOSegmentorConfig):
+            ioconfig (IOInstanceSegmentorConfig):
                 Object which defines I/O placement during inference and
                 when assembling back to full tile/wsi.
             save_path (str):
diff --git a/tiatoolbox/models/engine/patch_predictor.py b/tiatoolbox/models/engine/patch_predictor.py
index 820f04fe9..b940598ca 100644
--- a/tiatoolbox/models/engine/patch_predictor.py
+++ b/tiatoolbox/models/engine/patch_predictor.py
@@ -1,219 +1,275 @@
-"""This module implements patch level prediction."""
+"""Defines the PatchPredictor engine for patch-level inference in digital pathology.
 
-from __future__ import annotations
+This module implements the PatchPredictor class, which extends the EngineABC base
+class to support patch-based and whole slide image (WSI) inference using deep learning
+models from TIAToolbox. It provides utilities for model initialization, post-processing,
+and output management, including support for multiple output formats.
 
-import copy
-from collections import OrderedDict
-from pathlib import Path
-from typing import TYPE_CHECKING
+Classes:
+    - PatchPredictor:
+        Engine for performing patch-level predictions.
+    - PredictorRunParams:
+        TypedDict for configuring runtime parameters.
 
-import numpy as np
-import torch
-import tqdm
+Example:
+    >>> images = [np.ndarray, np.ndarray]
+    >>> predictor = PatchPredictor(model="resnet18-kather100k")
+    >>> output = predictor.run(images, patch_mode=True)
 
-from tiatoolbox import logger, rcParam
-from tiatoolbox.models.architecture import get_pretrained_model
-from tiatoolbox.models.architecture.utils import compile_model
-from tiatoolbox.models.dataset.classification import PatchDataset, WSIPatchDataset
-from tiatoolbox.models.engine.semantic_segmentor import IOSegmentorConfig
-from tiatoolbox.models.models_abc import model_to
-from tiatoolbox.utils import save_as_json
-from tiatoolbox.wsicore.wsireader import VirtualWSIReader, WSIReader
+"""
 
-if TYPE_CHECKING:  # pragma: no cover
-    from collections.abc import Callable
+from __future__ import annotations
 
-    from tiatoolbox.type_hints import IntPair, Resolution, Units
+from typing import TYPE_CHECKING
 
+from typing_extensions import Unpack
 
-class IOPatchPredictorConfig(IOSegmentorConfig):
-    """Contains patch predictor input and output information."""
+from tiatoolbox.utils.misc import cast_to_min_dtype
 
-    def __init__(
-        self: IOPatchPredictorConfig,
-        patch_input_shape: IntPair = None,
-        input_resolutions: Resolution = None,
-        stride_shape: IntPair = None,
-        **kwargs: dict,
-    ) -> None:
-        """Initialize :class:`IOPatchPredictorConfig`."""
-        stride_shape = patch_input_shape if stride_shape is None else stride_shape
-        super().__init__(
-            input_resolutions=input_resolutions,
-            output_resolutions=[],
-            stride_shape=stride_shape,
-            patch_input_shape=patch_input_shape,
-            patch_output_shape=patch_input_shape,
-            save_resolution=None,
-            **kwargs,
-        )
+from .engine_abc import EngineABC, EngineABCRunParams
 
+if TYPE_CHECKING:  # pragma: no cover
+    import os
+    from pathlib import Path
 
-class PatchPredictor:
-    r"""Patch level predictor.
-
-    The models provided by tiatoolbox should give the following results:
-
-    .. list-table:: PatchPredictor performance on the Kather100K dataset [1]
-       :widths: 15 15
-       :header-rows: 1
-
-       * - Model name
-         - F\ :sub:`1`\ score
-       * - alexnet-kather100k
-         - 0.965
-       * - resnet18-kather100k
-         - 0.990
-       * - resnet34-kather100k
-         - 0.991
-       * - resnet50-kather100k
-         - 0.989
-       * - resnet101-kather100k
-         - 0.989
-       * - resnext50_32x4d-kather100k
-         - 0.992
-       * - resnext101_32x8d-kather100k
-         - 0.991
-       * - wide_resnet50_2-kather100k
-         - 0.989
-       * - wide_resnet101_2-kather100k
-         - 0.990
-       * - densenet121-kather100k
-         - 0.993
-       * - densenet161-kather100k
-         - 0.992
-       * - densenet169-kather100k
-         - 0.992
-       * - densenet201-kather100k
-         - 0.991
-       * - mobilenet_v2-kather100k
-         - 0.990
-       * - mobilenet_v3_large-kather100k
-         - 0.991
-       * - mobilenet_v3_small-kather100k
-         - 0.992
-       * - googlenet-kather100k
-         - 0.992
-
-    .. list-table:: PatchPredictor performance on the PCam dataset [2]
-       :widths: 15 15
-       :header-rows: 1
-
-       * - Model name
-         - F\ :sub:`1`\ score
-       * - alexnet-pcam
-         - 0.840
-       * - resnet18-pcam
-         - 0.888
-       * - resnet34-pcam
-         - 0.889
-       * - resnet50-pcam
-         - 0.892
-       * - resnet101-pcam
-         - 0.888
-       * - resnext50_32x4d-pcam
-         - 0.900
-       * - resnext101_32x8d-pcam
-         - 0.892
-       * - wide_resnet50_2-pcam
-         - 0.901
-       * - wide_resnet101_2-pcam
-         - 0.898
-       * - densenet121-pcam
-         - 0.897
-       * - densenet161-pcam
-         - 0.893
-       * - densenet169-pcam
-         - 0.895
-       * - densenet201-pcam
-         - 0.891
-       * - mobilenet_v2-pcam
-         - 0.899
-       * - mobilenet_v3_large-pcam
-         - 0.895
-       * - mobilenet_v3_small-pcam
-         - 0.890
-       * - googlenet-pcam
-         - 0.867
+    import dask.array as da
+    import numpy as np
+
+    from tiatoolbox.annotation import AnnotationStore
+    from tiatoolbox.models.engine.io_config import ModelIOConfigABC
+    from tiatoolbox.models.models_abc import ModelABC
+    from tiatoolbox.wsicore import WSIReader
 
-    Args:
-        model (nn.Module):
-            Use externally defined PyTorch model for prediction with.
-            weights already loaded. Default is `None`. If provided,
-            `pretrained_model` argument is ignored.
-        pretrained_model (str):
-            Name of the existing models support by tiatoolbox for
-            processing the data. For a full list of pretrained models,
-            refer to the `docs
-            <https://tia-toolbox.readthedocs.io/en/latest/pretrained.html>`_
-            By default, the corresponding pretrained weights will also
-            be downloaded. However, you can override with your own set
-            of weights via the `pretrained_weights` argument. Argument
-            is case-insensitive.
-        pretrained_weights (str):
-            Path to the weight of the corresponding `pretrained_model`.
 
-          >>> predictor = PatchPredictor(
-          ...    pretrained_model="resnet18-kather100k",
-          ...    pretrained_weights="resnet18_local_weight")
+class PredictorRunParams(EngineABCRunParams, total=False):
+    """Parameters for configuring the `PatchPredictor.run()` method.
 
+    This class extends `EngineABCRunParams` with additional parameters specific
+    to patch-level prediction workflows.
+
+    Attributes:
+        auto_get_mask (bool):
+            Whether to automatically generate segmentation masks using
+            `wsireader.tissue_mask()` during processing.
         batch_size (int):
-            Number of images fed into the model each time.
-        num_loader_workers (int):
-            Number of workers to load the data. Take note that they will
-            also perform preprocessing.
+            Number of image patches to feed to the model in a forward pass.
+        class_dict (dict):
+            Optional dictionary mapping classification outputs to class names.
+        device (str):
+            Device to run the model on (e.g., "cpu", "cuda").
+        input_resolutions (list[dict]):
+            Resolution used for reading the image. See `WSIReader` for details.
+        ioconfig (ModelIOConfigABC):
+            Input/output configuration for patch extraction and resolution.
+        memory_threshold (int):
+            Memory usage threshold (in percentage) to trigger caching behavior.
+        num_workers (int):
+            Number of workers used in DataLoader.
+        output_file (str):
+            Output file name for saving results (e.g., .zarr or .db).
+        patch_input_shape (tuple[int, int]):
+            Shape of input patches (height, width).
+        return_labels (bool):
+            Whether to return labels with predictions.
+        return_probabilities (bool):
+            Whether to return per-class probabilities in the output.
+            If False, only predicted labels are returned.
+        scale_factor (tuple[float, float]):
+            Scale factor for converting annotations to baseline resolution.
+            Typically model_mpp / slide_mpp.
+        stride_shape (tuple[int, int]):
+            Stride used during WSI processing. Defaults to patch_input_shape.
         verbose (bool):
             Whether to output logging information.
 
-    Attributes:
-        img (:obj:`str` or :obj:`pathlib.Path` or :obj:`numpy.ndarray`):
-            A HWC image or a path to WSI.
-        mode (str):
-            Type of input to process. Choose from either `patch`, `tile`
-            or `wsi`.
-        model (nn.Module):
-            Defined PyTorch model.
-        pretrained_model (str):
-            Name of the existing models support by tiatoolbox for
-            processing the data. For a full list of pretrained models,
-            refer to the `docs
+    """
+
+    return_probabilities: bool
+
+
+class PatchPredictor(EngineABC):
+    r"""Patch-level prediction engine for digital histology images.
+
+    This class extends `EngineABC` to support patch-based inference using
+    pretrained or custom models from TIAToolbox. It supports both patch and
+    whole slide image (WSI) modes, and provides utilities for post-processing
+    and saving predictions.
+
+    Supported Models:
+        .. list-table:: PatchPredictor performance on the Kather100K dataset [1].
+           :widths: 15 15
+           :header-rows: 1
+
+           * - Model name
+             - F\ :sub:`1`\ score
+           * - alexnet-kather100k
+             - 0.965
+           * - resnet18-kather100k
+             - 0.990
+           * - resnet34-kather100k
+             - 0.991
+           * - resnet50-kather100k
+             - 0.989
+           * - resnet101-kather100k
+             - 0.989
+           * - resnext50_32x4d-kather100k
+             - 0.992
+           * - resnext101_32x8d-kather100k
+             - 0.991
+           * - wide_resnet50_2-kather100k
+             - 0.989
+           * - wide_resnet101_2-kather100k
+             - 0.990
+           * - densenet121-kather100k
+             - 0.993
+           * - densenet161-kather100k
+             - 0.992
+           * - densenet169-kather100k
+             - 0.992
+           * - densenet201-kather100k
+             - 0.991
+           * - mobilenet_v2-kather100k
+             - 0.990
+           * - mobilenet_v3_large-kather100k
+             - 0.991
+           * - mobilenet_v3_small-kather100k
+             - 0.992
+           * - googlenet-kather100k
+             - 0.992
+
+        .. list-table:: PatchPredictor performance on the PCam dataset [2]
+           :widths: 15 15
+           :header-rows: 1
+
+           * - Model name
+             - F\ :sub:`1`\ score
+           * - alexnet-pcam
+             - 0.840
+           * - resnet18-pcam
+             - 0.888
+           * - resnet34-pcam
+             - 0.889
+           * - resnet50-pcam
+             - 0.892
+           * - resnet101-pcam
+             - 0.888
+           * - resnext50_32x4d-pcam
+             - 0.900
+           * - resnext101_32x8d-pcam
+             - 0.892
+           * - wide_resnet50_2-pcam
+             - 0.901
+           * - wide_resnet101_2-pcam
+             - 0.898
+           * - densenet121-pcam
+             - 0.897
+           * - densenet161-pcam
+             - 0.893
+           * - densenet169-pcam
+             - 0.895
+           * - densenet201-pcam
+             - 0.891
+           * - mobilenet_v2-pcam
+             - 0.899
+           * - mobilenet_v3_large-pcam
+             - 0.895
+           * - mobilenet_v3_small-pcam
+             - 0.890
+           * - googlenet-pcam
+             - 0.867
+
+    Args:
+        model (str | ModelABC):
+            A PyTorch model instance or name of a pretrained model from TIAToolbox.
+            If a string is provided, pretrained weights
+            will be downloaded unless overridden via `weights`.
+            The user can request pretrained models from the toolbox model zoo using
+            the list of pretrained models available at this `link
             <https://tia-toolbox.readthedocs.io/en/latest/pretrained.html>`_
             By default, the corresponding pretrained weights will also
-            be downloaded. However, you can override with your own set
-            of weights via the `pretrained_weights` argument. Argument
-            is case insensitive.
+            be downloaded.
         batch_size (int):
-            Number of images fed into the model each time.
-        num_loader_worker (int):
-            Number of workers used in torch.utils.data.DataLoader.
+            Number of image patches processed per forward pass.
+            Default is 8.
+        num_workers (int):
+            Number of workers for data loading. Default is 0.
+        weights (str | Path | None):
+            Path to model weights. If None, default weights are used.
+
+            >>> engine = PatchPredictor(
+            ...    model="pretrained-model",
+            ...    weights="/path/to/pretrained-local-weights.pth"
+            ... )
+
+        device (str):
+            Device to run the model on (e.g., "cpu", "cuda"). Default is "cpu".
         verbose (bool):
-            Whether to output logging information.
+            Whether to enable verbose logging. Default is True.
+
 
-    Examples:
+    Attributes:
+        images (list[str | Path] | np.ndarray):
+            Input image patches or WSI paths.
+        masks (list[str | Path] | np.ndarray):
+            Optional tissue masks for WSI processing.
+            These are only utilized when patch_mode is False.
+            If not provided, then a tissue mask will be automatically
+            generated for whole slide images.
+        patch_mode (bool):
+            Whether input is treated as patches (`True`) or WSIs (`False`).
+        model (ModelABC):
+            Loaded PyTorch model.
+        ioconfig (ModelIOConfigABC):
+            IO configuration for patch extraction and resolution.
+        return_labels (bool):
+            Whether to include labels in the output.
+        input_resolutions (list[dict]):
+            Resolution settings for model input. Supported
+            units are `level`, `power` and `mpp`. Keys should be "units" and
+            "resolution" e.g., [{"units": "mpp", "resolution": 0.25}]. Please see
+            :class:`WSIReader` for details.
+        patch_input_shape (tuple[int, int]):
+            Shape of input patches (height, width). Patches are at
+            requested read resolution, not with respect to level 0,
+            and must be positive.
+        stride_shape (tuple[int, int]):
+            Stride used during patch extraction. Stride is
+            at requested read resolution, not with respect to
+            level 0, and must be positive. If not provided,
+            `stride_shape=patch_input_shape`.
+        labels (list | None):
+            Optional labels for input images.
+            Only a single label per image is supported.
+        drop_keys (list):
+            Keys to exclude from model output.
+        output_type (str):
+            Format of output ("dict", "zarr", "annotationstore").
+
+    Example:
         >>> # list of 2 image patches as input
-        >>> data = [img1, img2]
-        >>> predictor = PatchPredictor(pretrained_model="resnet18-kather100k")
-        >>> output = predictor.predict(data, mode='patch')
+        >>> data = ['path/img.svs', 'path/img.svs']
+        >>> predictor = PatchPredictor(model="resnet18-kather100k")
+        >>> output = predictor.run(data, patch_mode=False)
 
         >>> # array of list of 2 image patches as input
         >>> data = np.array([img1, img2])
-        >>> predictor = PatchPredictor(pretrained_model="resnet18-kather100k")
-        >>> output = predictor.predict(data, mode='patch')
+        >>> predictor = PatchPredictor(model="resnet18-kather100k")
+        >>> output = predictor.run(data, patch_mode=True)
 
         >>> # list of 2 image patch files as input
         >>> data = ['path/img.png', 'path/img.png']
-        >>> predictor = PatchPredictor(pretrained_model="resnet18-kather100k")
-        >>> output = predictor.predict(data, mode='patch')
+        >>> predictor = PatchPredictor(model="resnet18-kather100k")
+        >>> output = predictor.run(data, patch_mode=True)
 
         >>> # list of 2 image tile files as input
         >>> tile_file = ['path/tile1.png', 'path/tile2.png']
-        >>> predictor = PatchPredictor(pretraind_model="resnet18-kather100k")
-        >>> output = predictor.predict(tile_file, mode='tile')
+        >>> predictor = PatchPredictor(model="resnet18-kather100k")
+        >>> output = predictor.run(tile_file, patch_mode=False)
 
         >>> # list of 2 wsi files as input
         >>> wsi_file = ['path/wsi1.svs', 'path/wsi2.svs']
-        >>> predictor = PatchPredictor(pretraind_model="resnet18-kather100k")
-        >>> output = predictor.predict(wsi_file, mode='wsi')
+        >>> predictor = PatchPredictor(model="resnet18-kather100k")
+        >>> output = predictor.run(wsi_file, patch_mode=False)
 
     References:
         [1] Kather, Jakob Nikolas, et al. "Predicting survival from colorectal cancer
@@ -228,745 +284,253 @@ class PatchPredictor:
 
     def __init__(
         self: PatchPredictor,
+        model: str | ModelABC,
         batch_size: int = 8,
-        num_loader_workers: int = 0,
-        model: torch.nn.Module = None,
-        pretrained_model: str | None = None,
-        pretrained_weights: str | None = None,
+        num_workers: int = 0,
+        weights: str | Path | None = None,
         *,
+        device: str = "cpu",
         verbose: bool = True,
     ) -> None:
-        """Initialize :class:`PatchPredictor`."""
-        super().__init__()
-
-        self.imgs = None
-        self.mode = None
-
-        if model is None and pretrained_model is None:
-            msg = "Must provide either `model` or `pretrained_model`."
-            raise ValueError(msg)
-
-        if model is not None:
-            self.model = model
-            ioconfig = None  # retrieve iostate from provided model ?
-        else:
-            model, ioconfig = get_pretrained_model(pretrained_model, pretrained_weights)
-
-        self.ioconfig = ioconfig  # for storing original
-        self._ioconfig = None  # for storing runtime
-        self.model = (
-            compile_model(  # for runtime, such as after wrapping with nn.DataParallel
-                model,
-                mode=rcParam["torch_compile_mode"],
-            )
-        )
-        self.pretrained_model = pretrained_model
-        self.batch_size = batch_size
-        self.num_loader_worker = num_loader_workers
-        self.verbose = verbose
-
-    @staticmethod
-    def merge_predictions(
-        img: str | Path | np.ndarray,
-        output: dict,
-        resolution: Resolution | None = None,
-        units: Units | None = None,
-        postproc_func: Callable | None = None,
-        *,
-        return_raw: bool = False,
-    ) -> np.ndarray:
-        """Merge patch level predictions to form a 2-dimensional prediction map.
-
-        #! Improve how the below reads.
-        The prediction map will contain values from 0 to N, where N is
-        the number of classes. Here, 0 is the background which has not
-        been processed by the model and N is the number of classes
-        predicted by the model.
+        """Initialize the PatchPredictor engine.
 
         Args:
-            img (:obj:`str` or :obj:`pathlib.Path` or :class:`numpy.ndarray`):
-              A HWC image or a path to WSI.
-            output (dict):
-                Output generated by the model.
-            resolution (Resolution):
-                Resolution of merged predictions.
-            units (Units):
-                Units of resolution used when merging predictions. This
-                must be the same `units` used when processing the data.
-            postproc_func (callable):
-                A function to post-process raw prediction from model. By
-                default, internal code uses the `np.argmax` function.
-            return_raw (bool):
-                Return raw result without applying the `postproc_func`
-                on the assembled image.
-
-        Returns:
-            :class:`numpy.ndarray`:
-                Merged predictions as a 2D array.
-
-        Examples:
-            >>> # pseudo output dict from model with 2 patches
-            >>> output = {
-            ...     'resolution': 1.0,
-            ...     'units': 'baseline',
-            ...     'probabilities': [[0.45, 0.55], [0.90, 0.10]],
-            ...     'predictions': [1, 0],
-            ...     'coordinates': [[0, 0, 2, 2], [2, 2, 4, 4]],
-            ... }
-            >>> merged = PatchPredictor.merge_predictions(
-            ...         np.zeros([4, 4]),
-            ...         output,
-            ...         resolution=1.0,
-            ...         units='baseline'
-            ... )
-            >>> merged
-            ... array([[2, 2, 0, 0],
-            ...    [2, 2, 0, 0],
-            ...    [0, 0, 1, 1],
-            ...    [0, 0, 1, 1]])
-
-        """
-        reader = WSIReader.open(img)
-        if isinstance(reader, VirtualWSIReader):
-            logger.warning(
-                "Image is not pyramidal hence read is forced to be "
-                "at `units='baseline'` and `resolution=1.0`.",
-                stacklevel=2,
-            )
-            resolution = 1.0
-            units = "baseline"
-
-        canvas_shape = reader.slide_dimensions(resolution=resolution, units=units)
-        canvas_shape = canvas_shape[::-1]  # XY to YX
-
-        # may crash here, do we need to deal with this ?
-        output_shape = reader.slide_dimensions(
-            resolution=output["resolution"],
-            units=output["units"],
-        )
-        output_shape = output_shape[::-1]  # XY to YX
-        fx = np.array(canvas_shape) / np.array(output_shape)
-
-        if "probabilities" not in output:
-            coordinates = output["coordinates"]
-            predictions = output["predictions"]
-            denominator = None
-            output = np.zeros(list(canvas_shape), dtype=np.float32)
-        else:
-            coordinates = output["coordinates"]
-            predictions = output["probabilities"]
-            num_class = np.array(predictions[0]).shape[0]
-            denominator = np.zeros(canvas_shape)
-            output = np.zeros([*list(canvas_shape), num_class], dtype=np.float32)
-
-        for idx, bound in enumerate(coordinates):
-            prediction = predictions[idx]
-            # assumed to be in XY
-            # top-left for output placement
-            tl = np.ceil(np.array(bound[:2]) * fx).astype(np.int32)
-            # bot-right for output placement
-            br = np.ceil(np.array(bound[2:]) * fx).astype(np.int32)
-            output[tl[1] : br[1], tl[0] : br[0]] += prediction
-            if denominator is not None:
-                denominator[tl[1] : br[1], tl[0] : br[0]] += 1
-
-        # deal with overlapping regions
-        if denominator is not None:
-            output = output / (np.expand_dims(denominator, -1) + 1.0e-8)
-            if not return_raw:
-                # convert raw probabilities to predictions
-                if postproc_func is not None:
-                    output = postproc_func(output)
-                else:
-                    output = np.argmax(output, axis=-1)
-                # to make sure background is 0 while class will be 1...N
-                output[denominator > 0] += 1
-        return output
-
-    def _predict_engine(
-        self: PatchPredictor,
-        dataset: torch.utils.data.Dataset,
-        device: str = "cpu",
-        *,
-        return_probabilities: bool = False,
-        return_labels: bool = False,
-        return_coordinates: bool = False,
-    ) -> np.ndarray:
-        """Make a prediction on a dataset. The dataset may be mutated.
-
-        Args:
-            dataset (torch.utils.data.Dataset):
-                PyTorch dataset object created using
-                `tiatoolbox.models.data.classification.Patch_Dataset`.
-            return_probabilities (bool):
-                Whether to return per-class probabilities.
-            return_labels (bool):
-                Whether to return labels.
-            return_coordinates (bool):
-                Whether to return patch coordinates.
+            model (str | ModelABC):
+                A PyTorch model instance or name of a pretrained model from TIAToolbox.
+                If a string is provided, the corresponding pretrained
+                weights will be downloaded unless overridden via `weights`.
+            batch_size (int):
+                Number of image patches processed per forward pass. Default is 8.
+            num_workers (int):
+                Number of workers for data loading. Default is 0.
+            weights (str | Path | None): Path to model weights.
+                If None, default weights are used.
             device (str):
-                :class:`torch.device` to run the model.
-                Select the device to run the model. Please see
-                https://pytorch.org/docs/stable/tensor_attributes.html#torch.device
-                for more details on input parameters for device. Default value is "cpu".
-
-        Returns:
-            :class:`numpy.ndarray`:
-                Model predictions of the input dataset
+                device to run the model on (e.g., "cpu", "cuda"). Default is "cpu".
+            verbose (bool):
+                Whether to enable verbose logging. Default is True.
 
         """
-        dataset.preproc_func = self.model.preproc_func
-
-        # preprocessing must be defined with the dataset
-        dataloader = torch.utils.data.DataLoader(
-            dataset,
-            num_workers=self.num_loader_worker,
-            batch_size=self.batch_size,
-            drop_last=False,
-            shuffle=False,
+        super().__init__(
+            model=model,
+            batch_size=batch_size,
+            num_workers=num_workers,
+            weights=weights,
+            device=device,
+            verbose=verbose,
         )
 
-        if self.verbose:
-            pbar = tqdm.tqdm(
-                total=len(dataloader),
-                leave=True,
-                ncols=80,
-                ascii=True,
-                position=0,
-            )
-
-        # use external for testing
-        model = model_to(model=self.model, device=device)
-
-        cum_output = {
-            "probabilities": [],
-            "predictions": [],
-            "coordinates": [],
-            "labels": [],
-        }
-        for _, batch_data in enumerate(dataloader):
-            batch_output_probabilities = self.model.infer_batch(
-                model,
-                batch_data["image"],
-                device=device,
-            )
-            # We get the index of the class with the maximum probability
-            batch_output_predictions = self.model.postproc_func(
-                batch_output_probabilities,
-            )
-
-            # tolist might be very expensive
-            cum_output["probabilities"].extend(batch_output_probabilities.tolist())
-            cum_output["predictions"].extend(batch_output_predictions.tolist())
-            if return_coordinates:
-                cum_output["coordinates"].extend(batch_data["coords"].tolist())
-            if return_labels:  # be careful of `s`
-                # We do not use tolist here because label may be of mixed types
-                # and hence collated as list by torch
-                cum_output["labels"].extend(list(batch_data["label"]))
-
-            if self.verbose:
-                pbar.update()
-        if self.verbose:
-            pbar.close()
-
-        if not return_probabilities:
-            cum_output.pop("probabilities")
-        if not return_labels:
-            cum_output.pop("labels")
-        if not return_coordinates:
-            cum_output.pop("coordinates")
-
-        return cum_output
-
-    def _update_ioconfig(
+    def post_process_patches(
         self: PatchPredictor,
-        ioconfig: IOPatchPredictorConfig,
-        patch_input_shape: IntPair,
-        stride_shape: IntPair,
-        resolution: Resolution,
-        units: Units,
-    ) -> IOPatchPredictorConfig:
-        """Updates the ioconfig.
+        raw_predictions: da.Array,
+        prediction_shape: tuple[int, ...],
+        prediction_dtype: type,
+        **kwargs: Unpack[PredictorRunParams],
+    ) -> da.Array:
+        """Post-process raw patch predictions from model inference.
 
-        Args:
-            ioconfig (IOPatchPredictorConfig):
-                Input ioconfig for PatchPredictor.
-            patch_input_shape (IntPair):
-                Size of patches input to the model. Patches are at
-                requested read resolution, not with respect to level 0,
-                and must be positive.
-            stride_shape (IntPair):
-                Stride using during tile and WSI processing. Stride is
-                at requested read resolution, not with respect to
-                level 0, and must be positive. If not provided,
-                `stride_shape=patch_input_shape`.
-            resolution (Resolution):
-                Resolution used for reading the image. Please see
-                :obj:`WSIReader` for details.
-            units (Units):
-                Units of resolution used for reading the image.
-
-        Returns:
-            IOPatchPredictorConfig:
-                Updated Patch Predictor IO configuration.
-
-        """
-        config_flag = (
-            patch_input_shape is None,
-            resolution is None,
-            units is None,
-        )
-        if ioconfig:
-            return ioconfig
-
-        if self.ioconfig is None and any(config_flag):
-            msg = (
-                "Must provide either "
-                "`ioconfig` or `patch_input_shape`, `resolution`, and `units`."
-            )
-            raise ValueError(
-                msg,
-            )
-
-        if stride_shape is None:
-            stride_shape = patch_input_shape
-
-        if self.ioconfig:
-            ioconfig = copy.deepcopy(self.ioconfig)
-            # ! not sure if there is a nicer way to set this
-            if patch_input_shape is not None:
-                ioconfig.patch_input_shape = patch_input_shape
-            if stride_shape is not None:
-                ioconfig.stride_shape = stride_shape
-            if resolution is not None:
-                ioconfig.input_resolutions[0]["resolution"] = resolution
-            if units is not None:
-                ioconfig.input_resolutions[0]["units"] = units
-
-            return ioconfig
-
-        return IOPatchPredictorConfig(
-            input_resolutions=[{"resolution": resolution, "units": units}],
-            patch_input_shape=patch_input_shape,
-            stride_shape=stride_shape,
-        )
-
-    @staticmethod
-    def _prepare_save_dir(save_dir: str | Path, imgs: list | np.ndarray) -> Path:
-        """Create directory if not defined and number of images is more than 1.
+        This method applies the model's post-processing function to the raw predictions
+        obtained from `infer_patches()`. The output is wrapped in a Dask array for
+        efficient computation and memory handling.
 
         Args:
-            save_dir (str or Path):
-                Path to output directory.
-            imgs (list, ndarray):
-                List of inputs to process.
+            raw_predictions (da.Array | np.ndarray):
+                Raw model predictions.
+            prediction_shape (tuple[int, ...]):
+                Expected shape of the prediction output.
+            prediction_dtype (type):
+                Data type of the prediction output.
+            **kwargs (PredictorRunParams):
+                Additional runtime parameters, including `return_probabilities`.
 
         Returns:
-            :class:`Path`:
-                Path to output directory.
+            dask.array.Array: Post-processed predictions as a Dask array.
 
         """
-        if save_dir is None and len(imgs) > 1:
-            logger.warning(
-                "More than 1 WSIs detected but there is no save directory set."
-                "All subsequent output will be saved to current runtime"
-                "location under folder 'output'. Overwriting may happen!",
-                stacklevel=2,
-            )
-            save_dir = Path.cwd() / "output"
-        elif save_dir is not None and len(imgs) > 1:
-            logger.warning(
-                "When providing multiple whole-slide images / tiles, "
-                "we save the outputs and return the locations "
-                "to the corresponding files.",
-                stacklevel=2,
-            )
-
-        if save_dir is not None:
-            save_dir = Path(save_dir)
-            save_dir.mkdir(parents=True, exist_ok=False)
-
-        return save_dir
-
-    def _predict_patch(
+        _ = kwargs.get("return_probabilities")
+        _ = prediction_shape
+        _ = prediction_dtype
+        raw_predictions = self.model.postproc_func(raw_predictions)
+        return cast_to_min_dtype(raw_predictions)
+
+    def post_process_wsi(
         self: PatchPredictor,
-        imgs: list | np.ndarray,
-        labels: list,
-        device: str = "cpu",
-        *,
-        return_probabilities: bool,
-        return_labels: bool,
-    ) -> np.ndarray:
-        """Process patch mode.
+        raw_predictions: da.Array,
+        prediction_shape: tuple[int, ...],
+        prediction_dtype: type,
+        **kwargs: Unpack[PredictorRunParams],
+    ) -> da.Array:
+        """Post-process predictions from whole slide image (WSI) inference.
+
+        This method refines the raw patch-level predictions obtained from WSI inference.
+        It typically applies spatial smoothing or other contextual operations using
+        neighboring patch information. Internally, it delegates to
+        `post_process_patches()`.
 
         Args:
-            imgs (list, ndarray):
-                List of inputs to process. when using `patch` mode, the
-                input must be either a list of images, a list of image
-                file paths or a numpy array of an image list. When using
-                `tile` or `wsi` mode, the input must be a list of file
-                paths.
-            labels (list):
-                List of labels. If using `tile` or `wsi` mode, then only
-                a single label per image tile or whole-slide image is
-                supported.
-            return_probabilities (bool):
-                Whether to return per-class probabilities.
-            return_labels (bool):
-                Whether to return the labels with the predictions.
-            device (str):
-                :class:`torch.device` to run the model.
-                Select the device to run the model. Please see
-                https://pytorch.org/docs/stable/tensor_attributes.html#torch.device
-                for more details on input parameters for device. Default value is "cpu".
+            raw_predictions (dask.array.Array):
+                Raw model predictions.
+            prediction_shape (tuple[int, ...]):
+                Expected shape of the prediction output.
+            prediction_dtype (type):
+                Data type of the prediction output.
+            **kwargs (PredictorRunParams):
+                Additional runtime parameters, including `return_probabilities`.
 
         Returns:
-            :class:`numpy.ndarray`:
-                Model predictions of the input dataset
+            dask.array.Array: Post-processed predictions as a Dask array.
 
         """
-        if labels:
-            # if a labels is provided, then return with the prediction
-            return_labels = bool(labels)
-
-        if labels and len(labels) != len(imgs):
-            msg = f"len(labels) != len(imgs) : {len(labels)} != {len(imgs)}"
-            raise ValueError(
-                msg,
-            )
-
-        # don't return coordinates if patches are already extracted
-        return_coordinates = False
-        dataset = PatchDataset(imgs, labels)
-        return self._predict_engine(
-            dataset,
-            return_probabilities=return_probabilities,
-            return_labels=return_labels,
-            return_coordinates=return_coordinates,
-            device=device,
+        return self.post_process_patches(
+            raw_predictions=raw_predictions,
+            prediction_shape=prediction_shape,
+            prediction_dtype=prediction_dtype,
+            **kwargs,
         )
 
-    def _predict_tile_wsi(  # noqa: PLR0913
+    def _update_run_params(
         self: PatchPredictor,
-        imgs: list,
-        masks: list | None,
-        labels: list,
-        mode: str,
-        ioconfig: IOPatchPredictorConfig,
-        save_dir: str | Path,
-        highest_input_resolution: list[dict],
-        device: str = "cpu",
+        images: list[os.PathLike | Path | WSIReader] | np.ndarray,
+        masks: list[os.PathLike | Path] | np.ndarray | None = None,
+        labels: list | None = None,
+        save_dir: os.PathLike | Path | None = None,
+        ioconfig: ModelIOConfigABC | None = None,
+        output_type: str = "dict",
         *,
-        save_output: bool,
-        return_probabilities: bool,
-        merge_predictions: bool,
-    ) -> list | dict:
-        """Predict on Tile and WSIs.
+        overwrite: bool = False,
+        patch_mode: bool,
+        **kwargs: Unpack[PredictorRunParams],
+    ) -> Path | None:
+        """Update runtime parameters for the PatchPredictor engine.
 
-        Args:
-            imgs (list, ndarray):
-                List of inputs to process. when using `patch` mode, the
-                input must be either a list of images, a list of image
-                file paths or a numpy array of an image list. When using
-                `tile` or `wsi` mode, the input must be a list of file
-                paths.
-            masks (list):
-                List of masks. Only utilised when processing image tiles
-                and whole-slide images. Patches are only processed if
-                they are within a masked area. If not provided, then a
-                tissue mask will be automatically generated for
-                whole-slide images or the entire image is processed for
-                image tiles.
-            labels (list):
-                List of labels. If using `tile` or `wsi` mode, then only
-                a single label per image tile or whole-slide image is
-                supported.
-            mode (str):
-                Type of input to process. Choose from either `patch`,
-                `tile` or `wsi`.
-            return_probabilities (bool):
-                Whether to return per-class probabilities.
-            device (str):
-                :class:`torch.device` to run the model.
-                Select the device to run the model. Please see
-                https://pytorch.org/docs/stable/tensor_attributes.html#torch.device
-                for more details on input parameters for device. Default value is "cpu".
-            ioconfig (IOPatchPredictorConfig):
-                Patch Predictor IO configuration..
-            merge_predictions (bool):
-                Whether to merge the predictions to form a 2-dimensional
-                map. This is only applicable for `mode='wsi'` or
-                `mode='tile'`.
-            save_dir (str or pathlib.Path):
-                Output directory when processing multiple tiles and
-                whole-slide images. By default, it is folder `output`
-                where the running script is invoked.
-            save_output (bool):
-                Whether to save output for a single file. default=False
-            highest_input_resolution (list(dict)):
-                Highest available input resolution.
+        This method sets internal attributes such as caching, batch size,
+        IO configuration, and output format based on user input and keyword arguments.
+        It also configures whether to include probabilities in the output.
 
+        Args:
+            images (list[PathLike | WSIReader] | np.ndarray):
+                Input images or patches.
+            masks (list[PathLike] | np.ndarray | None):
+                Optional masks for WSI processing.
+            labels (list | None):
+                Optional labels for input images.
+            save_dir (PathLike | None):
+                Directory to save output files. Required for WSI mode.
+            ioconfig (ModelIOConfigABC | None):
+                IO configuration for patch extraction and resolution.
+            output_type (str):
+                Desired output format: "dict", "zarr", or "annotationstore".
+            overwrite (bool):
+                Whether to overwrite existing output files. Default is False.
+            patch_mode (bool):
+                Whether to treat input as patches (`True`) or WSIs (`False`).
+            **kwargs (PredictorRunParams):
+                Additional runtime parameters.
 
         Returns:
-            dict:
-                Results are saved to `save_dir` and a dictionary indicating save
-                location for each input is returned. The dict is in the following
-                format:
-                    - img_path: path of the input image.
-                        - raw: path to save location for raw prediction,
-                          saved in .json.
-                        - merged: path to .npy contain merged
-                          predictions if
-                        `merge_predictions` is `True`.
+            Path | None:
+                Path to the save directory if applicable, otherwise None.
 
         """
-        # return coordinates of patches processed within a tile / whole-slide image
-        return_coordinates = True
-
-        input_is_path_like = isinstance(imgs[0], (str, Path))
-        default_save_dir = (
-            imgs[0].parent / "output" if input_is_path_like else Path.cwd()
+        return_probabilities = kwargs.get("return_probabilities")
+        if not return_probabilities:
+            self.drop_keys.append("probabilities")
+        return super()._update_run_params(
+            images=images,
+            masks=masks,
+            labels=labels,
+            save_dir=save_dir,
+            ioconfig=ioconfig,
+            overwrite=overwrite,
+            patch_mode=patch_mode,
+            output_type=output_type,
+            **kwargs,
         )
-        save_dir = default_save_dir if save_dir is None else Path(save_dir)
-
-        # None if no output
-        outputs = None
-
-        self._ioconfig = ioconfig
-        # generate a list of output file paths if number of input images > 1
-        file_dict = OrderedDict()
-
-        if len(imgs) > 1:
-            save_output = True
-
-        for idx, img_path in enumerate(imgs):
-            img_path_ = Path(img_path)
-            img_label = None if labels is None else labels[idx]
-            img_mask = None if masks is None else masks[idx]
-
-            dataset = WSIPatchDataset(
-                img_path_,
-                mode=mode,
-                mask_path=img_mask,
-                patch_input_shape=ioconfig.patch_input_shape,
-                stride_shape=ioconfig.stride_shape,
-                resolution=ioconfig.input_resolutions[0]["resolution"],
-                units=ioconfig.input_resolutions[0]["units"],
-            )
-            output_model = self._predict_engine(
-                dataset,
-                return_labels=False,
-                return_probabilities=return_probabilities,
-                return_coordinates=return_coordinates,
-                device=device,
-            )
-            output_model["label"] = img_label
-            # add extra information useful for downstream analysis
-            output_model["pretrained_model"] = self.pretrained_model
-            output_model["resolution"] = highest_input_resolution["resolution"]
-            output_model["units"] = highest_input_resolution["units"]
-
-            outputs = [output_model]  # assign to a list
-            merged_prediction = None
-            if merge_predictions:
-                merged_prediction = self.merge_predictions(
-                    img_path_,
-                    output_model,
-                    resolution=output_model["resolution"],
-                    units=output_model["units"],
-                    postproc_func=self.model.postproc,
-                )
-                outputs.append(merged_prediction)
-
-            if save_output:
-                # dynamic 0 padding
-                img_code = f"{idx:0{len(str(len(imgs)))}d}"
-
-                save_info = {}
-                save_path = save_dir / img_code
-                raw_save_path = f"{save_path}.raw.json"
-                save_info["raw"] = raw_save_path
-                save_as_json(output_model, raw_save_path)
-                if merge_predictions:
-                    merged_file_path = f"{save_path}.merged.npy"
-                    np.save(merged_file_path, merged_prediction)
-                    save_info["merged"] = merged_file_path
-                file_dict[str(img_path_)] = save_info
-
-        return file_dict if save_output else outputs
-
-    def predict(  # noqa: PLR0913
+
+    def run(
         self: PatchPredictor,
-        imgs: list,
-        masks: list | None = None,
+        images: list[os.PathLike | Path | WSIReader] | np.ndarray,
+        masks: list[os.PathLike | Path] | np.ndarray | None = None,
         labels: list | None = None,
-        mode: str = "patch",
-        ioconfig: IOPatchPredictorConfig | None = None,
-        patch_input_shape: tuple[int, int] | None = None,
-        stride_shape: tuple[int, int] | None = None,
-        resolution: Resolution | None = None,
-        units: Units = None,
-        device: str = "cpu",
+        ioconfig: ModelIOConfigABC | None = None,
         *,
-        return_probabilities: bool = False,
-        return_labels: bool = False,
-        merge_predictions: bool = False,
-        save_dir: str | Path | None = None,
-        save_output: bool = False,
-    ) -> np.ndarray | list | dict:
-        """Make a prediction for a list of input data.
+        patch_mode: bool = True,
+        save_dir: os.PathLike | Path | None = None,
+        overwrite: bool = False,
+        output_type: str = "dict",
+        **kwargs: Unpack[PredictorRunParams],
+    ) -> AnnotationStore | Path | str | dict:
+        """Run the PatchPredictor engine on input images.
+
+        This method orchestrates the full inference pipeline, including preprocessing,
+        model inference, post-processing, and saving results. It supports both patch
+        and whole slide image (WSI) modes.
 
         Args:
-            imgs (list, ndarray):
-                List of inputs to process. when using `patch` mode, the
+            images (list[PathLike | WSIReader] | np.ndarray):
+                Input images or patches. When using `patch` mode, the
                 input must be either a list of images, a list of image
-                file paths or a numpy array of an image list. When using
-                `tile` or `wsi` mode, the input must be a list of file
-                paths.
-            masks (list):
-                List of masks. Only utilised when processing image tiles
-                and whole-slide images. Patches are only processed if
-                they are within a masked area. If not provided, then a
-                tissue mask will be automatically generated for
-                whole-slide images or the entire image is processed for
-                image tiles.
-            labels:
-                List of labels. If using `tile` or `wsi` mode, then only
-                a single label per image tile or whole-slide image is
-                supported.
-            mode (str):
-                Type of input to process. Choose from either `patch`,
-                `tile` or `wsi`.
-            return_probabilities (bool):
-                Whether to return per-class probabilities.
-            return_labels (bool):
-                Whether to return the labels with the predictions.
-            device (str):
-                :class:`torch.device` to run the model.
-                Select the device to run the model. Please see
-                https://pytorch.org/docs/stable/tensor_attributes.html#torch.device
-                for more details on input parameters for device. Default value is "cpu".
-            ioconfig (IOPatchPredictorConfig):
-                Patch Predictor IO configuration.
-            patch_input_shape (tuple):
-                Size of patches input to the model. Patches are at
-                requested read resolution, not with respect to level 0,
-                and must be positive.
-            stride_shape (tuple):
-                Stride using during tile and WSI processing. Stride is
-                at requested read resolution, not with respect to
-                level 0, and must be positive. If not provided,
-                `stride_shape=patch_input_shape`.
-            resolution (Resolution):
-                Resolution used for reading the image. Please see
-                :obj:`WSIReader` for details.
-            units (Units):
-                Units of resolution used for reading the image. Choose
-                from either `level`, `power` or `mpp`. Please see
-                :obj:`WSIReader` for details.
-            merge_predictions (bool):
-                Whether to merge the predictions to form a 2-dimensional
-                map. This is only applicable for `mode='wsi'` or
-                `mode='tile'`.
-            save_dir (str or pathlib.Path):
-                Output directory when processing multiple tiles and
-                whole-slide images. By default, it is folder `output`
-                where the running script is invoked.
-            save_output (bool):
-                Whether to save output for a single file. default=False
+                file paths or a numpy array of an image list.
+            masks (list[PathLike] | np.ndarray | None):
+                Optional masks for WSI processing.
+                Only utilised when patch_mode is False.
+                Patches are only generated within a masked area.
+                If not provided, then a tissue mask will be automatically
+                generated for whole slide images.
+            labels (list | None):
+                Optional labels for input images.
+                Only a single label per image is supported.
+            ioconfig (ModelIOConfigABC | None):
+                IO configuration for patch extraction and resolution.
+            patch_mode (bool):
+                Whether to treat input as patches (`True`) or WSIs (`False`).
+            save_dir (PathLike | None):
+                Directory to save output files. Required for WSI mode.
+            overwrite (bool):
+                Whether to overwrite existing output files. Default is False.
+            output_type (str):
+                Desired output format: "dict", "zarr", or "annotationstore".
+                Default value is "zarr".
+            **kwargs (PredictorRunParams):
+                Additional runtime parameters.
 
         Returns:
-            (:class:`numpy.ndarray` or list or dict):
-                Model predictions of the input dataset. If multiple
-                image tiles or whole-slide images are provided as input,
-                or save_output is True, then results are saved to
-                `save_dir` and a dictionary indicating save location for
-                each input is returned.
-
-                The dict has the following format:
-
-                - img_path: path of the input image.
-                - raw: path to save location for raw prediction,
-                  saved in .json.
-                - merged: path to .npy contain merged
-                  predictions if `merge_predictions` is `True`.
+            AnnotationStore | Path | str | dict:
+                - If `patch_mode` is True: returns predictions or path to saved output.
+                - If `patch_mode` is False: returns a dictionary mapping each WSI to
+                  its output path.
 
         Examples:
             >>> wsis = ['wsi1.svs', 'wsi2.svs']
-            >>> predictor = PatchPredictor(
-            ...                 pretrained_model="resnet18-kather100k")
-            >>> output = predictor.predict(wsis, mode="wsi")
+            >>> image_patches = [np.ndarray, np.ndarray]
+            >>> class PatchPredictor(EngineABC):
+            >>> # Define all Abstract methods.
+            >>>     ...
+            >>> predictor = PatchPredictor(model="resnet18-kather100k")
+            >>> output = predictor.run(image_patches, patch_mode=True)
+            >>> output
+            ... "/path/to/Output.db"
+            >>> output = predictor.run(
+            >>>     image_patches,
+            >>>     patch_mode=True,
+            >>>     output_type="zarr")
+            >>> output
+            ... "/path/to/Output.zarr"
+            >>> output = predictor.run(wsis, patch_mode=False)
             >>> output.keys()
             ... ['wsi1.svs', 'wsi2.svs']
             >>> output['wsi1.svs']
-            ... {'raw': '0.raw.json', 'merged': '0.merged.npy'}
-            >>> output['wsi2.svs']
-            ... {'raw': '1.raw.json', 'merged': '1.merged.npy'}
+            ... {'/path/to/wsi1.db'}
 
         """
-        if mode not in ["patch", "wsi", "tile"]:
-            msg = f"{mode} is not a valid mode. Use either `patch`, `tile` or `wsi`"
-            raise ValueError(
-                msg,
-            )
-        if mode == "patch":
-            return self._predict_patch(
-                imgs,
-                labels,
-                return_probabilities=return_probabilities,
-                return_labels=return_labels,
-                device=device,
-            )
-
-        if not isinstance(imgs, list):
-            msg = "Input to `tile` and `wsi` mode must be a list of file paths."
-            raise TypeError(
-                msg,
-            )
-
-        if mode == "wsi" and masks is not None and len(masks) != len(imgs):
-            msg = f"len(masks) != len(imgs) : {len(masks)} != {len(imgs)}"
-            raise ValueError(
-                msg,
-            )
-
-        ioconfig = self._update_ioconfig(
-            ioconfig,
-            patch_input_shape,
-            stride_shape,
-            resolution,
-            units,
-        )
-        if mode == "tile":
-            logger.warning(
-                "WSIPatchDataset only reads image tile at "
-                '`units="baseline"`. Resolutions will be converted '
-                "to baseline value.",
-                stacklevel=2,
-            )
-            ioconfig = ioconfig.to_baseline()
-
-        fx_list = ioconfig.scale_to_highest(
-            ioconfig.input_resolutions,
-            ioconfig.input_resolutions[0]["units"],
-        )
-        fx_list = zip(fx_list, ioconfig.input_resolutions, strict=False)
-        fx_list = sorted(fx_list, key=lambda x: x[0])
-        highest_input_resolution = fx_list[0][1]
-
-        save_dir = self._prepare_save_dir(save_dir, imgs)
-
-        return self._predict_tile_wsi(
-            imgs=imgs,
+        return super().run(
+            images=images,
             masks=masks,
             labels=labels,
-            mode=mode,
-            return_probabilities=return_probabilities,
-            device=device,
             ioconfig=ioconfig,
-            merge_predictions=merge_predictions,
+            patch_mode=patch_mode,
             save_dir=save_dir,
-            save_output=save_output,
-            highest_input_resolution=highest_input_resolution,
+            overwrite=overwrite,
+            output_type=output_type,
+            **kwargs,
         )
diff --git a/tiatoolbox/models/engine/semantic_segmentor.py b/tiatoolbox/models/engine/semantic_segmentor.py
index b222d0266..a33bcf028 100644
--- a/tiatoolbox/models/engine/semantic_segmentor.py
+++ b/tiatoolbox/models/engine/semantic_segmentor.py
@@ -1,1692 +1,1247 @@
-"""This module implements semantic segmentation."""
+"""Semantic Segmentation Engine for Whole Slide Images (WSIs) using TIAToolbox.
+
+This module defines the `SemanticSegmentor` class, which extends the `PatchPredictor`
+engine to support semantic segmentation workflows on digital pathology images.
+It leverages deep learning models from TIAToolbox to perform patch-level and
+WSI-level inference, and includes utilities for preprocessing, postprocessing,
+and saving predictions in various formats.
+
+Key Components:
+---------------
+Classes:
+- SemanticSegmentorRunParams:
+    Configuration parameters for controlling runtime behavior during segmentation.
+- SemanticSegmentor:
+    Core engine for performing semantic segmentation on image patches or WSIs.
+
+Functions:
+- concatenate_none:
+    Concatenate arrays while gracefully handling None values.
+- merge_horizontal:
+    Incrementally merge horizontal patches and update location arrays.
+- save_to_cache:
+    Save intermediate canvas and count arrays to Zarr cache.
+- merge_vertical_chunkwise:
+    Merge vertically chunked canvas and count arrays into a probability map.
+- store_probabilities:
+    Store computed probability data in Zarr or Dask arrays.
+- prepare_full_batch:
+    Align patch-level predictions with global output locations.
+
+Example:
+>>> from tiatoolbox.models.engine.semantic_segmentor import SemanticSegmentor
+>>> segmentor = SemanticSegmentor(model="fcn_resnet50_unet-bcss")
+>>> wsis = ["slide1.svs", "slide2.svs"]
+>>> output = segmentor.run(wsis, patch_mode=False)
+>>>
+>>> patches = [np.ndarray, np.ndarray]
+>>> segmentor = SemanticSegmentor(model="fcn_resnet50_unet-bcss")
+>>> output = segmentor.run(patches, patch_mode=True, output_type="dict")
+
+Notes:
+------
+- Supports both patch-based and WSI-based segmentation.
+- Compatible with TIAToolbox pretrained models and custom PyTorch models.
+- Outputs can be saved as dictionaries, Zarr arrays, or AnnotationStore databases.
+- Includes memory-aware caching and efficient merging strategies for large-scale
+  inference.
+
+"""
 
 from __future__ import annotations
 
-import copy
-import logging
-import shutil
-from concurrent.futures import ProcessPoolExecutor
+import gc
 from pathlib import Path
 from typing import TYPE_CHECKING
 
-import cv2
-import joblib
+import dask.array as da
 import numpy as np
+import psutil
 import torch
-import torch.distributed as dist
-import torch.multiprocessing as torch_mp
-import torch.utils.data as torch_data
-import tqdm
-
-from tiatoolbox import logger, rcParam
-from tiatoolbox.models.architecture import get_pretrained_model
-from tiatoolbox.models.architecture.utils import (
-    compile_model,
-    is_torch_compile_compatible,
+import zarr
+from dask import compute
+from typing_extensions import Unpack
+
+from tiatoolbox import logger
+from tiatoolbox.models.dataset.dataset_abc import WSIPatchDataset
+from tiatoolbox.utils.misc import (
+    dict_to_store_semantic_segmentor,
+    get_tqdm,
 )
-from tiatoolbox.models.models_abc import IOConfigABC, model_to
-from tiatoolbox.tools.patchextraction import PatchExtractor
-from tiatoolbox.utils import imread
-from tiatoolbox.wsicore.wsireader import VirtualWSIReader, WSIMeta, WSIReader
+from tiatoolbox.wsicore.wsireader import is_zarr
+
+from .patch_predictor import PatchPredictor, PredictorRunParams
 
 if TYPE_CHECKING:  # pragma: no cover
-    from collections.abc import Callable
-    from multiprocessing.managers import Namespace
+    import os
 
-    from tiatoolbox.type_hints import IntPair, Resolution, Units
+    from torch.utils.data import DataLoader
 
+    from tiatoolbox.annotation import AnnotationStore
+    from tiatoolbox.models.engine.io_config import IOSegmentorConfig
+    from tiatoolbox.models.models_abc import ModelABC
+    from tiatoolbox.type_hints import Resolution
+    from tiatoolbox.wsicore import WSIReader
 
-def _estimate_canvas_parameters(
-    sample_prediction: np.ndarray,
-    canvas_shape: np.ndarray,
-) -> tuple[tuple, tuple, bool]:
-    """Estimates canvas parameters.
 
-    Args:
-        sample_prediction (:class:`numpy.ndarray`):
-            Patch prediction assuming to be of shape HWC.
-        canvas_shape (:class:`numpy.ndarray`):
-            HW of the supposed assembled image.
+class SemanticSegmentorRunParams(PredictorRunParams, total=False):
+    """Runtime parameters for configuring the `SemanticSegmentor.run()` method.
 
-    Returns:
-        (tuple, tuple, bool):
-            Canvas Shape, Canvas Count and whether to add singleton dimension.
+    This class extends `PredictorRunParams`, which itself extends `EngineABCRunParams`,
+    and adds parameters specific to semantic segmentation workflows.
 
-    """
-    if len(sample_prediction.shape) == 3:  # noqa: PLR2004
-        num_output_ch = sample_prediction.shape[-1]
-        canvas_cum_shape_ = tuple(map(int, (*tuple(canvas_shape), num_output_ch)))
-        canvas_count_shape_ = tuple(map(int, (*tuple(canvas_shape), 1)))
-        add_singleton_dim = num_output_ch == 1
-    else:
-        canvas_cum_shape_ = tuple(map(int, (*tuple(canvas_shape), 1)))
-        canvas_count_shape_ = tuple(map(int, (*tuple(canvas_shape), 1)))
-        add_singleton_dim = True
-
-    return canvas_cum_shape_, canvas_count_shape_, add_singleton_dim
-
-
-def _prepare_save_output(
-    save_path: str | Path,
-    cache_count_path: str | Path,
-    canvas_cum_shape_: tuple[int, ...],
-    canvas_count_shape_: tuple[int, ...],
-) -> tuple:
-    """Prepares for saving the cached output."""
-    if save_path is not None:
-        save_path = Path(save_path)
-        cache_count_path = Path(cache_count_path)
-        if Path.exists(save_path) and Path.exists(cache_count_path):
-            cum_canvas = np.load(str(save_path), mmap_mode="r+")
-            count_canvas = np.load(str(cache_count_path), mmap_mode="r+")
-            if canvas_cum_shape_ != cum_canvas.shape:
-                msg = "Existing image shape in `save_path` does not match."
-                raise ValueError(msg)
-            if canvas_count_shape_ != count_canvas.shape:
-                msg = "Existing image shape in `cache_count_path` does not match."
-                raise ValueError(
-                    msg,
-                )
-        else:
-            cum_canvas = np.lib.format.open_memmap(
-                save_path,
-                mode="w+",
-                shape=canvas_cum_shape_,
-                dtype=np.float32,
-            )
-            # assuming no more than 255 overlapping times
-            count_canvas = np.lib.format.open_memmap(
-                cache_count_path,
-                mode="w+",
-                shape=canvas_count_shape_,
-                dtype=np.uint8,
-            )
-            # flush fill
-            count_canvas[:] = 0
-        is_on_drive = True
-    else:
-        is_on_drive = False
-        cum_canvas = np.zeros(
-            shape=canvas_cum_shape_,
-            dtype=np.float32,
-        )
-        # for pixel occurrence counting
-        count_canvas = np.zeros(canvas_count_shape_, dtype=np.float32)
-
-    return is_on_drive, count_canvas, cum_canvas
+    Attributes:
+        auto_get_mask (bool):
+            Whether to automatically generate segmentation masks using
+            `wsireader.tissue_mask()` during processing.
+        batch_size (int):
+            Number of image patches to feed to the model in a forward pass.
+        class_dict (dict):
+            Optional dictionary mapping classification outputs to class names.
+        device (str):
+            Device to run the model on (e.g., "cpu", "cuda").
+        input_resolutions (list[dict]):
+            Resolution used for reading the image. See `WSIReader` for details.
+        ioconfig (ModelIOConfigABC):
+            Input/output configuration for patch extraction and resolution.
+        memory_threshold (int):
+            Memory usage threshold (in percentage) to trigger caching behavior.
+        num_workers (int):
+            Number of workers used in DataLoader.
+        output_file (str):
+            Output file name for saving results (e.g., .zarr or .db).
+        output_resolutions (Resolution):
+            Resolution used for writing output predictions.
+        patch_input_shape (tuple[int, int]):
+            Shape of input patches (height, width).
+        patch_output_shape (tuple[int, int]):
+            Shape of output patches (height, width).
+        return_labels (bool):
+            Whether to return labels with predictions.
+        return_probabilities (bool):
+            Whether to return per-class probabilities.
+        scale_factor (tuple[float, float]):
+            Scale factor for converting annotations to baseline resolution.
+            Typically model_mpp / slide_mpp.
+        stride_shape (tuple[int, int]):
+            Stride used during WSI processing. Defaults to patch_input_shape.
+        verbose (bool):
+            Whether to output logging information.
 
+    """
 
-class IOSegmentorConfig(IOConfigABC):
-    """Contain semantic segmentor input and output information.
+    patch_output_shape: tuple[int, int]
+    output_resolutions: Resolution
+
+
+class SemanticSegmentor(PatchPredictor):
+    r"""Semantic segmentation engine for digital histology images.
+
+    This class extends `PatchPredictor` to support semantic segmentation tasks
+    using pretrained or custom models from TIAToolbox. It supports both patch-level
+    and whole slide image (WSI) processing, and provides utilities for merging,
+    post-processing, and saving predictions.
+
+    Performance:
+        The TIAToolbox model `fcn_resnet50_unet-bcss` achieves the following
+        results on the BCSS dataset:
+
+        .. list-table:: Semantic segmentation performance on the BCSS dataset
+           :widths: 15 15 15 15 15 15 15
+           :header-rows: 1
+
+           * -
+             - Tumour
+             - Stroma
+             - Inflammatory
+             - Necrosis
+             - Other
+             - All
+           * - Amgad et al.
+             - 0.851
+             - 0.800
+             - 0.712
+             - 0.723
+             - 0.666
+             - 0.750
+           * - TIAToolbox
+             - 0.885
+             - 0.825
+             - 0.761
+             - 0.765
+             - 0.581
+             - 0.763
 
     Args:
-        input_resolutions (list):
-            Resolution of each input head of model inference, must be in
-            the same order as `target model.forward()`.
-        output_resolutions (list):
-            Resolution of each output head from model inference, must be
-            in the same order as target model.infer_batch().
-        patch_input_shape (:class:`numpy.ndarray`, list(int)):
-            Shape of the largest input in (height, width).
-        patch_output_shape (:class:`numpy.ndarray`, list(int)):
-            Shape of the largest output in (height, width).
-        save_resolution (dict):
-            Resolution to save all output.
+        model (str | ModelABC):
+            A PyTorch model instance or name of a pretrained model from TIAToolbox.
+            The user can request pretrained models from the toolbox model zoo using
+            the list of pretrained models available at this `link
+            <https://tia-toolbox.readthedocs.io/en/latest/pretrained.html>`_
+            By default, the corresponding pretrained weights will also
+            be downloaded. However, you can override with your own set
+            of weights using the `weights` parameter. Default is `None`.
+        batch_size (int):
+            Number of image patches processed per forward pass. Default is 8.
+        num_workers (int):
+            Number of workers for data loading. Default is 0.
+        weights (str | Path | None):
+            Path to model weights. If None, default weights are used.
+
+            >>> engine = SemanticSegmentor(
+            ...    model="pretrained-model",
+            ...    weights="/path/to/pretrained-local-weights.pth"
+            ... )
+
+        device (str):
+            Device to run the model on (e.g., "cpu", "cuda"). Default is "cpu".
+        verbose (bool):
+            Whether to enable verbose logging. Default is True.
 
-    Examples:
-        >>> # Defining io for a network having 1 input and 1 output at the
-        >>> # same resolution
-        >>> ioconfig = IOSegmentorConfig(
-        ...     input_resolutions=[{"units": "baseline", "resolution": 1.0}],
-        ...     output_resolutions=[{"units": "baseline", "resolution": 1.0}],
-        ...     patch_input_shape=[2048, 2048],
-        ...     patch_output_shape=[1024, 1024],
-        ...     stride_shape=[512, 512],
-        ... )
+    Attributes:
+        images (list[str | Path] | np.ndarray):
+            Input image patches or WSI paths.
+        masks (list[str | Path] | np.ndarray):
+            Optional tissue masks for WSI processing.
+            These are only utilized when patch_mode is False.
+            If not provided, then a tissue mask will be automatically
+            generated for whole slide images.
+        patch_mode (bool):
+            Whether input is treated as patches (`True`) or WSIs (`False`).
+        model (ModelABC):
+            Loaded PyTorch model.
+        ioconfig (ModelIOConfigABC):
+            IO configuration for patch extraction and resolution.
+        return_labels (bool):
+            Whether to include labels in the output.
+        input_resolutions (list[dict]):
+            Resolution settings for model input. Supported
+            units are `level`, `power` and `mpp`. Keys should be "units" and
+            "resolution" e.g., [{"units": "mpp", "resolution": 0.25}]. Please see
+            :class:`WSIReader` for details.
+        patch_input_shape (tuple[int, int]):
+            Shape of input patches (height, width). Patches are at
+            requested read resolution, not with respect to level 0,
+            and must be positive.
+        stride_shape (tuple[int, int]):
+            Stride used during patch extraction. Stride is
+            at requested read resolution, not with respect to
+            level 0, and must be positive. If not provided,
+            `stride_shape=patch_input_shape`.
+        labels (list | None):
+            Optional labels for input images.
+            Only a single label per image is supported.
+        drop_keys (list):
+            Keys to exclude from model output.
+        output_type (str):
+            Format of output ("dict", "zarr", "annotationstore").
+        output_locations (list | None):
+            Coordinates of output patches used during WSI processing.
 
     Examples:
-        >>> # Defining io for a network having 3 input and 2 output
-        >>> # at the same resolution, the output is then merged at a
-        >>> # different resolution.
-        >>> ioconfig = IOSegmentorConfig(
-        ...     input_resolutions=[
-        ...         {"units": "mpp", "resolution": 0.25},
-        ...         {"units": "mpp", "resolution": 0.50},
-        ...         {"units": "mpp", "resolution": 0.75},
-        ...     ],
-        ...     output_resolutions=[
-        ...         {"units": "mpp", "resolution": 0.25},
-        ...         {"units": "mpp", "resolution": 0.50},
-        ...     ],
-        ...     patch_input_shape=[2048, 2048],
-        ...     patch_output_shape=[1024, 1024],
-        ...     stride_shape=[512, 512],
-        ...     save_resolution={"units": "mpp", "resolution": 4.0},
-        ... )
+        >>> # list of 2 image patches as input
+        >>> wsis = ['path/img.svs', 'path/img.svs']
+        >>> segmentor = SemanticSegmentor(model="fcn-tissue_mask")
+        >>> output = segmentor.run(wsis, patch_mode=False)
+
+        >>> # array of list of 2 image patches as input
+        >>> image_patches = [np.ndarray, np.ndarray]
+        >>> segmentor = SemanticSegmentor(model="fcn-tissue_mask")
+        >>> output = segmentor.run(data, patch_mode=True)
+
+        >>> # list of 2 image patch files as input
+        >>> data = ['path/img.png', 'path/img.png']
+        >>> segmentor = SemanticSegmentor(model="fcn-tissue_mask")
+        >>> output = segmentor.run(data, patch_mode=False)
+
+        >>> # list of 2 image tile files as input
+        >>> tile_file = ['path/tile1.png', 'path/tile2.png']
+        >>> segmentor = SemanticSegmentor(model="fcn-tissue_mask")
+        >>> output = segmentor.run(tile_file, patch_mode=False)
+
+        >>> # list of 2 wsi files as input
+        >>> wsis = ['path/wsi1.svs', 'path/wsi2.svs']
+        >>> segmentor = SemanticSegmentor(model="resnet18-kather100k")
+        >>> output = segmentor.run(wsis, patch_mode=False)
+
+    References:
+        [1] Amgad M, Elfandy H, ..., Gutman DA, Cooper LAD. Structured crowdsourcing
+        enables convolutional segmentation of histology images. Bioinformatics 2019.
+        doi: 10.1093/bioinformatics/btz083
 
     """
 
-    # We pre-define to follow enforcement, actual initialisation in init
-    input_resolutions = None
-    output_resolutions = None
-
     def __init__(
-        self: IOSegmentorConfig,
-        input_resolutions: list[dict],
-        output_resolutions: list[dict],
-        patch_input_shape: IntPair,
-        patch_output_shape: IntPair,
-        save_resolution: dict | None = None,
-        **kwargs: dict,
+        self: SemanticSegmentor,
+        model: str | ModelABC,
+        batch_size: int = 8,
+        num_workers: int = 0,
+        weights: str | Path | None = None,
+        *,
+        device: str = "cpu",
+        verbose: bool = True,
     ) -> None:
-        """Initialize :class:`IOSegmentorConfig`."""
-        self._kwargs = kwargs
-        self.patch_input_shape = patch_input_shape
-        self.patch_output_shape = patch_output_shape
-        self.stride_shape = None
-        self.input_resolutions = input_resolutions
-        self.output_resolutions = output_resolutions
-
-        self.resolution_unit = input_resolutions[0]["units"]
-        self.save_resolution = save_resolution
-
-        for variable, value in kwargs.items():
-            self.__setattr__(variable, value)
-
-        self._validate()
-
-        if self.resolution_unit == "mpp":
-            self.highest_input_resolution = min(
-                self.input_resolutions,
-                key=lambda x: x["resolution"],
-            )
-        else:
-            self.highest_input_resolution = max(
-                self.input_resolutions,
-                key=lambda x: x["resolution"],
-            )
+        """Initialize :class:`SemanticSegmentor`.
 
-    def _validate(self: IOSegmentorConfig) -> None:
-        """Validate the data format."""
-        resolutions = self.input_resolutions + self.output_resolutions
-        units = [v["units"] for v in resolutions]
-        units = np.unique(units)
-        if len(units) != 1 or units[0] not in [
-            "power",
-            "baseline",
-            "mpp",
-        ]:
-            msg = f"Invalid resolution units `{units[0]}`."
-            raise ValueError(msg)
+        Args:
+            model (str | ModelABC):
+                A PyTorch model instance or name of a pretrained model from TIAToolbox.
+                If a string is provided, the corresponding pretrained weights will be
+                downloaded unless overridden via `weights`.
+            batch_size (int):
+                Number of image patches processed per forward pass. Default is 8.
+            num_workers (int):
+                Number of workers for data loading. Default is 0.
+            weights (str | Path | None):
+                Path to model weights. If None, default weights are used.
+            device (str):
+                Device to run the model on (e.g., "cpu", "cuda"). Default is "cpu".
+            verbose (bool):
+                Whether to enable verbose logging. Default is True.
 
-    @staticmethod
-    def scale_to_highest(resolutions: list[dict], units: Units) -> np.ndarray:
-        """Get the scaling factor from input resolutions.
+        """
+        super().__init__(
+            model=model,
+            batch_size=batch_size,
+            num_workers=num_workers,
+            weights=weights,
+            device=device,
+            verbose=verbose,
+        )
+        self.output_locations: list | None = None
+
+    def get_dataloader(
+        self: SemanticSegmentor,
+        images: str | Path | list[str | Path] | np.ndarray,
+        masks: Path | None = None,
+        labels: list | None = None,
+        ioconfig: SemanticSegmentorRunParams | None = None,
+        *,
+        patch_mode: bool = True,
+        auto_get_mask: bool = True,
+    ) -> torch.utils.data.DataLoader:
+        """Pre-process images and masks and return a DataLoader for inference.
 
-        This will convert resolutions to a scaling factor with respect to
-        the highest resolution found in the input resolutions list.
+        This method prepares the dataset and returns a PyTorch DataLoader
+        for either patch-based or WSI-based semantic segmentation. It overrides
+        the base method to support additional WSI-specific logic, including
+        patch output shape and output location tracking.
 
         Args:
-            resolutions (list):
-                A list of resolutions where one is defined as
-                `{'resolution': value, 'unit': value}`
-            units (Units):
-                Units that the resolutions are at.
+            images (str | Path | list[str | Path] | np.ndarray):
+                Input images. Can be a list of file paths or a NumPy array
+                of image patches in NHWC format.
+            masks (Path | None):
+                Optional tissue masks for WSI processing. Only used when
+                `patch_mode` is False.
+            labels (list | None):
+                Optional labels for input images. Only one label per image is supported.
+            ioconfig (SemanticSegmentorRunParams | None):
+                IO configuration for patch extraction and resolution.
+            patch_mode (bool):
+                Whether to treat input as patches (`True`) or WSIs (`False`).
+            auto_get_mask (bool):
+                Whether to automatically generate a tissue mask using
+                `wsireader.tissue_mask()` when `patch_mode` is False.
+                If `True`, only tissue regions are processed. If `False`,
+                all patches are processed. Default is `True`.
 
         Returns:
-            :class:`numpy.ndarray`:
-                A 1D array of scaling factors having the same length as
-                `resolutions`
+            torch.utils.data.DataLoader:
+                A PyTorch DataLoader configured for semantic segmentation inference.
 
         """
-        old_val = [v["resolution"] for v in resolutions]
-        if units not in ["baseline", "mpp", "power"]:
-            msg = (
-                f"Unknown units `{units}`. "
-                f"Units should be one of 'baseline', 'mpp' or 'power'."
-            )
-            raise ValueError(
-                msg,
+        # Overwrite when patch_mode is False.
+        if not patch_mode:
+            dataset = WSIPatchDataset(
+                input_img=images,
+                mask_path=masks,
+                patch_input_shape=ioconfig.patch_input_shape,
+                patch_output_shape=ioconfig.patch_output_shape,
+                stride_shape=ioconfig.stride_shape,
+                resolution=ioconfig.input_resolutions[0]["resolution"],
+                units=ioconfig.input_resolutions[0]["units"],
+                auto_get_mask=auto_get_mask,
             )
-        if units == "baseline":
-            return old_val
-        if units == "mpp":
-            return np.min(old_val) / np.array(old_val)
-        return np.array(old_val) / np.max(old_val)
 
-    def to_baseline(self: IOSegmentorConfig) -> IOSegmentorConfig:
-        """Return a new config object converted to baseline form.
+            dataset.preproc_func = self.model.preproc_func
+            self.output_locations = dataset.outputs
 
-        This will return a new :class:`IOSegmentorConfig` where
-        resolutions have been converted to baseline format with the
-        highest possible resolution found in both input and output as
-        reference.
+            # preprocessing must be defined with the dataset
+            return torch.utils.data.DataLoader(
+                dataset,
+                num_workers=self.num_workers,
+                batch_size=self.batch_size,
+                drop_last=False,
+                shuffle=False,
+            )
 
-        """
-        resolutions = self.input_resolutions + self.output_resolutions
-        if self.save_resolution is not None:
-            resolutions.append(self.save_resolution)
-
-        scale_factors = self.scale_to_highest(resolutions, self.resolution_unit)
-        num_input_resolutions = len(self.input_resolutions)
-        num_output_resolutions = len(self.output_resolutions)
-
-        end_idx = num_input_resolutions
-        input_resolutions = [
-            {"units": "baseline", "resolution": v} for v in scale_factors[:end_idx]
-        ]
-        end_idx = num_input_resolutions + num_output_resolutions
-        output_resolutions = [
-            {"units": "baseline", "resolution": v}
-            for v in scale_factors[num_input_resolutions:end_idx]
-        ]
-
-        save_resolution = None
-        if self.save_resolution is not None:
-            save_resolution = {"units": "baseline", "resolution": scale_factors[-1]}
-        return IOSegmentorConfig(
-            input_resolutions=input_resolutions,
-            output_resolutions=output_resolutions,
-            patch_input_shape=self.patch_input_shape,
-            patch_output_shape=self.patch_output_shape,
-            save_resolution=save_resolution,
-            **self._kwargs,
+        return super().get_dataloader(
+            images=images,
+            masks=masks,
+            labels=labels,
+            ioconfig=ioconfig,
+            patch_mode=patch_mode,
         )
 
+    def infer_wsi(
+        self: SemanticSegmentor,
+        dataloader: DataLoader,
+        save_path: Path,
+        **kwargs: Unpack[SemanticSegmentorRunParams],
+    ) -> dict[str, da.Array]:
+        """Perform model inference on a whole slide image (WSI).
 
-class WSIStreamDataset(torch_data.Dataset):
-    """Reading a wsi in parallel mode with persistent workers.
+        This method processes a WSI using the provided DataLoader, merges
+        patch-level predictions into a full-resolution canvas, and returns
+        the aggregated output. It supports memory-aware caching and optional
+        inclusion of coordinates and labels.
 
-    To speed up the inference process for multiple WSIs. The
-    `torch.utils.data.Dataloader` is set to run in persistent mode.
-    Normally, this will prevent workers from altering their initial
-    states (such as provided input etc.). To sidestep this, we use a
-    shared parallel workspace context manager to send data and signal
-    from the main thread, thus allowing each worker to load a new wsi as
-    well as corresponding patch information.
+        Args:
+            dataloader (DataLoader):
+                PyTorch DataLoader configured for WSI processing.
+            save_path (Path):
+                Path to save the intermediate output. The intermediate output
+                is saved in a Zarr file.
+            **kwargs (SemanticSegmentorRunParams):
+                Additional runtime parameters, including:
+                - return_probabilities (bool): Whether to return probability maps.
+                - return_labels (bool): Whether to include labels in the output.
+                - memory_threshold (int): Memory usage threshold to trigger disk
+                  caching.
 
-    Args:
-        mp_shared_space (:class:`Namespace`):
-            A shared multiprocessing space, must be from
-            `torch.multiprocessing`.
-        ioconfig (:class:`IOSegmentorConfig`):
-            An object which contains I/O placement for patches.
-        wsi_paths (list): List of paths pointing to a WSI or tiles.
-        preproc (Callable):
-            Pre-processing function to be applied to a patch.
-        mode (str):
-            Either `"wsi"` or `"tile"` to indicate the format of images
-            in `wsi_paths`.
+        Returns:
+            dict[str, dask.array.Array]:
+                Dictionary containing merged prediction results:
+                - "probabilities": Full-resolution probability map.
+                - "coordinates": Patch coordinates.
+                - "labels": Ground truth labels (if `return_labels` is True).
 
-    Examples:
-        >>> ioconfig = IOSegmentorConfig(
-        ...     input_resolutions=[{"units": "baseline", "resolution": 1.0}],
-        ...     output_resolutions=[{"units": "baseline", "resolution": 1.0}],
-        ...     patch_input_shape=[2048, 2048],
-        ...     patch_output_shape=[1024, 1024],
-        ...     stride_shape=[512, 512],
-        ... )
-        >>> mp_manager = torch_mp.Manager()
-        >>> mp_shared_space = mp_manager.Namespace()
-        >>> mp_shared_space.signal = 1  # adding variable to the shared space
-        >>> wsi_paths = ['A.svs', 'B.svs']
-        >>> wsi_dataset = WSIStreamDataset(ioconfig, wsi_paths, mp_shared_space)
+        """
+        # Default Memory threshold percentage is 80.
+        memory_threshold = kwargs.get("memory_threshold", 80)
+        vm = psutil.virtual_memory()
 
-    """
+        keys = ["probabilities", "coordinates"]
+        coordinates = []
 
-    def __init__(
-        self: WSIStreamDataset,
-        ioconfig: IOSegmentorConfig,
-        wsi_paths: list[str | Path],
-        mp_shared_space: Namespace,
-        preproc: Callable[[np.ndarray], np.ndarray] | None = None,
-        mode: str = "wsi",
-    ) -> None:
-        """Initialize :class:`WSIStreamDataset`."""
-        super().__init__()
-        self.mode = mode
-        self.preproc = preproc
-        self.ioconfig = copy.deepcopy(ioconfig)
-
-        if mode == "tile":
-            logger.warning(
-                "WSIPatchDataset only reads image tile at "
-                '`units="baseline"`. Resolutions will be converted '
-                "to baseline value.",
-                stacklevel=2,
-            )
-            self.ioconfig = self.ioconfig.to_baseline()
-
-        self.mp_shared_space = mp_shared_space
-        self.wsi_paths = wsi_paths
-        self.wsi_idx = None  # to be received externally via thread communication
-        self.reader = None
-
-    def _get_reader(self: WSIStreamDataset, img_path: str | Path) -> WSIReader:
-        """Get appropriate reader for input path."""
-        img_path = Path(img_path)
-        if self.mode == "wsi":
-            return WSIReader.open(img_path)
-        img = imread(img_path)
-        # initialise metadata for VirtualWSIReader.
-        # here, we simulate a whole-slide image, but with a single level.
-        metadata = WSIMeta(
-            mpp=np.array([1.0, 1.0]),
-            objective_power=10,
-            axes="YXS",
-            slide_dimensions=np.array(img.shape[:2][::-1]),
-            level_downsamples=[1.0],
-            level_dimensions=[np.array(img.shape[:2][::-1])],
+        # Main output dictionary
+        raw_predictions = dict(
+            zip(keys, [da.empty(shape=(0, 0))] * len(keys), strict=False)
         )
-        return VirtualWSIReader(
-            img,
-            info=metadata,
+
+        # Inference loop
+        tqdm = get_tqdm()
+        tqdm_loop = (
+            tqdm(dataloader, leave=False, desc="Inferring patches")
+            if self.verbose
+            else dataloader
         )
 
-    def __len__(self: WSIStreamDataset) -> int:
-        """Return the length of the instance attributes."""
-        return len(self.mp_shared_space.patch_inputs)
+        canvas_np, output_locs_y_ = None, None
+        canvas, count, output_locs = None, None, None
+        canvas_zarr, count_zarr = None, None
+
+        full_output_locs = (
+            dataloader.dataset.full_outputs
+            if hasattr(dataloader.dataset, "full_outputs")
+            else dataloader.dataset.outputs
+        )
 
-    @staticmethod
-    def collate_fn(batch: list | np.ndarray) -> torch.Tensor:
-        """Prototype to handle reading exception.
+        for batch_idx, batch_data in enumerate(tqdm_loop):
+            batch_output = self.model.infer_batch(
+                self.model,
+                batch_data["image"],
+                device=self.device,
+            )
 
-        This will exclude any sample with `None` from the batch. As
-        such, wrapping `__getitem__` with try-catch and return `None`
-        upon exceptions will prevent crashing the entire program. But as
-        a side effect, the batch may not have the size as defined.
+            batch_locs = batch_data["output_locs"].numpy()
 
-        """
-        batch = [v for v in batch if v is not None]
-        return torch.utils.data.dataloader.default_collate(batch)
-
-    def __getitem__(self: WSIStreamDataset, idx: int) -> tuple:
-        """Get an item from the dataset."""
-        # ! no need to lock as we do not modify source value in shared space
-        if self.wsi_idx != self.mp_shared_space.wsi_idx:
-            self.wsi_idx = int(self.mp_shared_space.wsi_idx.item())
-            self.reader = self._get_reader(self.wsi_paths[self.wsi_idx])
-
-        # this is in XY and at requested resolution (not baseline)
-        bounds = self.mp_shared_space.patch_inputs[idx]
-        bounds = bounds.numpy()  # expected to be a torch.Tensor
-
-        # be the same as bounds br-tl, unless bounds are of float
-        patch_data_ = []
-        scale_factors = self.ioconfig.scale_to_highest(
-            self.ioconfig.input_resolutions,
-            self.ioconfig.resolution_unit,
-        )
-        for idy, resolution in enumerate(self.ioconfig.input_resolutions):
-            resolution_bounds = np.round(bounds * scale_factors[idy])
-            patch_data = self.reader.read_bounds(
-                resolution_bounds.astype(np.int32),
-                coord_space="resolution",
-                pad_constant_values=0,  # expose this ?
-                **resolution,
+            # Interpolate outputs for masked regions
+            full_batch_output, full_output_locs, output_locs = prepare_full_batch(
+                batch_output,
+                batch_locs,
+                full_output_locs,
+                output_locs,
+                is_last=(batch_idx == (len(dataloader) - 1)),
             )
 
-            if self.preproc is not None:
-                patch_data = patch_data.copy()
-                patch_data = self.preproc(patch_data)
-            patch_data_.append(patch_data)
-        if len(patch_data_) == 1:
-            patch_data_ = patch_data_[0]
-
-        bound = self.mp_shared_space.patch_outputs[idx]
-        return patch_data_, bound
-
-
-class SemanticSegmentor:
-    """Pixel-wise segmentation predictor.
-
-    The tiatoolbox model should produce the following results on the BCSS dataset
-    using fcn_resnet50_unet-bcss.
-
-    .. list-table:: Semantic segmentation performance on the BCSS dataset
-       :widths: 15 15 15 15 15 15 15
-       :header-rows: 1
-
-       * -
-         - Tumour
-         - Stroma
-         - Inflammatory
-         - Necrosis
-         - Other
-         - All
-       * - Amgad et al.
-         - 0.851
-         - 0.800
-         - 0.712
-         - 0.723
-         - 0.666
-         - 0.750
-       * - TIAToolbox
-         - 0.885
-         - 0.825
-         - 0.761
-         - 0.765
-         - 0.581
-         - 0.763
-
-    Note, if `model` is supplied in the arguments, it will ignore the
-    `pretrained_model` and `pretrained_weights` arguments.
+            canvas_np = concatenate_none(old_arr=canvas_np, new_arr=full_batch_output)
+
+            # Determine if dataloader is moved to next row of patches
+            change_indices = np.where(np.diff(output_locs[:, 1]) != 0)[0] + 1
+
+            # If a row of patches has been processed.
+            if change_indices.size > 0:
+                canvas, count, canvas_np, output_locs, output_locs_y_ = (
+                    merge_horizontal(
+                        canvas,
+                        count,
+                        output_locs_y_,
+                        canvas_np,
+                        output_locs,
+                        change_indices,
+                    )
+                )
 
-    Args:
-        model (nn.Module):
-            Use externally defined PyTorch model for prediction with
-            weights already loaded. Default is `None`. If provided,
-            `pretrained_model` argument is ignored.
-        pretrained_model (str):
-            Name of the existing models support by tiatoolbox for
-            processing the data. For a full list of pretrained models,
-            refer to the `docs
-            <https://tia-toolbox.readthedocs.io/en/latest/pretrained.html>`_.
-            By default, the corresponding pretrained weights will also
-            be downloaded. However, you can override with your own set
-            of weights via the `pretrained_weights` argument. Argument
-            is case-insensitive.
-        pretrained_weights (str):
-            Path to the weight of the corresponding `pretrained_model`.
-        batch_size (int):
-            Number of images fed into the model each time.
-        num_loader_workers (int):
-            Number of workers to load the data. Take note that they will
-            also perform preprocessing.
-        num_postproc_workers (int):
-            This value is there to maintain input compatibility with
-            `tiatoolbox.models.classification` and is not used.
-        verbose (bool):
-            Whether to output logging information.
-        dataset_class (obj):
-            Dataset class to be used instead of default.
-        auto_generate_mask (bool):
-            To automatically generate tile/WSI tissue mask if is not
-            provided.
+                used_percent = vm.percent
+                canvas_used_percent = (canvas.nbytes / vm.free) * 100
+                if (
+                    used_percent > memory_threshold
+                    or canvas_used_percent > memory_threshold
+                ):
+                    tqdm_loop.desc = "Spill intermediate data to disk"
+                    used_percent = (
+                        canvas_used_percent
+                        if (canvas_used_percent > memory_threshold)
+                        else used_percent
+                    )
+                    msg = (
+                        f"Current Memory usage: {used_percent} %  "
+                        f"exceeds specified threshold: {memory_threshold}. "
+                        f"Saving intermediate results to disk."
+                    )
+                    tqdm.write(msg)
+                    # Flush data in Memory and clear dask graph
+                    canvas_zarr, count_zarr = save_to_cache(
+                        canvas,
+                        count,
+                        canvas_zarr,
+                        count_zarr,
+                        save_path=save_path,
+                    )
+                    canvas, count = None, None
+                    gc.collect()
+                    tqdm_loop.desc = "Inferring patches"
+
+            coordinates.append(
+                da.from_array(
+                    self._get_coordinates(batch_data),
+                )
+            )
 
-    Attributes:
-        process_prediction_per_batch (bool):
-            A flag to denote whether post-processing for inference
-            output is applied after each batch or after finishing an entire
-            tile or WSI.
+        canvas, count, _, _, output_locs_y_ = merge_horizontal(
+            canvas,
+            count,
+            output_locs_y_,
+            canvas_np,
+            output_locs,
+            change_indices=[len(output_locs)],
+        )
 
-    Examples:
-        >>> # Sample output of a network
-        >>> wsis = ['A/wsi.svs', 'B/wsi.svs']
-        >>> predictor = SemanticSegmentor(model='fcn-tissue_mask')
-        >>> output = predictor.predict(wsis, mode='wsi')
-        >>> list(output.keys())
-        [('A/wsi.svs', 'output/0.raw') , ('B/wsi.svs', 'output/1.raw')]
-        >>> # if a network have 2 output heads, each head output of 'A/wsi.svs'
-        >>> # will be respectively stored in 'output/0.raw.0', 'output/0.raw.1'
+        zarr_group = None
+        if canvas_zarr is not None:
+            canvas_zarr, count_zarr = save_to_cache(
+                canvas, count, canvas_zarr, count_zarr
+            )
+            # Wrap zarr in dask array
+            canvas = da.from_zarr(canvas_zarr, chunks=canvas_zarr.chunks)
+            count = da.from_zarr(count_zarr, chunks=count_zarr.chunks)
+            zarr_group = zarr.open(canvas_zarr.store.path, mode="a")
+
+        # Final vertical merge
+        raw_predictions["probabilities"] = merge_vertical_chunkwise(
+            canvas,
+            count,
+            output_locs_y_,
+            zarr_group,
+            save_path,
+            memory_threshold,
+        )
+        raw_predictions["coordinates"] = da.concatenate(coordinates, axis=0)
 
-    """
+        return raw_predictions
 
-    def __init__(
+    def save_predictions(
         self: SemanticSegmentor,
-        batch_size: int = 8,
-        num_loader_workers: int = 0,
-        num_postproc_workers: int = 0,
-        model: torch.nn.Module | None = None,
-        pretrained_model: str | None = None,
-        pretrained_weights: str | None = None,
-        dataset_class: Callable = WSIStreamDataset,
-        *,
-        verbose: bool = True,
-        auto_generate_mask: bool = False,
-    ) -> None:
-        """Initialize :class:`SemanticSegmentor`."""
-        super().__init__()
+        processed_predictions: dict,
+        output_type: str,
+        save_path: Path | None = None,
+        **kwargs: Unpack[SemanticSegmentorRunParams],
+    ) -> dict | AnnotationStore | Path:
+        """Save semantic segmentation predictions to disk or return them in memory.
 
-        if model is None and pretrained_model is None:
-            msg = "Must provide either of `model` or `pretrained_model`"
-            raise ValueError(msg)
+        This method saves predictions in one of the supported formats:
+        - "dict": returns predictions as a Python dictionary.
+        - "zarr": saves predictions as a Zarr group and returns the path.
+        - "annotationstore": converts predictions to an AnnotationStore (.db file).
 
-        if model is not None:
-            self.model = model
-            # template ioconfig, usually coming from pretrained
-            self.ioconfig = None
-        else:
-            model, ioconfig = get_pretrained_model(pretrained_model, pretrained_weights)
-            self.ioconfig = ioconfig
-            self.model = model
-
-        # local variables for flagging mode within class,
-        # subclass should have overwritten to alter some specific behavior
-        self.process_prediction_per_batch = True
-
-        # for runtime, such as after wrapping with nn.DataParallel
-        self._cache_dir = None
-        self._loader = None
-        self._model = None
-        self._device = None
-        self._mp_shared_space = None
-        self._postproc_workers = None
-        self.num_postproc_workers = num_postproc_workers
-        self._futures = None
-        self._outputs = []
-        self.imgs = None
-        self.masks = None
-
-        self.dataset_class: WSIStreamDataset = dataset_class
-        self.model = compile_model(
-            model,
-            mode=rcParam["torch_compile_mode"],
-        )
-        self.pretrained_model = pretrained_model
-        self.batch_size = batch_size
-        self.num_loader_workers = num_loader_workers
-        self.num_postproc_workers = None
-        self.verbose = verbose
-        self.auto_generate_mask = auto_generate_mask
-
-    @staticmethod
-    def get_coordinates(
-        image_shape: tuple[int, int] | np.ndarray,
-        ioconfig: IOSegmentorConfig,
-    ) -> tuple[np.ndarray, np.ndarray]:
-        """Calculate patch tiling coordinates.
-
-        By default, internally, it will call the
-        `PatchExtractor.get_coordinates`. To use your own approach,
-        either subclass to overwrite or directly assign your own
-        function to this name. In either cases, the function must obey
-        the API defined here.
+        If `patch_mode` is True, predictions are saved per image. If False,
+        predictions are merged and saved as a single output.
 
         Args:
-            image_shape (tuple(int), :class:`numpy.ndarray`):
-                This argument specifies the shape of mother image (the
-                image we want to extract patches from) at requested
-                `resolution` and `units` and it is expected to be in
-                (width, height) format.
-            ioconfig (:class:`IOSegmentorConfig`):
-                Object that contains information about input and output
-                placement of patches. Check `IOSegmentorConfig` for
-                details about available attributes.
+            processed_predictions (dict):
+                Dictionary containing processed model predictions.
+            output_type (str):
+                Desired output format: "dict", "zarr", or "annotationstore".
+            save_path (Path | None):
+                Path to save the output file. Required for "zarr" and "annotationstore".
+            **kwargs (SemanticSegmentorRunParams):
+                Additional runtime parameters including:
+                - scale_factor (tuple[float, float]): For coordinate transformation.
+                - class_dict (dict): Mapping of class indices to names.
+                - return_probabilities (bool): Whether to save probability maps.
 
         Returns:
-            tuple:
-                List of patch inputs and outputs
-
-                - :py:obj:`list` - patch_inputs:
-                    A list of corrdinates in `[start_x, start_y, end_x,
-                    end_y]` format indicating the read location of the
-                    patch in the mother image.
+            dict | AnnotationStore | Path:
+                - If output_type is "dict": returns predictions as a dictionary.
+                - If output_type is "zarr": returns path to saved Zarr file.
+                - If output_type is "annotationstore": returns AnnotationStore
+                  or path to .db file.
 
-                - :py:obj:`list` - patch_outputs:
-                    A list of corrdinates in `[start_x, start_y, end_x,
-                    end_y]` format indicating to write location of the
-                    patch in the mother image.
+        """
+        # Conversion to annotationstore uses a different function for SemanticSegmentor
+        if output_type.lower() != "annotationstore":
+            return super().save_predictions(
+                processed_predictions, output_type, save_path=save_path, **kwargs
+            )
 
-        Examples:
-            >>> # API of function expected to overwrite `get_coordinates`
-            >>> def func(image_shape, ioconfig):
-            ...   patch_inputs = np.array([[0, 0, 256, 256]])
-            ...   patch_outputs = np.array([[0, 0, 256, 256]])
-            ...   return patch_inputs, patch_outputs
-            >>> segmentor = SemanticSegmentor(model='unet')
-            >>> segmentor.get_coordinates = func
+        return_probabilities = kwargs.get("return_probabilities", False)
+        output_type_ = (
+            "zarr"
+            if is_zarr(save_path.with_suffix(".zarr")) or return_probabilities
+            else "dict"
+        )
 
-        """
-        results = PatchExtractor.get_coordinates(
-            patch_output_shape=ioconfig.patch_output_shape,
-            image_shape=image_shape,
-            patch_input_shape=ioconfig.patch_input_shape,
-            stride_shape=ioconfig.stride_shape,
+        processed_predictions = super().save_predictions(
+            processed_predictions,
+            output_type=output_type_,
+            save_path=save_path.with_suffix(".zarr"),
+            **kwargs,
         )
-        return results[0], results[1]
 
-    @staticmethod
-    def filter_coordinates(
-        mask_reader: VirtualWSIReader,
-        bounds: np.ndarray,
-        resolution: Resolution | None = None,
-        units: Units | None = None,
-    ) -> np.ndarray:
-        """Indicates which coordinate is valid basing on the mask.
+        if isinstance(processed_predictions, Path):
+            processed_predictions = zarr.open(str(processed_predictions), mode="r")
+
+        # scale_factor set from kwargs
+        scale_factor = kwargs.get("scale_factor", (1.0, 1.0))
+        # class_dict set from kwargs
+        class_dict = kwargs.get("class_dict")
+
+        # Need to add support for zarr conversion.
+        save_paths = []
+
+        logger.info("Saving predictions as AnnotationStore.")
+        if self.patch_mode:
+            for i, predictions in enumerate(processed_predictions["predictions"]):
+                if isinstance(self.images[i], Path):
+                    output_path = save_path.parent / (self.images[i].stem + ".db")
+                else:
+                    output_path = save_path.parent / (str(i) + ".db")
+
+                out_file = dict_to_store_semantic_segmentor(
+                    patch_output={"predictions": predictions},
+                    scale_factor=scale_factor,
+                    class_dict=class_dict,
+                    save_path=output_path,
+                )
 
-        To use your own approaches, either subclass to overwrite or
-        directly assign your own function to this name. In either cases,
-        the function must obey the API defined here.
+                save_paths.append(out_file)
+        else:
+            out_file = dict_to_store_semantic_segmentor(
+                patch_output=processed_predictions,
+                scale_factor=scale_factor,
+                class_dict=class_dict,
+                save_path=save_path.with_suffix(".db"),
+            )
+            save_paths = out_file
+
+        if return_probabilities:
+            msg = (
+                f"Probability maps cannot be saved as AnnotationStore. "
+                f"To visualise heatmaps in TIAToolbox Visualization tool,"
+                f"convert heatmaps in {save_path} to ome.tiff using"
+                f"tiatoolbox.utils.misc.write_probability_heatmap_as_ome_tiff."
+            )
+            logger.info(msg)
+
+        return save_paths
+
+    def _update_run_params(
+        self: SemanticSegmentor,
+        images: list[os.PathLike | Path | WSIReader] | np.ndarray,
+        masks: list[os.PathLike | Path] | np.ndarray | None = None,
+        labels: list | None = None,
+        save_dir: os.PathLike | Path | None = None,
+        ioconfig: IOSegmentorConfig | None = None,
+        output_type: str = "dict",
+        *,
+        overwrite: bool = False,
+        patch_mode: bool,
+        **kwargs: Unpack[SemanticSegmentorRunParams],
+    ) -> Path | None:
+        """Update runtime parameters for the PatchPredictor engine.
+
+        This method sets internal attributes such as caching, batch size,
+        IO configuration, and output format based on user input and keyword arguments.
+        It also configures whether to include probabilities in the output.
 
         Args:
-            mask_reader (:class:`.VirtualReader`):
-                A virtual pyramidal reader of the mask related to the
-                WSI from which we want to extract the patches.
-            bounds (ndarray and np.int32):
-                Coordinates to be checked via the `func`. They must be
-                in the same resolution as requested `resolution` and
-                `units`. The shape of `coordinates` is (N, K) where N is
-                the number of coordinate sets and K is either 2 for
-                centroids or 4 for bounding boxes. When using the
-                default `func=None`, K should be 4, as we expect the
-                `coordinates` to be bounding boxes in `[start_x,
-                start_y, end_x, end_y]` format.
-            resolution (Resolution):
-                Resolution of the requested patch.
-            units (Units):
-                Units of the requested patch.
+            images (list[PathLike | WSIReader] | np.ndarray):
+                Input images or patches.
+            masks (list[PathLike] | np.ndarray | None):
+                Optional masks for WSI processing.
+            labels (list | None):
+                Optional labels for input images.
+            save_dir (PathLike | None):
+                Directory to save output files. Required for WSI mode.
+            ioconfig (ModelIOConfigABC | None):
+                IO configuration for patch extraction and resolution.
+            output_type (str):
+                Desired output format: "dict", "zarr", or "annotationstore".
+            overwrite (bool):
+                Whether to overwrite existing output files. Default is False.
+            patch_mode (bool):
+                Whether to treat input as patches (`True`) or WSIs (`False`).
+            **kwargs (SemanticSegmentorRunParams):
+                Additional runtime parameters.
 
         Returns:
-            :class:`numpy.ndarray`:
-                List of flags to indicate which coordinate is valid.
+            Path | None:
+                Path to the save directory if applicable, otherwise None.
 
-        Examples:
-            >>> # API of function expected to overwrite `filter_coordinates`
-            >>> def func(reader, bounds, resolution, units):
-            ...   # as example, only select first bound
-            ...   return np.array([1, 0])
-            >>> coords = [[0, 0, 256, 256], [128, 128, 384, 384]]
-            >>> segmentor = SemanticSegmentor(model='unet')
-            >>> segmentor.filter_coordinates = func
+        Raises:
+            ValueError:
+                If `labels` are requested for WSI processing.
 
         """
-        if not isinstance(mask_reader, VirtualWSIReader):
-            msg = "`mask_reader` should be VirtualWSIReader."
-            raise TypeError(msg)
-
-        if not isinstance(bounds, np.ndarray) or not np.issubdtype(
-            bounds.dtype,
-            np.integer,
-        ):
-            msg = "`coordinates` should be ndarray of integer type."
+        return_labels = kwargs.get("return_labels")
+
+        if return_labels and not patch_mode:
+            msg = "`return_labels` is not supported when `patch_mode` is False."
             raise ValueError(msg)
 
-        mask_real_shape = mask_reader.img.shape[:2]
-        mask_resolution_shape = mask_reader.slide_dimensions(
-            resolution=resolution,
-            units=units,
-        )[::-1]
-        mask_real_shape = np.array(mask_real_shape)
-        mask_resolution_shape = np.array(mask_resolution_shape)
-        scale_factor = mask_real_shape / mask_resolution_shape
-        scale_factor = scale_factor[0]  # what if ratio x != y
-
-        def sel_func(coord: np.ndarray) -> bool:
-            """Accept coord as long as its box contains part of mask."""
-            coord_in_real_mask = np.ceil(scale_factor * coord).astype(np.int32)
-            start_x, start_y, end_x, end_y = coord_in_real_mask
-            roi = mask_reader.img[start_y:end_y, start_x:end_x]
-            return np.sum(roi > 0) > 0
-
-        flags = [sel_func(bound) for bound in bounds]
-        return np.array(flags)
-
-    @staticmethod
-    def get_reader(
-        img_path: str | Path,
-        mask_path: str | Path,
-        mode: str,
-        *,
-        auto_get_mask: bool,
-    ) -> tuple[WSIReader, WSIReader]:
-        """Define how to get reader for mask and source image."""
-        img_path = Path(img_path)
-        reader = WSIReader.open(img_path)
-
-        mask_reader = None
-        if mask_path is not None:
-            mask_path = Path(mask_path)
-            if not Path.is_file(mask_path):
-                msg = "`mask_path` must be a valid file path."
-                raise ValueError(msg)
-            mask = imread(mask_path)  # assume to be gray
-            mask = cv2.cvtColor(mask, cv2.COLOR_RGB2GRAY)
-            mask = np.array(mask > 0, dtype=np.uint8)
-
-            mask_reader = VirtualWSIReader(mask)
-            mask_reader.info = reader.info
-        elif auto_get_mask and mode == "wsi" and mask_path is None:
-            # if no mask provided and `wsi` mode, generate basic tissue
-            # mask on the fly
-            mask_reader = reader.tissue_mask(resolution=1.25, units="power")
-            mask_reader.info = reader.info
-        return reader, mask_reader
-
-    def _predict_one_wsi(
+        return super()._update_run_params(
+            images=images,
+            masks=masks,
+            labels=labels,
+            save_dir=save_dir,
+            ioconfig=ioconfig,
+            overwrite=overwrite,
+            patch_mode=patch_mode,
+            output_type=output_type,
+            **kwargs,
+        )
+
+    def run(
         self: SemanticSegmentor,
-        wsi_idx: int,
-        ioconfig: IOSegmentorConfig,
-        save_path: str,
-        mode: str,
-    ) -> None:
-        """Make a prediction on tile/wsi.
+        images: list[os.PathLike | Path | WSIReader] | np.ndarray,
+        masks: list[os.PathLike | Path] | np.ndarray | None = None,
+        labels: list | None = None,
+        ioconfig: IOSegmentorConfig | None = None,
+        *,
+        patch_mode: bool = True,
+        save_dir: os.PathLike | Path | None = None,
+        overwrite: bool = False,
+        output_type: str = "dict",
+        **kwargs: Unpack[SemanticSegmentorRunParams],
+    ) -> AnnotationStore | Path | str | dict | list[Path]:
+        """Run the semantic segmentation engine on input images.
+
+        This method orchestrates the full inference pipeline, including preprocessing,
+        model inference, post-processing, and saving results. It supports both
+        patch-level and whole slide image (WSI) modes.
 
         Args:
-            wsi_idx (int):
-                Index of the tile/wsi to be processed within `self`.
-            ioconfig (:class:`IOSegmentorConfig`):
-                Object which defines I/O placement during inference and
-                when assembling back to full tile/wsi.
-            save_path (str):
-                Location to save output prediction as well as possible
-                intermediate results.
-            mode (str):
-                Either `"tile"` or `"wsi"` to indicate run mode.
+            images (list[PathLike | WSIReader] | np.ndarray):
+                Input images or patches. Can be a list of file paths, WSIReader objects,
+                or a NumPy array of image patches.
+            masks (list[PathLike] | np.ndarray | None):
+                Optional masks for WSI processing. Only used when `patch_mode` is False.
+            labels (list | None):
+                Optional labels for input images. Only one label per image is supported.
+            ioconfig (IOSegmentorConfig | None):
+                IO configuration for patch extraction and resolution.
+            patch_mode (bool):
+                Whether to treat input as patches (`True`) or WSIs (`False`). Default
+                is True.
+            save_dir (PathLike | None):
+                Directory to save output files. Required for WSI mode.
+            overwrite (bool):
+                Whether to overwrite existing output files. Default is False.
+            output_type (str):
+                Desired output format: "dict", "zarr", or "annotationstore". Default
+                is "dict".
+            **kwargs (SemanticSegmentorRunParams):
+                Additional runtime parameters to update engine attributes.
+
+        Returns:
+            AnnotationStore | Path | str | dict | list[Path]:
+                - If `patch_mode` is True: returns predictions or path to saved output.
+                - If `patch_mode` is False: returns a dictionary mapping each WSI
+                  to its output path.
+
+        Examples:
+            >>> wsis = ['wsi1.svs', 'wsi2.svs']
+            >>> image_patches = [np.ndarray, np.ndarray]
+            >>> segmentor = SemanticSegmentor(model="fcn-tissue_mask")
+            >>> output = segmentor.run(image_patches, patch_mode=True)
+            >>> output
+            ... "/path/to/Output.db"
+
+            >>> output = segmentor.run(
+            ...     image_patches,
+            ...     patch_mode=True,
+            ...     output_type="zarr"
+            ... )
+            >>> output
+            ... "/path/to/Output.zarr"
+
+            >>> output = segmentor.run(wsis, patch_mode=False)
+            >>> output.keys()
+            ... ['wsi1.svs', 'wsi2.svs']
+            >>> output['wsi1.svs']
+            ... "/path/to/wsi1.db"
 
         """
-        cache_dir = self._cache_dir / str(wsi_idx)
-        cache_dir.mkdir(parents=True)
-
-        wsi_path = self.imgs[wsi_idx]
-        mask_path = None if self.masks is None else self.masks[wsi_idx]
-        wsi_reader, mask_reader = self.get_reader(
-            wsi_path,
-            mask_path,
-            mode,
-            auto_get_mask=self.auto_generate_mask,
+        return super().run(
+            images=images,
+            masks=masks,
+            labels=labels,
+            ioconfig=ioconfig,
+            patch_mode=patch_mode,
+            save_dir=save_dir,
+            overwrite=overwrite,
+            output_type=output_type,
+            **kwargs,
         )
 
-        # assume ioconfig has already been converted to `baseline` for `tile` mode
-        resolution = ioconfig.highest_input_resolution
-        wsi_proc_shape = wsi_reader.slide_dimensions(**resolution)
-
-        # * retrieve patch and tile placement
-        # this is in XY
-        (patch_inputs, patch_outputs) = self.get_coordinates(wsi_proc_shape, ioconfig)
-        if mask_reader is not None:
-            sel = self.filter_coordinates(mask_reader, patch_outputs, **resolution)
-            patch_outputs = patch_outputs[sel]
-            patch_inputs = patch_inputs[sel]
-
-        # modify the shared space so that we can update worker info
-        # without needing to re-create the worker. There should be no
-        # race-condition because only the following enumerate loop
-        # triggers the parallelism, and this portion is still in
-        # sequential execution order
-        patch_inputs = torch.from_numpy(patch_inputs).share_memory_()
-        patch_outputs = torch.from_numpy(patch_outputs).share_memory_()
-        self._mp_shared_space.patch_inputs = patch_inputs
-        self._mp_shared_space.patch_outputs = patch_outputs
-        self._mp_shared_space.wsi_idx = torch.Tensor([wsi_idx]).share_memory_()
-
-        pbar_desc = "Process Batch: "
-        pbar = tqdm.tqdm(
-            desc=pbar_desc,
-            leave=True,
-            total=len(self._loader),
-            ncols=80,
-            ascii=True,
-            position=0,
-        )
 
-        cum_output = []
-        for _, batch_data in enumerate(self._loader):
-            sample_datas, sample_infos = batch_data
-            batch_size = sample_infos.shape[0]
-            # ! depending on the protocol of the output within infer_batch
-            # ! this may change, how to enforce/document/expose this in a
-            # ! sensible way?
-
-            # assume to return a list of L output,
-            # each of shape N x etc. (N=batch size)
-            sample_outputs = self.model.infer_batch(
-                self._model,
-                sample_datas,
-                device=self._device,
-            )
-            # repackage so that it's an N list, each contains
-            # L x etc. output
-            sample_outputs = [np.split(v, batch_size, axis=0) for v in sample_outputs]
-            sample_outputs = list(zip(*sample_outputs, strict=False))
-
-            # tensor to numpy, costly?
-            sample_infos = sample_infos.numpy()
-            sample_infos = np.split(sample_infos, batch_size, axis=0)
-
-            sample_outputs = list(zip(sample_infos, sample_outputs, strict=False))
-            if self.process_prediction_per_batch:
-                self._process_predictions(
-                    sample_outputs,
-                    wsi_reader,
-                    ioconfig,
-                    save_path,
-                    cache_dir,
-                )
-            else:
-                cum_output.extend(sample_outputs)
-            pbar.update()
-        pbar.close()
-
-        self._process_predictions(
-            cum_output,
-            wsi_reader,
-            ioconfig,
-            save_path,
-            cache_dir,
-        )
+def concatenate_none(
+    old_arr: np.ndarray | da.Array,
+    new_arr: np.ndarray | da.Array,
+) -> np.ndarray | da.Array:
+    """Concatenate arrays, handling None values gracefully.
 
-        # clean up the cache directories
-        shutil.rmtree(cache_dir)
+    This utility function concatenates `new_arr` to `old_arr` along the first axis.
+    If `old_arr` is None, it returns `new_arr` directly. Supports both NumPy and Dask
+    arrays.
 
-    def _process_predictions(
-        self: SemanticSegmentor,
-        cum_batch_predictions: list,
-        wsi_reader: WSIReader,
-        ioconfig: IOSegmentorConfig,
-        save_path: str,
-        cache_dir: str,
-    ) -> None:
-        """Define how the aggregated predictions are processed.
+    Args:
+        old_arr (np.ndarray | da.Array):
+            Existing array to append to. Can be None.
+        new_arr (np.ndarray | da.Array):
+            New array to append.
 
-        This includes merging the prediction if necessary and also saving afterwards.
-        Note that items within `cum_batch_predictions` will be consumed during
-        the operation.
+    Returns:
+        np.ndarray | da.Array:
+            Concatenated array of the same type as `new_arr`.
 
-        Args:
-            cum_batch_predictions (list):
-                List of batch predictions. Each item within the list
-                should be of (location, patch_predictions).
-            wsi_reader (:class:`WSIReader`):
-                A reader for the image where the predictions come from.
-            ioconfig (:class:`IOSegmentorConfig`):
-                A configuration object contains input and output
-                information.
-            save_path (str):
-                Root path to save current WSI predictions.
-            cache_dir (str):
-                Root path to cache current WSI data.
+    """
+    if isinstance(new_arr, np.ndarray):
+        return (
+            new_arr if old_arr is None else np.concatenate((old_arr, new_arr), axis=0)
+        )
 
-        """
-        if len(cum_batch_predictions) == 0:
-            return
-
-        # assume predictions is N, each item has L output element
-        locations, predictions = list(zip(*cum_batch_predictions, strict=False))
-        # Nx4 (N x [tl_x, tl_y, br_x, br_y), denotes the location of
-        # output patch this can exceed the image bound at the requested
-        # resolution remove singleton due to split.
-        locations = np.array([v[0] for v in locations])
-        for index, output_resolution in enumerate(ioconfig.output_resolutions):
-            # assume resolution index to be in the same order as L
-            merged_resolution = ioconfig.highest_input_resolution
-            merged_locations = locations
-            # ! location is w.r.t the highest resolution, hence still need conversion
-            if ioconfig.save_resolution is not None:
-                merged_resolution = ioconfig.save_resolution
-                output_shape = wsi_reader.slide_dimensions(**output_resolution)
-                merged_shape = wsi_reader.slide_dimensions(**merged_resolution)
-                fx = merged_shape[0] / output_shape[0]
-                merged_locations = np.ceil(locations * fx).astype(np.int64)
-            merged_shape = wsi_reader.slide_dimensions(**merged_resolution)
-            # 0 idx is to remove singleton without removing other axes singleton
-            to_merge_predictions = [v[index][0] for v in predictions]
-            sub_save_path = f"{save_path}.raw.{index}.npy"
-            sub_count_path = f"{cache_dir}/count.{index}.npy"
-            self.merge_prediction(
-                merged_shape[::-1],  # XY to YX
-                to_merge_predictions,
-                merged_locations,
-                save_path=sub_save_path,
-                cache_count_path=sub_count_path,
-            )
+    return new_arr if old_arr is None else da.concatenate([old_arr, new_arr], axis=0)
 
-    @staticmethod
-    def merge_prediction(
-        canvas_shape: tuple[int] | list[int] | np.ndarray,
-        predictions: list[np.ndarray],
-        locations: list | np.ndarray,
-        save_path: str | Path | None = None,
-        cache_count_path: str | Path | None = None,
-    ) -> np.ndarray:
-        """Merge patch-level predictions to form a 2-dimensional prediction map.
-
-        When accumulating the raw prediction onto a same canvas (via
-        calling the function multiple times), `save_path` and
-        `cache_count_path` must be the same. If either of these two do
-        not exist, the function will create new files. However, if
-        `save_path` is `None`, the function will perform the
-        accumulation using CPU-RAM as storage.
 
-        Args:
-            canvas_shape (:class:`numpy.ndarray`):
-                HW of the supposed assembled image.
-            predictions (list):
-                List of :class:`np.ndarray`, each item is a patch prediction,
-                assuming to be of shape HWC.
-            locations (list):
-                List of :class:`np.ndarray`, each item is the location of the patch
-                at the same index within `predictions`. The location is
-                in the to be assembled canvas and of the form
-                `(top_left_x, top_left_y, bottom_right_x,
-                bottom_right_x)`.
-            save_path (str):
-                Location to save the assembled image.
-            cache_count_path (str):
-                Location to store the canvas for counting how many times
-                each pixel get overlapped when assembling.
+def merge_batch_to_canvas(
+    blocks: np.ndarray,
+    output_locations: np.ndarray,
+    merged_shape: tuple[int, int, int],
+) -> tuple[np.ndarray, np.ndarray]:
+    """Merge patch-level predictions into a single canvas.
 
-        Returns:
-            :class:`numpy.ndarray`:
-                An image contains merged data.
+    This function aggregates overlapping patch predictions into a unified
+    output canvas and maintains a count map to normalize overlapping regions.
 
-        Examples:
-        >>> SemanticSegmentor.merge_prediction(
-        ...     canvas_shape=[4, 4],
-        ...     predictions=[
-        ...         np.full((2, 2), 1),
-        ...         np.full((2, 2), 2)],
-        ...     locations=[
-        ...         [0, 0, 2, 2],
-        ...         [2, 2, 4, 4]],
-        ...     save_path=None,
-        ... )
-        ... array([[1, 1, 0, 0],
-        ...        [1, 1, 0, 0],
-        ...        [0, 0, 2, 2],
-        ...        [0, 0, 2, 2]])
+    Args:
+        blocks (np.ndarray):
+            Array of predicted blocks with shape (N, H, W, C), where N is the
+            number of patches.
+        output_locations (np.ndarray):
+            Array of coordinates for each block in the format
+            [start_x, start_y, end_x, end_y] with shape (N, 4).
+        merged_shape (tuple[int, int, int]):
+            Shape of the final merged canvas (H, W, C).
 
-        """
-        canvas_shape = np.array(canvas_shape)
+    Returns:
+        tuple[np.ndarray, np.ndarray]:
+            - canvas: Merged prediction map of shape (H, W, C).
+            - count: Count map indicating how many times each pixel was updated,
+              shape (H, W).
 
-        sample_prediction = predictions[0]
+    """
+    canvas = np.zeros(merged_shape, dtype=blocks.dtype)
+    count = np.zeros((*merged_shape[:2], 1), dtype=np.uint8)
+    for i, block in enumerate(blocks):
+        xs, ys, xe, ye = output_locations[i]
+        if not np.any(block):
+            continue
+        # To deal with edge cases
+        canvas[0 : ye - ys, xs:xe, :] += block[0 : ye - ys, 0 : xe - xs, :]
+        count[ys:ye, xs:xe, 0] += 1
+    return canvas, count
+
+
+def merge_horizontal(
+    canvas: None | da.Array,
+    count: None | da.Array,
+    output_locs_y_: np.ndarray,
+    canvas_np: np.ndarray,
+    output_locs: np.ndarray,
+    change_indices: np.ndarray | list[np.ndarray],
+) -> tuple[da.Array, da.Array, np.ndarray, np.ndarray, np.ndarray]:
+    """Merge horizontal patches incrementally for each row of patches.
+
+    This function processes segments of NumPy patch arrays (`canvas_np`, `count_np`,
+    `output_locs`) based on `change_indices`, merging them horizontally and appending
+    the results to Dask arrays. It also updates the vertical output locations
+    (`output_locs_y_`) for downstream vertical merging.
 
-        if len(sample_prediction.shape) not in (2, 3):
-            msg = f"Prediction is no HW or HWC: {sample_prediction.shape}."
-            raise ValueError(msg)
+    Args:
+        canvas (None | da.Array):
+            Existing Dask array for canvas data, or None if uninitialized.
+        count (None | da.Array):
+            Existing Dask array for count data, or None if uninitialized.
+        output_locs_y_ (np.ndarray):
+            Array tracking vertical output locations for merged patches.
+        canvas_np (np.ndarray):
+            NumPy array of canvas patches to be merged.
+        output_locs (np.ndarray):
+            Array of output locations for each patch.
+        change_indices (np.ndarray | list[np.ndarray]):
+            Indices indicating where to flush and merge patches.
 
-        (
-            canvas_cum_shape_,
-            canvas_count_shape_,
-            add_singleton_dim,
-        ) = _estimate_canvas_parameters(sample_prediction, canvas_shape)
+    Returns:
+        tuple:
+            Updated canvas and count Dask arrays, along with remaining canvas_np,
+            count_np, output_locs, and output_locs_y_ arrays after processing.
 
-        is_on_drive, count_canvas, cum_canvas = _prepare_save_output(
-            save_path,
-            cache_count_path,
-            canvas_cum_shape_,
-            canvas_count_shape_,
-        )
+    """
+    start_idx = 0
+    for c_idx in change_indices:
+        output_locs_ = output_locs[: c_idx - start_idx]
+        canvas_np_ = canvas_np[: c_idx - start_idx]
 
-        def index(arr: np.ndarray, tl: np.ndarray, br: np.ndarray) -> np.ndarray:
-            """Helper to shorten indexing."""
-            return arr[tl[0] : br[0], tl[1] : br[1]]
-
-        patch_infos = list(zip(locations, predictions, strict=False))
-        for _, patch_info in enumerate(patch_infos):
-            # position is assumed to be in XY coordinate
-            (bound_in_wsi, prediction) = patch_info
-            # convert to XY to YX, and in tl, br
-            tl_in_wsi = np.array(bound_in_wsi[:2][::-1])
-            br_in_wsi = np.array(bound_in_wsi[2:][::-1])
-            old_tl_in_wsi = tl_in_wsi.copy()
-
-            # need to do conversion
-            patch_shape_in_wsi = tuple(br_in_wsi - tl_in_wsi)
-            # conversion to make cv2 happy
-            prediction = prediction.astype(np.float32)
-            prediction = cv2.resize(prediction, patch_shape_in_wsi[::-1])
-            # ! cv2 resize will remove singleton !
-            if add_singleton_dim:
-                prediction = prediction[..., None]
-
-            sel = tl_in_wsi < 0
-            tl_in_wsi[sel] = 0
-
-            if np.any(tl_in_wsi >= canvas_shape):
-                continue
-
-            sel = br_in_wsi > canvas_shape
-            br_in_wsi[sel] = canvas_shape[sel]
-
-            # re-calibrate the position in case patch passing the image bound
-            br_in_patch = br_in_wsi - old_tl_in_wsi
-            patch_actual_shape = br_in_wsi - tl_in_wsi
-            tl_in_patch = br_in_patch - patch_actual_shape
-
-            # now cropping the prediction region
-            patch_pred = prediction[
-                tl_in_patch[0] : br_in_patch[0],
-                tl_in_patch[1] : br_in_patch[1],
-            ]
-
-            patch_count = np.ones(patch_pred.shape[:2])[..., None]
-            if not is_on_drive:
-                index(cum_canvas, tl_in_wsi, br_in_wsi)[:] += patch_pred
-                index(count_canvas, tl_in_wsi, br_in_wsi)[:] += patch_count
-            else:
-                old_avg_pred = np.array(index(cum_canvas, tl_in_wsi, br_in_wsi))
-                old_count = np.array(index(count_canvas, tl_in_wsi, br_in_wsi))
-                # ! there will be precision error, but we have to live with this
-                new_count = old_count + patch_count
-                # retrieve old raw probabilities after summation
-                old_raw_pred = old_avg_pred * old_count
-                new_avg_pred = (old_raw_pred + patch_pred) / new_count
-                index(cum_canvas, tl_in_wsi, br_in_wsi)[:] = new_avg_pred
-                index(count_canvas, tl_in_wsi, br_in_wsi)[:] = new_count
-        if not is_on_drive:
-            cum_canvas /= count_canvas + 1.0e-6
-        return cum_canvas
-
-    @staticmethod
-    def _prepare_save_dir(save_dir: str | Path | None) -> tuple[Path, Path]:
-        """Prepare save directory and cache."""
-        if save_dir is None:
-            logger.warning(
-                "Segmentor will only output to directory. "
-                "All subsequent output will be saved to current runtime "
-                "location under folder 'output'. Overwriting may happen! ",
-                stacklevel=2,
-            )
-            save_dir = Path.cwd() / "output"
+        batch_xs = np.min(output_locs[:, 0], axis=0)
+        batch_xe = np.max(output_locs[:, 2], axis=0)
 
-        save_dir = Path(save_dir).resolve()
-        if save_dir.is_dir():
-            msg = f"`save_dir` already exists! {save_dir}"
-            raise ValueError(msg)
-        save_dir.mkdir(parents=True)
-        cache_dir = Path(f"{save_dir}/cache")
-        Path.mkdir(cache_dir, parents=True)
+        merged_shape = (canvas_np_.shape[1], batch_xe - batch_xs, canvas_np.shape[3])
 
-        return save_dir, cache_dir
+        canvas_merge, count_merge = merge_batch_to_canvas(
+            blocks=canvas_np_,
+            output_locations=output_locs_,
+            merged_shape=merged_shape,
+        )
 
-    def _update_ioconfig(
-        self: SemanticSegmentor,
-        ioconfig: IOSegmentorConfig,
-        mode: str,
-        patch_input_shape: IntPair,
-        patch_output_shape: IntPair,
-        stride_shape: IntPair,
-        resolution: Resolution,
-        units: Units,
-    ) -> IOSegmentorConfig:
-        """Update ioconfig according to input parameters.
+        canvas_merge = da.from_array(canvas_merge, chunks=canvas_merge.shape)
+        count_merge = da.from_array(count_merge, chunks=count_merge.shape)
 
-        Args:
-            ioconfig (:class:`IOSegmentorConfig`):
-                Object defines information about input and output
-                placement of patches. When provided,
-                `patch_input_shape`, `patch_output_shape`,
-                `stride_shape`, `resolution`, and `units` arguments are
-                ignored. Otherwise, those arguments will be internally
-                converted to a :class:`IOSegmentorConfig` object.
-            mode (str):
-                Type of input to process. Choose from either `tile` or
-                `wsi`.
-            patch_input_shape (tuple):
-                Size of patches input to the model. The values
-                are at requested read resolution and must be positive.
-            patch_output_shape (tuple):
-                Size of patches output by the model. The values are at
-                the requested read resolution and must be positive.
-            stride_shape (tuple):
-                Stride using during tile and WSI processing. The values
-                are at requested read resolution and must be positive.
-                If not provided, `stride_shape=patch_input_shape` is
-                used.
-            resolution (Resolution):
-                Resolution used for reading the image.
-            units (Units):
-                Units of resolution used for reading the image.
+        canvas = concatenate_none(old_arr=canvas, new_arr=canvas_merge)
+        count = concatenate_none(old_arr=count, new_arr=count_merge)
 
-        Returns:
-            :class:`IOSegmentorConfig`:
-                Updated ioconfig.
+        output_locs_y_ = concatenate_none(
+            old_arr=output_locs_y_, new_arr=output_locs[:, (1, 3)]
+        )
 
-        """
-        if patch_output_shape is None:
-            patch_output_shape = patch_input_shape
-        if stride_shape is None:
-            stride_shape = patch_output_shape
-
-        if ioconfig is None and patch_input_shape is None:
-            if self.ioconfig is None:
-                msg = (
-                    "Must provide either `ioconfig` or `patch_input_shape` "
-                    "and `patch_output_shape`"
-                )
-                raise ValueError(
-                    msg,
-                )
-            ioconfig = copy.deepcopy(self.ioconfig)
-        elif ioconfig is None:
-            ioconfig = IOSegmentorConfig(
-                input_resolutions=[{"resolution": resolution, "units": units}],
-                output_resolutions=[{"resolution": resolution, "units": units}],
-                patch_input_shape=patch_input_shape,
-                patch_output_shape=patch_output_shape,
-                stride_shape=stride_shape,
-            )
-        if mode == "tile":
-            logger.warning(
-                "WSIPatchDataset only reads image tile at "
-                '`units="baseline"`. Resolutions will be converted '
-                "to baseline value.",
-                stacklevel=2,
-            )
-            return ioconfig.to_baseline()
+        canvas_np = canvas_np[c_idx - start_idx :]
+        output_locs = output_locs[c_idx - start_idx :]
+        start_idx = c_idx
 
-        return ioconfig
+    return canvas, count, canvas_np, output_locs, output_locs_y_
 
-    def _prepare_workers(self: SemanticSegmentor) -> None:
-        """Prepare number of workers."""
-        self._postproc_workers = None
-        if self.num_postproc_workers is not None:
-            self._postproc_workers = ProcessPoolExecutor(
-                max_workers=self.num_postproc_workers,
-            )
 
-    def _memory_cleanup(self: SemanticSegmentor) -> None:
-        """Memory clean up."""
-        self.imgs = None
-        self.masks = None
-        self._cache_dir = None
-        self._model = None
-        self._loader = None
-        self._device = None
-        self._futures = None
-        self._mp_shared_space = None
-        if self._postproc_workers is not None:
-            self._postproc_workers.shutdown()
-        self._postproc_workers = None
-
-    def _predict_wsi_handle_exception(
-        self: SemanticSegmentor,
-        imgs: list,
-        wsi_idx: int,
-        img_path: str | Path,
-        mode: str,
-        ioconfig: IOSegmentorConfig,
-        save_dir: str | Path,
-        *,
-        crash_on_exception: bool,
-    ) -> None:
-        """Predict on multiple WSIs.
+def save_to_cache(
+    canvas: da.Array,
+    count: da.Array,
+    canvas_zarr: zarr.Array,
+    count_zarr: zarr.Array,
+    save_path: str | Path = "temp.zarr",
+) -> tuple[zarr.Array, zarr.Array]:
+    """Save computed canvas and count arrays to Zarr cache.
 
-        Args:
-            imgs (list, ndarray):
-                List of inputs to process. When using `"patch"` mode,
-                the input must be either a list of images, a list of
-                image file paths or a numpy array of an image list. When
-                using `"tile"` or `"wsi"` mode, the input must be a list
-                of file paths.
-            wsi_idx (int):
-                index of current WSI being processed.
-            img_path(str or Path):
-                Path to current image.
-            mode (str):
-                Type of input to process. Choose from either `tile` or
-                `wsi`.
-            ioconfig (:class:`IOSegmentorConfig`):
-                Object defines information about input and output
-                placement of patches. When provided,
-                `patch_input_shape`, `patch_output_shape`,
-                `stride_shape`, `resolution`, and `units` arguments are
-                ignored. Otherwise, those arguments will be internally
-                converted to a :class:`IOSegmentorConfig` object.
-            save_dir (str or Path):
-                Output directory when processing multiple tiles and
-                whole-slide images. By default, it is folder `output`
-                where the running script is invoked.
-            crash_on_exception (bool):
-                If `True`, the running loop will crash if there is any
-                error during processing a WSI. Otherwise, the loop will
-                move on to the next wsi for processing.
+    This function computes the given Dask arrays (`canvas` and `count`), resizes the
+    corresponding Zarr datasets to accommodate the new data, and appends the results.
+    If the Zarr datasets do not exist, it initializes them within the specified
+    Zarr group.
 
-        Returns:
-            list:
-                A list of tuple(input_path, save_path) where
-                `input_path` is the path of the input wsi while
-                `save_path` corresponds to the output predictions.
+    Args:
+        canvas (da.Array):
+            Dask array representing image or feature data.
+        count (da.Array):
+            Dask array representing count or normalization data.
+        canvas_zarr (zarr.Array):
+            Existing Zarr dataset for canvas data. If None, a new one is created.
+        count_zarr (zarr.Array):
+            Existing Zarr dataset for count data. If None, a new one is created.
+        save_path (str | Path):
+            Path to the Zarr group for saving datasets. Defaults to "temp.zarr".
 
-        """
-        try:
-            wsi_save_path = save_dir / f"{wsi_idx}"
-            self._predict_one_wsi(wsi_idx, ioconfig, str(wsi_save_path), mode)
-
-            # Do not use dict with file name as key, because it can be
-            # overwritten. It may be user intention to provide files with a
-            # same name multiple times (maybe they have different root path)
-            self._outputs.append([str(img_path), str(wsi_save_path)])
-
-            # ? will this corrupt old version if control + c midway?
-            map_file_path = save_dir / "file_map.dat"
-            # backup old version first
-            if Path.exists(map_file_path):
-                old_map_file_path = save_dir / "file_map_old.dat"
-                shutil.copy(map_file_path, old_map_file_path)
-            joblib.dump(self._outputs, map_file_path)
-
-            # verbose mode, error by passing ?
-            logging.info("Finish: %d", wsi_idx / len(imgs))
-            logging.info("--Input: %s", str(img_path))
-            logging.info("--Output: %s", str(wsi_save_path))
-        # prevent deep source check because this is bypass and
-        # delegating error message
-        except Exception as err:  # skipcq: PYL-W0703
-            wsi_save_path = save_dir.joinpath(f"{wsi_idx}")
-            if crash_on_exception:
-                raise err  # noqa: TRY201
-            logging.exception("Crashed on %s", wsi_save_path)
-
-    def predict(  # noqa: PLR0913
-        self: SemanticSegmentor,
-        imgs: list,
-        masks: list | None = None,
-        mode: str = "tile",
-        ioconfig: IOSegmentorConfig = None,
-        patch_input_shape: IntPair = None,
-        patch_output_shape: IntPair = None,
-        stride_shape: IntPair = None,
-        resolution: Resolution = 1.0,
-        units: Units = "baseline",
-        save_dir: str | Path | None = None,
-        device: str = "cpu",
-        *,
-        crash_on_exception: bool = False,
-    ) -> list[tuple[Path, Path]]:
-        """Make a prediction for a list of input data.
-
-        By default, if the input model at the object instantiation time
-        is a pretrained model in the toolbox as well as
-        `patch_input_shape`, `patch_output_shape`, `stride_shape`,
-        `resolution`, `units` and `ioconfig` are `None`. The method will
-        use the `ioconfig` retrieved together with the pretrained model.
-        Otherwise, either `patch_input_shape`, `patch_output_shape`,
-        `stride_shape`, `resolution`, `units` or `ioconfig` must be set
-        else a `Value Error` will be raised.
+    Returns:
+        tuple[zarr.Array, zarr.Array]:
+            Updated Zarr datasets for canvas and count arrays.
 
-        Args:
-            imgs (list, ndarray):
-                List of inputs to process. When using `"patch"` mode,
-                the input must be either a list of images, a list of
-                image file paths or a numpy array of an image list. When
-                using `"tile"` or `"wsi"` mode, the input must be a list
-                of file paths.
-            masks (list):
-                List of masks. Only utilised when processing image tiles
-                and whole-slide images. Patches are only processed if
-                they are within a masked area. If not provided, then a
-                tissue mask will be automatically generated for
-                whole-slide images or the entire image is processed for
-                image tiles.
-            mode (str):
-                Type of input to process. Choose from either `tile` or
-                `wsi`.
-            ioconfig (:class:`IOSegmentorConfig`):
-                Object defines information about input and output
-                placement of patches. When provided,
-                `patch_input_shape`, `patch_output_shape`,
-                `stride_shape`, `resolution`, and `units` arguments are
-                ignored. Otherwise, those arguments will be internally
-                converted to a :class:`IOSegmentorConfig` object.
-            device (str):
-                :class:`torch.device` to run the model.
-                Select the device to run the model. Please see
-                https://pytorch.org/docs/stable/tensor_attributes.html#torch.device
-                for more details on input parameters for device. Default value is "cpu".
-            patch_input_shape (tuple):
-                Size of patches input to the model. The values
-                are at requested read resolution and must be positive.
-            patch_output_shape (tuple):
-                Size of patches output by the model. The values are at
-                the requested read resolution and must be positive.
-            stride_shape (tuple):
-                Stride using during tile and WSI processing. The values
-                are at requested read resolution and must be positive.
-                If not provided, `stride_shape=patch_input_shape` is
-                used.
-            resolution (float):
-                Resolution used for reading the image.
-            units (Units):
-                Units of resolution used for reading the image. Choose
-                from either `"level"`, `"power"` or `"mpp"`.
-            save_dir (str or pathlib.Path):
-                Output directory when processing multiple tiles and
-                whole-slide images. By default, it is folder `output`
-                where the running script is invoked.
-            crash_on_exception (bool):
-                If `True`, the running loop will crash if there is any
-                error during processing a WSI. Otherwise, the loop will
-                move on to the next wsi for processing.
+    """
+    computed_values = compute(*[canvas, count])
+    canvas_computed, count_computed = computed_values
+
+    chunk_shape = tuple(chunk[0] for chunk in canvas.chunks)
+    if canvas_zarr is None:
+        zarr_group = zarr.open(str(save_path), mode="w")
+
+        canvas_zarr = zarr_group.create_dataset(
+            name="canvas",
+            shape=(0, *canvas_computed.shape[1:]),
+            chunks=(chunk_shape[0], *canvas_computed.shape[1:]),
+            dtype=canvas_computed.dtype,
+            overwrite=True,
+        )
 
-        Returns:
-            list:
-                A list of tuple(input_path, save_path) where
-                `input_path` is the path of the input wsi while
-                `save_path` corresponds to the output predictions.
+        count_zarr = zarr_group.create_dataset(
+            name="count",
+            shape=(0, *count_computed.shape[1:]),
+            dtype=count_computed.dtype,
+            chunks=(chunk_shape[0], *count_computed.shape[1:]),
+            overwrite=True,
+        )
 
-        Examples:
-            >>> # Sample output of a network
-            >>> wsis = ['A/wsi.svs', 'B/wsi.svs']
-            >>> predictor = SemanticSegmentor(model='fcn-tissue_mask')
-            >>> output = predictor.predict(wsis, mode='wsi')
-            >>> list(output.keys())
-            [('A/wsi.svs', 'output/0.raw') , ('B/wsi.svs', 'output/1.raw')]
-            >>> # if a network have 2 output heads, each head output of 'A/wsi.svs'
-            >>> # will be respectively stored in 'output/0.raw.0', 'output/0.raw.1'
+    canvas_zarr.resize(
+        (canvas_zarr.shape[0] + canvas_computed.shape[0], *canvas_zarr.shape[1:])
+    )
+    canvas_zarr[-canvas_computed.shape[0] :] = canvas_computed
 
-        """
-        if mode not in ["wsi", "tile"]:
-            msg = f"{mode} is not a valid mode. Use either `tile` or `wsi`."
-            raise ValueError(msg)
+    count_zarr.resize(
+        (count_zarr.shape[0] + count_computed.shape[0], *count_zarr.shape[1:])
+    )
+    count_zarr[-count_computed.shape[0] :] = count_computed
 
-        save_dir, self._cache_dir = self._prepare_save_dir(save_dir)
+    return canvas_zarr, count_zarr
 
-        ioconfig = self._update_ioconfig(
-            ioconfig,
-            mode,
-            patch_input_shape,
-            patch_output_shape,
-            stride_shape,
-            resolution,
-            units,
-        )
 
-        # use external for testing
-        self._device = device
-        self._model = model_to(model=self.model, device=device)
+def merge_vertical_chunkwise(
+    canvas: da.Array,
+    count: da.Array,
+    output_locs_y_: np.ndarray,
+    zarr_group: zarr.Group,
+    save_path: Path,
+    memory_threshold: int = 80,
+) -> da.Array:
+    """Merge vertically chunked canvas and count arrays into a single probability map.
 
-        # workers should be > 0 else Value Error will be thrown
-        self._prepare_workers()
+    This function processes vertically stacked image blocks (`canvas`) and their
+    associated count arrays to compute normalized probabilities. It handles overlapping
+    regions between chunks by applying seam folding and trimming halos to ensure smooth
+    transitions. If a Zarr group is provided, the result is stored incrementally.
 
-        mp_manager = torch_mp.Manager()
-        mp_shared_space = mp_manager.Namespace()
-        self._mp_shared_space = mp_shared_space
+    Args:
+        canvas (da.Array):
+            Dask array containing image data split into vertical chunks.
+        count (da.Array):
+            Dask array containing count data corresponding to the canvas.
+        output_locs_y_ (np.ndarray):
+            Array of shape (N, 2) specifying vertical output locations
+            for each chunk, used to compute overlaps.
+        zarr_group (zarr.Group):
+            Zarr group to store the merged probability dataset.
+        save_path (Path):
+            Path to save the intermediate output. The intermediate output
+            is saved in a Zarr file.
+        memory_threshold (int):
+            Memory usage threshold (in percentage) to trigger caching behavior.
 
-        ds = self.dataset_class(
-            ioconfig=ioconfig,
-            preproc=self.model.preproc_func,
-            wsi_paths=imgs,
-            mp_shared_space=mp_shared_space,
-            mode=mode,
-        )
+    Returns:
+        da.Array:
+            A merged Dask array of normalized probabilities, either loaded from Zarr
+            or constructed in memory.
 
-        loader = torch_data.DataLoader(
-            ds,
-            drop_last=False,
-            batch_size=self.batch_size,
-            num_workers=self.num_loader_workers,
-            persistent_workers=self.num_loader_workers > 0,
+    """
+    y0s, y1s = np.unique(output_locs_y_[:, 0]), np.unique(output_locs_y_[:, 1])
+    overlaps = np.append(y1s[:-1] - y0s[1:], 0)
+
+    num_chunks = canvas.numblocks[0]
+    probabilities_zarr, probabilities_da = None, None
+    chunk_shape = tuple(chunk[0] for chunk in canvas.chunks)
+
+    tqdm = get_tqdm()
+    tqdm_loop = tqdm(overlaps, leave=False, desc="Merging rows")
+
+    used_percent = 0
+
+    curr_chunk = canvas.blocks[0, 0].compute()
+    curr_count = count.blocks[0, 0].compute()
+    next_chunk = canvas.blocks[1, 0].compute() if num_chunks > 1 else None
+    next_count = count.blocks[1, 0].compute() if num_chunks > 1 else None
+
+    for i, overlap in enumerate(tqdm_loop):
+        if next_chunk is not None and overlap > 0:
+            curr_chunk[-overlap:] += next_chunk[:overlap]
+            curr_count[-overlap:] += next_count[:overlap]
+
+        # Normalize
+        curr_count = np.where(curr_count == 0, 1, curr_count)
+        probabilities = curr_chunk / curr_count.astype(np.float32)
+
+        probabilities_zarr, probabilities_da = store_probabilities(
+            probabilities=probabilities,
+            chunk_shape=chunk_shape,
+            probabilities_zarr=probabilities_zarr,
+            probabilities_da=probabilities_da,
+            zarr_group=zarr_group,
         )
 
-        self._loader = loader
-        self.imgs = imgs
-        self.masks = masks
-
-        # contain input / output prediction mapping
-        self._outputs = []
-        # ? what will happen if this crash midway?
-        # => may not be able to retrieve the result dict
-        for wsi_idx, img_path in enumerate(imgs):
-            self._predict_wsi_handle_exception(
-                imgs=imgs,
-                wsi_idx=wsi_idx,
-                img_path=img_path,
-                mode=mode,
-                ioconfig=ioconfig,
-                save_dir=save_dir,
-                crash_on_exception=crash_on_exception,
+        if probabilities_da is not None:
+            vm = psutil.virtual_memory()
+            used_percent = (probabilities_da.nbytes / vm.free) * 100
+        if probabilities_zarr is None and used_percent > memory_threshold:
+            msg = (
+                f"Current Memory usage: {used_percent} %  "
+                f"exceeds specified threshold: {memory_threshold}. "
+                f"Saving intermediate results to disk."
+            )
+            tqdm.write(msg)
+            zarr_group = zarr.open(str(save_path), mode="a")
+            probabilities_zarr = zarr_group.create_dataset(
+                name="probabilities",
+                shape=probabilities_da.shape,
+                chunks=(chunk_shape[0], *probabilities.shape[1:]),
+                dtype=probabilities.dtype,
+                overwrite=True,
             )
+            probabilities_zarr[:] = probabilities_da.compute()
 
-        # clean up the cache directories
-        try:
-            shutil.rmtree(self._cache_dir)
-        except PermissionError:  # pragma: no cover
-            logger.warning("Unable to remove %s", self._cache_dir)
+            probabilities_da = None
 
-        self._memory_cleanup()
+        if next_chunk is not None:
+            curr_chunk, curr_count = next_chunk[overlap:], next_count[overlap:]
 
-        if (
-            device == "cuda"
-            and torch.cuda.device_count() > 1
-            and is_torch_compile_compatible()
-        ):  # pragma: no cover
-            dist.destroy_process_group()
+        if i + 2 < num_chunks:
+            next_chunk = canvas.blocks[i + 2, 0].compute()
+            next_count = count.blocks[i + 2, 0].compute()
+        else:
+            next_chunk, next_count = None, None
+
+    if probabilities_zarr:
+        if "canvas" in zarr_group:
+            del zarr_group["canvas"]
+        if "count" in zarr_group:
+            del zarr_group["count"]
+        return da.from_zarr(
+            probabilities_zarr, chunks=(chunk_shape[0], *probabilities.shape[1:])
+        )
 
-        return self._outputs
+    return probabilities_da
 
 
-class DeepFeatureExtractor(SemanticSegmentor):
-    """Generic CNN Feature Extractor.
+def store_probabilities(
+    probabilities: np.ndarray,
+    chunk_shape: tuple[int, ...],
+    probabilities_zarr: zarr.Array | None,
+    probabilities_da: da.Array | None,
+    zarr_group: zarr.Group | None,
+) -> tuple[zarr.Array | None, da.Array | None]:
+    """Store computed probability data into a Zarr dataset or accumulate in memory.
 
-    AN engine for using any CNN model as a feature extractor. Note, if
-    `model` is supplied in the arguments, it will ignore the
-    `pretrained_model` and `pretrained_weights` arguments.
+    If a Zarr group is provided, the function appends the given probability array
+    to the 'probabilities' dataset, resizing as needed. Otherwise, it concatenates
+    the array into an existing Dask array for in-memory accumulation.
 
     Args:
-        model (nn.Module):
-            Use externally defined PyTorch model for prediction with
-            weights already loaded. Default is `None`. If provided,
-            `pretrained_model` argument is ignored.
-        pretrained_model (str):
-            Name of the existing models support by tiatoolbox for
-            processing the data. By default, the corresponding
-            pretrained weights will also be downloaded. However, you can
-            override with your own set of weights via the
-            `pretrained_weights` argument. Argument is case-insensitive.
-            Refer to
-            :class:`tiatoolbox.models.architecture.vanilla.CNNBackbone`
-            for list of supported pretrained models.
-        pretrained_weights (str):
-            Path to the weight of the corresponding `pretrained_model`.
-        batch_size (int):
-            Number of images fed into the model each time.
-        num_loader_workers (int):
-            Number of workers to load the data. Take note that they will
-            also perform preprocessing.
-        num_postproc_workers (int):
-            This value is there to maintain input compatibility with
-            `tiatoolbox.models.classification` and is not used.
-        verbose (bool):
-            Whether to output logging information.
-        dataset_class (obj):
-            Dataset class to be used instead of default.
-        auto_generate_mask(bool):
-            To automatically generate tile/WSI tissue mask if is not
-            provided.
+        probabilities (np.ndarray):
+            Computed probability array to store.
+        chunk_shape (tuple[int, ...]):
+            Chunk shape used for Zarr dataset creation.
+        probabilities_zarr (zarr.Array | None):
+            Existing Zarr dataset, or None to initialize.
+        probabilities_da (da.Array | None):
+            Existing Dask array for in-memory accumulation.
+        zarr_group (zarr.Group | None):
+            Zarr group used to create or access the dataset.
 
-    Examples:
-        >>> # Sample output of a network
-        >>> from tiatoolbox.models.architecture.vanilla import CNNBackbone
-        >>> wsis = ['A/wsi.svs', 'B/wsi.svs']
-        >>> # create resnet50 with pytorch pretrained weights
-        >>> model = CNNBackbone('resnet50')
-        >>> predictor = DeepFeatureExtractor(model=model)
-        >>> output = predictor.predict(wsis, mode='wsi')
-        >>> list(output.keys())
-        [('A/wsi.svs', 'output/0') , ('B/wsi.svs', 'output/1')]
-        >>> # If a network have 2 output heads, for 'A/wsi.svs',
-        >>> # there will be 3 outputs, and they are respectively stored at
-        >>> # 'output/0.position.npy'   # will always be output
-        >>> # 'output/0.features.0.npy' # output of head 0
-        >>> # 'output/0.features.1.npy' # output of head 1
-        >>> # Each file will contain a same number of items, and the item at each
-        >>> # index corresponds to 1 patch. The item in `.*position.npy` will
-        >>> # be the corresponding patch bounding box. The box coordinates are at
-        >>> # the inference resolution defined within the provided `ioconfig`.
+    Returns:
+        tuple[zarr.Array | None, da.Array | None]:
+            Updated Zarr dataset and/or Dask array.
 
     """
+    if zarr_group is not None:
+        if probabilities_zarr is None:
+            probabilities_zarr = zarr_group.create_dataset(
+                name="probabilities",
+                shape=(0, *probabilities.shape[1:]),
+                chunks=(chunk_shape[0], *probabilities.shape[1:]),
+                dtype=probabilities.dtype,
+            )
 
-    def __init__(
-        self: DeepFeatureExtractor,
-        batch_size: int = 8,
-        num_loader_workers: int = 0,
-        num_postproc_workers: int = 0,
-        model: torch.nn.Module | None = None,
-        pretrained_model: str | None = None,
-        pretrained_weights: str | None = None,
-        dataset_class: Callable = WSIStreamDataset,
-        *,
-        verbose: bool = True,
-        auto_generate_mask: bool = False,
-    ) -> None:
-        """Initialize :class:`DeepFeatureExtractor`."""
-        super().__init__(
-            batch_size=batch_size,
-            num_loader_workers=num_loader_workers,
-            num_postproc_workers=num_postproc_workers,
-            model=model,
-            pretrained_model=pretrained_model,
-            pretrained_weights=pretrained_weights,
-            verbose=verbose,
-            auto_generate_mask=auto_generate_mask,
-            dataset_class=dataset_class,
+        probabilities_zarr.resize(
+            (
+                probabilities_zarr.shape[0] + probabilities.shape[0],
+                *probabilities_zarr.shape[1:],
+            )
+        )
+        probabilities_zarr[-probabilities.shape[0] :] = probabilities
+    else:
+        probabilities_da = concatenate_none(
+            old_arr=probabilities_da,
+            new_arr=da.from_array(
+                probabilities, chunks=(chunk_shape[0], *probabilities.shape[1:])
+            ),
         )
-        self.process_prediction_per_batch = False
-
-    def _process_predictions(
-        self: DeepFeatureExtractor,
-        cum_batch_predictions: list,
-        wsi_reader: WSIReader,  # skipcq: PYL-W0613  # noqa: ARG002
-        ioconfig: IOSegmentorConfig,
-        save_path: str,
-        cache_dir: str,  # skipcq: PYL-W0613  # noqa: ARG002
-    ) -> None:
-        """Define how the aggregated predictions are processed.
 
-        This includes merging the prediction if necessary and also
-        saving afterward.
+    return probabilities_zarr, probabilities_da
 
-        Args:
-            cum_batch_predictions (list):
-                List of batch predictions. Each item within the list
-                should be of (location, patch_predictions).
-            wsi_reader (:class:`WSIReader`):
-                A reader for the image where the predictions come from.
-                Not used here. Added for consistency with the API.
-            ioconfig (:class:`IOSegmentorConfig`):
-                A configuration object contains input and output
-                information.
-            save_path (str):
-                Root path to save current WSI predictions.
-            cache_dir (str):
-                Root path to cache current WSI data.
-                Not used here. Added for consistency with the API.
 
-        """
-        # assume prediction_list is N, each item has L output elements
-        location_list, prediction_list = list(zip(*cum_batch_predictions, strict=False))
-        # Nx4 (N x [tl_x, tl_y, br_x, br_y), denotes the location of output
-        # patch, this can exceed the image bound at the requested resolution
-        # remove singleton due to split.
-        location_list = np.array([v[0] for v in location_list])
-        np.save(f"{save_path}.position.npy", location_list)
-        for idx, _ in enumerate(ioconfig.output_resolutions):
-            # assume resolution idx to be in the same order as L
-            # 0 idx is to remove singleton without removing other axes singleton
-            prediction_list = [v[idx][0] for v in prediction_list]
-            prediction_list = np.array(prediction_list)
-            np.save(f"{save_path}.features.{idx}.npy", prediction_list)
-
-    def predict(  # noqa: PLR0913
-        self: DeepFeatureExtractor,
-        imgs: list,
-        masks: list | None = None,
-        mode: str = "tile",
-        ioconfig: IOSegmentorConfig | None = None,
-        patch_input_shape: IntPair | None = None,
-        patch_output_shape: IntPair | None = None,
-        stride_shape: IntPair = None,
-        resolution: Resolution = 1.0,
-        units: Units = "baseline",
-        save_dir: str | Path | None = None,
-        device: str = "cpu",
-        *,
-        crash_on_exception: bool = False,
-    ) -> list[tuple[Path, Path]]:
-        """Make a prediction for a list of input data.
-
-        By default, if the input model at the time of object
-        instantiation is a pretrained model in the toolbox as well as
-        `patch_input_shape`, `patch_output_shape`, `stride_shape`,
-        `resolution`, `units` and `ioconfig` are `None`. The method will
-        use the `ioconfig` retrieved together with the pretrained model.
-        Otherwise, either `patch_input_shape`, `patch_output_shape`,
-        `stride_shape`, `resolution`, `units` or `ioconfig` must be set
-        - else a `Value Error` will be raised.
+def prepare_full_batch(
+    batch_output: np.ndarray,
+    batch_locs: np.ndarray,
+    full_output_locs: np.ndarray,
+    output_locs: np.ndarray,
+    *,
+    is_last: bool,
+) -> tuple[np.ndarray, np.ndarray, np.ndarray]:
+    """Prepare full-sized output and count arrays for a batch of patch predictions.
 
-        Args:
-            imgs (list, ndarray):
-                List of inputs to process. When using `"patch"` mode,
-                the input must be either a list of images, a list of
-                image file paths or a numpy array of an image list. When
-                using `"tile"` or `"wsi"` mode, the input must be a list
-                of file paths.
-            masks (list):
-                List of masks. Only utilised when processing image tiles
-                and whole-slide images. Patches are only processed if
-                they are within a masked area. If not provided, then a
-                tissue mask will be automatically generated for each
-                whole-slide image or all image tiles in the entire image
-                are processed.
-            mode (str):
-                Type of input to process. Choose from either `tile` or
-                `wsi`.
-            ioconfig (:class:`IOSegmentorConfig`):
-                Object that defines information about input and output
-                placement of patches. When provided,
-                `patch_input_shape`, `patch_output_shape`,
-                `stride_shape`, `resolution`, and `units` arguments are
-                ignored. Otherwise, those arguments will be internally
-                converted to a :class:`IOSegmentorConfig` object.
-            device (str):
-                :class:`torch.device` to run the model.
-                Select the device to run the model. Please see
-                https://pytorch.org/docs/stable/tensor_attributes.html#torch.device
-                for more details on input parameters for device. Default value is "cpu".
-            patch_input_shape (IntPair):
-                Size of patches input to the model. The values are at
-                requested read resolution and must be positive.
-            patch_output_shape (tuple):
-                Size of patches output by the model. The values are at
-                the requested read resolution and must be positive.
-            stride_shape (tuple):
-                Stride using during tile and WSI processing. The values
-                are at requested read resolution and must be positive.
-                If not provided, `stride_shape=patch_input_shape` is
-                used.
-            resolution (Resolution):
-                Resolution used for reading the image.
-            units (Units):
-                Units of resolution used for reading the image.
-            save_dir (str):
-                Output directory when processing multiple tiles and
-                whole-slide images. By default, it is folder `output`
-                where the running script is invoked.
-            crash_on_exception (bool):
-                If `True`, the running loop will crash if there is any
-                error during processing a WSI. Otherwise, the loop will
-                move on to the next wsi for processing.
+    This function aligns patch-level predictions with global output locations when
+    a mask (e.g., auto_get_mask) is applied. It initializes full-sized arrays and
+    fills them using matched indices. If the batch is the last in the sequence,
+    it pads the arrays to cover remaining locations.
 
-        Returns:
-            list:
-                A list of tuple(input_path, save_path) where
-                `input_path` is the path of the input wsi while
-                `save_path` corresponds to the output predictions.
+    Args:
+        batch_output (np.ndarray):
+            Patch-level model predictions of shape (N, H, W, C).
+        batch_locs (np.ndarray):
+            Output locations corresponding to `batch_output`.
+        full_output_locs (np.ndarray):
+            Remaining global output locations to be matched.
+        output_locs (np.ndarray):
+            Accumulated output location array across batches.
+        is_last (bool):
+            Flag indicating whether this is the final batch.
 
-        Examples:
-            >>> # Sample output of a network
-            >>> from tiatoolbox.models.architecture.vanilla import CNNBackbone
-            >>> wsis = ['A/wsi.svs', 'B/wsi.svs']
-            >>> # create resnet50 with pytorch pretrained weights
-            >>> model = CNNBackbone('resnet50')
-            >>> predictor = DeepFeatureExtractor(model=model)
-            >>> output = predictor.predict(wsis, mode='wsi')
-            >>> list(output.keys())
-            [('A/wsi.svs', 'output/0') , ('B/wsi.svs', 'output/1')]
-            >>> # If a network have 2 output heads, for 'A/wsi.svs',
-            >>> # there will be 3 outputs, and they are respectively stored at
-            >>> # 'output/0.position.npy'   # will always be output
-            >>> # 'output/0.features.0.npy' # output of head 0
-            >>> # 'output/0.features.1.npy' # output of head 1
-            >>> # Each file will contain a same number of items, and the item at each
-            >>> # index corresponds to 1 patch. The item in `.*position.npy` will
-            >>> # be the corresponding patch bounding box. The box coordinates are at
-            >>> # the inference resolution defined within the provided `ioconfig`.
+    Returns:
+        tuple[np.ndarray, np.ndarray, np.ndarray, np.ndarray]:
+            - full_batch_output: Full-sized output array with predictions placed.
+            - full_output_locs: Updated remaining global output locations.
+            - output_locs: Updated accumulated output locations.
 
-        """
-        return super().predict(
-            imgs=imgs,
-            masks=masks,
-            mode=mode,
-            device=device,
-            ioconfig=ioconfig,
-            patch_input_shape=patch_input_shape,
-            patch_output_shape=patch_output_shape,
-            stride_shape=stride_shape,
-            resolution=resolution,
-            units=units,
-            save_dir=save_dir,
-            crash_on_exception=crash_on_exception,
+    """
+    # Use np.intersect1d once numpy version is upgraded to 2.0
+    full_output_dict = {tuple(row): i for i, row in enumerate(full_output_locs)}
+    matches = [full_output_dict[tuple(row)] for row in batch_locs]
+
+    total_size = np.max(matches).astype(np.uint16) + 1
+
+    # Initialize full output array
+    full_batch_output = np.zeros(
+        shape=(total_size, *batch_output.shape[1:]),
+        dtype=batch_output.dtype,
+    )
+
+    # Place matching outputs using matching indices
+    full_batch_output[matches] = batch_output
+
+    output_locs = concatenate_none(
+        old_arr=output_locs, new_arr=full_output_locs[:total_size]
+    )
+    full_output_locs = full_output_locs[total_size:]
+
+    if is_last:
+        output_locs = concatenate_none(old_arr=output_locs, new_arr=full_output_locs)
+        full_batch_output = concatenate_none(
+            old_arr=full_batch_output,
+            new_arr=np.zeros(
+                shape=(len(full_output_locs), *batch_output.shape[1:]), dtype=np.uint8
+            ),
         )
+
+    return full_batch_output, full_output_locs, output_locs
diff --git a/tiatoolbox/models/models_abc.py b/tiatoolbox/models/models_abc.py
index 4e1f1d755..dcca370f5 100644
--- a/tiatoolbox/models/models_abc.py
+++ b/tiatoolbox/models/models_abc.py
@@ -9,6 +9,7 @@
 import torch
 import torch._dynamo
 import torch.distributed as dist
+from torch import nn
 from torch.nn.parallel import DistributedDataParallel
 
 from tiatoolbox.models.architecture.utils import is_torch_compile_compatible
@@ -22,29 +23,29 @@
     import numpy as np
 
 
-class IOConfigABC(ABC):
-    """Define an abstract class for holding predictor I/O information.
+def load_torch_model(model: nn.Module, weights: str | Path) -> nn.Module:
+    """Helper function to load a torch model.
 
-    Enforcing such that following attributes must always be defined by
-    the subclass.
-
-    """
+    Args:
+        model (torch.nn.Module):
+            A torch model.
+        weights (str or Path):
+            Path to pretrained weights.
 
-    @property
-    @abstractmethod
-    def input_resolutions(self: IOConfigABC) -> None:
-        """Abstract method to update input_resolution."""
-        raise NotImplementedError
+    Returns:
+        torch.nn.Module:
+            Torch model with pretrained weights loaded on CPU.
 
-    @property
-    @abstractmethod
-    def output_resolutions(self: IOConfigABC) -> None:
-        """Abstract method to update output_resolutions."""
-        raise NotImplementedError
+    """
+    # ! assume to be saved in single GPU mode
+    # always load on to the CPU
+    saved_state_dict = torch.load(weights, map_location="cpu")
+    model.load_state_dict(saved_state_dict, strict=True)
+    return model
 
 
 def model_to(model: torch.nn.Module, device: str = "cpu") -> torch.nn.Module:
-    """Transfers model to specified device e.g., "cpu" or "cuda".
+    """Transfers model to cpu/gpu.
 
     Args:
         model (torch.nn.Module):
@@ -54,7 +55,7 @@ def model_to(model: torch.nn.Module, device: str = "cpu") -> torch.nn.Module:
 
     Returns:
         torch.nn.Module:
-            The model after being moved to specified device.
+            The model after being moved to cpu/gpu.
 
     """
     torch_device = torch.device(device)
@@ -103,10 +104,8 @@ def forward(
     @staticmethod
     @abstractmethod
     def infer_batch(
-        model: torch.nn.Module,
-        batch_data: np.ndarray,
-        device: str,
-    ) -> None:
+        model: nn.Module, batch_data: np.ndarray | torch.Tensor, *, device: str
+    ) -> np.ndarray | tuple[np.ndarray, ...] | dict:
         """Run inference on an input batch.
 
         Contains logic for forward operation as well as I/O aggregation.
@@ -114,13 +113,15 @@ def infer_batch(
         Args:
             model (nn.Module):
                 PyTorch defined model.
-            batch_data (np.ndarray):
+            batch_data (np.ndarray | torch.Tensor):
                 A batch of data generated by
                 `torch.utils.data.DataLoader`.
             device (str):
-                Transfers model to the specified device. Default is "cpu".
+                Transfers model to the specified device.
 
         Returns:
+            np.ndarray:
+                The inference results as a numpy array.
             dict:
                 Returns a dictionary of predictions and other expected outputs
                 depending on the network architecture.
@@ -209,7 +210,7 @@ def to(  # type: ignore[override]
         """Transfers model to cpu/gpu.
 
         Args:
-            model (torch.nn.Module):
+            self (ModelABC):
                 PyTorch defined model.
             device (str):
                 Transfers model to the specified device. Default is "cpu".
diff --git a/tiatoolbox/utils/exceptions.py b/tiatoolbox/utils/exceptions.py
index db74af710..2f9f2a126 100644
--- a/tiatoolbox/utils/exceptions.py
+++ b/tiatoolbox/utils/exceptions.py
@@ -33,3 +33,23 @@ def __init__(
     ) -> None:
         """Initialize :class:`MethodNotSupportedError`."""
         super().__init__(message)
+
+
+class DimensionMismatchError(Exception):
+    """Raise dimension mismatch error.
+
+    Args:
+        expected_dims (list or tuple) : Expected dimensions.
+        actual_dims (list or tuple) : Actual dimensions.
+
+    """
+
+    def __init__(
+        self: DimensionMismatchError,
+        expected_dims: list | tuple,
+        actual_dims: list | tuple,
+    ) -> None:
+        """Initialize :class:`DimensionMismatchError`."""
+        self.expected_dims = expected_dims
+        self.actual_dims = actual_dims
+        super().__init__(f"Expected dimensions {expected_dims}, but got {actual_dims}.")
diff --git a/tiatoolbox/utils/misc.py b/tiatoolbox/utils/misc.py
index a81098acd..56c6a3ea7 100644
--- a/tiatoolbox/utils/misc.py
+++ b/tiatoolbox/utils/misc.py
@@ -11,8 +11,8 @@
 from typing import IO, TYPE_CHECKING, cast
 
 import cv2
+import dask.array as da
 import joblib
-import numcodecs
 import numpy as np
 import pandas as pd
 import requests
@@ -24,10 +24,12 @@
 from shapely.geometry import Polygon
 from shapely.geometry import shape as feature2geometry
 from skimage import exposure
-from tqdm import trange
+from tqdm import notebook as tqdm_notebook
+from tqdm import tqdm, trange
 
 from tiatoolbox import logger
 from tiatoolbox.annotation.storage import Annotation, AnnotationStore, SQLiteStore
+from tiatoolbox.utils.env_detection import is_notebook
 from tiatoolbox.utils.exceptions import FileNotSupportedError
 
 if TYPE_CHECKING:  # pragma: no cover
@@ -163,7 +165,7 @@ def imwrite(image_path: PathLike, img: np.ndarray) -> None:
 
 
 def imread(image_path: PathLike, *, as_uint8: bool | None = None) -> np.ndarray:
-    """Read an image as a NumPy array.
+    """Read an image as :class:`numpy.ndarray`.
 
     Args:
         image_path (PathLike):
@@ -1204,6 +1206,41 @@ def add_from_dat(
     store.append_many(anns)
 
 
+def patch_predictions_as_annotations(
+    preds: list | np.ndarray,
+    keys: list,
+    class_dict: dict,
+    class_probs: list | np.ndarray,
+    patch_coords: list,
+    classes_predicted: list,
+    labels: list,
+) -> list:
+    """Helper function to generate annotation per patch predictions."""
+    annotations = []
+    for i, _ in enumerate(patch_coords):
+        if "probabilities" in keys:
+            props = {
+                f"prob_{class_dict[j]}": class_probs[i][j] for j in classes_predicted
+            }
+        else:
+            props = {}
+        if "labels" in keys:
+            props["label"] = class_dict[labels[i]]
+        if len(preds) > 0:
+            props["type"] = class_dict[preds[i]]
+        annotations.append(Annotation(Polygon.from_bounds(*patch_coords[i]), props))
+
+    return annotations
+
+
+def get_zarr_array(zarr_array: zarr.core.Array | np.ndarray | list) -> np.ndarray:
+    """Converts a zarr array into a numpy array."""
+    if isinstance(zarr_array, zarr.core.Array):
+        return zarr_array[:]
+
+    return np.array(zarr_array).astype(float)
+
+
 def process_contours(
     contours: list[np.ndarray],
     hierarchy: np.ndarray,
@@ -1332,12 +1369,11 @@ def dict_to_store_semantic_segmentor(
             for each patch.
 
     """
-    preds = patch_output["predictions"]
+    preds = da.from_array(patch_output["predictions"], chunks="auto")
 
     # Get the number of unique predictions
-    layer_list = np.unique(preds)
-
-    layer_list = np.delete(layer_list, np.where(layer_list == 0))
+    layer_list = da.unique(preds).compute()
+    layer_list = layer_list[layer_list != 0]
 
     store = SQLiteStore()
 
@@ -1346,12 +1382,13 @@ def dict_to_store_semantic_segmentor(
     annotations_list: list[Annotation] = []
 
     for type_class in layer_list:
-        layer = np.where(preds == type_class, 1, 0)
+        layer = da.where(preds == type_class, 1, 0).astype("uint8").compute()
         contours, hierarchy = cv2.findContours(
-            layer.astype("uint8"),
+            layer,
             cv2.RETR_CCOMP,
             cv2.CHAIN_APPROX_NONE,
         )
+
         contours = cast("list[np.ndarray]", contours)
 
         annotations_list_ = process_contours(contours, hierarchy, scale_factor)
@@ -1374,19 +1411,19 @@ def dict_to_store_semantic_segmentor(
     return store
 
 
-def dict_to_store(
-    patch_output: dict,
-    scale_factor: tuple[int, int],
+def dict_to_store_patch_predictions(
+    patch_output: dict | zarr.group,
+    scale_factor: tuple[float, float],
     class_dict: dict | None = None,
     save_path: Path | None = None,
 ) -> AnnotationStore | Path:
-    """Converts (and optionally saves) output of TIAToolbox engines as AnnotationStore.
+    """Converts output of TIAToolbox PatchPredictor engine to AnnotationStore.
 
     Args:
-        patch_output (dict):
-            A dictionary in the TIAToolbox Engines output format. Important
-            keys are "probabilities", "predictions", "coordinates", and "labels".
-        scale_factor (tuple[int, int]):
+        patch_output (dict | zarr.Group):
+            A dictionary with "probabilities", "predictions", "coordinates",
+            and "labels" keys.
+        scale_factor (tuple[float, float]):
             The scale factor to use when loading the
             annotations. All coordinates will be multiplied by this factor to allow
             conversion of annotations saved at non-baseline resolution to baseline.
@@ -1408,45 +1445,50 @@ def dict_to_store(
         # we cant create annotations without coordinates
         msg = "Patch output must contain coordinates."
         raise ValueError(msg)
+
     # get relevant keys
-    class_probs = patch_output.get("probabilities", [])
-    preds = patch_output.get("predictions", [])
+    class_probs = get_zarr_array(patch_output.get("probabilities", []))
+    preds = get_zarr_array(patch_output.get("predictions", []))
+
     patch_coords = np.array(patch_output.get("coordinates", []))
     if not np.all(np.array(scale_factor) == 1):
         patch_coords = patch_coords * (np.tile(scale_factor, 2))  # to baseline mpp
+
     labels = patch_output.get("labels", [])
     # get classes to consider
     if len(class_probs) == 0:
         classes_predicted = np.unique(preds).tolist()
     else:
         classes_predicted = range(len(class_probs[0]))
+
     if class_dict is None:
         # if no class dict create a default one
-        class_dict = {i: i for i in np.unique(preds + labels).tolist()}
+        if len(class_probs) == 0:
+            class_dict = {i: i for i in np.unique(np.append(preds, labels)).tolist()}
+        else:
+            class_dict = {i: i for i in range(len(class_probs[0]))}
 
     # find what keys we need to save
     keys = ["predictions"]
     keys = keys + [key for key in ["probabilities", "labels"] if key in patch_output]
 
     # put patch predictions into a store
-    annotations = []
-    for i, pred in enumerate(preds):
-        if "probabilities" in keys:
-            props = {
-                f"prob_{class_dict[j]}": class_probs[i][j] for j in classes_predicted
-            }
-        else:
-            props = {}
-        if "labels" in keys:
-            props["label"] = class_dict[labels[i]]
-        props["type"] = class_dict[pred]
-        annotations.append(Annotation(Polygon.from_bounds(*patch_coords[i]), props))
+    annotations = patch_predictions_as_annotations(
+        preds.astype(float),
+        keys,
+        class_dict,
+        class_probs.astype(float),
+        patch_coords.astype(float),
+        classes_predicted,
+        labels,
+    )
+
     store = SQLiteStore()
-    keys = store.append_many(annotations, [str(i) for i in range(len(annotations))])
+    _ = store.append_many(annotations, [str(i) for i in range(len(annotations))])
 
     # if a save director is provided, then dump store into a file
     if save_path:
-        # ensure parent directory exisits
+        # ensure parent directory exists
         save_path.parent.absolute().mkdir(parents=True, exist_ok=True)
         # ensure proper db extension
         save_path = save_path.parent.absolute() / (save_path.stem + ".db")
@@ -1462,6 +1504,27 @@ def _tiles(
     colormap: int = cv2.COLORMAP_JET,
     level: int = 0,
 ) -> Iterator[np.ndarray]:
+    """Generate color-mapped tiles from an input image or Zarr array.
+
+    This function iterates over the input image in non-overlapping tiles of the
+    specified size, optionally downsampling by a power-of-two factor (`level`),
+    and applies a colormap to each tile before yielding it.
+
+    Parameters:
+        in_img (np.ndarray | zarr.core.Array):
+            Input image or Zarr array to be tiled.
+        tile_size (tuple[int, int]):
+            Height and width of each tile.
+        colormap (int, optional):
+            OpenCV colormap to apply to each tile. Defaults to cv2.COLORMAP_JET.
+        level (int, optional):
+            Downsampling factor as a power of two. Defaults to 0 (no downsampling).
+
+    Yields:
+        np.ndarray:
+            A color-mapped tile extracted from the input image.
+
+    """
     for y in trange(0, in_img.shape[0], tile_size[0]):
         for x in range(0, in_img.shape[1], tile_size[1]):
             in_img_ = in_img[
@@ -1567,44 +1630,42 @@ def write_probability_heatmap_as_ome_tiff(
     logger.info(msg)
 
 
-def dict_to_zarr(
-    raw_predictions: dict,
-    save_path: Path,
-    **kwargs: dict,
-) -> Path:
-    """Saves the output of TIAToolbox engines to a zarr file.
+def get_tqdm() -> type[tqdm_notebook | tqdm]:
+    """Returns appropriate tqdm tqdm object."""
+    if is_notebook():  # pragma: no cover
+        return tqdm_notebook.tqdm
+    return tqdm
 
-    Args:
-        raw_predictions (dict):
-            A dictionary in the TIAToolbox Engines output format.
-        save_path (str or Path):
-            Path to save the zarr file.
-        **kwargs (dict):
-            Keyword Args to update patch_pred_store_zarr attributes.
 
+def cast_to_min_dtype(array: np.ndarray | da.Array) -> np.ndarray | da.Array:
+    """Cast the input array to the minimal data type required to represent its values.
+
+    This function determines the maximum value in the array and casts it to the smallest
+    unsigned integer type (or boolean) that can accommodate all values. It supports both
+    NumPy and Dask arrays and preserves the input type in the output.
+
+    For Dask arrays, the maximum value is computed lazily and only when needed.
+
+    Args:
+        array (Union[np.ndarray, da.Array]): Input array containing integer values.
 
     Returns:
-        Path to zarr file storing the patch predictor output
+        (np.ndarray or da.Array):
+             A copy of the input array cast to the minimal required dtype.
+            - If the maximum value is 1, the array is cast to boolean.
+            - Otherwise, it is cast to the smallest suitable unsigned integer type.
 
     """
-    # Default values for Compressor and Chunks set if not received from kwargs.
-    compressor = (
-        kwargs["compressor"] if "compressor" in kwargs else numcodecs.Zstd(level=1)
-    )
-    chunks = kwargs.get("chunks", 10000)
-
-    # ensure proper zarr extension
-    save_path = save_path.parent.absolute() / (save_path.stem + ".zarr")
-
-    # save to zarr
-    predictions_array = np.array(raw_predictions["predictions"])
-    z = zarr.open(
-        save_path,
-        mode="w",
-        shape=predictions_array.shape,
-        chunks=chunks,
-        compressor=compressor,
-    )
-    z[:] = predictions_array
+    is_dask = isinstance(array, da.Array)
+    max_value = da.max(array) if is_dask else np.max(array)
+    max_value = max_value.compute() if is_dask else max_value
 
-    return save_path
+    if max_value == 1:
+        return array.astype(bool)
+
+    dtypes = [np.uint8, np.uint16, np.uint32, np.uint64]
+    for dtype in dtypes:
+        if max_value <= np.iinfo(dtype).max:
+            return array.astype(dtype)
+
+    return array
diff --git a/tiatoolbox/utils/transforms.py b/tiatoolbox/utils/transforms.py
index bb9f5670d..8fba6fee9 100644
--- a/tiatoolbox/utils/transforms.py
+++ b/tiatoolbox/utils/transforms.py
@@ -95,7 +95,7 @@ def imresize(
     img: np.ndarray,
     scale_factor: float | tuple[float, float] | None = None,
     output_size: int | tuple[int, int] | None = None,
-    interpolation: str = "optimise",
+    interpolation: str | int = "optimise",
 ) -> np.ndarray:
     """Resize input image.