Add Tiled Image Upscale (With Model)

WASasquatch · WASasquatch · commit 77ca55d7a4dd · 2025-11-03T23:28:59.000-08:00
diff --git a/nodes/TiledUpscaleModel.py b/nodes/TiledUpscaleModel.py
@@ -0,0 +1,315 @@
+import torch
+
+import comfy.utils
+from comfy import model_management
+
+
+@torch.inference_mode()
+def dynamic_tiled_upscale_with_custom_feather(
+    samples,
+    function,
+    tile_size=512,
+    overlap=32,
+    output_device="cpu",
+    pbar=None,
+    feather=0,
+    target_height=None,
+    target_width=None,
+    resample_method="lanczos",
+):
+    if samples.ndim != 4:
+        raise ValueError("Expected samples with shape [B, C, H, W].")
+
+    batch_size, channels, in_height, in_width = samples.shape
+
+    if target_height is None or target_width is None:
+        raise ValueError("target_height and target_width must be provided.")
+
+    tile_size = int(tile_size)
+    if tile_size <= 0:
+        raise ValueError("tile_size must be positive.")
+
+    overlap = max(0, int(overlap))
+    if overlap >= tile_size:
+        overlap = tile_size - 1 if tile_size > 1 else 0
+
+    tile_step = tile_size - overlap if tile_size > overlap else tile_size
+
+    scale_y_global = float(target_height) / float(in_height)
+    scale_x_global = float(target_width) / float(in_width)
+
+    blended_output = None
+
+    for batch_index in range(batch_size):
+        source = samples[batch_index : batch_index + 1]
+
+        output_for_batch = None
+        weight_for_batch = None
+
+        y_position = 0
+        while y_position < in_height:
+            x_position = 0
+            while x_position < in_width:
+                y_end = min(y_position + tile_size, in_height)
+                x_end = min(x_position + tile_size, in_width)
+
+                tile_source = source[:, :, y_position:y_end, x_position:x_end]
+                tile_output_native = function(tile_source).to(output_device)
+
+                if output_for_batch is None:
+                    out_channels = tile_output_native.shape[1]
+                    output_for_batch = torch.zeros(
+                        (1, out_channels, target_height, target_width),
+                        device=output_device,
+                        dtype=tile_output_native.dtype,
+                    )
+                    weight_for_batch = torch.zeros_like(output_for_batch)
+
+                    if blended_output is None:
+                        blended_output = torch.zeros(
+                            (batch_size, out_channels, target_height, target_width),
+                            device=output_device,
+                            dtype=tile_output_native.dtype,
+                        )
+
+                out_y_start = int(round(y_position * target_height / in_height))
+                out_y_end = int(round(y_end * target_height / in_height))
+                out_x_start = int(round(x_position * target_width / in_width))
+                out_x_end = int(round(x_end * target_width / in_width))
+
+                tile_target_height = max(1, out_y_end - out_y_start)
+                tile_target_width = max(1, out_x_end - out_x_start)
+
+                if (
+                    tile_output_native.shape[2] != tile_target_height
+                    or tile_output_native.shape[3] != tile_target_width
+                ):
+                    tile_output = comfy.utils.common_upscale(
+                        tile_output_native,
+                        tile_target_width,
+                        tile_target_height,
+                        resample_method,
+                        "disabled",
+                    )
+                else:
+                    tile_output = tile_output_native
+
+                mask = torch.ones_like(tile_output)
+
+                if feather is None or feather <= 0:
+                    feather_pixels_y = int(round(overlap * scale_y_global))
+                    feather_pixels_x = int(round(overlap * scale_x_global))
+                else:
+                    feather_pixels_y = int(feather)
+                    feather_pixels_x = int(feather)
+
+                if feather_pixels_y > 0:
+                    max_vertical = tile_output.shape[2] // 2
+                    feather_pixels_y = min(feather_pixels_y, max_vertical)
+                    for t in range(feather_pixels_y):
+                        weight_value = float(t + 1) / float(feather_pixels_y)
+                        row_start = t
+                        row_end = t + 1
+                        inv_row_start = tile_output.shape[2] - 1 - t
+                        inv_row_end = tile_output.shape[2] - t
+                        mask[:, :, row_start:row_end, :].mul_(weight_value)
+                        mask[:, :, inv_row_start:inv_row_end, :].mul_(weight_value)
+
+                if feather_pixels_x > 0:
+                    max_horizontal = tile_output.shape[3] // 2
+                    feather_pixels_x = min(feather_pixels_x, max_horizontal)
+                    for t in range(feather_pixels_x):
+                        weight_value = float(t + 1) / float(feather_pixels_x)
+                        col_start = t
+                        col_end = t + 1
+                        inv_col_start = tile_output.shape[3] - 1 - t
+                        inv_col_end = tile_output.shape[3] - t
+                        mask[:, :, :, col_start:col_end].mul_(weight_value)
+                        mask[:, :, :, inv_col_start:inv_col_end].mul_(weight_value)
+
+                out_y_end = out_y_start + tile_output.shape[2]
+                out_x_end = out_x_start + tile_output.shape[3]
+
+                output_for_batch[:, :, out_y_start:out_y_end, out_x_start:out_x_end] += (
+                    tile_output * mask
+                )
+                weight_for_batch[:, :, out_y_start:out_y_end, out_x_start:out_x_end] += mask
+
+                if pbar is not None:
+                    pbar.update(1)
+
+                x_position += tile_step
+            y_position += tile_step
+
+        weight_for_batch = torch.where(
+            weight_for_batch == 0.0,
+            torch.ones_like(weight_for_batch),
+            weight_for_batch,
+        )
+        output_for_batch = output_for_batch / weight_for_batch
+
+        blended_output[batch_index : batch_index + 1] = output_for_batch
+
+    return blended_output
+
+
+class WASTiledImageUpscaleWithModel:
+    @classmethod
+    def INPUT_TYPES(cls):
+        return {
+            "required": {
+                "upscale_model": ("UPSCALE_MODEL", {}),
+                "image": ("IMAGE", {}),
+                "upscale_factor": (
+                    "FLOAT",
+                    {
+                        "default": 4.0,
+                        "min": 1.0,
+                        "max": 16.0,
+                        "step": 0.1,
+                        "tooltip": "Final scale relative to input image size. Output resolution ~= input * upscale_factor.",
+                    },
+                ),
+                "tile_size": (
+                    "INT",
+                    {
+                        "default": 512,
+                        "min": 64,
+                        "max": 4096,
+                        "step": 16,
+                        "tooltip": "Tile size in input pixels. Larger tiles are faster but use more VRAM.",
+                    },
+                ),
+                "overlap": (
+                    "INT",
+                    {
+                        "default": 32,
+                        "min": 0,
+                        "max": 1024,
+                        "step": 1,
+                        "tooltip": "Tile overlap in input pixels. Higher overlap reduces seams but increases compute.",
+                    },
+                ),
+                "feather": (
+                    "INT",
+                    {
+                        "default": 0,
+                        "min": 0,
+                        "max": 4096,
+                        "step": 1,
+                        "tooltip": "Feather width in output pixels for tile blending. 0 = auto from overlap.",
+                    },
+                ),
+                "resample_method": (
+                    [
+                        "nearest-exact",
+                        "bilinear",
+                        "area",
+                        "bicubic",
+                        "lanczos",
+                    ],
+                    {
+                        "default": "lanczos",
+                        "tooltip": "Resampling kernel used to reach the final upscale_factor resolution.",
+                    },
+                ),
+            }
+        }
+
+    RETURN_TYPES = ("IMAGE",)
+    FUNCTION = "upscale"
+    CATEGORY = "image/upscaling"
+
+    def upscale(
+        self,
+        upscale_model,
+        image,
+        upscale_factor,
+        tile_size,
+        overlap,
+        feather,
+        resample_method,
+    ):
+        device = model_management.get_torch_device()
+
+        scale_estimate = getattr(upscale_model, "scale", 4.0)
+        element_size = image.element_size()
+
+        memory_required = model_management.module_size(upscale_model.model)
+        memory_required += (
+            tile_size * tile_size * 3
+        ) * element_size * max(scale_estimate, 1.0) * 384.0
+        memory_required += image.nelement() * element_size
+
+        model_management.free_memory(memory_required, device)
+
+        upscale_model.to(device)
+
+        batch_size, in_h, in_w, _ = image.shape
+
+        upscale_factor = float(upscale_factor)
+        if upscale_factor < 1.0:
+            upscale_factor = 1.0
+
+        target_height = max(1, int(round(in_h * upscale_factor)))
+        target_width = max(1, int(round(in_w * upscale_factor)))
+
+        input_image = image.movedim(-1, -3).to(device)
+
+        current_tile_size = int(tile_size)
+        minimum_tile_size = 64
+
+        upscale_result = None
+        output_device = device
+
+        oom = True
+        last_exception = None
+
+        while oom:
+            try:
+                steps = input_image.shape[0] * comfy.utils.get_tiled_scale_steps(
+                    input_image.shape[3],
+                    input_image.shape[2],
+                    tile_x=current_tile_size,
+                    tile_y=current_tile_size,
+                    overlap=overlap,
+                )
+                progress = comfy.utils.ProgressBar(steps)
+
+                upscale_result = dynamic_tiled_upscale_with_custom_feather(
+                    samples=input_image,
+                    function=lambda a: upscale_model(a),
+                    tile_size=current_tile_size,
+                    overlap=overlap,
+                    output_device=output_device,
+                    pbar=progress,
+                    feather=feather,
+                    target_height=target_height,
+                    target_width=target_width,
+                    resample_method=resample_method,
+                )
+
+                oom = False
+            except model_management.OOM_EXCEPTION as exception:
+                last_exception = exception
+                current_tile_size //= 2
+                if current_tile_size < minimum_tile_size:
+                    upscale_model.to("cpu")
+                    raise last_exception
+
+        upscale_model.to("cpu")
+
+        upscale_result = torch.clamp(
+            upscale_result.movedim(-3, -1), min=0.0, max=1.0
+        )
+
+        return (upscale_result,)
+
+
+NODE_CLASS_MAPPINGS = {
+    "WASTiledImageUpscaleWithModel": WASTiledImageUpscaleWithModel,
+}
+
+NODE_DISPLAY_NAME_MAPPINGS = {
+    "WASTiledImageUpscaleWithModel": "Tiled Image Upscale (With Model)",
+}
diff --git a/pyproject.toml b/pyproject.toml
@@ -1,6 +1,6 @@
 [project]
 name = "was-extras"
-version = "1.1.0"
+version = "1.2.0"
 description = "A collection of experimental WAS nodes and utilities for ComfyUI."
 readme = "README.md"
 requires-python = ">=3.10"