fix

mgumowsk · mgumowsk · commit 6774f62dcd56 · 2025-10-02T12:36:21.000+02:00
diff --git a/src/model_api/adapters/onnx_adapter.py b/src/model_api/adapters/onnx_adapter.py
@@ -1,17 +1,16 @@
 #
-# Copyright (C) 2020-2024 Intel Corporation
+# Copyright (C) 2020-2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #
 
 from __future__ import annotations
 
 import sys
-from functools import partial, reduce
 from typing import Any, Callable
 
 import numpy as np
 
-from .utils import INTERPOLATION_TYPES, RESIZE_TYPES, InputTransform
+from .utils import setup_python_preprocessing_pipeline
 
 try:
     import onnx
@@ -145,30 +144,17 @@ def embed_preprocessing(
         """
         Adds external preprocessing steps done before ONNX model execution.
         """
-        preproc_funcs = [np.squeeze]
-        if resize_mode != "crop":
-            if resize_mode == "fit_to_window_letterbox":
-                resize_fn = partial(
-                    RESIZE_TYPES[resize_mode],
-                    size=target_shape,
-                    interpolation=INTERPOLATION_TYPES[interpolation_mode],
-                    pad_value=pad_value,
-                )
-            else:
-                resize_fn = partial(
-                    RESIZE_TYPES[resize_mode],
-                    size=target_shape,
-                    interpolation=INTERPOLATION_TYPES[interpolation_mode],
-                )
-        else:
-            resize_fn = partial(RESIZE_TYPES[resize_mode], size=target_shape)
-        preproc_funcs.append(resize_fn)
-        input_transform = InputTransform(brg2rgb, mean, scale)
-        preproc_funcs.extend((input_transform.__call__, partial(change_layout, layout=layout)))
-
-        self.preprocessor = reduce(
-            lambda f, g: lambda x: f(g(x)),
-            reversed(preproc_funcs),
+        self.preprocessor = setup_python_preprocessing_pipeline(
+            layout=layout,
+            resize_mode=resize_mode,
+            interpolation_mode=interpolation_mode,
+            target_shape=target_shape,
+            pad_value=pad_value,
+            dtype=dtype,
+            brg2rgb=brg2rgb,
+            mean=mean,
+            scale=scale,
+            input_idx=input_idx,
         )
 
     def get_model(self):
@@ -227,18 +213,3 @@ def get_shape_from_onnx(onnx_shape):
         if isinstance(item, str):
             onnx_shape[i] = -1
     return tuple(onnx_shape)
-
-
-def change_layout(image, layout):
-    """Changes the input image layout to fit the layout of the model input layer.
-
-    Args:
-        inputs (ndarray): a single image as 3D array in HWC layout
-
-    Returns:
-        - the image with layout aligned with the model layout
-    """
-    if "CHW" in layout:
-        image = image.transpose((2, 0, 1))  # HWC->CHW
-        image = image.reshape((1, *image.shape))
-    return image
diff --git a/src/model_api/adapters/openvino_adapter.py b/src/model_api/adapters/openvino_adapter.py
@@ -41,6 +41,7 @@
     resize_image,
     resize_image_letterbox,
     resize_image_with_aspect,
+    setup_python_preprocessing_pipeline,
 )
 
 
@@ -143,6 +144,8 @@ def __init__(
         )
         self.is_onnx_file = False
         self.onnx_metadata = {}
+        self.preprocessor = lambda arg: arg
+        self.use_python_preprocessing = False
 
         if isinstance(self.model_path, (str, Path)):
             if Path(self.model_path).suffix == ".onnx" and weights_path:
@@ -280,11 +283,17 @@ def copy_raw_result(self, request):
         return {key: request.get_tensor(key).data.copy() for key in self.get_output_layers()}
 
     def infer_sync(self, dict_data: dict[str, ndarray]) -> dict[str, ndarray]:
+        if self.use_python_preprocessing:
+            for key in dict_data:
+                dict_data[key] = self.preprocessor(dict_data[key])
         self.infer_request = self.async_queue[self.async_queue.get_idle_request_id()]
         self.infer_request.infer(dict_data)
         return self.get_raw_result(self.infer_request)
 
     def infer_async(self, dict_data, callback_data) -> None:
+        if self.use_python_preprocessing:
+            for key in dict_data:
+                dict_data[key] = self.preprocessor(dict_data[key])
         self.async_queue.start_async(dict_data, callback_data)
 
     def set_callback(self, callback_fn: Callable):
@@ -347,8 +356,26 @@ def embed_preprocessing(
         input_idx: int = 0,
     ) -> None:
         """
-        Embeds OpenVINO PrePostProcessor module into the model.
+        Embeds preprocessing into the model, or sets up Python preprocessing for NPU devices.
         """
+        # Check if we should use Python preprocessing for NPU devices
+        devices = parse_devices(self.device)
+        if any("NPU" in dev.upper() for dev in devices):
+            self.preprocessor = setup_python_preprocessing_pipeline(
+                layout=layout,
+                resize_mode=resize_mode,
+                interpolation_mode=interpolation_mode,
+                target_shape=target_shape,
+                pad_value=pad_value,
+                dtype=dtype,
+                brg2rgb=brg2rgb,
+                mean=mean,
+                scale=scale,
+                input_idx=input_idx,
+            )
+            self.use_python_preprocessing = True
+            return
+
         ppp = PrePostProcessor(self.model)
 
         # Change the input type to the 8-bit image
diff --git a/src/model_api/adapters/utils.py b/src/model_api/adapters/utils.py
@@ -517,6 +517,81 @@ def crop_resize_ocv(image: np.ndarray, size: tuple[int, int]) -> np.ndarray:
     return cv2.resize(cropped_frame, size)
 
 
+def setup_python_preprocessing_pipeline(
+    layout: str,
+    resize_mode: str,
+    interpolation_mode: str,
+    target_shape: tuple[int, ...],
+    pad_value: int,
+    dtype: type = int,
+    brg2rgb: bool = False,
+    mean: list[Any] | None = None,
+    scale: list[Any] | None = None,
+    input_idx: int = 0,
+):
+    """
+    Sets up a Python preprocessing pipeline for model adapters.
+
+    Args:
+        layout: Target layout for the input (e.g., "NCHW", "NHWC")
+        resize_mode: Type of resizing ("crop", "standard", "fit_to_window", "fit_to_window_letterbox")
+        interpolation_mode: Interpolation method ("LINEAR", "CUBIC", "NEAREST")
+        target_shape: Target shape for resizing
+        pad_value: Padding value for letterbox resizing
+        dtype: Data type for preprocessing
+        brg2rgb: Whether to convert BGR to RGB
+        mean: Mean values for normalization
+        scale: Scale values for normalization
+        input_idx: Input index (unused but kept for compatibility)
+
+    Returns:
+        Callable: A preprocessing function that can be applied to input data
+    """
+    from functools import partial, reduce
+
+    preproc_funcs = [np.squeeze]
+    if resize_mode != "crop":
+        if resize_mode == "fit_to_window_letterbox":
+            resize_fn = partial(
+                RESIZE_TYPES[resize_mode],
+                size=target_shape,
+                interpolation=INTERPOLATION_TYPES[interpolation_mode],
+                pad_value=pad_value,
+            )
+        else:
+            resize_fn = partial(
+                RESIZE_TYPES[resize_mode],
+                size=target_shape,
+                interpolation=INTERPOLATION_TYPES[interpolation_mode],
+            )
+    else:
+        resize_fn = partial(RESIZE_TYPES[resize_mode], size=target_shape)
+    preproc_funcs.append(resize_fn)
+    input_transform = InputTransform(brg2rgb, mean, scale)
+    preproc_funcs.extend((input_transform.__call__, partial(change_layout, layout=layout)))
+
+    return reduce(
+        lambda f, g: lambda x: f(g(x)),
+        reversed(preproc_funcs),
+    )
+
+
+def change_layout(image, layout):
+    """Changes the input image layout to fit the layout of the model input layer.
+
+    Args:
+        image (ndarray): a single image as 3D array in HWC layout
+        layout (str): target layout
+
+    Returns:
+        ndarray: the image with layout aligned with the model layout
+    """
+    if "CHW" in layout:
+        image = image.transpose((2, 0, 1))  # HWC->CHW
+        image = image.reshape((1, *image.shape))
+    return image
+
+
 RESIZE_TYPES: dict[str, Callable] = {
     "crop": crop_resize_ocv,
     "standard": resize_image_ocv,