diff --git a/.github/workflows/test_accuracy.yml b/.github/workflows/test_accuracy.yml
index 0ce9dc10..37e81794 100644
--- a/.github/workflows/test_accuracy.yml
+++ b/.github/workflows/test_accuracy.yml
@@ -42,17 +42,8 @@ jobs:
           mkdir build && cd build
           pip install nanobind==2.4.0
           pip install typing_extensions==4.12.2
-          cmake ../tests/cpp/accuracy/
+          cmake ../tests/cpp
           make -j
-      - name: Build CPP-PY Bindings
-        run: |
-          source venv/bin/activate
-          pip install src/cpp/py_bindings
       - name: Run CPP Test
         run: |
           build/test_accuracy -d data -p tests/python/accuracy/public_scope.json
-      - name: Run CPP-PY Bindings Test
-        run: |
-          source venv/bin/activate
-          pip list
-          pytest --data=./data --config=./tests/python/accuracy/public_scope.json tests/cpp/accuracy/test_bindings.py
diff --git a/.github/workflows/test_precommit.yml b/.github/workflows/test_precommit.yml
index 5ae39dcb..45961b40 100644
--- a/.github/workflows/test_precommit.yml
+++ b/.github/workflows/test_precommit.yml
@@ -47,81 +47,6 @@ jobs:
           github_token: ${{ secrets.GITHUB_TOKEN}}
           # missingInclude: cppcheck can't find stl, openvino, opencv
           other_options: --suppress=missingInclude -Isrc/cpp/models/include -Isrc/cpp/utils/include -Isrc/cpp/pipelines/include --check-config
-  CPP-Precommit:
-    runs-on: ubuntu-22.04
-    steps:
-      - uses: actions/checkout@v3
-      - uses: actions/setup-python@v4
-        with:
-          python-version: "3.10"
-          cache: pip
-      - name: Create and start a virtual environment
-        run: |
-          python -m venv venv
-          source venv/bin/activate
-      - name: Install dependencies
-        run: |
-          source venv/bin/activate
-          python -m pip install --upgrade pip
-          pip install src/python/[tests,build] --extra-index-url https://download.pytorch.org/whl/cpu
-
-          sudo bash src/cpp/install_dependencies.sh
-      - name: Prepare test data
-        run: |
-          source venv/bin/activate
-          python tests/cpp/precommit/prepare_data.py -d data -p tests/cpp/precommit/public_scope.json
-      - name: Build
-        run: |
-          mkdir build && cd build
-          pip install nanobind==2.4.0
-          pip install typing_extensions==4.12.2
-          cmake ../tests/cpp/precommit/
-          cmake --build . -j $((`nproc`*2+2))
-      - name: Run test
-        run: |
-          build/test_sanity -d data -p tests/cpp/precommit/public_scope.json && build/test_model_config -d data
-  CPP-Windows-Precommit:
-    runs-on: windows-latest
-    steps:
-      - uses: actions/checkout@v3
-      - uses: actions/setup-python@v4
-        with:
-          python-version: 3.9
-          cache: pip
-      - name: Create and start a virtual environment
-        shell: bash
-        run: |
-          python -m venv venv
-          source venv/Scripts/activate
-      - name: Install dependencies
-        shell: bash
-        run: |
-          source venv/Scripts/activate
-          python -m pip install --upgrade pip
-          pip install src/python/[tests,build] --extra-index-url https://download.pytorch.org/whl/cpu
-          curl https://storage.openvinotoolkit.org/repositories/openvino/packages/2024.6/windows/w_openvino_toolkit_windows_2024.6.0.17404.4c0f47d2335_x86_64.zip --output w_openvino_toolkit_windows.zip
-          unzip w_openvino_toolkit_windows.zip
-          rm w_openvino_toolkit_windows.zip
-          curl -L https://github.com/opencv/opencv/releases/download/4.10.0/opencv-4.10.0-windows.exe --output opencv-4.10.0-windows.exe
-          ./opencv-4.10.0-windows.exe -oopencv -y
-          rm opencv-4.10.0-windows.exe
-      - name: Prepare test data
-        shell: bash
-        run: |
-          source venv/Scripts/activate
-          python tests/cpp/precommit/prepare_data.py -d data -p tests/cpp/precommit/public_scope.json
-      - name: Build
-        shell: bash
-        run: |
-          mkdir build && cd build
-          MSYS_NO_PATHCONV=1 cmake ../examples/cpp/ -DOpenVINO_DIR=$GITHUB_WORKSPACE/w_openvino_toolkit_windows_2024.6.0.17404.4c0f47d2335_x86_64/runtime/cmake -DOpenCV_DIR=$GITHUB_WORKSPACE/opencv/opencv/build -DCMAKE_CXX_FLAGS=/WX
-          cmake --build . --config Release -j $((`nproc`*2+2))
-      - name: Run sync sample
-        shell: cmd
-        # .\w_openvino_toolkit_windows_2023.0.0.10926.b4452d56304_x86_64\setupvars.bat exits with 0 code without moving to a next command. Set PATH manually
-        run: |
-          set PATH=opencv\opencv\build\x64\vc16\bin;w_openvino_toolkit_windows_2024.6.0.17404.4c0f47d2335_x86_64\runtime\bin\intel64\Release;w_openvino_toolkit_windows_2024.6.0.17404.4c0f47d2335_x86_64\runtime\3rdparty\tbb\bin;%PATH%
-          .\build\Release\synchronous_api.exe .\data\otx_models\detection_model_with_xai_head.xml .\data\BloodImage_00007.jpg
   serving_api:
     strategy:
       fail-fast: false
diff --git a/examples/cpp/CMakeLists.txt b/examples/cpp/CMakeLists.txt
index fe22571f..f2e10985 100644
--- a/examples/cpp/CMakeLists.txt
+++ b/examples/cpp/CMakeLists.txt
@@ -94,5 +94,4 @@ find_package(OpenCV REQUIRED COMPONENTS imgcodecs)
 
 add_subdirectory(../../src/cpp ${Samples_BINARY_DIR}/src/cpp)
 
-add_example(NAME asynchronous_api SOURCES ./asynchronous_api/main.cpp DEPENDENCIES model_api)
-add_example(NAME synchronous_api SOURCES ./synchronous_api/main.cpp DEPENDENCIES model_api)
+add_example(NAME synchronous_api SOURCES ./main.cpp DEPENDENCIES model_api)
diff --git a/examples/cpp/synchronous_api/README.md b/examples/cpp/README.md
similarity index 100%
rename from examples/cpp/synchronous_api/README.md
rename to examples/cpp/README.md
diff --git a/examples/cpp/asynchronous_api/README.md b/examples/cpp/asynchronous_api/README.md
deleted file mode 100644
index 88e44483..00000000
--- a/examples/cpp/asynchronous_api/README.md
+++ /dev/null
@@ -1,55 +0,0 @@
-# Synchronous API example
-
-This example demonstrates how to use a C++ API of OpenVINO Model API for asynchronous inference and its basic steps:
-
-- Instantiate a model
-- Set a callback to grab inference results
-- Model inference
-- Model batch inference
-- Process results of the batch inference
-
-## Prerequisites
-
-- Install third party dependencies by running the following script:
-
-  ```bash
-  chmod +x ../../../src/cpp/install_dependencies.sh
-  sudo ../../../src/cpp/install_dependencies.sh
-  ```
-
-- Build example:
-
-  - Create `build` folder and navigate into it:
-
-  ```bash
-  mkdir build && cd build
-  ```
-
-  - Run cmake:
-
-  ```bash
-  cmake ../
-  ```
-
-  - Build:
-
-  ```bash
-  make -j
-  ```
-
-- Download a model by running a Python code with Model API, see Python [example](../../python/asynchronous_api/README.md):
-
-  ```python
-  from model_api.models import DetectionModel
-
-  model = DetectionModel.create_model("ssd_mobilenet_v1_fpn_coco",
-                                  download_dir="tmp")
-  ```
-
-## Run example
-
-To run the example, please execute the following command:
-
-```bash
-./asynchronous_api ./tmp/public/ssd_mobilenet_v1_fpn_coco/FP16/ssd_mobilenet_v1_fpn_coco.xml <path_to_image>
-```
diff --git a/examples/cpp/asynchronous_api/main.cpp b/examples/cpp/asynchronous_api/main.cpp
deleted file mode 100644
index f8edc2cc..00000000
--- a/examples/cpp/asynchronous_api/main.cpp
+++ /dev/null
@@ -1,88 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-#include <adapters/openvino_adapter.h>
-#include <models/detection_model.h>
-#include <models/results.h>
-#include <stddef.h>
-
-#include <cstdint>
-#include <exception>
-#include <iomanip>
-#include <iostream>
-#include <opencv2/core.hpp>
-#include <opencv2/imgcodecs.hpp>
-#include <openvino/openvino.hpp>
-#include <stdexcept>
-#include <string>
-
-int main(int argc, char* argv[]) try {
-    if (argc != 3) {
-        throw std::runtime_error(std::string{"Usage: "} + argv[0] + " <path_to_model> <path_to_image>");
-    }
-
-    cv::Mat image = cv::imread(argv[2]);
-    cv::cvtColor(image, image, cv::COLOR_BGR2RGB);
-
-    if (!image.data) {
-        throw std::runtime_error{"Failed to read the image"};
-    }
-
-    // Instantiate Object Detection model
-    auto model = DetectionModel::create_model(argv[1],
-                                              {},
-                                              "",
-                                              false);  // works with SSD models. Download it using Python Model API
-    // Define number of parallel infer requests. Is this number is set to 0, OpenVINO will determine it automatically to
-    // obtain optimal performance.
-    size_t num_requests = 0;
-    static ov::Core core;
-    model->load(core, "CPU", num_requests);
-
-    std::cout << "Async inference will be carried out by " << model->getNumAsyncExecutors() << " parallel executors\n";
-    // Prepare batch data
-    std::vector<ImageInputData> data;
-    for (size_t i = 0; i < 3; i++) {
-        data.push_back(ImageInputData(image));
-    }
-
-    // Batch inference is done by processing batch with num_requests parallel infer requests
-    std::cout << "Starting batch inference\n";
-    auto results = model->inferBatch(data);
-
-    std::cout << "Batch mode inference results:\n";
-    for (const auto& result : results) {
-        for (auto& obj : result->objects) {
-            std::cout << " " << std::left << std::setw(9) << obj.confidence << " " << obj.label << "\n";
-        }
-        std::cout << std::string(10, '-') << "\n";
-    }
-    std::cout << "Batch mode inference done\n";
-    std::cout << "Async mode inference results:\n";
-
-    // Set callback to grab results once the inference is done
-    model->setCallback([](std::unique_ptr<ResultBase> result, const ov::AnyMap& callback_args) {
-        auto det_result = std::unique_ptr<DetectionResult>(static_cast<DetectionResult*>(result.release()));
-
-        // callback_args can contain arbitrary data
-        size_t id = callback_args.find("id")->second.as<size_t>();
-
-        std::cout << "Request with id " << id << " is finished\n";
-        for (auto& obj : det_result->objects) {
-            std::cout << " " << std::left << std::setw(9) << obj.confidence << " " << obj.label << "\n";
-        }
-        std::cout << std::string(10, '-') << "\n";
-    });
-
-    for (size_t i = 0; i < 3; i++) {
-        model->inferAsync(image, {{"id", i}});
-    }
-    model->awaitAll();
-} catch (const std::exception& error) {
-    std::cerr << error.what() << '\n';
-    return 1;
-} catch (...) {
-    std::cerr << "Non-exception object thrown\n";
-    return 1;
-}
diff --git a/examples/cpp/synchronous_api/main.cpp b/examples/cpp/main.cpp
similarity index 78%
rename from examples/cpp/synchronous_api/main.cpp
rename to examples/cpp/main.cpp
index 1f79a035..47d2eaf9 100644
--- a/examples/cpp/synchronous_api/main.cpp
+++ b/examples/cpp/main.cpp
@@ -1,12 +1,11 @@
 /*
- * Copyright (C) 2020-2024 Intel Corporation
+ * Copyright (C) 2020-2025 Intel Corporation
  * SPDX-License-Identifier: Apache-2.0
  */
 
-#include <models/detection_model.h>
-#include <models/input_data.h>
-#include <models/results.h>
 #include <stddef.h>
+#include <tasks/detection.h>
+#include <tasks/results.h>
 
 #include <cstdint>
 #include <exception>
@@ -31,13 +30,13 @@ int main(int argc, char* argv[]) try {
     }
 
     // Instantiate Object Detection model
-    auto model = DetectionModel::create_model(argv[1]);  // works with SSD models. Download it using Python Model API
+    auto model = DetectionModel::load(argv[1], {});  // works with SSD models. Download it using Python Model API
 
     // Run the inference
-    auto result = model->infer(image);
+    auto result = model.infer(image);
 
     // Process detections
-    for (auto& obj : result->objects) {
+    for (auto& obj : result.objects) {
         std::cout << " " << std::left << std::setw(9) << obj.label << " | " << std::setw(10) << obj.confidence << " | "
                   << std::setw(4) << int(obj.x) << " | " << std::setw(4) << int(obj.y) << " | " << std::setw(4)
                   << int(obj.x + obj.width) << " | " << std::setw(4) << int(obj.y + obj.height) << "\n";
diff --git a/examples/python/asynchronous_api/run.py b/examples/python/asynchronous_api/run.py
index 8385b2a9..f0667a3e 100644
--- a/examples/python/asynchronous_api/run.py
+++ b/examples/python/asynchronous_api/run.py
@@ -1,6 +1,6 @@
 #!/usr/bin/env python3
 #
-# Copyright (C) 2020-2024 Intel Corporation
+# Copyright (C) 2020-2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #
 
diff --git a/examples/python/serving_api/run.py b/examples/python/serving_api/run.py
index 99299164..213029dc 100755
--- a/examples/python/serving_api/run.py
+++ b/examples/python/serving_api/run.py
@@ -1,6 +1,6 @@
 #!/usr/bin/env python3
 #
-# Copyright (C) 2020-2024 Intel Corporation
+# Copyright (C) 2020-2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #
 
diff --git a/examples/python/synchronous_api/run.py b/examples/python/synchronous_api/run.py
index 3f3d6806..d45dd03a 100755
--- a/examples/python/synchronous_api/run.py
+++ b/examples/python/synchronous_api/run.py
@@ -1,6 +1,6 @@
 #!/usr/bin/env python3
 #
-# Copyright (C) 2020-2024 Intel Corporation
+# Copyright (C) 2020-2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #
 
diff --git a/examples/python/visual_prompting/run.py b/examples/python/visual_prompting/run.py
index 793e1504..0eab9175 100644
--- a/examples/python/visual_prompting/run.py
+++ b/examples/python/visual_prompting/run.py
@@ -1,6 +1,6 @@
 #!/usr/bin/env python3
 #
-# Copyright (C) 2020-2024 Intel Corporation
+# Copyright (C) 2020-2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #
 
diff --git a/examples/python/zsl_visual_prompting/run.py b/examples/python/zsl_visual_prompting/run.py
index 439c1765..9873e6f3 100644
--- a/examples/python/zsl_visual_prompting/run.py
+++ b/examples/python/zsl_visual_prompting/run.py
@@ -1,6 +1,6 @@
 #!/usr/bin/env python3
 #
-# Copyright (C) 2020-2024 Intel Corporation
+# Copyright (C) 2020-2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #
 
diff --git a/src/cpp/CMakeLists.txt b/src/cpp/CMakeLists.txt
index 880f211a..215bf2aa 100644
--- a/src/cpp/CMakeLists.txt
+++ b/src/cpp/CMakeLists.txt
@@ -1,106 +1,24 @@
-# Copyright (C) 2018-2025 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-#
-
 cmake_minimum_required(VERSION 3.26)
 
-# Multi config generators such as Visual Studio ignore CMAKE_BUILD_TYPE. Multi config generators are configured with
-# CMAKE_CONFIGURATION_TYPES, but limiting options in it completely removes such build options
-get_property(GENERATOR_IS_MULTI_CONFIG_VAR GLOBAL PROPERTY GENERATOR_IS_MULTI_CONFIG)
-if(NOT GENERATOR_IS_MULTI_CONFIG_VAR AND NOT DEFINED CMAKE_BUILD_TYPE)
-    message(STATUS "CMAKE_BUILD_TYPE not defined, 'Release' will be used")
-    # Setting CMAKE_BUILD_TYPE as CACHE must go before project(). Otherwise project() sets its value and set() doesn't take an effect
-    set(CMAKE_BUILD_TYPE Release CACHE STRING "Choose the type of build, options are: None Debug Release RelWithDebInfo MinSizeRel ...")
-endif()
-
-set(model_api_VERSION 0.0.0)
+set(vision_api_VERSION 0.0.0)
 
-project(model_api
-        VERSION ${model_api_VERSION}
+project(vision_api
+        VERSION ${vision_api_VERSION}
         DESCRIPTION "OpenVINO Vision API"
         HOMEPAGE_URL "https://github.com/openvinotoolkit/model_api/"
         LANGUAGES CXX C)
 
-if(WIN32)
-    if(NOT "${CMAKE_SIZEOF_VOID_P}" EQUAL "8")
-        message(FATAL_ERROR "Only 64-bit supported on Windows")
-    endif()
-
-    add_definitions(-DNOMINMAX)
-endif()
-
 find_package(OpenCV REQUIRED COMPONENTS core imgproc)
 
 find_package(OpenVINO REQUIRED
              COMPONENTS Runtime Threading)
 
-include(FetchContent)
-FetchContent_Declare(json GIT_REPOSITORY https://github.com/nlohmann/json.git
-                          GIT_TAG d41ca94fa85d5119852e2f7a3f94335cc7cb0486  # PR #4709, fixes cmake deprecation warnings
-                    )
-FetchContent_MakeAvailable(json)
-
-file(GLOB MODELS_SOURCES ./models/src/*.cpp)
-file(GLOB MODELS_HEADERS ./models/include/models/*.h)
-file(GLOB_RECURSE UTILS_HEADERS ./utils/include/*)
-file(GLOB_RECURSE UTILS_SOURCES ./utils/src/*.cpp)
-file(GLOB_RECURSE ADAPTERS_HEADERS ./adapters/include/*)
-file(GLOB_RECURSE ADAPTERS_SOURCES ./adapters/src/*.cpp)
-file(GLOB_RECURSE TILERS_HEADERS ./tilers/include/tilers/*.h)
-file(GLOB_RECURSE TILERS_SOURCES ./tilers/src/*.cpp)
+file(GLOB TASK_SOURCES src/tasks/**/*.cpp)
+file(GLOB TASKS_SOURCES src/tasks/*.cpp)
+file(GLOB UTILS_SOURCES src/utils/*.cpp)
+file(GLOB ADAPTERS_SOURCES src/adapters/*.cpp)
 
-# Create named folders for the sources within the .vcproj
-# Empty name lists them directly under the .vcproj
-source_group("models/src" FILES ${MODELS_SOURCES})
-source_group("models/include" FILES ${MODELS_HEADERS})
-source_group("utils/src" FILES ${UTILS_SOURCES})
-source_group("utils/include" FILES ${UTILS_HEADERS})
-source_group("adapters/src" FILES ${ADAPTERS_SOURCES})
-source_group("adapters/include" FILES ${ADAPTERS_HEADERS})
-source_group("tilers/src" FILES ${TILERS_SOURCES})
-source_group("tilers/include" FILES ${TILERS_HEADERS})
+add_library(model_api STATIC ${TASK_SOURCES} ${TASKS_SOURCES} ${UTILS_SOURCES} ${ADAPTERS_SOURCES} ${TILERS_SOURCES})
 
-add_library(model_api STATIC ${MODELS_SOURCES} ${UTILS_SOURCES} ${ADAPTERS_SOURCES} ${TILERS_SOURCES})
-target_include_directories(model_api PUBLIC "$<BUILD_INTERFACE:${CMAKE_CURRENT_SOURCE_DIR}/models/include>" "$<BUILD_INTERFACE:${CMAKE_CURRENT_SOURCE_DIR}/utils/include>" "$<BUILD_INTERFACE:${CMAKE_CURRENT_SOURCE_DIR}/adapters/include>" "$<BUILD_INTERFACE:${CMAKE_CURRENT_SOURCE_DIR}/tilers/include>" "$<INSTALL_INTERFACE:include>")
 target_link_libraries(model_api PUBLIC openvino::runtime opencv_core opencv_imgproc)
-target_link_libraries(model_api PRIVATE $<BUILD_LOCAL_INTERFACE:nlohmann_json::nlohmann_json>)
-set_target_properties(model_api PROPERTIES CXX_STANDARD 17)
-set_target_properties(model_api PROPERTIES CXX_STANDARD_REQUIRED ON)
-if(MSVC)
-    target_compile_options(model_api PRIVATE /wd4251 /wd4275 /wd4267  # disable some warnings
-        /W3  # Specify the level of warnings to be generated by the compiler
-        /EHsc)  # Enable standard C++ stack unwinding, assume functions with extern "C" never throw
-elseif(CMAKE_CXX_COMPILER_ID MATCHES "^GNU|(Apple)?Clang$")
-    target_compile_options(model_api PRIVATE -Wall -Wextra -Wpedantic)
-    set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -fPIC")
-endif()
-
-include(GenerateExportHeader)
-
-generate_export_header(model_api)
-set_property(TARGET model_api PROPERTY VERSION ${model_api_VERSION})
-set_property(TARGET model_api PROPERTY SOVERSION 3)
-set_property(TARGET model_api PROPERTY INTERFACE_model_api_MAJOR_VERSION 3)
-set_property(TARGET model_api APPEND PROPERTY COMPATIBLE_INTERFACE_STRING model_api_MAJOR_VERSION)
-
-install(TARGETS model_api EXPORT model_apiTargets
-    LIBRARY DESTINATION lib COMPONENT Devel
-    ARCHIVE DESTINATION lib COMPONENT Devel
-    RUNTIME DESTINATION bin COMPONENT Devel
-    INCLUDES DESTINATION include)
-install(DIRECTORY "${CMAKE_CURRENT_SOURCE_DIR}/models/include/" "${CMAKE_CURRENT_SOURCE_DIR}/utils/include/" "${CMAKE_CURRENT_SOURCE_DIR}/adapters/include/" "${CMAKE_CURRENT_SOURCE_DIR}/tilers/include/"
-    DESTINATION include COMPONENT Devel)
-
-include(CMakePackageConfigHelpers)
-write_basic_package_version_file("${CMAKE_CURRENT_BINARY_DIR}/model_apiConfigVersion.cmake" VERSION ${model_api_VERSION} COMPATIBILITY AnyNewerVersion)
-
-export(EXPORT model_apiTargets FILE "${CMAKE_CURRENT_BINARY_DIR}/model_apiTargets.cmake")
-configure_file(cmake/model_apiConfig.cmake "${CMAKE_CURRENT_BINARY_DIR}/model_apiConfig.cmake" COPYONLY)
-
-set(ConfigPackageLocation lib/cmake/model_api)
-install(EXPORT model_apiTargets FILE model_apiTargets.cmake DESTINATION ${ConfigPackageLocation})
-install(FILES cmake/model_apiConfig.cmake "${CMAKE_CURRENT_BINARY_DIR}/model_apiConfigVersion.cmake"
-    DESTINATION ${ConfigPackageLocation} COMPONENT Devel)
-
-set(CPACK_PACKAGE_VERSION ${model_api_VERSION})
-include(CPack)
+target_include_directories(model_api PUBLIC ${PROJECT_SOURCE_DIR}/include)
diff --git a/src/cpp/cmake/model_apiConfig.cmake b/src/cpp/cmake/model_apiConfig.cmake
deleted file mode 100644
index 570679ce..00000000
--- a/src/cpp/cmake/model_apiConfig.cmake
+++ /dev/null
@@ -1,7 +0,0 @@
-include(CMakeFindDependencyMacro)
-find_dependency(OpenCV COMPONENTS core imgproc)
-find_dependency(OpenVINO COMPONENTS Runtime)
-
-include("${CMAKE_CURRENT_LIST_DIR}/model_apiTargets.cmake")
-
-check_required_components()
diff --git a/src/cpp/adapters/include/adapters/inference_adapter.h b/src/cpp/include/adapters/inference_adapter.h
similarity index 97%
rename from src/cpp/adapters/include/adapters/inference_adapter.h
rename to src/cpp/include/adapters/inference_adapter.h
index 8d28e84e..9911f655 100644
--- a/src/cpp/adapters/include/adapters/inference_adapter.h
+++ b/src/cpp/include/adapters/inference_adapter.h
@@ -1,5 +1,5 @@
 /*
- * Copyright (C) 2020-2024 Intel Corporation
+ * Copyright (C) 2020-2025 Intel Corporation
  * SPDX-License-Identifier: Apache-2.0
  */
 
diff --git a/src/cpp/adapters/include/adapters/openvino_adapter.h b/src/cpp/include/adapters/openvino_adapter.h
similarity index 95%
rename from src/cpp/adapters/include/adapters/openvino_adapter.h
rename to src/cpp/include/adapters/openvino_adapter.h
index 7e1db1ac..7713ae93 100644
--- a/src/cpp/adapters/include/adapters/openvino_adapter.h
+++ b/src/cpp/include/adapters/openvino_adapter.h
@@ -1,5 +1,5 @@
 /*
- * Copyright (C) 2020-2024 Intel Corporation
+ * Copyright (C) 2020-2025 Intel Corporation
  * SPDX-License-Identifier: Apache-2.0
  */
 
@@ -12,7 +12,7 @@
 #include <vector>
 
 #include "adapters/inference_adapter.h"
-#include "utils/async_infer_queue.hpp"
+#include "utils/async_infer_queue.h"
 
 class OpenVINOInferenceAdapter : public InferenceAdapter {
 public:
@@ -46,7 +46,9 @@ class OpenVINOInferenceAdapter : public InferenceAdapter {
     // Depends on the implementation details but we should share the model state in this class
     std::vector<std::string> inputNames;
     std::vector<std::string> outputNames;
-    ov::CompiledModel compiledModel;
     std::unique_ptr<AsyncInferQueue> asyncQueue;
     ov::AnyMap modelConfig;  // the content of model_info section of rt_info
+
+public:
+    ov::CompiledModel compiledModel;
 };
diff --git a/src/cpp/include/tasks/detection.h b/src/cpp/include/tasks/detection.h
new file mode 100644
index 00000000..e5405133
--- /dev/null
+++ b/src/cpp/include/tasks/detection.h
@@ -0,0 +1,77 @@
+/*
+ * Copyright (C) 2020-2025 Intel Corporation
+ * SPDX-License-Identifier: Apache-2.0
+ */
+
+#pragma once
+
+#include <opencv2/opencv.hpp>
+#include <openvino/openvino.hpp>
+#include <string>
+
+#include "adapters/inference_adapter.h"
+#include "tasks/detection/ssd.h"
+#include "tasks/results.h"
+#include "utils/tiling.h"
+#include "utils/vision_pipeline.h"
+
+class DetectionModel {
+public:
+    std::unique_ptr<Pipeline<DetectionResult>> pipeline;
+
+    DetectionModel(std::unique_ptr<SSD> algorithm, const ov::AnyMap& configuration) : algorithm(std::move(algorithm)) {
+        auto config = this->algorithm->adapter->getModelConfig();
+        if (configuration.count("tiling") && configuration.at("tiling").as<bool>()) {
+            if (!utils::config_contains_tiling_info(config)) {
+                throw std::runtime_error("Model config does not contain tiling properties.");
+            }
+            pipeline = std::make_unique<TilingPipeline<DetectionResult>>(
+                this->algorithm->adapter,
+                utils::get_tiling_info_from_config(config),
+                [&](cv::Mat image) {
+                    return preprocess(image);
+                },
+                [&](InferenceResult result) {
+                    return postprocess(result);
+                },
+                [&](DetectionResult& result, const cv::Rect& coord) {
+                    return postprocess_tile(result, coord);
+                },
+                [&](const std::vector<DetectionResult>& tiles_results,
+                    const cv::Size& image_size,
+                    const std::vector<cv::Rect>& tile_coords,
+                    const utils::TilingInfo& tiling_info) {
+                    return merge_tiling_results(tiles_results, image_size, tile_coords, tiling_info);
+                });
+        } else {
+            pipeline = std::make_unique<VisionPipeline<DetectionResult>>(
+                this->algorithm->adapter,
+                [&](cv::Mat image) {
+                    return preprocess(image);
+                },
+                [&](InferenceResult result) {
+                    return postprocess(result);
+                });
+        }
+    }
+
+    InferenceInput preprocess(cv::Mat);
+    DetectionResult postprocess(InferenceResult);
+    DetectionResult postprocess_tile(DetectionResult& result, const cv::Rect& coord);
+    DetectionResult merge_tiling_results(const std::vector<DetectionResult>& tiles_results,
+                                         const cv::Size& image_size,
+                                         const std::vector<cv::Rect>& tile_coords,
+                                         const utils::TilingInfo& tiling_info);
+    ov::Tensor merge_saliency_maps(const std::vector<DetectionResult>& tiles_results,
+                                   const cv::Size& image_size,
+                                   const std::vector<cv::Rect>& tile_coords,
+                                   const utils::TilingInfo& tiling_info);
+
+    static DetectionModel load(const std::string& model_path, const ov::AnyMap& configuration = {});
+
+    DetectionResult infer(cv::Mat image);
+    std::vector<DetectionResult> inferBatch(std::vector<cv::Mat> image);
+
+private:
+    std::unique_ptr<SSD> algorithm;
+};
diff --git a/src/cpp/include/tasks/detection/ssd.h b/src/cpp/include/tasks/detection/ssd.h
new file mode 100644
index 00000000..a51311f9
--- /dev/null
+++ b/src/cpp/include/tasks/detection/ssd.h
@@ -0,0 +1,60 @@
+/*
+ * Copyright (C) 2020-2025 Intel Corporation
+ * SPDX-License-Identifier: Apache-2.0
+ */
+
+#pragma once
+
+#include <openvino/openvino.hpp>
+
+#include "adapters/inference_adapter.h"
+#include "tasks/results.h"
+#include "utils/config.h"
+#include "utils/preprocessing.h"
+
+enum SSDOutputMode { single, multi };
+
+class NumAndStep {
+public:
+    size_t detectionsNum, objectSize;
+
+    static inline NumAndStep fromSingleOutput(const ov::Shape& shape);
+    static inline NumAndStep fromMultipleOutputs(const ov::Shape& boxesShape);
+};
+
+constexpr float box_area_threshold = 1.0f;
+
+class SSD {
+public:
+    std::shared_ptr<InferenceAdapter> adapter;
+
+    SSD(std::shared_ptr<InferenceAdapter> adapter, cv::Size input_shape) : adapter(adapter), input_shape(input_shape) {
+        auto config = adapter->getModelConfig();
+        labels = utils::get_from_any_maps("labels", config, {}, labels);
+        confidence_threshold = utils::get_from_any_maps("confidence_threshold", config, {}, confidence_threshold);
+    }
+    std::map<std::string, ov::Tensor> preprocess(cv::Mat);
+    DetectionResult postprocess(InferenceResult& infResult);
+
+    static cv::Size serialize(std::shared_ptr<ov::Model> ov_model);
+
+    SSDOutputMode output_mode;
+
+private:
+    static void prepareSingleOutput(std::shared_ptr<ov::Model> ov_model);
+    static void prepareMultipleOutputs(std::shared_ptr<ov::Model> ov_model);
+
+    DetectionResult postprocessSingleOutput(InferenceResult& infResult);
+    DetectionResult postprocessMultipleOutputs(InferenceResult& infResult);
+
+    float confidence_threshold = 0.5f;
+
+    std::vector<std::string> labels;
+    std::vector<std::string> filterOutXai(const std::vector<std::string>&);
+
+    std::vector<std::string> output_names = {};
+    utils::RESIZE_MODE resize_mode = utils::RESIZE_FILL;
+    ov::Layout layout;
+    cv::InterpolationFlags interpolation_mode;
+    cv::Size input_shape;
+};
diff --git a/src/cpp/include/tasks/instance_segmentation.h b/src/cpp/include/tasks/instance_segmentation.h
new file mode 100644
index 00000000..1e72488e
--- /dev/null
+++ b/src/cpp/include/tasks/instance_segmentation.h
@@ -0,0 +1,60 @@
+/*
+ * Copyright (C) 2020-2025 Intel Corporation
+ * SPDX-License-Identifier: Apache-2.0
+ */
+
+#pragma once
+
+#include <opencv2/opencv.hpp>
+#include <openvino/openvino.hpp>
+
+#include "adapters/inference_adapter.h"
+#include "tasks/results.h"
+#include "utils/config.h"
+#include "utils/vision_pipeline.h"
+
+class InstanceSegmentation {
+public:
+    std::shared_ptr<InferenceAdapter> adapter;
+    VisionPipeline<InstanceSegmentationResult> pipeline;
+
+    InstanceSegmentation(std::shared_ptr<InferenceAdapter> adapter, cv::Size input_shape)
+        : adapter(adapter),
+          input_shape(input_shape) {
+        pipeline = VisionPipeline<InstanceSegmentationResult>(
+            adapter,
+            [&](cv::Mat image) {
+                return preprocess(image);
+            },
+            [&](InferenceResult result) {
+                return postprocess(result);
+            });
+
+        auto config = adapter->getModelConfig();
+        labels = utils::get_from_any_maps("labels", config, {}, labels);
+        confidence_threshold = utils::get_from_any_maps("confidence_threshold", config, {}, confidence_threshold);
+    }
+
+    static cv::Size serialize(std::shared_ptr<ov::Model>& ov_model);
+    static InstanceSegmentation load(const std::string& model_path);
+
+    InstanceSegmentationResult infer(cv::Mat image);
+    std::vector<InstanceSegmentationResult> inferBatch(std::vector<cv::Mat> image);
+
+    std::map<std::string, ov::Tensor> preprocess(cv::Mat);
+    InstanceSegmentationResult postprocess(InferenceResult& infResult);
+
+    static std::vector<SegmentedObjectWithRects> getRotatedRectangles(const InstanceSegmentationResult& result);
+    static std::vector<Contour> getContours(const std::vector<SegmentedObject>& objects);
+
+    bool postprocess_semantic_masks = true;
+
+private:
+    std::vector<std::string> labels;
+    std::string getLabelName(size_t labelID) {
+        return labelID < labels.size() ? labels[labelID] : std::string("Label #") + std::to_string(labelID);
+    }
+
+    cv::Size input_shape;
+    float confidence_threshold = 0.5f;
+};
diff --git a/src/cpp/include/tasks/results.h b/src/cpp/include/tasks/results.h
new file mode 100644
index 00000000..42c47d3b
--- /dev/null
+++ b/src/cpp/include/tasks/results.h
@@ -0,0 +1,148 @@
+/*
+ * Copyright (C) 2020-2025 Intel Corporation
+ * SPDX-License-Identifier: Apache-2.0
+ */
+
+#pragma once
+
+#include <opencv2/opencv.hpp>
+#include <openvino/openvino.hpp>
+
+class InferenceResult {
+public:
+    std::map<std::string, ov::Tensor> data;
+    cv::Size inputImageSize;
+};
+
+struct DetectedObject : public cv::Rect2f {
+    size_t labelID;
+    std::string label;
+    float confidence;
+
+    friend std::ostream& operator<<(std::ostream& os, const DetectedObject& detection) {
+        return os << int(detection.x) << ", " << int(detection.y) << ", " << int(detection.x + detection.width) << ", "
+                  << int(detection.y + detection.height) << ", " << detection.labelID << " (" << detection.label
+                  << "): " << std::fixed << std::setprecision(3) << detection.confidence;
+    }
+};
+
+struct DetectionResult {
+    DetectionResult() {}
+    std::vector<DetectedObject> objects;
+    ov::Tensor saliency_map, feature_vector;  // Contan "saliency_map" and "feature_vector" model outputs if such exist
+
+    friend std::ostream& operator<<(std::ostream& os, const DetectionResult& prediction) {
+        for (const DetectedObject& obj : prediction.objects) {
+            os << obj << "; ";
+        }
+        try {
+            os << prediction.saliency_map.get_shape() << "; ";
+        } catch (ov::Exception&) {
+            os << "[0]; ";
+        }
+        try {
+            os << prediction.feature_vector.get_shape();
+        } catch (ov::Exception&) {
+            os << "[0]";
+        }
+        return os;
+    }
+
+    explicit operator std::string() {
+        std::stringstream ss;
+        ss << *this;
+        return ss.str();
+    }
+};
+
+struct Contour {
+    std::string label;
+    float probability;
+    std::vector<cv::Point> shape;
+
+    friend std::ostream& operator<<(std::ostream& os, const Contour& contour) {
+        return os << contour.label << ": " << std::fixed << std::setprecision(3) << contour.probability << ", "
+                  << contour.shape.size();
+    }
+};
+
+struct SemanticSegmentationResult {
+    SemanticSegmentationResult() {}
+    cv::Mat resultImage;
+    cv::Mat soft_prediction;
+    cv::Mat saliency_map;
+    ov::Tensor feature_vector;
+
+    friend std::ostream& operator<<(std::ostream& os, const SemanticSegmentationResult& prediction) {
+        cv::Mat predicted_mask[] = {prediction.resultImage};
+        int nimages = 1;
+        int* channels = nullptr;
+        cv::Mat mask;
+        cv::Mat outHist;
+        int dims = 1;
+        int histSize[] = {256};
+        float range[] = {0, 256};
+        const float* ranges[] = {range};
+        cv::calcHist(predicted_mask, nimages, channels, mask, outHist, dims, histSize, ranges);
+
+        os << std::fixed << std::setprecision(3);
+        for (int i = 0; i < range[1]; ++i) {
+            const float count = outHist.at<float>(i);
+            if (count > 0) {
+                os << i << ": " << count / prediction.resultImage.total() << ", ";
+            }
+        }
+        os << '[';
+        for (int i = 0; i < prediction.soft_prediction.dims; ++i) {
+            os << prediction.soft_prediction.size[i] << ',';
+        }
+        os << prediction.soft_prediction.channels() << "], [";
+        if (prediction.saliency_map.data) {
+            for (int i = 0; i < prediction.saliency_map.dims; ++i) {
+                os << prediction.saliency_map.size[i] << ',';
+            }
+            os << prediction.saliency_map.channels() << "], ";
+        } else {
+            os << "0], ";
+        }
+        try {
+            os << prediction.feature_vector.get_shape();
+        } catch (ov::Exception&) {
+            os << "[0]";
+        }
+        return os;
+    }
+    explicit operator std::string() {
+        std::stringstream ss;
+        ss << *this;
+        return ss.str();
+    }
+};
+
+struct SegmentedObject : DetectedObject {
+    cv::Mat mask;
+
+    friend std::ostream& operator<<(std::ostream& os, const SegmentedObject& prediction) {
+        return os << static_cast<const DetectedObject&>(prediction) << ", " << cv::countNonZero(prediction.mask > 0.5);
+    }
+};
+
+struct SegmentedObjectWithRects : SegmentedObject {
+    cv::RotatedRect rotated_rect;
+
+    SegmentedObjectWithRects(const SegmentedObject& segmented_object) : SegmentedObject(segmented_object) {}
+
+    friend std::ostream& operator<<(std::ostream& os, const SegmentedObjectWithRects& prediction) {
+        os << static_cast<const SegmentedObject&>(prediction) << std::fixed << std::setprecision(3);
+        auto rect = prediction.rotated_rect;
+        os << ", RotatedRect: " << rect.center.x << ' ' << rect.center.y << ' ' << rect.size.width << ' '
+           << rect.size.height << ' ' << rect.angle;
+        return os;
+    }
+};
+
+struct InstanceSegmentationResult {
+    std::vector<SegmentedObject> segmentedObjects;
+    std::vector<cv::Mat_<std::uint8_t>> saliency_map;
+    ov::Tensor feature_vector;
+};
diff --git a/src/cpp/include/tasks/semantic_segmentation.h b/src/cpp/include/tasks/semantic_segmentation.h
new file mode 100644
index 00000000..f2b97cd9
--- /dev/null
+++ b/src/cpp/include/tasks/semantic_segmentation.h
@@ -0,0 +1,59 @@
+/*
+ * Copyright (C) 2020-2025 Intel Corporation
+ * SPDX-License-Identifier: Apache-2.0
+ */
+
+#pragma once
+#include <opencv2/opencv.hpp>
+#include <openvino/openvino.hpp>
+
+#include "adapters/inference_adapter.h"
+#include "tasks/results.h"
+#include "utils/config.h"
+#include "utils/preprocessing.h"
+#include "utils/vision_pipeline.h"
+
+class SemanticSegmentation {
+public:
+    VisionPipeline<SemanticSegmentationResult> pipeline;
+    std::shared_ptr<InferenceAdapter> adapter;
+    SemanticSegmentation(std::shared_ptr<InferenceAdapter> adapter) : adapter(adapter) {
+        pipeline = VisionPipeline<SemanticSegmentationResult>(
+            adapter,
+            [&](cv::Mat image) {
+                return preprocess(image);
+            },
+            [&](InferenceResult result) {
+                return postprocess(result);
+            });
+
+        auto config = adapter->getModelConfig();
+        labels = utils::get_from_any_maps("labels", config, {}, labels);
+        soft_threshold = utils::get_from_any_maps("soft_threshold", config, {}, soft_threshold);
+        blur_strength = utils::get_from_any_maps("blur_strength", config, {}, blur_strength);
+    }
+
+    static cv::Size serialize(std::shared_ptr<ov::Model>& ov_model);
+    static SemanticSegmentation load(const std::string& model_path);
+
+    std::map<std::string, ov::Tensor> preprocess(cv::Mat);
+    SemanticSegmentationResult postprocess(InferenceResult& infResult);
+    std::vector<Contour> getContours(const SemanticSegmentationResult& result);
+
+    SemanticSegmentationResult infer(cv::Mat image);
+    std::vector<SemanticSegmentationResult> inferBatch(std::vector<cv::Mat> image);
+
+private:
+    cv::Mat create_hard_prediction_from_soft_prediction(cv::Mat, float threshold, int blur_strength);
+
+    // from config
+    int blur_strength = -1;
+    float soft_threshold = -std::numeric_limits<float>::infinity();
+    bool return_soft_prediction = true;
+
+    std::vector<std::string> labels;
+
+    std::string getLabelName(size_t labelID) {
+        return labelID < labels.size() ? labels[labelID] : std::string("Label #") + std::to_string(labelID);
+    }
+};
diff --git a/src/cpp/utils/include/utils/async_infer_queue.hpp b/src/cpp/include/utils/async_infer_queue.h
similarity index 68%
rename from src/cpp/utils/include/utils/async_infer_queue.hpp
rename to src/cpp/include/utils/async_infer_queue.h
index 1dd38aa4..033a1f0e 100644
--- a/src/cpp/utils/include/utils/async_infer_queue.hpp
+++ b/src/cpp/include/utils/async_infer_queue.h
@@ -1,18 +1,7 @@
 /*
-// Copyright (C) 2024 Intel Corporation
-//
-// Licensed under the Apache License, Version 2.0 (the "License");
-// you may not use this file except in compliance with the License.
-// You may obtain a copy of the License at
-//
-//      http://www.apache.org/licenses/LICENSE-2.0
-//
-// Unless required by applicable law or agreed to in writing, software
-// distributed under the License is distributed on an "AS IS" BASIS,
-// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-// See the License for the specific language governing permissions and
-// limitations under the License.
-*/
+ * Copyright (C) 2020-2025 Intel Corporation
+ * SPDX-License-Identifier: Apache-2.0
+ */
 
 #include <condition_variable>
 #include <functional>
diff --git a/src/cpp/include/utils/config.h b/src/cpp/include/utils/config.h
new file mode 100644
index 00000000..6319a62c
--- /dev/null
+++ b/src/cpp/include/utils/config.h
@@ -0,0 +1,136 @@
+/*
+ * Copyright (C) 2020-2025 Intel Corporation
+ * SPDX-License-Identifier: Apache-2.0
+ */
+
+#pragma once
+
+#include <opencv2/opencv.hpp>
+#include <openvino/openvino.hpp>
+namespace utils {
+template <typename Type>
+Type get_from_any_maps(const std::string& key,
+                       const ov::AnyMap& top_priority,
+                       const ov::AnyMap& mid_priority,
+                       Type low_priority) {
+    auto topk_iter = top_priority.find(key);
+    if (topk_iter != top_priority.end()) {
+        return topk_iter->second.as<Type>();
+    }
+    topk_iter = mid_priority.find(key);
+    if (topk_iter != mid_priority.end()) {
+        return topk_iter->second.as<Type>();
+    }
+    return low_priority;
+}
+
+inline bool model_has_embedded_processing(std::shared_ptr<ov::Model> model) {
+    if (model->has_rt_info("model_info")) {
+        auto model_info = model->get_rt_info<ov::AnyMap>("model_info");
+        auto iter = model_info.find("embedded_processing");
+        if (iter != model_info.end()) {
+            return iter->second.as<std::string>() == "YES";
+        }
+    }
+
+    return false;
+}
+
+inline cv::Size get_input_shape_from_model_info(std::shared_ptr<ov::Model> model) {
+    cv::Size result;
+    if (model->has_rt_info("model_info")) {
+        auto model_info = model->get_rt_info<ov::AnyMap>("model_info");
+        {
+            auto iter = model_info.find("orig_height");
+            if (iter != model_info.end()) {
+                result.height = iter->second.as<int>();
+            }
+        }
+        {
+            auto iter = model_info.find("orig_width");
+            if (iter != model_info.end()) {
+                result.width = iter->second.as<int>();
+            }
+        }
+    }
+
+    return result;
+}
+struct IntervalCondition {
+    using DimType = size_t;
+    using IndexType = size_t;
+    using ConditionChecker = std::function<bool(IndexType, const ov::PartialShape&)>;
+
+    template <class Cond>
+    constexpr IntervalCondition(IndexType i1, IndexType i2, Cond c)
+        : impl([=](IndexType i0, const ov::PartialShape& shape) {
+              return c(shape[i0].get_max_length(), shape[i1].get_max_length()) &&
+                     c(shape[i0].get_max_length(), shape[i2].get_max_length());
+          }) {}
+    bool operator()(IndexType i0, const ov::PartialShape& shape) const {
+        return impl(i0, shape);
+    }
+
+private:
+    ConditionChecker impl;
+};
+
+template <template <class> class Cond, class... Args>
+IntervalCondition makeCond(Args&&... args) {
+    return IntervalCondition(std::forward<Args>(args)..., Cond<IntervalCondition::DimType>{});
+}
+using LayoutCondition = std::tuple<size_t /*dim index*/, IntervalCondition, std::string>;
+
+static inline std::tuple<bool, ov::Layout> makeGuesLayoutFrom4DShape(const ov::PartialShape& shape) {
+    // at the moment we make assumption about NCHW & NHCW only
+    // if hypothetical C value is less than hypothetical H and W - then
+    // out assumption is correct and we pick a corresponding layout
+    static const std::array<LayoutCondition, 2> hypothesisMatrix{
+        {{1, makeCond<std::less_equal>(2, 3), "NCHW"}, {3, makeCond<std::less_equal>(1, 2), "NHWC"}}};
+    for (const auto& h : hypothesisMatrix) {
+        auto channel_index = std::get<0>(h);
+        const auto& cond = std::get<1>(h);
+        if (cond(channel_index, shape)) {
+            return std::make_tuple(true, ov::Layout{std::get<2>(h)});
+        }
+    }
+    return {false, ov::Layout{}};
+}
+
+static inline ov::Layout getLayoutFromShape(const ov::PartialShape& shape) {
+    if (shape.size() == 2) {
+        return "NC";
+    }
+    if (shape.size() == 3) {
+        if (shape[0] == 1) {
+            return "NHW";
+        }
+        if (shape[2] == 1) {
+            return "HWN";
+        }
+        throw std::runtime_error("Can't guess layout for " + shape.to_string());
+    }
+    if (shape.size() == 4) {
+        if (ov::Interval{1, 4}.contains(shape[1].get_interval())) {
+            return "NCHW";
+        }
+        if (ov::Interval{1, 4}.contains(shape[3].get_interval())) {
+            return "NHWC";
+        }
+        if (shape[1] == shape[2]) {
+            return "NHWC";
+        }
+        if (shape[2] == shape[3]) {
+            return "NCHW";
+        }
+        bool guesResult = false;
+        ov::Layout guessedLayout;
+        std::tie(guesResult, guessedLayout) = makeGuesLayoutFrom4DShape(shape);
+        if (guesResult) {
+            return guessedLayout;
+        }
+    }
+    throw std::runtime_error("Usupported " + std::to_string(shape.size()) + "D shape");
+}
+
+}  // namespace utils
diff --git a/src/cpp/include/utils/math.h b/src/cpp/include/utils/math.h
new file mode 100644
index 00000000..72582747
--- /dev/null
+++ b/src/cpp/include/utils/math.h
@@ -0,0 +1,23 @@
+/*
+ * Copyright (C) 2020-2025 Intel Corporation
+ * SPDX-License-Identifier: Apache-2.0
+ */
+
+#pragma once
+
+#include <algorithm>
+#include <cmath>
+
+inline float clamp_and_round(float val, float min, float max) {
+    return std::round(std::max(min, std::min(max, val)));
+};
+
+template <typename T, std::size_t N>
+constexpr std::size_t arraySize(const T (&)[N]) noexcept {
+    return N;
+}
+
+template <typename T>
+T clamp(T value, T low, T high) {
+    return value < low ? low : (value > high ? high : value);
+}
diff --git a/src/cpp/utils/include/utils/nms.hpp b/src/cpp/include/utils/nms.h
similarity index 76%
rename from src/cpp/utils/include/utils/nms.hpp
rename to src/cpp/include/utils/nms.h
index 725d4f80..1334c7e6 100644
--- a/src/cpp/utils/include/utils/nms.hpp
+++ b/src/cpp/include/utils/nms.h
@@ -1,18 +1,7 @@
 /*
-// Copyright (C) 2021-2024 Intel Corporation
-//
-// Licensed under the Apache License, Version 2.0 (the "License");
-// you may not use this file except in compliance with the License.
-// You may obtain a copy of the License at
-//
-//      http://www.apache.org/licenses/LICENSE-2.0
-//
-// Unless required by applicable law or agreed to in writing, software
-// distributed under the License is distributed on an "AS IS" BASIS,
-// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-// See the License for the specific language governing permissions and
-// limitations under the License.
-*/
+ * Copyright (C) 2020-2025 Intel Corporation
+ * SPDX-License-Identifier: Apache-2.0
+ */
 
 #pragma once
 
@@ -109,8 +98,22 @@ std::vector<size_t> nms(const std::vector<Anchor>& boxes,
     return keep;
 }
 
-std::vector<size_t> multiclass_nms(const std::vector<AnchorLabeled>& boxes,
-                                   const std::vector<float>& scores,
-                                   const float iou_threshold = 0.45f,
-                                   bool includeBoundaries = false,
-                                   size_t maxNum = 200);
+inline std::vector<size_t> multiclass_nms(const std::vector<AnchorLabeled>& boxes,
+                                          const std::vector<float>& scores,
+                                          const float iou_threshold = 0.45f,
+                                          bool includeBoundaries = false,
+                                          size_t maxNum = 200) {
+    std::vector<Anchor> boxes_copy;
+    boxes_copy.reserve(boxes.size());
+
+    float max_coord = 0.f;
+    for (const auto& box : boxes) {
+        max_coord = std::max(max_coord, std::max(box.right, box.bottom));
+    }
+    for (auto& box : boxes) {
+        float offset = box.labelID * max_coord;
+        boxes_copy.emplace_back(box.left + offset, box.top + offset, box.right + offset, box.bottom + offset);
+    }
+
+    return nms<Anchor>(boxes_copy, scores, iou_threshold, includeBoundaries, maxNum);
+}
diff --git a/src/cpp/include/utils/preprocessing.h b/src/cpp/include/utils/preprocessing.h
new file mode 100644
index 00000000..0aa6c8f9
--- /dev/null
+++ b/src/cpp/include/utils/preprocessing.h
@@ -0,0 +1,65 @@
+/*
+ * Copyright (C) 2020-2025 Intel Corporation
+ * SPDX-License-Identifier: Apache-2.0
+ */
+
+#pragma once
+
+#include <opencv2/opencv.hpp>
+#include <openvino/openvino.hpp>
+
+namespace utils {
+enum RESIZE_MODE {
+    RESIZE_FILL,
+    RESIZE_KEEP_ASPECT,
+    RESIZE_KEEP_ASPECT_LETTERBOX,
+    RESIZE_CROP,
+    NO_RESIZE,
+};
+
+std::shared_ptr<ov::Model> embedProcessing(std::shared_ptr<ov::Model>& model,
+                                           const std::string& inputName,
+                                           const ov::Layout&,
+                                           RESIZE_MODE resize_mode,
+                                           const cv::InterpolationFlags interpolationMode,
+                                           const ov::Shape& targetShape,
+                                           uint8_t pad_value,
+                                           bool brg2rgb,
+                                           const std::vector<float>& mean,
+                                           const std::vector<float>& scale,
+                                           const std::type_info& dtype = typeid(int));
+
+ov::preprocess::PostProcessSteps::CustomPostprocessOp createResizeGraph(RESIZE_MODE resizeMode,
+                                                                        const ov::Shape& size,
+                                                                        const cv::InterpolationFlags interpolationMode,
+                                                                        uint8_t pad_value);
+
+cv::Mat resizeImageExt(const cv::Mat& mat,
+                       int width,
+                       int height,
+                       RESIZE_MODE resizeMode = RESIZE_FILL,
+                       cv::InterpolationFlags interpolationMode = cv::INTER_LINEAR,
+                       cv::Rect* roi = nullptr,
+                       cv::Scalar BorderConstant = cv::Scalar(0, 0, 0));
+
+ov::Output<ov::Node> resizeImageGraph(const ov::Output<ov::Node>& input,
+                                      const ov::Shape& size,
+                                      bool keep_aspect_ratio,
+                                      const cv::InterpolationFlags interpolationMode,
+                                      uint8_t pad_value);
+
+ov::Output<ov::Node> fitToWindowLetterBoxGraph(const ov::Output<ov::Node>& input,
+                                               const ov::Shape& size,
+                                               const cv::InterpolationFlags interpolationMode,
+                                               uint8_t pad_value);
+
+ov::Output<ov::Node> fitToWindowLetterBoxGraph(const ov::Output<ov::Node>& input,
+                                               const ov::Shape& size,
+                                               const cv::InterpolationFlags interpolationMode,
+                                               uint8_t pad_value);
+
+ov::Output<ov::Node> cropResizeGraph(const ov::Output<ov::Node>& input,
+                                     const ov::Shape& size,
+                                     const cv::InterpolationFlags interpolationMode);
+
+}  // namespace utils
diff --git a/src/cpp/include/utils/tensor.h b/src/cpp/include/utils/tensor.h
new file mode 100644
index 00000000..0408de6e
--- /dev/null
+++ b/src/cpp/include/utils/tensor.h
@@ -0,0 +1,46 @@
+/*
+ * Copyright (C) 2020-2025 Intel Corporation
+ * SPDX-License-Identifier: Apache-2.0
+ */
+
+#pragma once
+
+#include <opencv2/opencv.hpp>
+#include <openvino/openvino.hpp>
+
+namespace utils {
+static inline ov::Tensor wrapMat2Tensor(const cv::Mat& mat) {
+    auto matType = mat.type() & CV_MAT_DEPTH_MASK;
+    if (matType != CV_8U && matType != CV_32F) {
+        throw std::runtime_error("Unsupported mat type for wrapping");
+    }
+    bool isMatFloat = matType == CV_32F;
+
+    const size_t channels = mat.channels();
+    const size_t height = mat.rows;
+    const size_t width = mat.cols;
+
+    const size_t strideH = mat.step.buf[0];
+    const size_t strideW = mat.step.buf[1];
+
+    const bool isDense = !isMatFloat
+                             ? (strideW == channels && strideH == channels * width)
+                             : (strideW == channels * sizeof(float) && strideH == channels * width * sizeof(float));
+    if (!isDense) {
+        throw std::runtime_error("Doesn't support conversion from not dense cv::Mat");
+    }
+    auto precision = isMatFloat ? ov::element::f32 : ov::element::u8;
+    struct SharedMatAllocator {
+        const cv::Mat mat;
+        void* allocate(size_t bytes, size_t) {
+            return bytes <= mat.rows * mat.step[0] ? mat.data : nullptr;
+        }
+        void deallocate(void*, size_t, size_t) {}
+        bool is_equal(const SharedMatAllocator& other) const noexcept {
+            return this == &other;
+        }
+    };
+    return ov::Tensor(precision, ov::Shape{1, height, width, channels}, SharedMatAllocator{mat});
+}
+
+}  // namespace utils
diff --git a/src/cpp/include/utils/tiling.h b/src/cpp/include/utils/tiling.h
new file mode 100644
index 00000000..5f50be02
--- /dev/null
+++ b/src/cpp/include/utils/tiling.h
@@ -0,0 +1,85 @@
+/*
+ * Copyright (C) 2020-2025 Intel Corporation
+ * SPDX-License-Identifier: Apache-2.0
+ */
+
+#pragma once
+
+#include <opencv2/opencv.hpp>
+#include <openvino/openvino.hpp>
+
+namespace utils {
+
+struct TilingInfo {
+    size_t tile_size = 400;
+    float tiles_overlap = 0.5f;
+    float iou_threshold = 0.45f;
+    bool tile_with_full_image = true;
+};
+
+inline bool config_contains_tiling_info(const ov::AnyMap& config) {
+    auto iter = config.find("tile_size");
+    return iter != config.end();
+}
+
+inline TilingInfo get_tiling_info_from_config(const ov::AnyMap& config) {
+    TilingInfo info;
+    {
+        auto iter = config.find("tile_size");
+        if (iter != config.end()) {
+            info.tile_size = iter->second.as<size_t>();
+        }
+    }
+    {
+        auto iter = config.find("tiles_overlap");
+        if (iter != config.end()) {
+            info.tiles_overlap = iter->second.as<float>();
+        }
+    }
+    {
+        auto iter = config.find("iou_threshold");
+        if (iter != config.end()) {
+            info.iou_threshold = iter->second.as<float>();
+        }
+    }
+    {
+        auto iter = config.find("tile_with_full_img");
+        if (iter != config.end()) {
+            info.tile_with_full_image = iter->second.as<bool>();
+        }
+    }
+    return info;
+}
+
+static inline cv::Mat wrap_saliency_map_tensor_to_mat(ov::Tensor& t, size_t shape_shift, size_t class_idx) {
+    int ocv_dtype;
+    switch (t.get_element_type()) {
+    case ov::element::u8:
+        ocv_dtype = CV_8U;
+        break;
+    case ov::element::f32:
+        ocv_dtype = CV_32F;
+        break;
+    default:
+        throw std::runtime_error("Unsupported saliency map data type in ov::Tensor to cv::Mat wrapper: " +
+                                 t.get_element_type().get_type_name());
+    }
+    void* t_ptr = static_cast<char*>(t.data()) + class_idx * t.get_strides()[shape_shift];
+    auto mat_size =
+        cv::Size(static_cast<int>(t.get_shape()[shape_shift + 2]), static_cast<int>(t.get_shape()[shape_shift + 1]));
+
+    return cv::Mat(mat_size, ocv_dtype, t_ptr, t.get_strides()[shape_shift + 1]);
+}
+
+inline cv::Mat non_linear_normalization(cv::Mat& class_map) {
+    double min_soft_score, max_soft_score;
+    cv::minMaxLoc(class_map, &min_soft_score);
+    cv::pow(class_map - min_soft_score, 1.5, class_map);
+
+    cv::minMaxLoc(class_map, &min_soft_score, &max_soft_score);
+    class_map = 255.0 / (max_soft_score + 1e-12) * class_map;
+
+    return class_map;
+}
+
+}  // namespace utils
diff --git a/src/cpp/include/utils/vision_pipeline.h b/src/cpp/include/utils/vision_pipeline.h
new file mode 100644
index 00000000..e3f72b17
--- /dev/null
+++ b/src/cpp/include/utils/vision_pipeline.h
@@ -0,0 +1,202 @@
+/*
+ * Copyright (C) 2020-2025 Intel Corporation
+ * SPDX-License-Identifier: Apache-2.0
+ */
+
+#pragma once
+
+#include <opencv2/opencv.hpp>
+#include <openvino/openvino.hpp>
+
+#include "adapters/inference_adapter.h"
+#include "tasks/results.h"
+#include "utils/tiling.h"
+
+template <typename ResultType>
+class Pipeline {
+public:
+    Pipeline() {}
+    virtual ResultType infer(cv::Mat image) = 0;
+    virtual std::vector<ResultType> inferBatch(std::vector<cv::Mat> images) = 0;
+};
+
+template <typename ResultType>
+class VisionPipeline : public Pipeline<ResultType> {
+private:
+    std::shared_ptr<InferenceAdapter> adapter;
+    std::function<InferenceInput(cv::Mat)> preprocess;
+    std::function<ResultType(InferenceResult)> postprocess;
+
+public:
+    VisionPipeline() {}
+    VisionPipeline(std::shared_ptr<InferenceAdapter> adapter,
+                   std::function<InferenceInput(cv::Mat)> preprocess,
+                   std::function<ResultType(InferenceResult)> postprocess)
+        : adapter(adapter),
+          preprocess(preprocess),
+          postprocess(postprocess) {}
+
+    inline ResultType infer(cv::Mat image) {
+        auto input = preprocess(image);
+        InferenceResult result;
+        result.inputImageSize = image.size();
+        result.data = adapter->infer(input);
+        return postprocess(result);
+    }
+
+    inline std::vector<ResultType> inferBatch(std::vector<cv::Mat> images) {
+        auto results = std::vector<ResultType>(images.size());
+
+        adapter->setCallback([&](ov::InferRequest request, CallbackData additional_data) {
+            InferenceResult result;
+            size_t index = additional_data->at("index").as<size_t>();
+            result.inputImageSize = additional_data->at("inputImageSize").as<cv::Size>();
+            for (const auto& item : adapter->getOutputNames()) {
+                result.data.emplace(item, request.get_tensor(item));
+            }
+            results[index] = postprocess(result);
+        });
+
+        for (size_t i = 0; i < images.size(); i++) {
+            auto input = preprocess(images[i]);
+            auto additional_data = std::make_shared<ov::AnyMap>();
+            additional_data->insert({"index", i});
+            additional_data->insert({"inputImageSize", images[i].size()});
+            adapter->inferAsync(input, additional_data);
+        }
+
+        adapter->awaitAll();
+
+        return results;
+    }
+};
+
+template <typename ResultType>
+class TilingPipeline : public Pipeline<ResultType> {
+private:
+    std::shared_ptr<InferenceAdapter> adapter;
+    utils::TilingInfo tiling_info;
+    std::function<InferenceInput(cv::Mat)> preprocess;
+    std::function<ResultType(InferenceResult)> postprocess;
+    std::function<ResultType(ResultType&, const cv::Rect&)> postprocess_tile;
+    std::function<DetectionResult(const std::vector<DetectionResult>&,
+                                  const cv::Size&,
+                                  const std::vector<cv::Rect>&,
+                                  const utils::TilingInfo&)>
+        merge_tiling_results;
+
+public:
+    TilingPipeline() {}
+    TilingPipeline(std::shared_ptr<InferenceAdapter> adapter,
+                   utils::TilingInfo tiling_info,
+                   std::function<InferenceInput(cv::Mat)> preprocess,
+                   std::function<ResultType(InferenceResult)> postprocess,
+                   std::function<ResultType(ResultType&, const cv::Rect&)> postprocess_tile,
+                   std::function<DetectionResult(const std::vector<DetectionResult>&,
+                                                 const cv::Size&,
+                                                 const std::vector<cv::Rect>&,
+                                                 const utils::TilingInfo&)> merge_tiling_results)
+        : adapter(adapter),
+          tiling_info(tiling_info),
+          preprocess(preprocess),
+          postprocess(postprocess),
+          postprocess_tile(postprocess_tile),
+          merge_tiling_results(merge_tiling_results) {}
+
+    inline ResultType infer(cv::Mat image) {
+        std::vector<ResultType> tile_results;
+        auto tile_coords = tile(image.size());
+
+        for (const auto& coord : tile_coords) {
+            auto tile_img = cv::Mat(image, coord);
+            auto input = preprocess(tile_img.clone());
+            InferenceResult result;
+            result.inputImageSize = image.size();
+            result.data = adapter->infer(input);
+            auto tile_result = postprocess(result);
+            tile_results.push_back(postprocess_tile(tile_result, coord));
+        }
+
+        return merge_tiling_results(tile_results, image.size(), tile_coords, tiling_info);
+    }
+
+    inline std::vector<ResultType> inferBatch(std::vector<cv::Mat> images) {
+        std::vector<std::vector<ResultType>> tile_results_for_all_images(images.size());
+        std::vector<ResultType> output(images.size());
+        std::vector<std::vector<cv::Rect>> tile_coordinates(images.size());
+
+        adapter->setCallback([&](ov::InferRequest request, CallbackData additional_data) {
+            InferenceResult result;
+            size_t index = additional_data->at("index").as<size_t>();
+            result.inputImageSize = additional_data->at("inputImageSize").as<cv::Size>();
+            auto coord = additional_data->at("tileCoord").as<cv::Rect>();
+            for (const auto& item : adapter->getOutputNames()) {
+                result.data.emplace(item, request.get_tensor(item));
+            }
+            auto tile_result = postprocess(result);
+            tile_results_for_all_images[index].push_back(postprocess_tile(tile_result, coord));
+            tile_coordinates[index].push_back(coord);
+        });
+
+        for (size_t i = 0; i < images.size(); i++) {
+            auto tile_coords = tile(images[i].size());
+
+            for (const auto& coord : tile_coords) {
+                auto tile_img = cv::Mat(images[i], coord);
+                auto input = preprocess(tile_img.clone());
+                auto additional_data = std::make_shared<ov::AnyMap>();
+                additional_data->insert({"index", i});
+                additional_data->insert({"inputImageSize", images[i].size()});
+                additional_data->insert({"tileCoord", coord});
+                adapter->inferAsync(input, additional_data);
+            }
+        }
+        adapter->awaitAll();
+        for (size_t i = 0; i < images.size(); i++) {
+            output[i] = merge_tiling_results(tile_results_for_all_images[i],
+                                             images[i].size(),
+                                             tile_coordinates[i],
+                                             tiling_info);
+        }
+
+        return output;
+    }
+
+private:
+    inline std::vector<cv::Rect> tile(const cv::Size& image_size) {
+        std::vector<cv::Rect> coords;
+
+        size_t tile_step = static_cast<size_t>(tiling_info.tile_size * (1.f - tiling_info.tiles_overlap));
+        size_t num_h_tiles = image_size.height / tile_step;
+        size_t num_w_tiles = image_size.width / tile_step;
+
+        if (num_h_tiles * tile_step < static_cast<size_t>(image_size.height)) {
+            num_h_tiles += 1;
+        }
+
+        if (num_w_tiles * tile_step < static_cast<size_t>(image_size.width)) {
+            num_w_tiles += 1;
+        }
+
+        if (tiling_info.tile_with_full_image) {
+            coords.reserve(num_h_tiles * num_w_tiles + 1);
+            coords.push_back(cv::Rect(0, 0, image_size.width, image_size.height));
+        } else {
+            coords.reserve(num_h_tiles * num_w_tiles);
+        }
+
+        for (size_t i = 0; i < num_w_tiles; ++i) {
+            for (size_t j = 0; j < num_h_tiles; ++j) {
+                int loc_h = static_cast<int>(j * tile_step);
+                int loc_w = static_cast<int>(i * tile_step);
+
+                coords.push_back(
+                    cv::Rect(loc_w,
+                             loc_h,
+                             std::min(static_cast<int>(tiling_info.tile_size), image_size.width - loc_w),
+                             std::min(static_cast<int>(tiling_info.tile_size), image_size.height - loc_h)));
+            }
+        }
+        return coords;
+    }
+};
diff --git a/src/cpp/install_dependencies.sh b/src/cpp/install_dependencies.sh
old mode 100755
new mode 100644
diff --git a/src/cpp/models/include/models/anomaly_model.h b/src/cpp/models/include/models/anomaly_model.h
deleted file mode 100644
index 1cc5be22..00000000
--- a/src/cpp/models/include/models/anomaly_model.h
+++ /dev/null
@@ -1,47 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#pragma once
-#include "models/base_model.h"
-
-namespace ov {
-class Model;
-}  // namespace ov
-struct AnomalyResult;
-struct ImageInputData;
-
-class AnomalyModel : public BaseModel {
-public:
-    AnomalyModel(std::shared_ptr<ov::Model>& model, const ov::AnyMap& configuration);
-    AnomalyModel(std::shared_ptr<InferenceAdapter>& adapter, const ov::AnyMap& configuration = {});
-
-    static std::unique_ptr<AnomalyModel> create_model(const std::string& modelFile,
-                                                      const ov::AnyMap& configuration = {},
-                                                      bool preload = true,
-                                                      const std::string& device = "AUTO");
-    static std::unique_ptr<AnomalyModel> create_model(std::shared_ptr<InferenceAdapter>& adapter);
-
-    virtual std::unique_ptr<AnomalyResult> infer(const ImageInputData& inputData);
-    virtual std::vector<std::unique_ptr<AnomalyResult>> inferBatch(const std::vector<ImageInputData>& inputImgs);
-    std::unique_ptr<ResultBase> postprocess(InferenceResult& infResult) override;
-
-    friend std::ostream& operator<<(std::ostream& os, std::unique_ptr<AnomalyModel>& model);
-
-    static std::string ModelType;
-
-protected:
-    float imageThreshold{0.5f};
-    float pixelThreshold{0.5f};
-    float normalizationScale{1.0f};
-    std::string task = "segmentation";
-
-    void init_from_config(const ov::AnyMap& top_priority, const ov::AnyMap& mid_priority);
-
-    void prepareInputsOutputs(std::shared_ptr<ov::Model>& model) override;
-    void updateModelInfo() override;
-    cv::Mat normalize(cv::Mat& tensor, float threshold);
-    double normalize(double& tensor, float threshold);
-    std::vector<cv::Rect> getBoxes(cv::Mat& mask);
-};
diff --git a/src/cpp/models/include/models/base_model.h b/src/cpp/models/include/models/base_model.h
deleted file mode 100644
index 85131805..00000000
--- a/src/cpp/models/include/models/base_model.h
+++ /dev/null
@@ -1,108 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#pragma once
-#include <stddef.h>
-
-#include <memory>
-#include <string>
-
-#include "adapters/inference_adapter.h"
-#include "models/input_data.h"
-#include "models/results.h"
-#include "utils/args_helper.hpp"
-#include "utils/image_utils.h"
-#include "utils/ocv_common.hpp"
-
-namespace ov {
-class InferRequest;
-}  // namespace ov
-struct InputData;
-struct InternalModelData;
-
-// ImageModel implements preprocess(), ImageModel's direct or indirect children are expected to implement prostprocess()
-class BaseModel {
-public:
-    /// Constructor
-    /// @param modelFile name of model to load
-    /// @param useAutoResize - if true, image is resized by openvino
-    /// @param layout - model input layout
-    BaseModel(const std::string& modelFile,
-              const std::string& resize_type,
-              bool useAutoResize,
-              const std::string& layout = "");
-
-    BaseModel(std::shared_ptr<ov::Model>& model, const ov::AnyMap& configuration);
-    BaseModel(std::shared_ptr<InferenceAdapter>& adapter, const ov::AnyMap& configuration = {});
-
-    virtual std::shared_ptr<InternalModelData> preprocess(const InputData& inputData, InferenceInput& input);
-    virtual std::unique_ptr<ResultBase> postprocess(InferenceResult& infResult) = 0;
-
-    void load(ov::Core& core, const std::string& device, size_t num_infer_requests = 1);
-
-    std::shared_ptr<ov::Model> prepare();
-
-    virtual size_t getNumAsyncExecutors() const;
-    virtual bool isReady();
-    virtual void awaitAll();
-    virtual void awaitAny();
-    virtual void setCallback(
-        std::function<void(std::unique_ptr<ResultBase>, const ov::AnyMap& callback_args)> callback);
-
-    std::shared_ptr<ov::Model> getModel();
-    std::shared_ptr<InferenceAdapter> getInferenceAdapter();
-
-    static std::vector<std::string> loadLabels(const std::string& labelFilename);
-    std::shared_ptr<ov::Model> embedProcessing(std::shared_ptr<ov::Model>& model,
-                                               const std::string& inputName,
-                                               const ov::Layout&,
-                                               RESIZE_MODE resize_mode,
-                                               const cv::InterpolationFlags interpolationMode,
-                                               const ov::Shape& targetShape,
-                                               uint8_t pad_value,
-                                               bool brg2rgb,
-                                               const std::vector<float>& mean,
-                                               const std::vector<float>& scale,
-                                               const std::type_info& dtype = typeid(int));
-    virtual void inferAsync(const ImageInputData& inputData, const ov::AnyMap& callback_args = {});
-    std::unique_ptr<ResultBase> inferImage(const ImageInputData& inputData);
-    std::vector<std::unique_ptr<ResultBase>> inferBatchImage(const std::vector<ImageInputData>& inputData);
-
-protected:
-    RESIZE_MODE selectResizeMode(const std::string& resize_type);
-    virtual void updateModelInfo();
-    void init_from_config(const ov::AnyMap& top_priority, const ov::AnyMap& mid_priority);
-
-    std::string getLabelName(size_t labelID) {
-        return labelID < labels.size() ? labels[labelID] : std::string("Label #") + std::to_string(labelID);
-    }
-
-    std::vector<std::string> labels = {};
-    bool useAutoResize = false;
-    bool embedded_processing = false;  // flag in model_info that pre/postprocessing embedded
-
-    size_t netInputHeight = 0;
-    size_t netInputWidth = 0;
-    cv::InterpolationFlags interpolationMode = cv::INTER_LINEAR;
-    RESIZE_MODE resizeMode = RESIZE_FILL;
-    uint8_t pad_value = 0;
-    bool reverse_input_channels = false;
-    std::vector<float> scale_values;
-    std::vector<float> mean_values;
-
-protected:
-    virtual void prepareInputsOutputs(std::shared_ptr<ov::Model>& model) = 0;
-
-    InputTransform inputTransform = InputTransform();
-
-    std::shared_ptr<ov::Model> model;
-    std::vector<std::string> inputNames;
-    std::vector<std::string> outputNames;
-    std::string modelFile;
-    std::shared_ptr<InferenceAdapter> inferenceAdapter;
-    std::map<std::string, ov::Layout> inputsLayouts;
-    ov::Layout getInputLayout(const ov::Output<ov::Node>& input);
-    std::function<void(std::unique_ptr<ResultBase>, const ov::AnyMap&)> lastCallback;
-};
diff --git a/src/cpp/models/include/models/classification_model.h b/src/cpp/models/include/models/classification_model.h
deleted file mode 100644
index 88ac03bc..00000000
--- a/src/cpp/models/include/models/classification_model.h
+++ /dev/null
@@ -1,126 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#pragma once
-#include <stddef.h>
-
-#include <map>
-#include <memory>
-#include <string>
-#include <unordered_map>
-#include <vector>
-
-#include "models/base_model.h"
-
-namespace ov {
-class Model;
-}  // namespace ov
-struct InferenceResult;
-struct ClassificationResult;
-struct ResultBase;
-struct ImageInputData;
-
-struct HierarchicalConfig {
-    std::map<std::string, int> label_to_idx;
-    std::vector<std::pair<std::string, std::string>> label_tree_edges;
-    std::vector<std::vector<std::string>> all_groups;
-    std::map<size_t, std::pair<size_t, size_t>> head_idx_to_logits_range;
-    std::map<size_t, std::string> logit_idx_to_label;
-    size_t num_multiclass_heads;
-    size_t num_multilabel_heads;
-    size_t num_single_label_classes;
-
-    HierarchicalConfig() = default;
-    HierarchicalConfig(const std::string&);
-};
-
-class SimpleLabelsGraph {
-public:
-    SimpleLabelsGraph() = default;
-    SimpleLabelsGraph(const std::vector<std::string>& vertices_);
-    void add_edge(const std::string& parent, const std::string& child);
-    std::vector<std::string> get_children(const std::string& label) const;
-    std::string get_parent(const std::string& label) const;
-    std::vector<std::string> get_ancestors(const std::string& label) const;
-    std::vector<std::string> get_labels_in_topological_order();
-
-protected:
-    std::vector<std::string> vertices;
-    std::unordered_map<std::string, std::vector<std::string>> adj;
-    std::unordered_map<std::string, std::string> parents_map;
-    bool t_sort_cache_valid = false;
-    std::vector<std::string> topological_order_cache;
-
-    std::vector<std::string> topological_sort();
-};
-
-class GreedyLabelsResolver {
-public:
-    GreedyLabelsResolver() = default;
-    GreedyLabelsResolver(const HierarchicalConfig&);
-
-    virtual std::map<std::string, float> resolve_labels(const std::vector<std::reference_wrapper<std::string>>& labels,
-                                                        const std::vector<float>& scores);
-
-protected:
-    std::map<std::string, int> label_to_idx;
-    std::vector<std::pair<std::string, std::string>> label_relations;
-    std::vector<std::vector<std::string>> label_groups;
-
-    std::string get_parent(const std::string& label);
-    std::vector<std::string> get_predecessors(const std::string& label, const std::vector<std::string>& candidates);
-};
-
-class ProbabilisticLabelsResolver : public GreedyLabelsResolver {
-public:
-    ProbabilisticLabelsResolver() = default;
-    ProbabilisticLabelsResolver(const HierarchicalConfig&);
-
-    virtual std::map<std::string, float> resolve_labels(const std::vector<std::reference_wrapper<std::string>>& labels,
-                                                        const std::vector<float>& scores);
-    std::unordered_map<std::string, float> add_missing_ancestors(const std::unordered_map<std::string, float>&) const;
-    std::map<std::string, float> resolve_exclusive_labels(const std::unordered_map<std::string, float>&) const;
-    void suppress_descendant_output(std::map<std::string, float>&);
-
-protected:
-    SimpleLabelsGraph label_tree;
-};
-
-class ClassificationModel : public BaseModel {
-public:
-    ClassificationModel(std::shared_ptr<ov::Model>& model, const ov::AnyMap& configuration);
-    ClassificationModel(std::shared_ptr<InferenceAdapter>& adapter, const ov::AnyMap& configuration = {});
-
-    static std::unique_ptr<ClassificationModel> create_model(const std::string& modelFile,
-                                                             const ov::AnyMap& configuration = {},
-                                                             bool preload = true,
-                                                             const std::string& device = "AUTO");
-    static std::unique_ptr<ClassificationModel> create_model(std::shared_ptr<InferenceAdapter>& adapter);
-
-    std::unique_ptr<ResultBase> postprocess(InferenceResult& infResult) override;
-
-    virtual std::unique_ptr<ClassificationResult> infer(const ImageInputData& inputData);
-    virtual std::vector<std::unique_ptr<ClassificationResult>> inferBatch(const std::vector<ImageInputData>& inputImgs);
-    static std::string ModelType;
-
-protected:
-    size_t topk = 1;
-    bool multilabel = false;
-    bool hierarchical = false;
-    bool output_raw_scores = false;
-    float confidence_threshold = 0.5f;
-    std::string hierarchical_config;
-    std::string hierarchical_postproc = "greedy";
-    HierarchicalConfig hierarchical_info;
-    std::unique_ptr<GreedyLabelsResolver> resolver;
-
-    void init_from_config(const ov::AnyMap& top_priority, const ov::AnyMap& mid_priority);
-    void prepareInputsOutputs(std::shared_ptr<ov::Model>& model) override;
-    void updateModelInfo() override;
-    std::unique_ptr<ResultBase> get_multilabel_predictions(InferenceResult& infResult, bool add_raw_scores);
-    std::unique_ptr<ResultBase> get_multiclass_predictions(InferenceResult& infResult, bool add_raw_scores);
-    std::unique_ptr<ResultBase> get_hierarchical_predictions(InferenceResult& infResult, bool add_raw_scores);
-    ov::Tensor reorder_saliency_maps(const ov::Tensor&);
-};
diff --git a/src/cpp/models/include/models/detection_model.h b/src/cpp/models/include/models/detection_model.h
deleted file mode 100644
index 16ba8cf8..00000000
--- a/src/cpp/models/include/models/detection_model.h
+++ /dev/null
@@ -1,35 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#pragma once
-
-#include <string>
-
-#include "models/base_model.h"
-
-struct DetectionResult;
-struct ImageInputData;
-struct InferenceAdatper;
-
-class DetectionModel : public BaseModel {
-public:
-    DetectionModel(std::shared_ptr<ov::Model>& model, const ov::AnyMap& configuration);
-    DetectionModel(std::shared_ptr<InferenceAdapter>& adapter, const ov::AnyMap& configuration = {});
-
-    static std::unique_ptr<DetectionModel> create_model(const std::string& modelFile,
-                                                        const ov::AnyMap& configuration = {},
-                                                        std::string model_type = "",
-                                                        bool preload = true,
-                                                        const std::string& device = "AUTO");
-    static std::unique_ptr<DetectionModel> create_model(std::shared_ptr<InferenceAdapter>& adapter);
-
-    virtual std::unique_ptr<DetectionResult> infer(const ImageInputData& inputData);
-    virtual std::vector<std::unique_ptr<DetectionResult>> inferBatch(const std::vector<ImageInputData>& inputImgs);
-
-protected:
-    float confidence_threshold = 0.5f;
-
-    void updateModelInfo() override;
-};
diff --git a/src/cpp/models/include/models/detection_model_ext.h b/src/cpp/models/include/models/detection_model_ext.h
deleted file mode 100644
index 8c6d46c7..00000000
--- a/src/cpp/models/include/models/detection_model_ext.h
+++ /dev/null
@@ -1,26 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#pragma once
-#include <stddef.h>
-
-#include <string>
-#include <vector>
-
-#include "models/detection_model.h"
-
-struct DetectionResult;
-struct ImageInputData;
-struct InferenceAdatper;
-
-class DetectionModelExt : public DetectionModel {
-public:
-    DetectionModelExt(std::shared_ptr<ov::Model>& model, const ov::AnyMap& configuration);
-    DetectionModelExt(std::shared_ptr<InferenceAdapter>& adapter);
-
-protected:
-    void updateModelInfo() override;
-    float iou_threshold = 0.5f;
-};
diff --git a/src/cpp/models/include/models/detection_model_ssd.h b/src/cpp/models/include/models/detection_model_ssd.h
deleted file mode 100644
index acb3060f..00000000
--- a/src/cpp/models/include/models/detection_model_ssd.h
+++ /dev/null
@@ -1,38 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#pragma once
-#include <stddef.h>
-
-#include <memory>
-#include <string>
-#include <vector>
-
-#include "models/detection_model.h"
-
-namespace ov {
-class InferRequest;
-class Model;
-}  // namespace ov
-struct InferenceResult;
-struct InputData;
-struct InternalModelData;
-struct ResultBase;
-
-class ModelSSD : public DetectionModel {
-public:
-    using DetectionModel::DetectionModel;
-    std::shared_ptr<InternalModelData> preprocess(const InputData& inputData, InferenceInput& input) override;
-    std::unique_ptr<ResultBase> postprocess(InferenceResult& infResult) override;
-    static std::string ModelType;
-
-protected:
-    std::unique_ptr<ResultBase> postprocessSingleOutput(InferenceResult& infResult);
-    std::unique_ptr<ResultBase> postprocessMultipleOutputs(InferenceResult& infResult);
-    void prepareInputsOutputs(std::shared_ptr<ov::Model>& model) override;
-    void prepareSingleOutput(std::shared_ptr<ov::Model>& model);
-    void prepareMultipleOutputs(std::shared_ptr<ov::Model>& model);
-    void updateModelInfo() override;
-};
diff --git a/src/cpp/models/include/models/detection_model_yolo.h b/src/cpp/models/include/models/detection_model_yolo.h
deleted file mode 100644
index 56055588..00000000
--- a/src/cpp/models/include/models/detection_model_yolo.h
+++ /dev/null
@@ -1,95 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#pragma once
-#include <stddef.h>
-#include <stdint.h>
-
-#include <map>
-#include <memory>
-#include <openvino/op/region_yolo.hpp>
-#include <openvino/openvino.hpp>
-#include <string>
-#include <vector>
-
-#include "models/detection_model_ext.h"
-
-struct DetectedObject;
-struct InferenceResult;
-struct ResultBase;
-
-class ModelYolo : public DetectionModelExt {
-protected:
-    class Region {
-    public:
-        int num = 0;
-        size_t classes = 0;
-        int coords = 0;
-        std::vector<float> anchors;
-        size_t outputWidth = 0;
-        size_t outputHeight = 0;
-
-        Region(const std::shared_ptr<ov::op::v0::RegionYolo>& regionYolo);
-        Region(size_t classes,
-               int coords,
-               const std::vector<float>& anchors,
-               const std::vector<int64_t>& masks,
-               size_t outputWidth,
-               size_t outputHeight);
-    };
-
-public:
-    enum class YoloVersion : size_t { YOLO_V1V2 = 0, YOLO_V3, YOLO_V4, YOLO_V4_TINY, YOLOF };
-
-    ModelYolo(std::shared_ptr<ov::Model>& model, const ov::AnyMap& configuration);
-    ModelYolo(std::shared_ptr<InferenceAdapter>& adapter);
-
-    std::unique_ptr<ResultBase> postprocess(InferenceResult& infResult) override;
-
-protected:
-    void prepareInputsOutputs(std::shared_ptr<ov::Model>& model) override;
-
-    void parseYOLOOutput(const std::string& output_name,
-                         const ov::Tensor& tensor,
-                         const unsigned long resized_im_h,
-                         const unsigned long resized_im_w,
-                         const unsigned long original_im_h,
-                         const unsigned long original_im_w,
-                         std::vector<DetectedObject>& objects);
-
-    static int calculateEntryIndex(int entriesNum, int lcoords, size_t lclasses, int location, int entry);
-    static double intersectionOverUnion(const DetectedObject& o1, const DetectedObject& o2);
-
-    std::map<std::string, Region> regions;
-    float iou_threshold;
-    bool useAdvancedPostprocessing = true;
-    bool isObjConf = 1;
-    YoloVersion yoloVersion = YoloVersion::YOLO_V3;
-    std::vector<float> presetAnchors;
-    std::vector<int64_t> presetMasks;
-    ov::Layout yoloRegionLayout = "NCHW";
-};
-
-class YOLOv5 : public DetectionModelExt {
-    // Reimplementation of ultralytics.YOLO
-    void prepareInputsOutputs(std::shared_ptr<ov::Model>& model) override;
-    void updateModelInfo() override;
-    void init_from_config(const ov::AnyMap& top_priority, const ov::AnyMap& mid_priority);
-    bool agnostic_nms = false;
-
-public:
-    YOLOv5(std::shared_ptr<ov::Model>& model, const ov::AnyMap& configuration);
-    YOLOv5(std::shared_ptr<InferenceAdapter>& adapter);
-    std::unique_ptr<ResultBase> postprocess(InferenceResult& infResult) override;
-    static std::string ModelType;
-};
-
-class YOLOv8 : public YOLOv5 {
-public:
-    // YOLOv5 and YOLOv8 are identical in terms of inference
-    YOLOv8(std::shared_ptr<ov::Model>& model, const ov::AnyMap& configuration) : YOLOv5{model, configuration} {}
-    YOLOv8(std::shared_ptr<InferenceAdapter>& adapter) : YOLOv5{adapter} {}
-    static std::string ModelType;
-};
diff --git a/src/cpp/models/include/models/detection_model_yolov3_onnx.h b/src/cpp/models/include/models/detection_model_yolov3_onnx.h
deleted file mode 100644
index 9dead24d..00000000
--- a/src/cpp/models/include/models/detection_model_yolov3_onnx.h
+++ /dev/null
@@ -1,31 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#pragma once
-
-#include <openvino/openvino.hpp>
-#include <string>
-#include <vector>
-
-#include "models/detection_model.h"
-
-class ModelYoloV3ONNX : public DetectionModel {
-public:
-    ModelYoloV3ONNX(std::shared_ptr<ov::Model>& model, const ov::AnyMap& configuration);
-    ModelYoloV3ONNX(std::shared_ptr<InferenceAdapter>& adapter);
-    using DetectionModel::DetectionModel;
-
-    std::unique_ptr<ResultBase> postprocess(InferenceResult& infResult) override;
-    std::shared_ptr<InternalModelData> preprocess(const InputData& inputData, InferenceInput& input) override;
-
-protected:
-    void prepareInputsOutputs(std::shared_ptr<ov::Model>& model) override;
-    void initDefaultParameters(const ov::AnyMap& configuration);
-
-    std::string boxesOutputName;
-    std::string scoresOutputName;
-    std::string indicesOutputName;
-    static const int numberOfClasses = 80;
-};
diff --git a/src/cpp/models/include/models/detection_model_yolox.h b/src/cpp/models/include/models/detection_model_yolox.h
deleted file mode 100644
index bc747ee5..00000000
--- a/src/cpp/models/include/models/detection_model_yolox.h
+++ /dev/null
@@ -1,34 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#pragma once
-#include <memory>
-#include <openvino/openvino.hpp>
-#include <string>
-#include <vector>
-
-#include "models/detection_model_ext.h"
-
-class ModelYoloX : public DetectionModelExt {
-public:
-    ModelYoloX(std::shared_ptr<ov::Model>& model, const ov::AnyMap& configuration);
-    ModelYoloX(std::shared_ptr<InferenceAdapter>& adapter);
-    using DetectionModelExt::DetectionModelExt;
-
-    std::unique_ptr<ResultBase> postprocess(InferenceResult& infResult) override;
-    std::shared_ptr<InternalModelData> preprocess(const InputData& inputData, InferenceInput& input) override;
-    static std::string ModelType;
-
-protected:
-    void prepareInputsOutputs(std::shared_ptr<ov::Model>& model) override;
-    void setStridesGrids();
-    void initDefaultParameters(const ov::AnyMap& configuration);
-    void updateModelInfo() override;
-
-    float iou_threshold;
-    std::vector<std::pair<size_t, size_t>> grids;
-    std::vector<size_t> expandedStrides;
-    static const size_t numberOfClasses = 80;
-};
diff --git a/src/cpp/models/include/models/input_data.h b/src/cpp/models/include/models/input_data.h
deleted file mode 100644
index 6d02e287..00000000
--- a/src/cpp/models/include/models/input_data.h
+++ /dev/null
@@ -1,30 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#pragma once
-#include <opencv2/opencv.hpp>
-
-struct InputData {
-    virtual ~InputData() {}
-
-    template <class T>
-    T& asRef() {
-        return dynamic_cast<T&>(*this);
-    }
-
-    template <class T>
-    const T& asRef() const {
-        return dynamic_cast<const T&>(*this);
-    }
-};
-
-struct ImageInputData : public InputData {
-    cv::Mat inputImage;
-
-    ImageInputData() {}
-    ImageInputData(const cv::Mat& img) {
-        inputImage = img;
-    }
-};
diff --git a/src/cpp/models/include/models/instance_segmentation.h b/src/cpp/models/include/models/instance_segmentation.h
deleted file mode 100644
index c6cadce7..00000000
--- a/src/cpp/models/include/models/instance_segmentation.h
+++ /dev/null
@@ -1,52 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#pragma once
-#include <memory>
-#include <string>
-#include <vector>
-
-#include "models/base_model.h"
-
-namespace ov {
-class Model;
-}  // namespace ov
-struct InferenceResult;
-struct ResultBase;
-struct InstanceSegmentationResult;
-struct ImageInputData;
-struct SegmentedObject;
-
-class MaskRCNNModel : public BaseModel {
-public:
-    MaskRCNNModel(std::shared_ptr<ov::Model>& model, const ov::AnyMap& configuration);
-    MaskRCNNModel(std::shared_ptr<InferenceAdapter>& adapter, const ov::AnyMap& configuration = {});
-
-    static std::unique_ptr<MaskRCNNModel> create_model(const std::string& modelFile,
-                                                       const ov::AnyMap& configuration = {},
-                                                       bool preload = true,
-                                                       const std::string& device = "AUTO");
-    static std::unique_ptr<MaskRCNNModel> create_model(std::shared_ptr<InferenceAdapter>& adapter);
-
-    std::unique_ptr<ResultBase> postprocess(InferenceResult& infResult) override;
-
-    virtual std::unique_ptr<InstanceSegmentationResult> infer(const ImageInputData& inputData);
-    virtual std::vector<std::unique_ptr<InstanceSegmentationResult>> inferBatch(
-        const std::vector<ImageInputData>& inputImgs);
-    static std::string ModelType;
-    bool postprocess_semantic_masks = true;
-
-protected:
-    void prepareInputsOutputs(std::shared_ptr<ov::Model>& model) override;
-    void updateModelInfo() override;
-    void init_from_config(const ov::AnyMap& top_priority, const ov::AnyMap& mid_priority);
-    std::string getLabelName(size_t labelID) {
-        return labelID < labels.size() ? labels[labelID] : std::string("Label #") + std::to_string(labelID);
-    }
-
-    float confidence_threshold = 0.5f;
-};
-
-cv::Mat segm_postprocess(const SegmentedObject& box, const cv::Mat& unpadded, int im_h, int im_w);
diff --git a/src/cpp/models/include/models/internal_model_data.h b/src/cpp/models/include/models/internal_model_data.h
deleted file mode 100644
index 2f1b84f7..00000000
--- a/src/cpp/models/include/models/internal_model_data.h
+++ /dev/null
@@ -1,37 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#pragma once
-
-struct InternalModelData {
-    virtual ~InternalModelData() {}
-
-    template <class T>
-    T& asRef() {
-        return dynamic_cast<T&>(*this);
-    }
-
-    template <class T>
-    const T& asRef() const {
-        return dynamic_cast<const T&>(*this);
-    }
-};
-
-struct InternalImageModelData : public InternalModelData {
-    InternalImageModelData(int width, int height) : inputImgWidth(width), inputImgHeight(height) {}
-
-    int inputImgWidth;
-    int inputImgHeight;
-};
-
-struct InternalScaleData : public InternalImageModelData {
-    InternalScaleData(int width, int height, float scaleX, float scaleY)
-        : InternalImageModelData(width, height),
-          scaleX(scaleX),
-          scaleY(scaleY) {}
-
-    float scaleX;
-    float scaleY;
-};
diff --git a/src/cpp/models/include/models/keypoint_detection.h b/src/cpp/models/include/models/keypoint_detection.h
deleted file mode 100644
index 15d21cba..00000000
--- a/src/cpp/models/include/models/keypoint_detection.h
+++ /dev/null
@@ -1,46 +0,0 @@
-/*
- * Copyright (C) 2020-2025 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#pragma once
-#include <memory>
-#include <string>
-#include <vector>
-
-#include "models/base_model.h"
-
-namespace ov {
-class Model;
-}  // namespace ov
-struct InferenceResult;
-struct ResultBase;
-struct KeypointDetectionResult;
-struct ImageInputData;
-
-class KeypointDetectionModel : public BaseModel {
-public:
-    KeypointDetectionModel(std::shared_ptr<ov::Model>& model, const ov::AnyMap& configuration);
-    KeypointDetectionModel(std::shared_ptr<InferenceAdapter>& adapter, const ov::AnyMap& configuration = {});
-
-    static std::unique_ptr<KeypointDetectionModel> create_model(const std::string& modelFile,
-                                                                const ov::AnyMap& configuration = {},
-                                                                bool preload = true,
-                                                                const std::string& device = "AUTO");
-    static std::unique_ptr<KeypointDetectionModel> create_model(std::shared_ptr<InferenceAdapter>& adapter);
-
-    std::unique_ptr<ResultBase> postprocess(InferenceResult& infResult) override;
-
-    virtual std::unique_ptr<KeypointDetectionResult> infer(const ImageInputData& inputData);
-    virtual std::vector<std::unique_ptr<KeypointDetectionResult>> inferBatch(
-        const std::vector<ImageInputData>& inputImgs);
-
-    static std::string ModelType;
-
-protected:
-    bool apply_softmax = true;
-
-    void prepareInputsOutputs(std::shared_ptr<ov::Model>& model) override;
-    void updateModelInfo() override;
-    void init_from_config(const ov::AnyMap& top_priority, const ov::AnyMap& mid_priority);
-};
diff --git a/src/cpp/models/include/models/results.h b/src/cpp/models/include/models/results.h
deleted file mode 100644
index 1a648723..00000000
--- a/src/cpp/models/include/models/results.h
+++ /dev/null
@@ -1,379 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#pragma once
-#include <map>
-#include <memory>
-#include <numeric>
-#include <opencv2/core.hpp>
-#include <opencv2/imgproc.hpp>
-#include <openvino/openvino.hpp>
-#include <string>
-#include <vector>
-
-#include "internal_model_data.h"
-
-struct MetaData;
-struct ResultBase {
-    ResultBase(int64_t frameId = -1, const std::shared_ptr<MetaData>& metaData = nullptr)
-        : frameId(frameId),
-          metaData(metaData) {}
-    virtual ~ResultBase() {}
-
-    int64_t frameId;
-
-    std::shared_ptr<MetaData> metaData;
-    bool IsEmpty() {
-        return frameId < 0;
-    }
-
-    template <class T>
-    T& asRef() {
-        return dynamic_cast<T&>(*this);
-    }
-
-    template <class T>
-    const T& asRef() const {
-        return dynamic_cast<const T&>(*this);
-    }
-};
-
-struct AnomalyResult : public ResultBase {
-    AnomalyResult(int64_t frameId = -1, const std::shared_ptr<MetaData>& metaData = nullptr)
-        : ResultBase(frameId, metaData) {}
-    cv::Mat anomaly_map;
-    std::vector<cv::Rect> pred_boxes;
-    std::string pred_label;
-    cv::Mat pred_mask;
-    double pred_score;
-
-    friend std::ostream& operator<<(std::ostream& os, const AnomalyResult& prediction) {
-        double min_anomaly_map, max_anomaly_map;
-        cv::minMaxLoc(prediction.anomaly_map, &min_anomaly_map, &max_anomaly_map);
-        double min_pred_mask, max_pred_mask;
-        cv::minMaxLoc(prediction.pred_mask, &min_pred_mask, &max_pred_mask);
-        os << "anomaly_map min:" << min_anomaly_map << " max:" << max_anomaly_map << ";";
-        os << "pred_score:" << std::fixed << std::setprecision(1) << prediction.pred_score << ";";
-        os << "pred_label:" << prediction.pred_label << ";";
-        os << std::fixed << std::setprecision(0) << "pred_mask min:" << min_pred_mask << " max:" << max_pred_mask
-           << ";";
-
-        if (!prediction.pred_boxes.empty()) {
-            os << "pred_boxes:";
-            for (const cv::Rect& box : prediction.pred_boxes) {
-                os << box << ",";
-            }
-        }
-
-        return os;
-    }
-    explicit operator std::string() {
-        std::stringstream ss;
-        ss << *this;
-        return ss.str();
-    }
-};
-
-struct InferenceResult : public ResultBase {
-    std::shared_ptr<InternalModelData> internalModelData;
-    std::map<std::string, ov::Tensor> outputsData;
-
-    /// Returns the first output tensor
-    /// This function is a useful addition to direct access to outputs list as many models have only one output
-    /// @returns first output tensor
-    ov::Tensor getFirstOutputTensor() {
-        if (outputsData.empty()) {
-            throw std::out_of_range("Outputs map is empty.");
-        }
-        return outputsData.begin()->second;
-    }
-
-    /// Returns true if object contains no valid data
-    /// @returns true if object contains no valid data
-    bool IsEmpty() {
-        return outputsData.empty();
-    }
-};
-
-struct ClassificationResult : public ResultBase {
-    ClassificationResult(int64_t frameId = -1, const std::shared_ptr<MetaData>& metaData = nullptr)
-        : ResultBase(frameId, metaData) {}
-
-    friend std::ostream& operator<<(std::ostream& os, const ClassificationResult& prediction) {
-        for (const ClassificationResult::Classification& classification : prediction.topLabels) {
-            os << classification << ", ";
-        }
-        try {
-            os << prediction.saliency_map.get_shape() << ", ";
-        } catch (ov::Exception&) {
-            os << "[0], ";
-        }
-        try {
-            os << prediction.feature_vector.get_shape() << ", ";
-        } catch (ov::Exception&) {
-            os << "[0], ";
-        }
-        try {
-            os << prediction.raw_scores.get_shape();
-        } catch (ov::Exception&) {
-            os << "[0]";
-        }
-        return os;
-    }
-
-    explicit operator std::string() {
-        std::stringstream ss;
-        ss << *this;
-        return ss.str();
-    }
-
-    struct Classification {
-        size_t id;
-        std::string label;
-        float score;
-
-        Classification(size_t id, const std::string& label, float score) : id(id), label(label), score(score) {}
-
-        friend std::ostream& operator<<(std::ostream& os, const Classification& prediction) {
-            return os << prediction.id << " (" << prediction.label << "): " << std::fixed << std::setprecision(3)
-                      << prediction.score;
-        }
-    };
-
-    std::vector<Classification> topLabels;
-    ov::Tensor saliency_map, feature_vector,
-        raw_scores;  // Contains "raw_scores", "saliency_map" and "feature_vector" model outputs if such exist
-};
-
-struct DetectedObject : public cv::Rect2f {
-    size_t labelID;
-    std::string label;
-    float confidence;
-
-    friend std::ostream& operator<<(std::ostream& os, const DetectedObject& detection) {
-        return os << int(detection.x) << ", " << int(detection.y) << ", " << int(detection.x + detection.width) << ", "
-                  << int(detection.y + detection.height) << ", " << detection.labelID << " (" << detection.label
-                  << "): " << std::fixed << std::setprecision(3) << detection.confidence;
-    }
-};
-
-struct DetectionResult : public ResultBase {
-    DetectionResult(int64_t frameId = -1, const std::shared_ptr<MetaData>& metaData = nullptr)
-        : ResultBase(frameId, metaData) {}
-    std::vector<DetectedObject> objects;
-    ov::Tensor saliency_map, feature_vector;  // Contan "saliency_map" and "feature_vector" model outputs if such exist
-
-    friend std::ostream& operator<<(std::ostream& os, const DetectionResult& prediction) {
-        for (const DetectedObject& obj : prediction.objects) {
-            os << obj << "; ";
-        }
-        try {
-            os << prediction.saliency_map.get_shape() << "; ";
-        } catch (ov::Exception&) {
-            os << "[0]; ";
-        }
-        try {
-            os << prediction.feature_vector.get_shape();
-        } catch (ov::Exception&) {
-            os << "[0]";
-        }
-        return os;
-    }
-
-    explicit operator std::string() {
-        std::stringstream ss;
-        ss << *this;
-        return ss.str();
-    }
-};
-
-struct RetinaFaceDetectionResult : public DetectionResult {
-    RetinaFaceDetectionResult(int64_t frameId = -1, const std::shared_ptr<MetaData>& metaData = nullptr)
-        : DetectionResult(frameId, metaData) {}
-    std::vector<cv::Point2f> landmarks;
-};
-
-struct SegmentedObject : DetectedObject {
-    cv::Mat mask;
-
-    friend std::ostream& operator<<(std::ostream& os, const SegmentedObject& prediction) {
-        return os << static_cast<const DetectedObject&>(prediction) << ", " << cv::countNonZero(prediction.mask > 0.5);
-    }
-};
-
-struct SegmentedObjectWithRects : SegmentedObject {
-    cv::RotatedRect rotated_rect;
-
-    SegmentedObjectWithRects(const SegmentedObject& segmented_object) : SegmentedObject(segmented_object) {}
-
-    friend std::ostream& operator<<(std::ostream& os, const SegmentedObjectWithRects& prediction) {
-        os << static_cast<const SegmentedObject&>(prediction) << std::fixed << std::setprecision(3);
-        auto rect = prediction.rotated_rect;
-        os << ", RotatedRect: " << rect.center.x << ' ' << rect.center.y << ' ' << rect.size.width << ' '
-           << rect.size.height << ' ' << rect.angle;
-        return os;
-    }
-};
-
-static inline std::vector<SegmentedObjectWithRects> add_rotated_rects(std::vector<SegmentedObject> segmented_objects) {
-    std::vector<SegmentedObjectWithRects> objects_with_rects;
-    objects_with_rects.reserve(segmented_objects.size());
-    for (const SegmentedObject& segmented_object : segmented_objects) {
-        objects_with_rects.push_back(SegmentedObjectWithRects{segmented_object});
-        cv::Mat mask;
-        segmented_object.mask.convertTo(mask, CV_8UC1);
-        std::vector<std::vector<cv::Point>> contours;
-        cv::findContours(mask, contours, cv::RETR_EXTERNAL, cv::CHAIN_APPROX_SIMPLE);
-
-        std::vector<cv::Point> contour = {};
-        for (size_t i = 0; i < contours.size(); i++) {
-            contour.insert(contour.end(), contours[i].begin(), contours[i].end());
-        }
-        if (contour.size() > 0) {
-            std::vector<cv::Point> hull;
-            cv::convexHull(contour, hull);
-            objects_with_rects.back().rotated_rect = cv::minAreaRect(hull);
-        }
-    }
-    return objects_with_rects;
-}
-
-struct InstanceSegmentationResult : ResultBase {
-    InstanceSegmentationResult(int64_t frameId = -1, const std::shared_ptr<MetaData>& metaData = nullptr)
-        : ResultBase(frameId, metaData) {}
-    std::vector<SegmentedObject> segmentedObjects;
-    // Contains per class saliency_maps and "feature_vector" model output if feature_vector exists
-    std::vector<cv::Mat_<std::uint8_t>> saliency_map;
-    ov::Tensor feature_vector;
-};
-
-struct ImageResult : public ResultBase {
-    ImageResult(int64_t frameId = -1, const std::shared_ptr<MetaData>& metaData = nullptr)
-        : ResultBase(frameId, metaData) {}
-    cv::Mat resultImage;
-    friend std::ostream& operator<<(std::ostream& os, const ImageResult& prediction) {
-        cv::Mat predicted_mask[] = {prediction.resultImage};
-        int nimages = 1;
-        int* channels = nullptr;
-        cv::Mat mask;
-        cv::Mat outHist;
-        int dims = 1;
-        int histSize[] = {256};
-        float range[] = {0, 256};
-        const float* ranges[] = {range};
-        cv::calcHist(predicted_mask, nimages, channels, mask, outHist, dims, histSize, ranges);
-
-        os << std::fixed << std::setprecision(3);
-        for (int i = 0; i < range[1]; ++i) {
-            const float count = outHist.at<float>(i);
-            if (count > 0) {
-                os << i << ": " << count / prediction.resultImage.total() << ", ";
-            }
-        }
-        return os;
-    }
-    explicit operator std::string() {
-        std::stringstream ss;
-        ss << *this;
-        return ss.str();
-    }
-};
-
-struct ImageResultWithSoftPrediction : public ImageResult {
-    ImageResultWithSoftPrediction(int64_t frameId = -1, const std::shared_ptr<MetaData>& metaData = nullptr)
-        : ImageResult(frameId, metaData) {}
-    cv::Mat soft_prediction;
-    // Contain per class saliency_maps and "feature_vector" model output if feature_vector exists
-    cv::Mat saliency_map;  // Requires return_soft_prediction==true
-    ov::Tensor feature_vector;
-    friend std::ostream& operator<<(std::ostream& os, const ImageResultWithSoftPrediction& prediction) {
-        os << static_cast<const ImageResult&>(prediction) << '[';
-        for (int i = 0; i < prediction.soft_prediction.dims; ++i) {
-            os << prediction.soft_prediction.size[i] << ',';
-        }
-        os << prediction.soft_prediction.channels() << "], [";
-        if (prediction.saliency_map.data) {
-            for (int i = 0; i < prediction.saliency_map.dims; ++i) {
-                os << prediction.saliency_map.size[i] << ',';
-            }
-            os << prediction.saliency_map.channels() << "], ";
-        } else {
-            os << "0], ";
-        }
-        try {
-            os << prediction.feature_vector.get_shape();
-        } catch (ov::Exception&) {
-            os << "[0]";
-        }
-        return os;
-    }
-};
-
-struct Contour {
-    std::string label;
-    float probability;
-    std::vector<cv::Point> shape;
-
-    friend std::ostream& operator<<(std::ostream& os, const Contour& contour) {
-        return os << contour.label << ": " << std::fixed << std::setprecision(3) << contour.probability << ", "
-                  << contour.shape.size();
-    }
-};
-
-static inline std::vector<Contour> getContours(const std::vector<SegmentedObject>& segmentedObjects) {
-    std::vector<Contour> combined_contours;
-    std::vector<std::vector<cv::Point>> contours;
-    for (const SegmentedObject& obj : segmentedObjects) {
-        cv::findContours(obj.mask, contours, cv::RETR_EXTERNAL, cv::CHAIN_APPROX_NONE);
-        // Assuming one contour output for findContours. Based on OTX this is a safe
-        // assumption
-        if (contours.size() != 1) {
-            throw std::runtime_error("findContours() must have returned only one contour");
-        }
-        combined_contours.push_back({obj.label, obj.confidence, contours[0]});
-    }
-    return combined_contours;
-}
-
-struct HumanPose {
-    std::vector<cv::Point2f> keypoints;
-    float score;
-};
-
-struct HumanPoseResult : public ResultBase {
-    HumanPoseResult(int64_t frameId = -1, const std::shared_ptr<MetaData>& metaData = nullptr)
-        : ResultBase(frameId, metaData) {}
-    std::vector<HumanPose> poses;
-};
-
-struct DetectedKeypoints {
-    std::vector<cv::Point2f> keypoints;
-    std::vector<float> scores;
-
-    friend std::ostream& operator<<(std::ostream& os, const DetectedKeypoints& prediction) {
-        float kp_x_sum = 0.f;
-        for (const cv::Point2f& keypoint : prediction.keypoints) {
-            kp_x_sum += keypoint.x;
-        }
-        float scores_sum = std::accumulate(prediction.scores.begin(), prediction.scores.end(), 0.f);
-
-        os << "keypoints: (" << prediction.keypoints.size() << ", 2), keypoints_x_sum: ";
-        os << std::fixed << std::setprecision(3) << kp_x_sum << ", scores: (" << prediction.scores.size() << ",) "
-           << std::fixed << std::setprecision(3) << scores_sum;
-        return os;
-    }
-
-    explicit operator std::string() {
-        std::stringstream ss;
-        ss << *this;
-        return ss.str();
-    }
-};
-
-struct KeypointDetectionResult : public ResultBase {
-    KeypointDetectionResult(int64_t frameId = -1, const std::shared_ptr<MetaData>& metaData = nullptr)
-        : ResultBase(frameId, metaData) {}
-    std::vector<DetectedKeypoints> poses;
-};
diff --git a/src/cpp/models/include/models/segmentation_model.h b/src/cpp/models/include/models/segmentation_model.h
deleted file mode 100644
index 922828f7..00000000
--- a/src/cpp/models/include/models/segmentation_model.h
+++ /dev/null
@@ -1,54 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#pragma once
-#include <memory>
-#include <string>
-#include <vector>
-
-#include "models/base_model.h"
-
-namespace ov {
-class Model;
-}  // namespace ov
-struct InferenceResult;
-struct ResultBase;
-struct ImageResult;
-struct ImageResultWithSoftPrediction;
-struct ImageInputData;
-struct Contour;
-
-class SegmentationModel : public BaseModel {
-public:
-    SegmentationModel(std::shared_ptr<ov::Model>& model, const ov::AnyMap& configuration);
-    SegmentationModel(std::shared_ptr<InferenceAdapter>& adapter, const ov::AnyMap& configuration = {});
-
-    static std::unique_ptr<SegmentationModel> create_model(const std::string& modelFile,
-                                                           const ov::AnyMap& configuration = {},
-                                                           bool preload = true,
-                                                           const std::string& device = "AUTO");
-    static std::unique_ptr<SegmentationModel> create_model(std::shared_ptr<InferenceAdapter>& adapter);
-
-    std::unique_ptr<ResultBase> postprocess(InferenceResult& infResult) override;
-
-    virtual std::unique_ptr<ImageResult> infer(const ImageInputData& inputData);
-    virtual std::vector<std::unique_ptr<ImageResult>> inferBatch(const std::vector<ImageInputData>& inputImgs);
-
-    static std::string ModelType;
-    std::vector<Contour> getContours(const ImageResultWithSoftPrediction& imageResult);
-
-protected:
-    void prepareInputsOutputs(std::shared_ptr<ov::Model>& model) override;
-    void updateModelInfo() override;
-    void init_from_config(const ov::AnyMap& top_priority, const ov::AnyMap& mid_priority);
-
-    int blur_strength = -1;
-    float soft_threshold = -std::numeric_limits<float>::infinity();
-    bool return_soft_prediction = true;
-};
-
-cv::Mat create_hard_prediction_from_soft_prediction(const cv::Mat& soft_prediction,
-                                                    float soft_threshold,
-                                                    int blur_strength);
diff --git a/src/cpp/models/src/anomaly_model.cpp b/src/cpp/models/src/anomaly_model.cpp
deleted file mode 100644
index eeccf08a..00000000
--- a/src/cpp/models/src/anomaly_model.cpp
+++ /dev/null
@@ -1,205 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#include "models/anomaly_model.h"
-
-#include <memory>
-#include <openvino/core/any.hpp>
-#include <openvino/core/model.hpp>
-#include <ostream>
-
-#include "models/base_model.h"
-#include "models/input_data.h"
-#include "models/internal_model_data.h"
-#include "models/results.h"
-#include "utils/slog.hpp"
-
-std::string AnomalyModel::ModelType = "AnomalyDetection";
-
-/// @brief Initializes the model from the given configuration
-/// @param top_priority  Uses this as the primary source for setting the parameters
-/// @param mid_priority Fallback source for setting the parameters
-void AnomalyModel::init_from_config(const ov::AnyMap& top_priority, const ov::AnyMap& mid_priority) {
-    imageThreshold = get_from_any_maps("image_threshold", top_priority, mid_priority, imageThreshold);
-    pixelThreshold = get_from_any_maps("pixel_threshold", top_priority, mid_priority, pixelThreshold);
-    normalizationScale = get_from_any_maps("normalization_scale", top_priority, mid_priority, normalizationScale);
-    task = get_from_any_maps("task", top_priority, mid_priority, task);
-}
-
-AnomalyModel::AnomalyModel(std::shared_ptr<ov::Model>& model, const ov::AnyMap& configuration)
-    : BaseModel(model, configuration) {
-    init_from_config(configuration, model->get_rt_info<ov::AnyMap>("model_info"));
-}
-
-AnomalyModel::AnomalyModel(std::shared_ptr<InferenceAdapter>& adapter, const ov::AnyMap& configuration)
-    : BaseModel(adapter, configuration) {
-    init_from_config(configuration, adapter->getModelConfig());
-}
-
-std::unique_ptr<AnomalyResult> AnomalyModel::infer(const ImageInputData& inputData) {
-    auto result = BaseModel::inferImage(inputData);
-
-    return std::unique_ptr<AnomalyResult>(static_cast<AnomalyResult*>(result.release()));
-}
-
-std::vector<std::unique_ptr<AnomalyResult>> AnomalyModel::inferBatch(const std::vector<ImageInputData>& inputImgs) {
-    auto results = BaseModel::inferBatchImage(inputImgs);
-    std::vector<std::unique_ptr<AnomalyResult>> anoResults;
-    anoResults.reserve(results.size());
-    for (auto& result : results) {
-        anoResults.emplace_back(static_cast<AnomalyResult*>(result.release()));
-    }
-    return anoResults;
-}
-
-std::unique_ptr<ResultBase> AnomalyModel::postprocess(InferenceResult& infResult) {
-    ov::Tensor predictions = infResult.outputsData[outputNames[0]];
-    const auto& inputImgSize = infResult.internalModelData->asRef<InternalImageModelData>();
-
-    double pred_score;
-    std::string pred_label;
-    cv::Mat anomaly_map;
-    cv::Mat pred_mask;
-    std::vector<cv::Rect> pred_boxes;
-    if (predictions.get_shape().size() == 1) {
-        pred_score = predictions.data<float>()[0];
-    } else {
-        const ov::Layout& layout = getLayoutFromShape(predictions.get_shape());
-        const ov::Shape& predictionsShape = predictions.get_shape();
-        anomaly_map = cv::Mat(static_cast<int>(predictionsShape[ov::layout::height_idx(layout)]),
-                              static_cast<int>(predictionsShape[ov::layout::width_idx(layout)]),
-                              CV_32FC1,
-                              predictions.data<float>());
-        // find the max predicted score
-        cv::minMaxLoc(anomaly_map, NULL, &pred_score);
-    }
-    pred_label = labels[pred_score > imageThreshold ? 1 : 0];
-
-    pred_mask = anomaly_map >= pixelThreshold;
-    pred_mask.convertTo(pred_mask, CV_8UC1, 1 / 255.);
-    cv::resize(pred_mask, pred_mask, cv::Size{inputImgSize.inputImgWidth, inputImgSize.inputImgHeight});
-    anomaly_map = normalize(anomaly_map, pixelThreshold);
-    anomaly_map.convertTo(anomaly_map, CV_8UC1, 255);
-
-    pred_score = normalize(pred_score, imageThreshold);
-    if (pred_label == labels[0]) {    // normal label
-        pred_score = 1 - pred_score;  // Score of normal is 1 - score of anomaly
-    }
-
-    if (!anomaly_map.empty()) {
-        cv::resize(anomaly_map, anomaly_map, cv::Size{inputImgSize.inputImgWidth, inputImgSize.inputImgHeight});
-    }
-    if (task == "detection") {
-        pred_boxes = getBoxes(pred_mask);
-    }
-
-    AnomalyResult* result = new AnomalyResult(infResult.frameId, infResult.metaData);
-    result->anomaly_map = std::move(anomaly_map);
-    result->pred_score = pred_score;
-    result->pred_label = std::move(pred_label);
-    result->pred_mask = std::move(pred_mask);
-    result->pred_boxes = std::move(pred_boxes);
-    return std::unique_ptr<ResultBase>(result);
-}
-
-cv::Mat AnomalyModel::normalize(cv::Mat& tensor, float threshold) {
-    cv::Mat normalized = ((tensor - threshold) / normalizationScale) + 0.5f;
-    normalized = cv::min(cv::max(normalized, 0.f), 1.f);
-    return normalized;
-}
-
-/// @brief Normalize the value to be in the range [0, 1]. Centered around 0.5 and scaled by the normalization scale.
-/// @param value Unbounded value to be normalized.
-/// @param threshold This is the value that is subtracted from the input value before normalization.
-/// @return value between 0 and 1.
-double AnomalyModel::normalize(double& value, float threshold) {
-    double normalized = ((value - threshold) / normalizationScale) + 0.5f;
-    return std::min(std::max(normalized, 0.), 1.);
-}
-
-std::vector<cv::Rect> AnomalyModel::getBoxes(cv::Mat& mask) {
-    std::vector<cv::Rect> boxes;
-    std::vector<std::vector<cv::Point>> contours;
-    cv::findContours(mask, contours, cv::RETR_EXTERNAL, cv::CHAIN_APPROX_SIMPLE);
-    for (auto& contour : contours) {
-        std::vector<int> box;
-        cv::Rect rect = cv::boundingRect(contour);
-        boxes.push_back(rect);
-    }
-    return boxes;
-}
-
-std::unique_ptr<AnomalyModel> AnomalyModel::create_model(const std::string& modelFile,
-                                                         const ov::AnyMap& configuration,
-                                                         bool preload,
-                                                         const std::string& device) {
-    auto core = ov::Core();
-    std::shared_ptr<ov::Model> model = core.read_model(modelFile);
-
-    std::unique_ptr<AnomalyModel> anomalyModel{new AnomalyModel(model, configuration)};
-
-    anomalyModel->prepare();
-    if (preload) {
-        anomalyModel->load(core, device);
-    }
-    return anomalyModel;
-}
-
-std::unique_ptr<AnomalyModel> AnomalyModel::create_model(std::shared_ptr<InferenceAdapter>& adapter) {
-    const ov::AnyMap& configuration = adapter->getModelConfig();
-    auto model_type_iter = configuration.find("model_type");
-    std::string model_type = AnomalyModel::ModelType;
-    if (model_type_iter != configuration.end()) {
-        model_type = model_type_iter->second.as<std::string>();
-    }
-
-    if (model_type != AnomalyModel::ModelType) {
-        throw std::runtime_error("Incorrect or unsupported model_type is provided: " + model_type);
-    }
-    std::unique_ptr<AnomalyModel> anomalyModel{new AnomalyModel(adapter)};
-    return anomalyModel;
-}
-
-std::ostream& operator<<(std::ostream& os, std::unique_ptr<AnomalyModel>& model) {
-    os << "AnomalyModel: " << model->task << ", Image threshold: " << model->imageThreshold
-       << ", Pixel threshold: " << model->pixelThreshold << ", Normalization scale: " << model->normalizationScale
-       << std::endl;
-    return os;
-}
-
-void AnomalyModel::prepareInputsOutputs(std::shared_ptr<ov::Model>& model) {
-    const auto& input = model->input();
-    inputNames.push_back(input.get_any_name());
-
-    const ov::Shape& inputShape = input.get_partial_shape().get_max_shape();
-    const ov::Layout& inputLayout = getInputLayout(input);
-
-    if (!embedded_processing) {
-        model = BaseModel::embedProcessing(
-            model,
-            inputNames[0],
-            inputLayout,
-            resizeMode,
-            interpolationMode,
-            ov::Shape{inputShape[ov::layout::width_idx(inputLayout)], inputShape[ov::layout::height_idx(inputLayout)]},
-            pad_value,
-            reverse_input_channels,
-            mean_values,
-            scale_values);
-        embedded_processing = true;
-    }
-    outputNames.push_back(model->output().get_any_name());
-}
-
-void AnomalyModel::updateModelInfo() {
-    BaseModel::updateModelInfo();
-
-    model->set_rt_info(AnomalyModel::ModelType, "model_info", "model_type");
-    model->set_rt_info(task, "model_info", "task");
-    model->set_rt_info(imageThreshold, "model_info", "image_threshold");
-    model->set_rt_info(pixelThreshold, "model_info", "pixel_threshold");
-    model->set_rt_info(normalizationScale, "model_info", "normalization_scale");
-    model->set_rt_info(task, "model_info", "task");
-}
diff --git a/src/cpp/models/src/base_model.cpp b/src/cpp/models/src/base_model.cpp
deleted file mode 100644
index 6fd83d73..00000000
--- a/src/cpp/models/src/base_model.cpp
+++ /dev/null
@@ -1,371 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#include "models/base_model.h"
-
-#include <adapters/inference_adapter.h>
-#include <utils/image_utils.h>
-
-#include <fstream>
-#include <opencv2/core.hpp>
-#include <openvino/openvino.hpp>
-#include <stdexcept>
-#include <utils/ocv_common.hpp>
-#include <vector>
-
-#include "adapters/openvino_adapter.h"
-#include "models/input_data.h"
-#include "models/internal_model_data.h"
-#include "models/results.h"
-#include "utils/common.hpp"
-
-namespace {
-class TmpCallbackSetter {
-public:
-    BaseModel* model;
-    std::function<void(std::unique_ptr<ResultBase>, const ov::AnyMap&)> last_callback;
-    TmpCallbackSetter(BaseModel* model_,
-                      std::function<void(std::unique_ptr<ResultBase>, const ov::AnyMap&)> tmp_callback,
-                      std::function<void(std::unique_ptr<ResultBase>, const ov::AnyMap&)> last_callback_)
-        : model(model_),
-          last_callback(last_callback_) {
-        model->setCallback(tmp_callback);
-    }
-    ~TmpCallbackSetter() {
-        if (last_callback) {
-            model->setCallback(last_callback);
-        } else {
-            model->setCallback([](std::unique_ptr<ResultBase>, const ov::AnyMap&) {});
-        }
-    }
-};
-}  // namespace
-
-BaseModel::BaseModel(const std::string& modelFile,
-                     const std::string& resize_type,
-                     bool useAutoResize,
-                     const std::string& layout)
-    : useAutoResize(useAutoResize),
-      resizeMode(selectResizeMode(resize_type)),
-      modelFile(modelFile),
-      inputsLayouts(parseLayoutString(layout)) {
-    auto core = ov::Core();
-    model = core.read_model(modelFile);
-}
-
-void BaseModel::load(ov::Core& core, const std::string& device, size_t num_infer_requests) {
-    if (!inferenceAdapter) {
-        inferenceAdapter = std::make_shared<OpenVINOInferenceAdapter>();
-    }
-
-    // Update model_info erased by pre/postprocessing
-    updateModelInfo();
-
-    inferenceAdapter->loadModel(model, core, device, {}, num_infer_requests);
-}
-
-std::shared_ptr<ov::Model> BaseModel::prepare() {
-    prepareInputsOutputs(model);
-    logBasicModelInfo(model);
-    ov::set_batch(model, 1);
-
-    return model;
-}
-
-ov::Layout BaseModel::getInputLayout(const ov::Output<ov::Node>& input) {
-    ov::Layout layout = ov::layout::get_layout(input);
-    if (layout.empty()) {
-        if (inputsLayouts.empty()) {
-            layout = getLayoutFromShape(input.get_partial_shape());
-            slog::warn << "Automatically detected layout '" << layout.to_string() << "' for input '"
-                       << input.get_any_name() << "' will be used." << slog::endl;
-        } else if (inputsLayouts.size() == 1) {
-            layout = inputsLayouts.begin()->second;
-        } else {
-            layout = inputsLayouts[input.get_any_name()];
-        }
-    }
-
-    return layout;
-}
-
-size_t BaseModel::getNumAsyncExecutors() const {
-    return inferenceAdapter->getNumAsyncExecutors();
-}
-
-bool BaseModel::isReady() {
-    return inferenceAdapter->isReady();
-}
-void BaseModel::awaitAll() {
-    inferenceAdapter->awaitAll();
-}
-void BaseModel::awaitAny() {
-    inferenceAdapter->awaitAny();
-}
-
-void BaseModel::setCallback(
-    std::function<void(std::unique_ptr<ResultBase>, const ov::AnyMap& callback_args)> callback) {
-    lastCallback = callback;
-    inferenceAdapter->setCallback([this, callback](ov::InferRequest request, CallbackData args) {
-        InferenceResult result;
-
-        InferenceOutput output;
-        for (const auto& item : this->getInferenceAdapter()->getOutputNames()) {
-            output.emplace(item, request.get_tensor(item));
-        }
-
-        result.outputsData = output;
-        auto model_data_iter = args->find("internalModelData");
-        if (model_data_iter != args->end()) {
-            result.internalModelData = std::move(model_data_iter->second.as<std::shared_ptr<InternalModelData>>());
-        }
-        auto retVal = this->postprocess(result);
-        *retVal = static_cast<ResultBase&>(result);
-        callback(std::move(retVal), args ? *args : ov::AnyMap());
-    });
-}
-
-std::shared_ptr<ov::Model> BaseModel::getModel() {
-    if (!model) {
-        throw std::runtime_error(std::string("ov::Model is not accessible for the current model adapter: ") +
-                                 typeid(inferenceAdapter).name());
-    }
-
-    updateModelInfo();
-    return model;
-}
-
-std::shared_ptr<InferenceAdapter> BaseModel::getInferenceAdapter() {
-    if (!inferenceAdapter) {
-        throw std::runtime_error(std::string("Model wasn't loaded"));
-    }
-
-    return inferenceAdapter;
-}
-
-RESIZE_MODE BaseModel::selectResizeMode(const std::string& resize_type) {
-    RESIZE_MODE resize = RESIZE_FILL;
-    if ("crop" == resize_type) {
-        resize = RESIZE_CROP;
-    } else if ("standard" == resize_type) {
-        resize = RESIZE_FILL;
-    } else if ("fit_to_window" == resize_type) {
-        resize = RESIZE_KEEP_ASPECT;
-    } else if ("fit_to_window_letterbox" == resize_type) {
-        resize = RESIZE_KEEP_ASPECT_LETTERBOX;
-    } else {
-        throw std::runtime_error("Unknown value for resize_type arg");
-    }
-
-    return resize;
-}
-
-void BaseModel::init_from_config(const ov::AnyMap& top_priority, const ov::AnyMap& mid_priority) {
-    useAutoResize = get_from_any_maps("auto_resize", top_priority, mid_priority, useAutoResize);
-
-    std::string resize_type = "standard";
-    resize_type = get_from_any_maps("resize_type", top_priority, mid_priority, resize_type);
-    resizeMode = selectResizeMode(resize_type);
-
-    labels = get_from_any_maps("labels", top_priority, mid_priority, labels);
-    embedded_processing = get_from_any_maps("embedded_processing", top_priority, mid_priority, embedded_processing);
-    netInputWidth = get_from_any_maps("orig_width", top_priority, mid_priority, netInputWidth);
-    netInputHeight = get_from_any_maps("orig_height", top_priority, mid_priority, netInputHeight);
-    int pad_value_int = 0;
-    pad_value_int = get_from_any_maps("pad_value", top_priority, mid_priority, pad_value_int);
-    if (0 > pad_value_int || 255 < pad_value_int) {
-        throw std::runtime_error("pad_value must be in range [0, 255]");
-    }
-    pad_value = static_cast<uint8_t>(pad_value_int);
-    reverse_input_channels =
-        get_from_any_maps("reverse_input_channels", top_priority, mid_priority, reverse_input_channels);
-    scale_values = get_from_any_maps("scale_values", top_priority, mid_priority, scale_values);
-    mean_values = get_from_any_maps("mean_values", top_priority, mid_priority, mean_values);
-}
-
-BaseModel::BaseModel(std::shared_ptr<ov::Model>& model, const ov::AnyMap& configuration) : model(model) {
-    auto layout_iter = configuration.find("layout");
-    std::string layout = "";
-
-    if (layout_iter != configuration.end()) {
-        layout = layout_iter->second.as<std::string>();
-    } else {
-        if (model->has_rt_info("model_info", "layout")) {
-            layout = model->get_rt_info<std::string>("model_info", "layout");
-        }
-    }
-    inputsLayouts = parseLayoutString(layout);
-    init_from_config(configuration,
-                     model->has_rt_info("model_info") ? model->get_rt_info<ov::AnyMap>("model_info") : ov::AnyMap{});
-}
-
-BaseModel::BaseModel(std::shared_ptr<InferenceAdapter>& adapter, const ov::AnyMap& configuration)
-    : inferenceAdapter(adapter) {
-    const ov::AnyMap& adapter_configuration = adapter->getModelConfig();
-
-    std::string layout = "";
-    layout = get_from_any_maps("layout", configuration, adapter_configuration, layout);
-    inputsLayouts = parseLayoutString(layout);
-
-    inputNames = adapter->getInputNames();
-    outputNames = adapter->getOutputNames();
-
-    init_from_config(configuration, adapter->getModelConfig());
-}
-
-std::unique_ptr<ResultBase> BaseModel::inferImage(const ImageInputData& inputData) {
-    InferenceInput inputs;
-    InferenceResult result;
-    auto internalModelData = this->preprocess(inputData, inputs);
-
-    result.outputsData = inferenceAdapter->infer(inputs);
-    result.internalModelData = std::move(internalModelData);
-
-    auto retVal = this->postprocess(result);
-    *retVal = static_cast<ResultBase&>(result);
-    return retVal;
-}
-
-std::vector<std::unique_ptr<ResultBase>> BaseModel::inferBatchImage(const std::vector<ImageInputData>& inputImgs) {
-    std::vector<std::reference_wrapper<const ImageInputData>> inputData;
-    inputData.reserve(inputImgs.size());
-    for (const auto& img : inputImgs) {
-        inputData.push_back(img);
-    }
-    auto results = std::vector<std::unique_ptr<ResultBase>>(inputData.size());
-    auto setter = TmpCallbackSetter(
-        this,
-        [&](std::unique_ptr<ResultBase> result, const ov::AnyMap& callback_args) {
-            size_t id = callback_args.find("id")->second.as<size_t>();
-            results[id] = std::move(result);
-        },
-        lastCallback);
-    size_t req_id = 0;
-    for (const auto& data : inputData) {
-        inferAsync(data, {{"id", req_id++}});
-    }
-    awaitAll();
-    return results;
-}
-
-void BaseModel::inferAsync(const ImageInputData& inputData, const ov::AnyMap& callback_args) {
-    InferenceInput inputs;
-    auto internalModelData = this->preprocess(inputData, inputs);
-    auto callback_args_ptr = std::make_shared<ov::AnyMap>(callback_args);
-    (*callback_args_ptr)["internalModelData"] = std::move(internalModelData);
-    inferenceAdapter->inferAsync(inputs, callback_args_ptr);
-}
-
-void BaseModel::updateModelInfo() {
-    if (!model) {
-        throw std::runtime_error("The ov::Model object is not accessible");
-    }
-
-    if (!inputsLayouts.empty()) {
-        auto layouts = formatLayouts(inputsLayouts);
-        model->set_rt_info(layouts, "model_info", "layout");
-    }
-
-    model->set_rt_info(useAutoResize, "model_info", "auto_resize");
-    model->set_rt_info(formatResizeMode(resizeMode), "model_info", "resize_type");
-
-    if (!labels.empty()) {
-        model->set_rt_info(labels, "model_info", "labels");
-    }
-
-    model->set_rt_info(embedded_processing, "model_info", "embedded_processing");
-    model->set_rt_info(netInputWidth, "model_info", "orig_width");
-    model->set_rt_info(netInputHeight, "model_info", "orig_height");
-}
-
-std::shared_ptr<ov::Model> BaseModel::embedProcessing(std::shared_ptr<ov::Model>& model,
-                                                      const std::string& inputName,
-                                                      const ov::Layout& layout,
-                                                      const RESIZE_MODE resize_mode,
-                                                      const cv::InterpolationFlags interpolationMode,
-                                                      const ov::Shape& targetShape,
-                                                      uint8_t pad_value,
-                                                      bool brg2rgb,
-                                                      const std::vector<float>& mean,
-                                                      const std::vector<float>& scale,
-                                                      const std::type_info& dtype) {
-    ov::preprocess::PrePostProcessor ppp(model);
-
-    // Change the input type to the 8-bit image
-    if (dtype == typeid(int)) {
-        ppp.input(inputName).tensor().set_element_type(ov::element::u8);
-    }
-
-    ppp.input(inputName).tensor().set_layout(ov::Layout("NHWC")).set_color_format(ov::preprocess::ColorFormat::BGR);
-
-    if (resize_mode != NO_RESIZE) {
-        ppp.input(inputName).tensor().set_spatial_dynamic_shape();
-        // Doing resize in u8 is more efficient than FP32 but can lead to slightly different results
-        ppp.input(inputName).preprocess().custom(
-            createResizeGraph(resize_mode, targetShape, interpolationMode, pad_value));
-    }
-
-    ppp.input(inputName).model().set_layout(ov::Layout(layout));
-
-    // Handle color format
-    if (brg2rgb) {
-        ppp.input(inputName).preprocess().convert_color(ov::preprocess::ColorFormat::RGB);
-    }
-
-    ppp.input(inputName).preprocess().convert_element_type(ov::element::f32);
-
-    if (!mean.empty()) {
-        ppp.input(inputName).preprocess().mean(mean);
-    }
-    if (!scale.empty()) {
-        ppp.input(inputName).preprocess().scale(scale);
-    }
-
-    return ppp.build();
-}
-
-std::shared_ptr<InternalModelData> BaseModel::preprocess(const InputData& inputData, InferenceInput& input) {
-    const auto& origImg = inputData.asRef<ImageInputData>().inputImage;
-    auto img = inputTransform(origImg);
-
-    if (!useAutoResize && !embedded_processing) {
-        // Resize and copy data from the image to the input tensor
-        auto tensorShape =
-            inferenceAdapter->getInputShape(inputNames[0]).get_max_shape();  // first input should be image
-        const ov::Layout layout("NHWC");
-        const size_t width = tensorShape[ov::layout::width_idx(layout)];
-        const size_t height = tensorShape[ov::layout::height_idx(layout)];
-        const size_t channels = tensorShape[ov::layout::channels_idx(layout)];
-        if (static_cast<size_t>(img.channels()) != channels) {
-            throw std::runtime_error("The number of channels for model input: " + std::to_string(channels) +
-                                     " and image: " + std::to_string(img.channels()) + " - must match");
-        }
-        if (channels != 1 && channels != 3) {
-            throw std::runtime_error("Unsupported number of channels");
-        }
-        img = resizeImageExt(img, width, height, resizeMode, interpolationMode);
-    }
-    input.emplace(inputNames[0], wrapMat2Tensor(img));
-    return std::make_shared<InternalImageModelData>(origImg.cols, origImg.rows);
-}
-
-std::vector<std::string> BaseModel::loadLabels(const std::string& labelFilename) {
-    std::vector<std::string> labelsList;
-
-    /* Read labels (if any) */
-    if (!labelFilename.empty()) {
-        std::ifstream inputFile(labelFilename);
-        if (!inputFile.is_open())
-            throw std::runtime_error("Can't open the labels file: " + labelFilename);
-        std::string label;
-        while (std::getline(inputFile, label)) {
-            labelsList.push_back(label);
-        }
-        if (labelsList.empty())
-            throw std::logic_error("File is empty: " + labelFilename);
-    }
-
-    return labelsList;
-}
diff --git a/src/cpp/models/src/classification_model.cpp b/src/cpp/models/src/classification_model.cpp
deleted file mode 100644
index a9d281e1..00000000
--- a/src/cpp/models/src/classification_model.cpp
+++ /dev/null
@@ -1,838 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#include "models/classification_model.h"
-
-#include <algorithm>
-#include <deque>
-#include <fstream>
-#include <iterator>
-#include <map>
-#include <nlohmann/json.hpp>
-#include <openvino/op/softmax.hpp>
-#include <openvino/op/topk.hpp>
-#include <openvino/openvino.hpp>
-#include <stdexcept>
-#include <string>
-#include <utility>
-#include <utils/slog.hpp>
-#include <vector>
-
-#include "models/input_data.h"
-#include "models/results.h"
-
-std::string ClassificationModel::ModelType = "Classification";
-
-namespace {
-constexpr char indices_name[]{"indices"};
-constexpr char scores_name[]{"scores"};
-constexpr char saliency_map_name[]{"saliency_map"};
-constexpr char feature_vector_name[]{"feature_vector"};
-constexpr char raw_scores_name[]{"raw_scores"};
-
-float sigmoid(float x) noexcept {
-    return 1.0f / (1.0f + std::exp(-x));
-}
-
-size_t fargmax(const float* x_start, const float* x_end) noexcept {
-    size_t argmax = 0;
-
-    for (const float* iter = x_start; iter < x_end; ++iter) {
-        if (x_start[argmax] < *iter) {
-            argmax = iter - x_start;
-        }
-    }
-
-    return argmax;
-}
-
-void softmax(float* x_start, float* x_end, float eps = 1e-9) {
-    if (x_start == x_end) {
-        return;
-    }
-
-    float x_max = *std::max_element(x_start, x_end);
-    float x_sum = 0.f;
-    for (auto it = x_start; it < x_end; ++it) {
-        *it = exp(*it - x_max);
-        x_sum += *it;
-    }
-
-    for (auto it = x_start; it < x_end; ++it) {
-        *it /= x_sum + eps;
-    }
-}
-
-void addOrFindSoftmaxAndTopkOutputs(std::shared_ptr<ov::Model>& model, size_t topk, bool add_raw_scores) {
-    auto nodes = model->get_ops();
-    std::shared_ptr<ov::Node> softmaxNode;
-    for (size_t i = 0; i < model->outputs().size(); ++i) {
-        auto output_node = model->get_output_op(i)->input(0).get_source_output().get_node_shared_ptr();
-        if (std::string(output_node->get_type_name()) == "Softmax") {
-            softmaxNode = output_node;
-        } else if (std::string(output_node->get_type_name()) == "TopK") {
-            return;
-        }
-    }
-
-    if (!softmaxNode) {
-        auto logitsNode = model->get_output_op(0)->input(0).get_source_output().get_node();
-        softmaxNode = std::make_shared<ov::op::v1::Softmax>(logitsNode->output(0), 1);
-    }
-
-    const auto k = std::make_shared<ov::op::v0::Constant>(ov::element::i32, ov::Shape{}, std::vector<size_t>{topk});
-    std::shared_ptr<ov::Node> topkNode = std::make_shared<ov::op::v3::TopK>(softmaxNode,
-                                                                            k,
-                                                                            1,
-                                                                            ov::op::v3::TopK::Mode::MAX,
-                                                                            ov::op::v3::TopK::SortType::SORT_VALUES);
-
-    auto indices = topkNode->output(0);
-    auto scores = topkNode->output(1);
-    ov::OutputVector outputs_vector;
-    if (add_raw_scores) {
-        auto raw_scores = softmaxNode->output(0);
-        outputs_vector = {scores, indices, raw_scores};
-    } else {
-        outputs_vector = {scores, indices};
-    }
-    for (const ov::Output<ov::Node>& output : model->outputs()) {
-        if (output.get_names().count(saliency_map_name) > 0 || output.get_names().count(feature_vector_name) > 0) {
-            outputs_vector.push_back(output);
-        }
-    }
-
-    auto source_rt_info =
-        model->has_rt_info("model_info") ? model->get_rt_info<ov::AnyMap>("model_info") : ov::AnyMap{};
-    model = std::make_shared<ov::Model>(outputs_vector, model->get_parameters(), "classification");
-
-    // preserve extra model_info items
-    for (const auto& k : source_rt_info) {
-        model->set_rt_info(k.second, "model_info", k.first);
-    }
-
-    // manually set output tensors name for created topK node
-    model->outputs()[0].set_names({indices_name});
-    model->outputs()[1].set_names({scores_name});
-    if (add_raw_scores) {
-        model->outputs()[2].set_names({raw_scores_name});
-    }
-
-    // set output precisions
-    ov::preprocess::PrePostProcessor ppp = ov::preprocess::PrePostProcessor(model);
-    ppp.output(indices_name).tensor().set_element_type(ov::element::i32);
-    ppp.output(scores_name).tensor().set_element_type(ov::element::f32);
-    if (add_raw_scores) {
-        ppp.output(raw_scores_name).tensor().set_element_type(ov::element::f32);
-    }
-    model = ppp.build();
-}
-
-std::vector<std::string> get_non_xai_names(const std::vector<ov::Output<ov::Node>>& outputs) {
-    std::vector<std::string> outputNames;
-    outputNames.reserve(std::max(1, int(outputs.size()) - 2));
-    for (const ov::Output<ov::Node>& output : outputs) {
-        if (output.get_names().count(saliency_map_name) > 0) {
-            continue;
-        }
-        if (output.get_names().count(feature_vector_name) > 0) {
-            continue;
-        }
-        outputNames.push_back(output.get_any_name());
-    }
-    return outputNames;
-}
-
-std::vector<size_t> get_non_xai_output_indices(const std::vector<ov::Output<ov::Node>>& outputs) {
-    std::vector<size_t> outputIndices;
-    outputIndices.reserve(std::max(1, int(outputs.size()) - 2));
-    size_t idx = 0;
-    for (const ov::Output<ov::Node>& output : outputs) {
-        bool is_xai =
-            output.get_names().count(saliency_map_name) > 0 || output.get_names().count(feature_vector_name) > 0;
-        if (!is_xai) {
-            outputIndices.push_back(idx);
-        }
-        ++idx;
-    }
-    return outputIndices;
-}
-
-std::vector<std::string> get_non_xai_names(const std::vector<std::string>& outputs) {
-    std::vector<std::string> outputNames;
-    outputNames.reserve(std::max(1, int(outputs.size()) - 2));
-    for (const auto& output : outputs) {
-        if (output.find(saliency_map_name) != std::string::npos) {
-            continue;
-        }
-        if (output.find(feature_vector_name) != std::string::npos) {
-            continue;
-        }
-        outputNames.push_back(output);
-    }
-    return outputNames;
-}
-
-void append_xai_names(const std::vector<ov::Output<ov::Node>>& outputs, std::vector<std::string>& outputNames) {
-    for (const ov::Output<ov::Node>& output : outputs) {
-        if (output.get_names().count(saliency_map_name) > 0) {
-            outputNames.emplace_back(saliency_map_name);
-        } else if (output.get_names().count(feature_vector_name) > 0) {
-            outputNames.push_back(feature_vector_name);
-        }
-    }
-}
-
-void append_xai_names(const std::vector<std::string>& outputs, std::vector<std::string>& outputNames) {
-    for (const auto& output : outputs) {
-        if (output.find(saliency_map_name) != std::string::npos) {
-            outputNames.emplace_back(saliency_map_name);
-        } else if (output.find(feature_vector_name) != std::string::npos) {
-            outputNames.push_back(feature_vector_name);
-        }
-    }
-}
-}  // namespace
-
-void ClassificationModel::init_from_config(const ov::AnyMap& top_priority, const ov::AnyMap& mid_priority) {
-    topk = get_from_any_maps("topk", top_priority, mid_priority, topk);
-    confidence_threshold = get_from_any_maps("confidence_threshold", top_priority, mid_priority, confidence_threshold);
-    multilabel = get_from_any_maps("multilabel", top_priority, mid_priority, multilabel);
-    output_raw_scores = get_from_any_maps("output_raw_scores", top_priority, mid_priority, output_raw_scores);
-    hierarchical = get_from_any_maps("hierarchical", top_priority, mid_priority, hierarchical);
-    hierarchical_config = get_from_any_maps("hierarchical_config", top_priority, mid_priority, hierarchical_config);
-    hierarchical_postproc =
-        get_from_any_maps("hierarchical_postproc", top_priority, mid_priority, hierarchical_postproc);
-    if (hierarchical) {
-        if (hierarchical_config.empty()) {
-            throw std::runtime_error("Error: empty hierarchical classification config");
-        }
-        hierarchical_info = HierarchicalConfig(hierarchical_config);
-        if (hierarchical_postproc == "probabilistic") {
-            resolver = std::make_unique<ProbabilisticLabelsResolver>(hierarchical_info);
-        } else if (hierarchical_postproc == "greedy") {
-            resolver = std::make_unique<GreedyLabelsResolver>(hierarchical_info);
-        } else {
-            throw std::runtime_error("Wrong hierarchical labels postprocessing type");
-        }
-    }
-}
-
-ClassificationModel::ClassificationModel(std::shared_ptr<ov::Model>& model, const ov::AnyMap& configuration)
-    : BaseModel(model, configuration) {
-    init_from_config(configuration,
-                     model->has_rt_info("model_info") ? model->get_rt_info<ov::AnyMap>("model_info") : ov::AnyMap{});
-}
-
-ClassificationModel::ClassificationModel(std::shared_ptr<InferenceAdapter>& adapter, const ov::AnyMap& configuration)
-    : BaseModel(adapter, configuration) {
-    outputNames = get_non_xai_names(adapter->getOutputNames());
-    append_xai_names(adapter->getOutputNames(), outputNames);
-    init_from_config(configuration, adapter->getModelConfig());
-}
-
-void ClassificationModel::updateModelInfo() {
-    BaseModel::updateModelInfo();
-
-    model->set_rt_info(ClassificationModel::ModelType, "model_info", "model_type");
-    model->set_rt_info(topk, "model_info", "topk");
-    model->set_rt_info(multilabel, "model_info", "multilabel");
-    model->set_rt_info(hierarchical, "model_info", "hierarchical");
-    model->set_rt_info(output_raw_scores, "model_info", "output_raw_scores");
-    model->set_rt_info(confidence_threshold, "model_info", "confidence_threshold");
-    model->set_rt_info(hierarchical_config, "model_info", "hierarchical_config");
-    model->set_rt_info(hierarchical_postproc, "model_info", "hierarchical_postproc");
-}
-
-std::unique_ptr<ClassificationModel> ClassificationModel::create_model(const std::string& modelFile,
-                                                                       const ov::AnyMap& configuration,
-                                                                       bool preload,
-                                                                       const std::string& device) {
-    auto core = ov::Core();
-    std::shared_ptr<ov::Model> model = core.read_model(modelFile);
-
-    // Check model_type in the rt_info, ignore configuration
-    std::string model_type = ClassificationModel::ModelType;
-    try {
-        if (model->has_rt_info("model_info", "model_type")) {
-            model_type = model->get_rt_info<std::string>("model_info", "model_type");
-        }
-    } catch (const std::exception&) {
-        slog::warn << "Model type is not specified in the rt_info, use default model type: " << model_type
-                   << slog::endl;
-    }
-
-    if (model_type != ClassificationModel::ModelType) {
-        throw std::runtime_error("Incorrect or unsupported model_type is provided in the model_info section: " +
-                                 model_type);
-    }
-
-    std::unique_ptr<ClassificationModel> classifier{new ClassificationModel(model, configuration)};
-    classifier->prepare();
-    if (preload) {
-        classifier->load(core, device);
-    }
-    return classifier;
-}
-
-std::unique_ptr<ClassificationModel> ClassificationModel::create_model(std::shared_ptr<InferenceAdapter>& adapter) {
-    const ov::AnyMap& configuration = adapter->getModelConfig();
-    auto model_type_iter = configuration.find("model_type");
-    std::string model_type = ClassificationModel::ModelType;
-    if (model_type_iter != configuration.end()) {
-        model_type = model_type_iter->second.as<std::string>();
-    }
-
-    if (model_type != ClassificationModel::ModelType) {
-        throw std::runtime_error("Incorrect or unsupported model_type is provided: " + model_type);
-    }
-
-    std::unique_ptr<ClassificationModel> classifier{new ClassificationModel(adapter)};
-    return classifier;
-}
-
-std::unique_ptr<ResultBase> ClassificationModel::postprocess(InferenceResult& infResult) {
-    std::unique_ptr<ResultBase> result;
-    if (multilabel) {
-        result = get_multilabel_predictions(infResult, output_raw_scores);
-    } else if (hierarchical) {
-        result = get_hierarchical_predictions(infResult, output_raw_scores);
-    } else {
-        result = get_multiclass_predictions(infResult, output_raw_scores);
-    }
-
-    ClassificationResult* cls_res = static_cast<ClassificationResult*>(result.get());
-    auto saliency_map_iter = infResult.outputsData.find(saliency_map_name);
-    if (saliency_map_iter != infResult.outputsData.end()) {
-        cls_res->saliency_map = std::move(saliency_map_iter->second);
-        cls_res->saliency_map = reorder_saliency_maps(cls_res->saliency_map);
-    }
-    auto feature_vector_iter = infResult.outputsData.find(feature_vector_name);
-    if (feature_vector_iter != infResult.outputsData.end()) {
-        cls_res->feature_vector = std::move(feature_vector_iter->second);
-    }
-    return result;
-}
-
-std::unique_ptr<ResultBase> ClassificationModel::get_multilabel_predictions(InferenceResult& infResult,
-                                                                            bool add_raw_scores) {
-    const ov::Tensor& logitsTensor = infResult.outputsData.find(outputNames[0])->second;
-    const float* logitsPtr = logitsTensor.data<float>();
-
-    ClassificationResult* result = new ClassificationResult(infResult.frameId, infResult.metaData);
-    auto retVal = std::unique_ptr<ResultBase>(result);
-
-    auto raw_scores = ov::Tensor();
-    float* raw_scoresPtr = nullptr;
-    if (add_raw_scores) {
-        raw_scores = ov::Tensor(logitsTensor.get_element_type(), logitsTensor.get_shape());
-        raw_scoresPtr = raw_scores.data<float>();
-        result->raw_scores = raw_scores;
-    }
-
-    result->topLabels.reserve(labels.size());
-    for (size_t i = 0; i < labels.size(); ++i) {
-        float score = sigmoid(logitsPtr[i]);
-        if (score > confidence_threshold) {
-            result->topLabels.emplace_back(i, labels[i], score);
-        }
-        if (add_raw_scores) {
-            raw_scoresPtr[i] = score;
-        }
-    }
-
-    return retVal;
-}
-
-std::unique_ptr<ResultBase> ClassificationModel::get_hierarchical_predictions(InferenceResult& infResult,
-                                                                              bool add_raw_scores) {
-    ClassificationResult* result = new ClassificationResult(infResult.frameId, infResult.metaData);
-
-    const ov::Tensor& logitsTensor = infResult.outputsData.find(outputNames[0])->second;
-    float* logitsPtr = logitsTensor.data<float>();
-
-    auto raw_scores = ov::Tensor();
-    float* raw_scoresPtr = nullptr;
-    if (add_raw_scores) {
-        raw_scores = ov::Tensor(logitsTensor.get_element_type(), logitsTensor.get_shape());
-        logitsTensor.copy_to(raw_scores);
-        raw_scoresPtr = raw_scores.data<float>();
-        result->raw_scores = raw_scores;
-    }
-
-    std::vector<std::reference_wrapper<std::string>> predicted_labels;
-    std::vector<float> predicted_scores;
-
-    predicted_labels.reserve(hierarchical_info.num_multiclass_heads + hierarchical_info.num_multilabel_heads);
-    predicted_scores.reserve(hierarchical_info.num_multiclass_heads + hierarchical_info.num_multilabel_heads);
-
-    for (size_t i = 0; i < hierarchical_info.num_multiclass_heads; ++i) {
-        const auto& logits_range = hierarchical_info.head_idx_to_logits_range[i];
-        softmax(logitsPtr + logits_range.first, logitsPtr + logits_range.second);
-        if (add_raw_scores) {
-            softmax(raw_scoresPtr + logits_range.first, raw_scoresPtr + logits_range.second);
-        }
-        size_t j = fargmax(logitsPtr + logits_range.first, logitsPtr + logits_range.second);
-        predicted_labels.push_back(hierarchical_info.all_groups[i][j]);
-        predicted_scores.push_back(logitsPtr[logits_range.first + j]);
-    }
-
-    if (hierarchical_info.num_multilabel_heads) {
-        const float* mlc_logitsPtr = logitsPtr + hierarchical_info.num_single_label_classes;
-
-        for (size_t i = 0; i < hierarchical_info.num_multilabel_heads; ++i) {
-            float score = sigmoid(mlc_logitsPtr[i]);
-            if (score > confidence_threshold) {
-                predicted_scores.push_back(score);
-                predicted_labels.push_back(hierarchical_info.all_groups[hierarchical_info.num_multiclass_heads + i][0]);
-            }
-            if (add_raw_scores) {
-                raw_scoresPtr[hierarchical_info.num_single_label_classes + i] = score;
-            }
-        }
-    }
-
-    auto resolved_labels = resolver->resolve_labels(predicted_labels, predicted_scores);
-
-    auto retVal = std::unique_ptr<ResultBase>(result);
-    result->topLabels.reserve(resolved_labels.size());
-    for (const auto& label : resolved_labels) {
-        result->topLabels.emplace_back(hierarchical_info.label_to_idx[label.first], label.first, label.second);
-    }
-
-    return retVal;
-}
-
-ov::Tensor ClassificationModel::reorder_saliency_maps(const ov::Tensor& source_maps) {
-    if (!hierarchical || source_maps.get_shape().size() == 1) {
-        return source_maps;
-    }
-
-    auto reordered_maps = ov::Tensor(source_maps.get_element_type(), source_maps.get_shape());
-    const std::uint8_t* source_maps_ptr = static_cast<std::uint8_t*>(source_maps.data());
-    std::uint8_t* reordered_maps_ptr = static_cast<std::uint8_t*>(reordered_maps.data());
-
-    size_t shape_offset = (source_maps.get_shape().size() == 4) ? 1 : 0;
-    size_t map_byte_size = source_maps.get_element_type().size() * source_maps.get_shape()[shape_offset + 1] *
-                           source_maps.get_shape()[shape_offset + 2];
-
-    for (size_t i = 0; i < source_maps.get_shape()[shape_offset]; ++i) {
-        size_t new_index = hierarchical_info.label_to_idx[hierarchical_info.logit_idx_to_label[i]];
-        std::copy_n(source_maps_ptr + i * map_byte_size, map_byte_size, reordered_maps_ptr + new_index * map_byte_size);
-    }
-
-    return reordered_maps;
-}
-
-std::unique_ptr<ResultBase> ClassificationModel::get_multiclass_predictions(InferenceResult& infResult,
-                                                                            bool add_raw_scores) {
-    const ov::Tensor& indicesTensor = infResult.outputsData.find(indices_name)->second;
-    const int* indicesPtr = indicesTensor.data<int>();
-    const ov::Tensor& scoresTensor = infResult.outputsData.find(scores_name)->second;
-    const float* scoresPtr = scoresTensor.data<float>();
-
-    ClassificationResult* result = new ClassificationResult(infResult.frameId, infResult.metaData);
-    auto retVal = std::unique_ptr<ResultBase>(result);
-
-    if (add_raw_scores) {
-        const ov::Tensor& logitsTensor = infResult.outputsData.find(raw_scores_name)->second;
-        result->raw_scores = ov::Tensor(logitsTensor.get_element_type(), logitsTensor.get_shape());
-        logitsTensor.copy_to(result->raw_scores);
-        result->raw_scores.set_shape(ov::Shape({result->raw_scores.get_size()}));
-    }
-
-    result->topLabels.reserve(scoresTensor.get_size());
-    for (size_t i = 0; i < scoresTensor.get_size(); ++i) {
-        int ind = indicesPtr[i];
-        if (ind < 0 || ind >= static_cast<int>(labels.size())) {
-            throw std::runtime_error("Invalid index for the class label is found during postprocessing");
-        }
-        result->topLabels.emplace_back(ind, labels[ind], scoresPtr[i]);
-    }
-
-    return retVal;
-}
-
-void ClassificationModel::prepareInputsOutputs(std::shared_ptr<ov::Model>& model) {
-    // --------------------------- Configure input & output -------------------------------------------------
-    // --------------------------- Prepare input  ------------------------------------------------------
-    if (model->inputs().size() != 1) {
-        throw std::logic_error("Classification model wrapper supports topologies with only 1 input");
-    }
-    const auto& input = model->input();
-    inputNames.push_back(input.get_any_name());
-
-    const ov::Shape& inputShape = input.get_partial_shape().get_max_shape();
-    const ov::Layout& inputLayout = getInputLayout(input);
-
-    if (!embedded_processing) {
-        model = BaseModel::embedProcessing(
-            model,
-            inputNames[0],
-            inputLayout,
-            resizeMode,
-            interpolationMode,
-            ov::Shape{inputShape[ov::layout::width_idx(inputLayout)], inputShape[ov::layout::height_idx(inputLayout)]},
-            pad_value,
-            reverse_input_channels,
-            mean_values,
-            scale_values);
-
-        ov::preprocess::PrePostProcessor ppp = ov::preprocess::PrePostProcessor(model);
-        model = ppp.build();
-        useAutoResize = true;  // temporal solution for classification
-    }
-
-    // --------------------------- Prepare output  -----------------------------------------------------
-    if (model->outputs().size() > 5) {
-        throw std::logic_error("Classification model wrapper supports topologies with up to 4 outputs");
-    }
-
-    auto non_xai_idx = get_non_xai_output_indices(model->outputs());
-    if (non_xai_idx.size() == 1) {
-        const ov::Shape& outputShape = model->outputs()[non_xai_idx[0]].get_partial_shape().get_max_shape();
-        if (outputShape.size() != 2 && outputShape.size() != 4) {
-            throw std::logic_error("Classification model wrapper supports topologies only with"
-                                   " 2-dimensional or 4-dimensional output");
-        }
-
-        const ov::Layout outputLayout("NCHW");
-        if (outputShape.size() == 4 && (outputShape[ov::layout::height_idx(outputLayout)] != 1 ||
-                                        outputShape[ov::layout::width_idx(outputLayout)] != 1)) {
-            throw std::logic_error("Classification model wrapper supports topologies only"
-                                   " with 4-dimensional output which has last two dimensions of size 1");
-        }
-
-        size_t classesNum = outputShape[ov::layout::channels_idx(outputLayout)];
-        if (topk > classesNum) {
-            throw std::logic_error("The model provides " + std::to_string(classesNum) + " classes, but " +
-                                   std::to_string(topk) + " labels are requested to be predicted");
-        }
-        if (classesNum != labels.size()) {
-            throw std::logic_error("Model's number of classes and parsed labels must match (" +
-                                   std::to_string(outputShape[1]) + " and " + std::to_string(labels.size()) + ')');
-        }
-    }
-
-    if (multilabel || hierarchical) {
-        embedded_processing = true;
-        outputNames = get_non_xai_names(model->outputs());
-        append_xai_names(model->outputs(), outputNames);
-        return;
-    }
-
-    if (!embedded_processing) {
-        addOrFindSoftmaxAndTopkOutputs(model, topk, output_raw_scores);
-    }
-    embedded_processing = true;
-
-    outputNames = {indices_name, scores_name};
-    if (output_raw_scores) {
-        outputNames.emplace_back("raw_scores");
-    }
-    append_xai_names(model->outputs(), outputNames);
-}
-
-std::unique_ptr<ClassificationResult> ClassificationModel::infer(const ImageInputData& inputData) {
-    auto result = BaseModel::inferImage(inputData);
-    return std::unique_ptr<ClassificationResult>(static_cast<ClassificationResult*>(result.release()));
-}
-
-std::vector<std::unique_ptr<ClassificationResult>> ClassificationModel::inferBatch(
-    const std::vector<ImageInputData>& inputImgs) {
-    auto results = BaseModel::inferBatchImage(inputImgs);
-    std::vector<std::unique_ptr<ClassificationResult>> clsResults;
-    clsResults.reserve(results.size());
-    for (auto& result : results) {
-        clsResults.emplace_back(static_cast<ClassificationResult*>(result.release()));
-    }
-    return clsResults;
-}
-
-HierarchicalConfig::HierarchicalConfig(const std::string& json_repr) {
-    nlohmann::json data = nlohmann::json::parse(json_repr);
-
-    num_multilabel_heads = data.at("cls_heads_info").at("num_multilabel_classes");
-    num_multiclass_heads = data.at("cls_heads_info").at("num_multiclass_heads");
-    num_single_label_classes = data.at("cls_heads_info").at("num_single_label_classes");
-
-    data.at("cls_heads_info").at("label_to_idx").get_to(label_to_idx);
-    data.at("cls_heads_info").at("all_groups").get_to(all_groups);
-    data.at("label_tree_edges").get_to(label_tree_edges);
-
-    std::map<std::string, std::pair<int, int>> tmp_head_idx_to_logits_range;
-    data.at("cls_heads_info").at("head_idx_to_logits_range").get_to(tmp_head_idx_to_logits_range);
-
-    for (const auto& range_descr : tmp_head_idx_to_logits_range) {
-        head_idx_to_logits_range[stoi(range_descr.first)] = range_descr.second;
-    }
-
-    size_t logits_processed = 0;
-    for (size_t i = 0; i < num_multiclass_heads; ++i) {
-        const auto& logits_range = head_idx_to_logits_range[i];
-        for (size_t k = logits_range.first; k < logits_range.second; ++k) {
-            logit_idx_to_label[logits_processed++] = all_groups[i][k - logits_range.first];
-        }
-    }
-    for (size_t i = 0; i < num_multilabel_heads; ++i) {
-        logit_idx_to_label[logits_processed++] = all_groups[num_multiclass_heads + i][0];
-    }
-}
-
-GreedyLabelsResolver::GreedyLabelsResolver(const HierarchicalConfig& config)
-    : label_to_idx(config.label_to_idx),
-      label_relations(config.label_tree_edges),
-      label_groups(config.all_groups) {}
-
-std::map<std::string, float> GreedyLabelsResolver::resolve_labels(
-    const std::vector<std::reference_wrapper<std::string>>& labels,
-    const std::vector<float>& scores) {
-    if (labels.size() != scores.size()) {
-        throw std::runtime_error("Inconsistent number of labels and scores");
-    }
-    std::map<std::string, float> label_to_prob;
-    for (const auto& label_idx : label_to_idx) {
-        label_to_prob[label_idx.first] = 0.f;
-    }
-
-    for (size_t i = 0; i < labels.size(); ++i) {
-        label_to_prob[labels[i]] = scores[i];
-    }
-
-    std::vector<std::string> candidates;
-    for (const auto& g : label_groups) {
-        if (g.size() == 1 && label_to_prob[g[0]] > 0.f) {
-            candidates.push_back(g[0]);
-        } else {
-            float max_prob = 0.f;
-            std::string max_label;
-            for (const auto& lbl : g) {
-                if (label_to_prob[lbl] > max_prob) {
-                    max_prob = label_to_prob[lbl];
-                    max_label = lbl;
-                }
-                if (max_label.size() > 0) {
-                    candidates.push_back(max_label);
-                }
-            }
-        }
-    }
-
-    std::map<std::string, float> resolved_label_to_prob;
-    for (const auto& lbl : candidates) {
-        if (resolved_label_to_prob.find(lbl) != resolved_label_to_prob.end()) {
-            continue;
-        }
-        auto labels_to_add = get_predecessors(lbl, candidates);
-        for (const auto& new_lbl : labels_to_add) {
-            if (resolved_label_to_prob.find(new_lbl) == resolved_label_to_prob.end()) {
-                resolved_label_to_prob[new_lbl] = label_to_prob[new_lbl];
-            }
-        }
-    }
-
-    return resolved_label_to_prob;
-}
-
-std::string GreedyLabelsResolver::get_parent(const std::string& label) {
-    for (const auto& edge : label_relations) {
-        if (label == edge.first) {
-            return edge.second;
-        }
-    }
-    return "";
-}
-
-std::vector<std::string> GreedyLabelsResolver::get_predecessors(const std::string& label,
-                                                                const std::vector<std::string>& candidates) {
-    std::vector<std::string> predecessors;
-    auto last_parent = get_parent(label);
-
-    if (last_parent.size() == 0) {
-        return {label};
-    }
-    while (last_parent.size() > 0) {
-        if (std::find(candidates.begin(), candidates.end(), last_parent) == candidates.end()) {
-            return {};
-        }
-        predecessors.push_back(last_parent);
-        last_parent = get_parent(last_parent);
-    }
-
-    if (predecessors.size() > 0) {
-        predecessors.push_back(label);
-    }
-
-    return predecessors;
-}
-
-SimpleLabelsGraph::SimpleLabelsGraph(const std::vector<std::string>& vertices_)
-    : vertices(vertices_),
-      t_sort_cache_valid(false) {}
-
-void SimpleLabelsGraph::add_edge(const std::string& parent, const std::string& child) {
-    adj[parent].push_back(child);
-    parents_map[child] = parent;
-    t_sort_cache_valid = false;
-}
-
-std::vector<std::string> SimpleLabelsGraph::get_children(const std::string& label) const {
-    auto iter = adj.find(label);
-    if (iter == adj.end()) {
-        return std::vector<std::string>();
-    }
-    return iter->second;
-}
-
-std::string SimpleLabelsGraph::get_parent(const std::string& label) const {
-    auto iter = parents_map.find(label);
-    if (iter == parents_map.end()) {
-        return std::string();
-    }
-    return iter->second;
-}
-
-std::vector<std::string> SimpleLabelsGraph::get_ancestors(const std::string& label) const {
-    std::vector<std::string> predecessors = {label};
-    auto last_parent = get_parent(label);
-    if (!last_parent.size()) {
-        return predecessors;
-    }
-
-    while (last_parent.size()) {
-        predecessors.push_back(last_parent);
-        last_parent = get_parent(last_parent);
-    }
-
-    return predecessors;
-}
-
-std::vector<std::string> SimpleLabelsGraph::get_labels_in_topological_order() {
-    if (!t_sort_cache_valid) {
-        topological_order_cache = topological_sort();
-    }
-    return topological_order_cache;
-}
-
-std::vector<std::string> SimpleLabelsGraph::topological_sort() {
-    auto in_degree = std::unordered_map<std::string, size_t>();
-    for (const auto& node : vertices) {
-        in_degree[node] = 0;
-    }
-
-    for (const auto& item : adj) {
-        for (const auto& node : item.second) {
-            in_degree[node] += 1;
-        }
-    }
-
-    std::deque<std::string> nodes_deque;
-    for (const auto& node : vertices) {
-        if (in_degree[node] == 0) {
-            nodes_deque.push_back(node);
-        }
-    }
-
-    std::vector<std::string> ordered_nodes;
-    while (!nodes_deque.empty()) {
-        auto u = nodes_deque[0];
-        nodes_deque.pop_front();
-        ordered_nodes.push_back(u);
-
-        for (const auto& node : adj[u]) {
-            auto degree = --in_degree[node];
-            if (degree == 0) {
-                nodes_deque.push_back(node);
-            }
-        }
-    }
-
-    if (ordered_nodes.size() != vertices.size()) {
-        throw std::runtime_error("Topological sort failed: input graph has been"
-                                 "changed during the sorting or contains a cycle");
-    }
-
-    return ordered_nodes;
-}
-
-ProbabilisticLabelsResolver::ProbabilisticLabelsResolver(const HierarchicalConfig& conf) : GreedyLabelsResolver(conf) {
-    std::vector<std::string> all_labels;
-    for (const auto& item : label_to_idx) {
-        all_labels.push_back(item.first);
-    }
-    label_tree = SimpleLabelsGraph(all_labels);
-    for (const auto& item : label_relations) {
-        label_tree.add_edge(item.second, item.first);
-    }
-    label_tree.get_labels_in_topological_order();
-}
-
-std::map<std::string, float> ProbabilisticLabelsResolver::resolve_labels(
-    const std::vector<std::reference_wrapper<std::string>>& labels,
-    const std::vector<float>& scores) {
-    if (labels.size() != scores.size()) {
-        throw std::runtime_error("Inconsistent number of labels and scores");
-    }
-
-    std::unordered_map<std::string, float> label_to_prob;
-    for (size_t i = 0; i < labels.size(); ++i) {
-        label_to_prob[labels[i]] = scores[i];
-    }
-
-    label_to_prob = add_missing_ancestors(label_to_prob);
-    auto hard_classification = resolve_exclusive_labels(label_to_prob);
-    suppress_descendant_output(hard_classification);
-
-    std::map<std::string, float> output_labels_map;
-
-    for (const auto& item : hard_classification) {
-        if (item.second > 0) {
-            if (label_to_prob.find(item.first) != label_to_prob.end()) {
-                output_labels_map[item.first] = item.second * label_to_prob[item.first];
-            } else {
-                output_labels_map[item.first] = item.second;
-            }
-        }
-    }
-
-    return output_labels_map;
-}
-
-std::unordered_map<std::string, float> ProbabilisticLabelsResolver::add_missing_ancestors(
-    const std::unordered_map<std::string, float>& label_to_prob) const {
-    std::unordered_map<std::string, float> updated_label_to_probability(label_to_prob);
-    for (const auto& item : label_to_prob) {
-        for (const auto& ancestor : label_tree.get_ancestors(item.first)) {
-            if (updated_label_to_probability.find(ancestor) == updated_label_to_probability.end()) {
-                updated_label_to_probability[ancestor] = 0.f;
-            }
-        }
-    }
-    return updated_label_to_probability;
-}
-
-std::map<std::string, float> ProbabilisticLabelsResolver::resolve_exclusive_labels(
-    const std::unordered_map<std::string, float>& label_to_prob) const {
-    std::map<std::string, float> hard_classification;
-
-    for (const auto& item : label_to_prob) {
-        hard_classification[item.first] = static_cast<float>(item.second > 0);
-    }
-
-    return hard_classification;
-}
-
-void ProbabilisticLabelsResolver::suppress_descendant_output(std::map<std::string, float>& hard_classification) {
-    auto all_labels = label_tree.get_labels_in_topological_order();
-
-    for (const auto& child : all_labels) {
-        if (hard_classification.find(child) != hard_classification.end()) {
-            auto parent = label_tree.get_parent(child);
-            if (parent.size() && hard_classification.find(parent) != hard_classification.end()) {
-                hard_classification[child] *= hard_classification[parent];
-            }
-        }
-    }
-}
diff --git a/src/cpp/models/src/detection_model.cpp b/src/cpp/models/src/detection_model.cpp
deleted file mode 100644
index 6b55eeba..00000000
--- a/src/cpp/models/src/detection_model.cpp
+++ /dev/null
@@ -1,118 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#include "models/detection_model.h"
-
-#include <fstream>
-#include <stdexcept>
-#include <string>
-#include <vector>
-
-#include "models/base_model.h"
-#include "models/detection_model_ssd.h"
-#include "models/detection_model_yolo.h"
-#include "models/detection_model_yolov3_onnx.h"
-#include "models/detection_model_yolox.h"
-#include "models/input_data.h"
-#include "models/results.h"
-#include "utils/slog.hpp"
-
-DetectionModel::DetectionModel(std::shared_ptr<ov::Model>& model, const ov::AnyMap& configuration)
-    : BaseModel(model, configuration) {
-    auto confidence_threshold_iter = configuration.find("confidence_threshold");
-    if (confidence_threshold_iter == configuration.end()) {
-        if (model->has_rt_info("model_info", "confidence_threshold")) {
-            confidence_threshold = model->get_rt_info<float>("model_info", "confidence_threshold");
-        }
-    } else {
-        confidence_threshold = confidence_threshold_iter->second.as<float>();
-    }
-}
-
-DetectionModel::DetectionModel(std::shared_ptr<InferenceAdapter>& adapter, const ov::AnyMap& configuration)
-    : BaseModel(adapter, configuration) {
-    confidence_threshold =
-        get_from_any_maps("confidence_threshold", configuration, adapter->getModelConfig(), confidence_threshold);
-}
-
-void DetectionModel::updateModelInfo() {
-    BaseModel::updateModelInfo();
-
-    model->set_rt_info(confidence_threshold, "model_info", "confidence_threshold");
-}
-
-std::unique_ptr<DetectionModel> DetectionModel::create_model(const std::string& modelFile,
-                                                             const ov::AnyMap& configuration,
-                                                             std::string model_type,
-                                                             bool preload,
-                                                             const std::string& device) {
-    auto core = ov::Core();
-    std::shared_ptr<ov::Model> model = core.read_model(modelFile);
-    if (model_type.empty()) {
-        try {
-            if (model->has_rt_info("model_info", "model_type")) {
-                model_type = model->get_rt_info<std::string>("model_info", "model_type");
-            }
-        } catch (const std::exception&) {
-            slog::warn << "Model type is not specified in the rt_info, use default model type: " << model_type
-                       << slog::endl;
-        }
-    }
-
-    std::unique_ptr<DetectionModel> detectionModel;
-    if (model_type == ModelSSD::ModelType || model_type == "SSD") {
-        detectionModel = std::unique_ptr<DetectionModel>(new ModelSSD(model, configuration));
-    } else if (model_type == ModelYoloX::ModelType) {
-        detectionModel = std::unique_ptr<DetectionModel>(new ModelYoloX(model, configuration));
-    } else if (model_type == YOLOv5::ModelType) {
-        detectionModel = std::unique_ptr<DetectionModel>(new YOLOv5(model, configuration));
-    } else if (model_type == YOLOv8::ModelType) {
-        detectionModel = std::unique_ptr<DetectionModel>(new YOLOv8(model, configuration));
-    } else {
-        throw std::runtime_error("Incorrect or unsupported model_type is provided in the model_info section: " +
-                                 model_type);
-    }
-
-    detectionModel->prepare();
-    if (preload) {
-        detectionModel->load(core, device);
-    }
-    return detectionModel;
-}
-
-std::unique_ptr<DetectionModel> DetectionModel::create_model(std::shared_ptr<InferenceAdapter>& adapter) {
-    const ov::AnyMap& configuration = adapter->getModelConfig();
-    auto model_type_iter = configuration.find("model_type");
-    std::string model_type;
-    if (model_type_iter != configuration.end()) {
-        model_type = model_type_iter->second.as<std::string>();
-    }
-
-    std::unique_ptr<DetectionModel> detectionModel;
-    if (model_type == ModelSSD::ModelType || model_type == "SSD") {
-        detectionModel = std::unique_ptr<DetectionModel>(new ModelSSD(adapter));
-    } else if (model_type == ModelYoloX::ModelType) {
-        detectionModel = std::unique_ptr<DetectionModel>(new ModelYoloX(adapter));
-    } else {
-        throw std::runtime_error("Incorrect or unsupported model_type is provided: " + model_type);
-    }
-
-    return detectionModel;
-}
-
-std::unique_ptr<DetectionResult> DetectionModel::infer(const ImageInputData& inputData) {
-    auto result = BaseModel::inferImage(inputData);
-    return std::unique_ptr<DetectionResult>(static_cast<DetectionResult*>(result.release()));
-}
-
-std::vector<std::unique_ptr<DetectionResult>> DetectionModel::inferBatch(const std::vector<ImageInputData>& inputImgs) {
-    auto results = BaseModel::inferBatchImage(inputImgs);
-    std::vector<std::unique_ptr<DetectionResult>> detResults;
-    detResults.reserve(results.size());
-    for (auto& result : results) {
-        detResults.emplace_back(static_cast<DetectionResult*>(result.release()));
-    }
-    return detResults;
-}
diff --git a/src/cpp/models/src/detection_model_ext.cpp b/src/cpp/models/src/detection_model_ext.cpp
deleted file mode 100644
index d1084820..00000000
--- a/src/cpp/models/src/detection_model_ext.cpp
+++ /dev/null
@@ -1,40 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-#include "models/detection_model_ext.h"
-
-#include <fstream>
-#include <stdexcept>
-#include <string>
-#include <vector>
-
-#include "models/base_model.h"
-#include "models/input_data.h"
-#include "models/results.h"
-
-DetectionModelExt::DetectionModelExt(std::shared_ptr<ov::Model>& model, const ov::AnyMap& configuration)
-    : DetectionModel(model, configuration) {
-    auto iou_threshold_iter = configuration.find("iou_threshold");
-    if (iou_threshold_iter != configuration.end()) {
-        iou_threshold = iou_threshold_iter->second.as<float>();
-    } else {
-        if (model->has_rt_info<std::string>("model_info", "iou_threshold")) {
-            iou_threshold = model->get_rt_info<float>("model_info", "iou_threshold");
-        }
-    }
-}
-
-DetectionModelExt::DetectionModelExt(std::shared_ptr<InferenceAdapter>& adapter) : DetectionModel(adapter) {
-    const ov::AnyMap& configuration = adapter->getModelConfig();
-    auto iou_threshold_iter = configuration.find("iou_threshold");
-    if (iou_threshold_iter != configuration.end()) {
-        iou_threshold = iou_threshold_iter->second.as<float>();
-    }
-}
-
-void DetectionModelExt::updateModelInfo() {
-    DetectionModel::updateModelInfo();
-
-    model->set_rt_info(iou_threshold, "model_info", "iou_threshold");
-}
diff --git a/src/cpp/models/src/detection_model_ssd.cpp b/src/cpp/models/src/detection_model_ssd.cpp
deleted file mode 100644
index f6f7c818..00000000
--- a/src/cpp/models/src/detection_model_ssd.cpp
+++ /dev/null
@@ -1,351 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#include "models/detection_model_ssd.h"
-
-#include <algorithm>
-#include <map>
-#include <openvino/openvino.hpp>
-#include <stdexcept>
-#include <string>
-#include <unordered_set>
-#include <utils/common.hpp>
-#include <utils/ocv_common.hpp>
-#include <vector>
-
-#include "models/internal_model_data.h"
-#include "models/results.h"
-
-namespace {
-constexpr char saliency_map_name[]{"saliency_map"};
-constexpr char feature_vector_name[]{"feature_vector"};
-constexpr float box_area_threshold = 1.0f;
-
-struct NumAndStep {
-    size_t detectionsNum, objectSize;
-};
-
-NumAndStep fromSingleOutput(const ov::Shape& shape) {
-    const ov::Layout& layout("NCHW");
-    if (shape.size() != 4) {
-        throw std::logic_error("SSD single output must have 4 dimensions, but had " + std::to_string(shape.size()));
-    }
-    size_t detectionsNum = shape[ov::layout::height_idx(layout)];
-    size_t objectSize = shape[ov::layout::width_idx(layout)];
-    if (objectSize != 7) {
-        throw std::logic_error("SSD single output must have 7 as a last dimension, but had " +
-                               std::to_string(objectSize));
-    }
-    return {detectionsNum, objectSize};
-}
-
-NumAndStep fromMultipleOutputs(const ov::Shape& boxesShape) {
-    if (boxesShape.size() == 2) {
-        ov::Layout boxesLayout = "NC";
-        size_t detectionsNum = boxesShape[ov::layout::batch_idx(boxesLayout)];
-        size_t objectSize = boxesShape[ov::layout::channels_idx(boxesLayout)];
-
-        if (objectSize != 5) {
-            throw std::logic_error("Incorrect 'boxes' output shape, [n][5] shape is required");
-        }
-        return {detectionsNum, objectSize};
-    }
-    if (boxesShape.size() == 3) {
-        ov::Layout boxesLayout = "CHW";
-        size_t detectionsNum = boxesShape[ov::layout::height_idx(boxesLayout)];
-        size_t objectSize = boxesShape[ov::layout::width_idx(boxesLayout)];
-
-        if (objectSize != 4 && objectSize != 5) {
-            throw std::logic_error("Incorrect 'boxes' output shape, [b][n][{4 or 5}] shape is required");
-        }
-        return {detectionsNum, objectSize};
-    }
-    throw std::logic_error("Incorrect number of 'boxes' output dimensions, expected 2 or 3, but had " +
-                           std::to_string(boxesShape.size()));
-}
-
-std::vector<std::string> filterOutXai(const std::vector<std::string>& names) {
-    std::vector<std::string> filtered;
-    std::copy_if(names.begin(), names.end(), std::back_inserter(filtered), [](const std::string& name) {
-        return name != saliency_map_name && name != feature_vector_name;
-    });
-    return filtered;
-}
-
-float clamp_and_round(float val, float min, float max) {
-    return std::round(std::max(min, std::min(max, val)));
-}
-}  // namespace
-
-std::string ModelSSD::ModelType = "ssd";
-
-std::shared_ptr<InternalModelData> ModelSSD::preprocess(const InputData& inputData, InferenceInput& input) {
-    if (inputNames.size() > 1) {
-        ov::Tensor info{ov::element::i32, ov::Shape({1, 3})};
-        int32_t* data = info.data<int32_t>();
-        data[0] = netInputHeight;
-        data[1] = netInputWidth;
-        data[3] = 1;
-        input.emplace(inputNames[1], std::move(info));
-    }
-    return DetectionModel::preprocess(inputData, input);
-}
-
-std::unique_ptr<ResultBase> ModelSSD::postprocess(InferenceResult& infResult) {
-    std::unique_ptr<ResultBase> result = filterOutXai(outputNames).size() > 1 ? postprocessMultipleOutputs(infResult)
-                                                                              : postprocessSingleOutput(infResult);
-    DetectionResult* cls_res = static_cast<DetectionResult*>(result.get());
-    auto saliency_map_iter = infResult.outputsData.find(saliency_map_name);
-    if (saliency_map_iter != infResult.outputsData.end()) {
-        cls_res->saliency_map = std::move(saliency_map_iter->second);
-    }
-    auto feature_vector_iter = infResult.outputsData.find(feature_vector_name);
-    if (feature_vector_iter != infResult.outputsData.end()) {
-        cls_res->feature_vector = std::move(feature_vector_iter->second);
-    }
-    return result;
-}
-
-std::unique_ptr<ResultBase> ModelSSD::postprocessSingleOutput(InferenceResult& infResult) {
-    const std::vector<std::string> namesWithoutXai = filterOutXai(outputNames);
-    assert(namesWithoutXai.size() == 1);
-    const ov::Tensor& detectionsTensor = infResult.outputsData[namesWithoutXai[0]];
-    NumAndStep numAndStep = fromSingleOutput(detectionsTensor.get_shape());
-    const float* detections = detectionsTensor.data<float>();
-
-    DetectionResult* result = new DetectionResult(infResult.frameId, infResult.metaData);
-    auto retVal = std::unique_ptr<ResultBase>(result);
-
-    const auto& internalData = infResult.internalModelData->asRef<InternalImageModelData>();
-    float floatInputImgWidth = float(internalData.inputImgWidth),
-          floatInputImgHeight = float(internalData.inputImgHeight);
-    float invertedScaleX = floatInputImgWidth / netInputWidth, invertedScaleY = floatInputImgHeight / netInputHeight;
-    int padLeft = 0, padTop = 0;
-    if (RESIZE_KEEP_ASPECT == resizeMode || RESIZE_KEEP_ASPECT_LETTERBOX == resizeMode) {
-        invertedScaleX = invertedScaleY = std::max(invertedScaleX, invertedScaleY);
-        if (RESIZE_KEEP_ASPECT_LETTERBOX == resizeMode) {
-            padLeft = (netInputWidth - int(std::round(floatInputImgWidth / invertedScaleX))) / 2;
-            padTop = (netInputHeight - int(std::round(floatInputImgHeight / invertedScaleY))) / 2;
-        }
-    }
-
-    for (size_t i = 0; i < numAndStep.detectionsNum; i++) {
-        float image_id = detections[i * numAndStep.objectSize + 0];
-        if (image_id < 0) {
-            break;
-        }
-
-        float confidence = detections[i * numAndStep.objectSize + 2];
-
-        /** Filtering out objects with confidence < confidence_threshold probability **/
-        if (confidence > confidence_threshold) {
-            DetectedObject desc;
-
-            desc.confidence = confidence;
-            desc.labelID = static_cast<size_t>(detections[i * numAndStep.objectSize + 1]);
-            desc.label = getLabelName(desc.labelID);
-            desc.x =
-                clamp(round((detections[i * numAndStep.objectSize + 3] * netInputWidth - padLeft) * invertedScaleX),
-                      0.f,
-                      floatInputImgWidth);
-            desc.y =
-                clamp(round((detections[i * numAndStep.objectSize + 4] * netInputHeight - padTop) * invertedScaleY),
-                      0.f,
-                      floatInputImgHeight);
-            desc.width =
-                clamp(round((detections[i * numAndStep.objectSize + 5] * netInputWidth - padLeft) * invertedScaleX),
-                      0.f,
-                      floatInputImgWidth) -
-                desc.x;
-            desc.height =
-                clamp(round((detections[i * numAndStep.objectSize + 6] * netInputHeight - padTop) * invertedScaleY),
-                      0.f,
-                      floatInputImgHeight) -
-                desc.y;
-            result->objects.push_back(desc);
-        }
-    }
-
-    return retVal;
-}
-
-std::unique_ptr<ResultBase> ModelSSD::postprocessMultipleOutputs(InferenceResult& infResult) {
-    const std::vector<std::string> namesWithoutXai = filterOutXai(outputNames);
-    const float* boxes = infResult.outputsData[namesWithoutXai[0]].data<float>();
-    NumAndStep numAndStep = fromMultipleOutputs(infResult.outputsData[namesWithoutXai[0]].get_shape());
-    const int64_t* labels = infResult.outputsData[namesWithoutXai[1]].data<int64_t>();
-    const float* scores =
-        namesWithoutXai.size() > 2 ? infResult.outputsData[namesWithoutXai[2]].data<float>() : nullptr;
-
-    DetectionResult* result = new DetectionResult(infResult.frameId, infResult.metaData);
-    auto retVal = std::unique_ptr<ResultBase>(result);
-
-    const auto& internalData = infResult.internalModelData->asRef<InternalImageModelData>();
-    float floatInputImgWidth = float(internalData.inputImgWidth),
-          floatInputImgHeight = float(internalData.inputImgHeight);
-    float invertedScaleX = floatInputImgWidth / netInputWidth, invertedScaleY = floatInputImgHeight / netInputHeight;
-    int padLeft = 0, padTop = 0;
-    if (RESIZE_KEEP_ASPECT == resizeMode || RESIZE_KEEP_ASPECT_LETTERBOX == resizeMode) {
-        invertedScaleX = invertedScaleY = std::max(invertedScaleX, invertedScaleY);
-        if (RESIZE_KEEP_ASPECT_LETTERBOX == resizeMode) {
-            padLeft = (netInputWidth - int(std::round(floatInputImgWidth / invertedScaleX))) / 2;
-            padTop = (netInputHeight - int(std::round(floatInputImgHeight / invertedScaleY))) / 2;
-        }
-    }
-
-    // In models with scores stored in separate output coordinates are normalized to [0,1]
-    // In other multiple-outputs models coordinates are normalized to [0,netInputWidth] and [0,netInputHeight]
-    float widthScale = scores ? netInputWidth : 1.0f;
-    float heightScale = scores ? netInputHeight : 1.0f;
-
-    for (size_t i = 0; i < numAndStep.detectionsNum; i++) {
-        float confidence = scores ? scores[i] : boxes[i * numAndStep.objectSize + 4];
-
-        /** Filtering out objects with confidence < confidence_threshold probability **/
-        if (confidence > confidence_threshold) {
-            DetectedObject desc;
-
-            desc.confidence = confidence;
-            desc.labelID = labels[i];
-            desc.label = getLabelName(desc.labelID);
-            desc.x = clamp_and_round((boxes[i * numAndStep.objectSize] * widthScale - padLeft) * invertedScaleX,
-                                     0.f,
-                                     floatInputImgWidth);
-            desc.y = clamp_and_round((boxes[i * numAndStep.objectSize + 1] * heightScale - padTop) * invertedScaleY,
-                                     0.f,
-                                     floatInputImgHeight);
-            desc.width = clamp_and_round((boxes[i * numAndStep.objectSize + 2] * widthScale - padLeft) * invertedScaleX,
-                                         0.f,
-                                         floatInputImgWidth) -
-                         desc.x;
-            desc.height =
-                clamp_and_round((boxes[i * numAndStep.objectSize + 3] * heightScale - padTop) * invertedScaleY,
-                                0.f,
-                                floatInputImgHeight) -
-                desc.y;
-
-            if (desc.width * desc.height >= box_area_threshold) {
-                result->objects.push_back(desc);
-            }
-        }
-    }
-
-    return retVal;
-}
-
-void ModelSSD::prepareInputsOutputs(std::shared_ptr<ov::Model>& model) {
-    // --------------------------- Configure input & output -------------------------------------------------
-    // --------------------------- Prepare input ------------------------------------------------------
-    for (const auto& input : model->inputs()) {
-        auto inputTensorName = input.get_any_name();
-        const ov::Shape& shape = input.get_partial_shape().get_max_shape();
-        ov::Layout inputLayout = getInputLayout(input);
-
-        if (shape.size() == 4) {  // 1st input contains images
-            if (inputNames.empty()) {
-                inputNames.push_back(inputTensorName);
-            } else {
-                inputNames[0] = inputTensorName;
-            }
-
-            if (!embedded_processing) {
-                model = BaseModel::embedProcessing(
-                    model,
-                    inputNames[0],
-                    inputLayout,
-                    resizeMode,
-                    interpolationMode,
-                    ov::Shape{shape[ov::layout::width_idx(inputLayout)], shape[ov::layout::height_idx(inputLayout)]},
-                    pad_value,
-                    reverse_input_channels,
-                    mean_values,
-                    scale_values);
-
-                netInputWidth = shape[ov::layout::width_idx(inputLayout)];
-                netInputHeight = shape[ov::layout::height_idx(inputLayout)];
-
-                useAutoResize = true;  // temporal solution for SSD
-                embedded_processing = true;
-            }
-        } else if (shape.size() == 2) {  // 2nd input contains image info
-            inputNames.resize(2);
-            inputNames[1] = inputTensorName;
-            if (!embedded_processing) {
-                ov::preprocess::PrePostProcessor ppp(model);
-                ppp.input(inputTensorName).tensor().set_element_type(ov::element::f32);
-                model = ppp.build();
-            }
-        } else {
-            throw std::logic_error("Unsupported " + std::to_string(input.get_partial_shape().size()) +
-                                   "D "
-                                   "input layer '" +
-                                   input.get_any_name() +
-                                   "'. "
-                                   "Only 2D and 4D input layers are supported");
-        }
-    }
-
-    // --------------------------- Prepare output  -----------------------------------------------------
-    if (model->outputs().size() == 1) {
-        prepareSingleOutput(model);
-    } else {
-        prepareMultipleOutputs(model);
-    }
-    embedded_processing = true;
-}
-
-void ModelSSD::prepareSingleOutput(std::shared_ptr<ov::Model>& model) {
-    const auto& output = model->output();
-    outputNames.push_back(output.get_any_name());
-
-    fromSingleOutput(output.get_partial_shape().get_max_shape());
-
-    if (!embedded_processing) {
-        ov::preprocess::PrePostProcessor ppp(model);
-        ppp.output().tensor().set_element_type(ov::element::f32);
-        model = ppp.build();
-    }
-}
-
-void ModelSSD::prepareMultipleOutputs(std::shared_ptr<ov::Model>& model) {
-    const ov::OutputVector& outputs = model->outputs();
-    for (auto& output : outputs) {
-        const auto& tensorNames = output.get_names();
-        for (const auto& name : tensorNames) {
-            if (name.find("boxes") != std::string::npos) {
-                outputNames.push_back(name);
-                break;
-            } else if (name.find("labels") != std::string::npos) {
-                outputNames.push_back(name);
-                break;
-            } else if (name.find("scores") != std::string::npos) {
-                outputNames.push_back(name);
-                break;
-            }
-        }
-    }
-    if (outputNames.size() != 2 && outputNames.size() != 3) {
-        throw std::logic_error("SSD model wrapper must have 2 or 3 outputs, but had " +
-                               std::to_string(outputNames.size()));
-    }
-    std::sort(outputNames.begin(), outputNames.end());
-
-    fromMultipleOutputs(model->output(outputNames[0]).get_partial_shape().get_max_shape());
-
-    if (!embedded_processing) {
-        ov::preprocess::PrePostProcessor ppp(model);
-
-        for (const auto& outName : outputNames) {
-            ppp.output(outName).tensor().set_element_type(ov::element::f32);
-        }
-        model = ppp.build();
-    }
-}
-
-void ModelSSD::updateModelInfo() {
-    DetectionModel::updateModelInfo();
-
-    model->set_rt_info(ModelSSD::ModelType, "model_info", "model_type");
-}
diff --git a/src/cpp/models/src/detection_model_yolo.cpp b/src/cpp/models/src/detection_model_yolo.cpp
deleted file mode 100644
index 1698b8e6..00000000
--- a/src/cpp/models/src/detection_model_yolo.cpp
+++ /dev/null
@@ -1,642 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#include "models/detection_model_yolo.h"
-
-#include <algorithm>
-#include <cmath>
-#include <cstdint>
-#include <openvino/openvino.hpp>
-#include <stdexcept>
-#include <string>
-#include <utility>
-#include <utils/common.hpp>
-#include <utils/nms.hpp>
-#include <utils/slog.hpp>
-#include <vector>
-
-#include "models/internal_model_data.h"
-#include "models/results.h"
-
-namespace {
-const std::vector<float> defaultAnchors[]{
-    // YOLOv1v2
-    {0.57273f, 0.677385f, 1.87446f, 2.06253f, 3.33843f, 5.47434f, 7.88282f, 3.52778f, 9.77052f, 9.16828f},
-    // YOLOv3
-    {10.0f,
-     13.0f,
-     16.0f,
-     30.0f,
-     33.0f,
-     23.0f,
-     30.0f,
-     61.0f,
-     62.0f,
-     45.0f,
-     59.0f,
-     119.0f,
-     116.0f,
-     90.0f,
-     156.0f,
-     198.0f,
-     373.0f,
-     326.0f},
-    // YOLOv4
-    {12.0f,
-     16.0f,
-     19.0f,
-     36.0f,
-     40.0f,
-     28.0f,
-     36.0f,
-     75.0f,
-     76.0f,
-     55.0f,
-     72.0f,
-     146.0f,
-     142.0f,
-     110.0f,
-     192.0f,
-     243.0f,
-     459.0f,
-     401.0f},
-    // YOLOv4_Tiny
-    {10.0f, 14.0f, 23.0f, 27.0f, 37.0f, 58.0f, 81.0f, 82.0f, 135.0f, 169.0f, 344.0f, 319.0f},
-    // YOLOF
-    {16.0f, 16.0f, 32.0f, 32.0f, 64.0f, 64.0f, 128.0f, 128.0f, 256.0f, 256.0f, 512.0f, 512.0f}};
-
-float sigmoid(float x) noexcept {
-    return 1.0f / (1.0f + std::exp(-x));
-}
-
-constexpr float identity(float x) noexcept {
-    return x;
-}
-}  // namespace
-
-ModelYolo::ModelYolo(std::shared_ptr<ov::Model>& model, const ov::AnyMap& configuration)
-    : DetectionModelExt(model, configuration) {
-    auto anchors_iter = configuration.find("anchors");
-    if (anchors_iter == configuration.end()) {
-        if (model->has_rt_info("model_info", "anchors")) {
-            // presetAnchors =
-            // model->get_rt_info().at("model_info").as<ov::VariantWrapper<ov::AnyMap>>().get().at("anchors").as<std::vector<float>>();
-            presetAnchors = model->get_rt_info<std::vector<float>>("model_info", "anchors");
-        }
-    } else {
-        presetAnchors = anchors_iter->second.as<std::vector<float>>();
-    }
-    auto masks_iter = configuration.find("masks");
-    if (masks_iter == configuration.end()) {
-        if (model->has_rt_info("model_info", "masks")) {
-            presetMasks = model->get_rt_info<std::vector<int64_t>>("model_info", "masks");
-        }
-    } else {
-        presetMasks = masks_iter->second.as<std::vector<int64_t>>();
-    }
-
-    resizeMode = RESIZE_FILL;  // Ignore resize_type for now
-}
-
-ModelYolo::ModelYolo(std::shared_ptr<InferenceAdapter>& adapter) : DetectionModelExt(adapter) {
-    const ov::AnyMap& configuration = adapter->getModelConfig();
-    auto anchors_iter = configuration.find("anchors");
-    if (anchors_iter != configuration.end()) {
-        presetAnchors = anchors_iter->second.as<std::vector<float>>();
-    }
-    auto masks_iter = configuration.find("masks");
-    if (masks_iter != configuration.end()) {
-        presetMasks = masks_iter->second.as<std::vector<int64_t>>();
-    }
-
-    resizeMode = RESIZE_FILL;  // Ignore resize_type for now
-}
-
-void ModelYolo::prepareInputsOutputs(std::shared_ptr<ov::Model>& model) {
-    // --------------------------- Configure input & output -------------------------------------------------
-    // --------------------------- Prepare input  ------------------------------------------------------
-    if (model->inputs().size() != 1) {
-        throw std::logic_error("YOLO model wrapper accepts models that have only 1 input");
-    }
-
-    const auto& input = model->input();
-    const ov::Shape& inputShape = model->input().get_shape();
-    ov::Layout inputLayout = getInputLayout(input);
-
-    if (inputShape[ov::layout::channels_idx(inputLayout)] != 3) {
-        throw std::logic_error("Expected 3-channel input");
-    }
-
-    ov::preprocess::PrePostProcessor ppp(model);
-    inputTransform.setPrecision(ppp, input.get_any_name());
-    ppp.input().tensor().set_layout({"NHWC"});
-
-    if (useAutoResize) {
-        ppp.input().tensor().set_spatial_dynamic_shape();
-
-        ppp.input()
-            .preprocess()
-            .convert_element_type(ov::element::f32)
-            .resize(ov::preprocess::ResizeAlgorithm::RESIZE_LINEAR);
-    }
-
-    ppp.input().model().set_layout(inputLayout);
-
-    //--- Reading image input parameters
-    inputNames.push_back(model->input().get_any_name());
-    netInputWidth = inputShape[ov::layout::width_idx(inputLayout)];
-    netInputHeight = inputShape[ov::layout::height_idx(inputLayout)];
-
-    // --------------------------- Prepare output  -----------------------------------------------------
-    const ov::OutputVector& outputs = model->outputs();
-    std::map<std::string, ov::Shape> outShapes;
-    for (auto& out : outputs) {
-        ppp.output(out.get_any_name()).tensor().set_element_type(ov::element::f32);
-        if (out.get_shape().size() == 4) {
-            if (out.get_shape()[ov::layout::height_idx("NCHW")] != out.get_shape()[ov::layout::width_idx("NCHW")] &&
-                out.get_shape()[ov::layout::height_idx("NHWC")] == out.get_shape()[ov::layout::width_idx("NHWC")]) {
-                ppp.output(out.get_any_name()).model().set_layout("NHWC");
-                // outShapes are saved before ppp.build() thus set yoloRegionLayout as it is in model before ppp.build()
-                yoloRegionLayout = "NHWC";
-            }
-            // yolo-v1-tiny-tf out shape is [1, 21125] thus set layout only for 4 dim tensors
-            ppp.output(out.get_any_name()).tensor().set_layout("NCHW");
-        }
-        outputNames.push_back(out.get_any_name());
-        outShapes[out.get_any_name()] = out.get_shape();
-    }
-    model = ppp.build();
-
-    yoloVersion = YoloVersion::YOLO_V3;
-    bool isRegionFound = false;
-    for (const auto& op : model->get_ordered_ops()) {
-        if (std::string("RegionYolo") == op->get_type_name()) {
-            auto regionYolo = std::dynamic_pointer_cast<ov::op::v0::RegionYolo>(op);
-
-            if (regionYolo) {
-                if (!regionYolo->get_mask().size()) {
-                    yoloVersion = YoloVersion::YOLO_V1V2;
-                }
-
-                const auto& opName = op->get_friendly_name();
-                for (const auto& out : outputs) {
-                    if (out.get_node()->get_friendly_name() == opName ||
-                        out.get_node()->get_input_node_ptr(0)->get_friendly_name() == opName) {
-                        isRegionFound = true;
-                        regions.emplace(out.get_any_name(), Region(regionYolo));
-                    }
-                }
-            }
-        }
-    }
-
-    if (!isRegionFound) {
-        switch (outputNames.size()) {
-        case 1:
-            yoloVersion = YoloVersion::YOLOF;
-            break;
-        case 2:
-            yoloVersion = YoloVersion::YOLO_V4_TINY;
-            break;
-        case 3:
-            yoloVersion = YoloVersion::YOLO_V4;
-            break;
-        }
-
-        int num = yoloVersion == YoloVersion::YOLOF ? 6 : 3;
-        isObjConf = yoloVersion == YoloVersion::YOLOF ? 0 : 1;
-        int i = 0;
-
-        const std::vector<int64_t> defaultMasks[]{// YOLOv1v2
-                                                  {},
-                                                  // YOLOv3
-                                                  {},
-                                                  // YOLOv4
-                                                  {0, 1, 2, 3, 4, 5, 6, 7, 8},
-                                                  // YOLOv4_Tiny
-                                                  {1, 2, 3, 3, 4, 5},
-                                                  // YOLOF
-                                                  {0, 1, 2, 3, 4, 5}};
-        auto chosenMasks = presetMasks.size() ? presetMasks : defaultMasks[size_t(yoloVersion)];
-        if (chosenMasks.size() != num * outputs.size()) {
-            throw std::runtime_error("Invalid size of masks array, got " + std::to_string(presetMasks.size()) +
-                                     ", should be " + std::to_string(num * outputs.size()));
-        }
-
-        std::sort(outputNames.begin(),
-                  outputNames.end(),
-                  [&outShapes, this](const std::string& x, const std::string& y) {
-                      return outShapes[x][ov::layout::height_idx(yoloRegionLayout)] >
-                             outShapes[y][ov::layout::height_idx(yoloRegionLayout)];
-                  });
-
-        for (const auto& name : outputNames) {
-            const auto& shape = outShapes[name];
-            if (shape[ov::layout::channels_idx(yoloRegionLayout)] % num != 0) {
-                throw std::logic_error(std::string("Output tensor ") + name + " has wrong channel dimension");
-            }
-            regions.emplace(
-                name,
-                Region(shape[ov::layout::channels_idx(yoloRegionLayout)] / num - 4 - (isObjConf ? 1 : 0),
-                       4,
-                       presetAnchors.size() ? presetAnchors : defaultAnchors[size_t(yoloVersion)],
-                       std::vector<int64_t>(chosenMasks.begin() + i * num, chosenMasks.begin() + (i + 1) * num),
-                       shape[ov::layout::width_idx(yoloRegionLayout)],
-                       shape[ov::layout::height_idx(yoloRegionLayout)]));
-            i++;
-        }
-    } else {
-        // Currently externally set anchors and masks are supported only for YoloV4
-        if (presetAnchors.size() || presetMasks.size()) {
-            slog::warn << "Preset anchors and mask can be set for YoloV4 model only. "
-                          "This model is not YoloV4, so these options will be ignored."
-                       << slog::endl;
-        }
-    }
-}
-
-std::unique_ptr<ResultBase> ModelYolo::postprocess(InferenceResult& infResult) {
-    DetectionResult* result = new DetectionResult(infResult.frameId, infResult.metaData);
-    std::vector<DetectedObject> objects;
-
-    // Parsing outputs
-    const auto& internalData = infResult.internalModelData->asRef<InternalImageModelData>();
-
-    for (auto& output : infResult.outputsData) {
-        this->parseYOLOOutput(output.first,
-                              output.second,
-                              netInputHeight,
-                              netInputWidth,
-                              internalData.inputImgHeight,
-                              internalData.inputImgWidth,
-                              objects);
-    }
-
-    if (useAdvancedPostprocessing) {
-        // Advanced postprocessing
-        // Checking IOU threshold conformance
-        // For every i-th object we're finding all objects it intersects with, and comparing confidence
-        // If i-th object has greater confidence than all others, we include it into result
-        for (const auto& obj1 : objects) {
-            bool isGoodResult = true;
-            for (const auto& obj2 : objects) {
-                if (obj1.labelID == obj2.labelID && obj1.confidence < obj2.confidence &&
-                    intersectionOverUnion(obj1, obj2) >= iou_threshold) {  // if obj1 is the same as obj2, condition
-                                                                           // expression will evaluate to false anyway
-                    isGoodResult = false;
-                    break;
-                }
-            }
-            if (isGoodResult) {
-                result->objects.push_back(obj1);
-            }
-        }
-    } else {
-        // Classic postprocessing
-        std::sort(objects.begin(), objects.end(), [](const DetectedObject& x, const DetectedObject& y) {
-            return x.confidence > y.confidence;
-        });
-        for (size_t i = 0; i < objects.size(); ++i) {
-            if (objects[i].confidence == 0)
-                continue;
-            for (size_t j = i + 1; j < objects.size(); ++j)
-                if (intersectionOverUnion(objects[i], objects[j]) >= iou_threshold)
-                    objects[j].confidence = 0;
-            result->objects.push_back(objects[i]);
-        }
-    }
-
-    return std::unique_ptr<ResultBase>(result);
-}
-
-void ModelYolo::parseYOLOOutput(const std::string& output_name,
-                                const ov::Tensor& tensor,
-                                const unsigned long resized_im_h,
-                                const unsigned long resized_im_w,
-                                const unsigned long original_im_h,
-                                const unsigned long original_im_w,
-                                std::vector<DetectedObject>& objects) {
-    // --------------------------- Extracting layer parameters -------------------------------------
-    auto it = regions.find(output_name);
-    if (it == regions.end()) {
-        throw std::runtime_error(std::string("Can't find output layer with name ") + output_name);
-    }
-    auto& region = it->second;
-
-    int sideW = 0;
-    int sideH = 0;
-    unsigned long scaleH;
-    unsigned long scaleW;
-    switch (yoloVersion) {
-    case YoloVersion::YOLO_V1V2:
-        sideH = region.outputHeight;
-        sideW = region.outputWidth;
-        scaleW = region.outputWidth;
-        scaleH = region.outputHeight;
-        break;
-    case YoloVersion::YOLO_V3:
-    case YoloVersion::YOLO_V4:
-    case YoloVersion::YOLO_V4_TINY:
-    case YoloVersion::YOLOF:
-        sideH = static_cast<int>(tensor.get_shape()[ov::layout::height_idx("NCHW")]);
-        sideW = static_cast<int>(tensor.get_shape()[ov::layout::width_idx("NCHW")]);
-        scaleW = resized_im_w;
-        scaleH = resized_im_h;
-        break;
-    default:
-        throw std::runtime_error("Unknown YoloVersion");
-    }
-
-    auto entriesNum = sideW * sideH;
-    const float* outData = tensor.data<float>();
-
-    auto postprocessRawData = (yoloVersion == YoloVersion::YOLO_V4 || yoloVersion == YoloVersion::YOLO_V4_TINY ||
-                               yoloVersion == YoloVersion::YOLOF)
-                                  ? sigmoid
-                                  : identity;
-
-    // --------------------------- Parsing YOLO Region output -------------------------------------
-    for (int i = 0; i < entriesNum; ++i) {
-        int row = i / sideW;
-        int col = i % sideW;
-        for (int n = 0; n < region.num; ++n) {
-            //--- Getting region data
-            int obj_index = calculateEntryIndex(entriesNum,
-                                                region.coords,
-                                                region.classes + isObjConf,
-                                                n * entriesNum + i,
-                                                region.coords);
-            int box_index =
-                calculateEntryIndex(entriesNum, region.coords, region.classes + isObjConf, n * entriesNum + i, 0);
-            float scale = isObjConf ? postprocessRawData(outData[obj_index]) : 1;
-
-            //--- Preliminary check for confidence threshold conformance
-            if (scale >= confidence_threshold) {
-                //--- Calculating scaled region's coordinates
-                float x, y;
-                if (yoloVersion == YoloVersion::YOLOF) {
-                    x = (static_cast<float>(col) / sideW +
-                         outData[box_index + 0 * entriesNum] * region.anchors[2 * n] / scaleW) *
-                        original_im_w;
-                    y = (static_cast<float>(row) / sideH +
-                         outData[box_index + 1 * entriesNum] * region.anchors[2 * n + 1] / scaleH) *
-                        original_im_h;
-                } else {
-                    x = static_cast<float>((col + postprocessRawData(outData[box_index + 0 * entriesNum])) / sideW *
-                                           original_im_w);
-                    y = static_cast<float>((row + postprocessRawData(outData[box_index + 1 * entriesNum])) / sideH *
-                                           original_im_h);
-                }
-                float height = static_cast<float>(std::exp(outData[box_index + 3 * entriesNum]) *
-                                                  region.anchors[2 * n + 1] * original_im_h / scaleH);
-                float width = static_cast<float>(std::exp(outData[box_index + 2 * entriesNum]) * region.anchors[2 * n] *
-                                                 original_im_w / scaleW);
-
-                DetectedObject obj;
-                obj.x = clamp(x - width / 2, 0.f, static_cast<float>(original_im_w));
-                obj.y = clamp(y - height / 2, 0.f, static_cast<float>(original_im_h));
-                obj.width = clamp(width, 0.f, static_cast<float>(original_im_w - obj.x));
-                obj.height = clamp(height, 0.f, static_cast<float>(original_im_h - obj.y));
-
-                for (size_t j = 0; j < region.classes; ++j) {
-                    int class_index = calculateEntryIndex(entriesNum,
-                                                          region.coords,
-                                                          region.classes + isObjConf,
-                                                          n * entriesNum + i,
-                                                          region.coords + isObjConf + j);
-                    float prob = scale * postprocessRawData(outData[class_index]);
-
-                    //--- Checking confidence threshold conformance and adding region to the list
-                    if (prob >= confidence_threshold) {
-                        obj.confidence = prob;
-                        obj.labelID = j;
-                        obj.label = getLabelName(obj.labelID);
-                        objects.push_back(obj);
-                    }
-                }
-            }
-        }
-    }
-}
-
-int ModelYolo::calculateEntryIndex(int totalCells, int lcoords, size_t lclasses, int location, int entry) {
-    int n = location / totalCells;
-    int loc = location % totalCells;
-    return (n * (lcoords + lclasses) + entry) * totalCells + loc;
-}
-
-double ModelYolo::intersectionOverUnion(const DetectedObject& o1, const DetectedObject& o2) {
-    double overlappingWidth = fmin(o1.x + o1.width, o2.x + o2.width) - fmax(o1.x, o2.x);
-    double overlappingHeight = fmin(o1.y + o1.height, o2.y + o2.height) - fmax(o1.y, o2.y);
-    double intersectionArea =
-        (overlappingWidth < 0 || overlappingHeight < 0) ? 0 : overlappingHeight * overlappingWidth;
-    double unionArea = o1.width * o1.height + o2.width * o2.height - intersectionArea;
-    return intersectionArea / unionArea;
-}
-
-ModelYolo::Region::Region(const std::shared_ptr<ov::op::v0::RegionYolo>& regionYolo) {
-    coords = regionYolo->get_num_coords();
-    classes = regionYolo->get_num_classes();
-    auto mask = regionYolo->get_mask();
-    num = mask.size();
-
-    auto shape = regionYolo->get_input_shape(0);
-    outputWidth = shape[3];
-    outputHeight = shape[2];
-
-    if (num) {
-        // Parsing YoloV3 parameters
-        anchors.resize(num * 2);
-
-        for (int i = 0; i < num; ++i) {
-            anchors[i * 2] = regionYolo->get_anchors()[mask[i] * 2];
-            anchors[i * 2 + 1] = regionYolo->get_anchors()[mask[i] * 2 + 1];
-        }
-    } else {
-        // Parsing YoloV2 parameters
-        num = regionYolo->get_num_regions();
-        anchors = regionYolo->get_anchors();
-        if (anchors.empty()) {
-            anchors = defaultAnchors[size_t(YoloVersion::YOLO_V1V2)];
-            num = 5;
-        }
-    }
-}
-
-ModelYolo::Region::Region(size_t classes,
-                          int coords,
-                          const std::vector<float>& anchors,
-                          const std::vector<int64_t>& masks,
-                          size_t outputWidth,
-                          size_t outputHeight)
-    : classes(classes),
-      coords(coords),
-      outputWidth(outputWidth),
-      outputHeight(outputHeight) {
-    num = masks.size();
-
-    if (anchors.size() == 0 || anchors.size() % 2 != 0) {
-        throw std::runtime_error("Explicitly initialized region should have non-empty even-sized regions vector");
-    }
-
-    if (num) {
-        this->anchors.resize(num * 2);
-
-        for (int i = 0; i < num; ++i) {
-            this->anchors[i * 2] = anchors[masks[i] * 2];
-            this->anchors[i * 2 + 1] = anchors[masks[i] * 2 + 1];
-        }
-    } else {
-        this->anchors = anchors;
-        num = anchors.size() / 2;
-    }
-}
-
-std::string YOLOv5::ModelType = "YOLOv5";
-
-void YOLOv5::prepareInputsOutputs(std::shared_ptr<ov::Model>& model) {
-    const ov::Output<ov::Node>& input = model->input();
-    const ov::Shape& in_shape = input.get_partial_shape().get_max_shape();
-    if (in_shape.size() != 4) {
-        throw std::runtime_error("YOLO: the rank of the input must be 4");
-    }
-    inputNames.push_back(input.get_any_name());
-    const ov::Layout& inputLayout = getInputLayout(input);
-    if (!embedded_processing) {
-        model = BaseModel::embedProcessing(
-            model,
-            inputNames[0],
-            inputLayout,
-            resizeMode,
-            interpolationMode,
-            ov::Shape{in_shape[ov::layout::width_idx(inputLayout)], in_shape[ov::layout::height_idx(inputLayout)]},
-            pad_value,
-            reverse_input_channels,
-            mean_values,
-            scale_values);
-
-        netInputWidth = in_shape[ov::layout::width_idx(inputLayout)];
-        netInputHeight = in_shape[ov::layout::height_idx(inputLayout)];
-
-        embedded_processing = true;
-    }
-
-    const ov::Output<const ov::Node>& output = model->output();
-    if (ov::element::Type_t::f32 != output.get_element_type()) {
-        throw std::runtime_error("YOLO: the output must be of precision f32");
-    }
-    const ov::Shape& out_shape = output.get_partial_shape().get_max_shape();
-    if (3 != out_shape.size()) {
-        throw std::runtime_error("YOLO: the output must be of rank 3");
-    }
-    if (!labels.empty() && labels.size() + 4 != out_shape[1]) {
-        throw std::runtime_error("YOLO: number of labels must be smaller than out_shape[1] by 4");
-    }
-}
-
-void YOLOv5::updateModelInfo() {
-    DetectionModelExt::updateModelInfo();
-    model->set_rt_info(YOLOv5::ModelType, "model_info", "model_type");
-    model->set_rt_info(agnostic_nms, "model_info", "agnostic_nms");
-    model->set_rt_info(iou_threshold, "model_info", "iou_threshold");
-}
-
-void YOLOv5::init_from_config(const ov::AnyMap& top_priority, const ov::AnyMap& mid_priority) {
-    pad_value = get_from_any_maps("pad_value", top_priority, mid_priority, 114);
-    if (top_priority.find("resize_type") == top_priority.end() &&
-        mid_priority.find("resize_type") == mid_priority.end()) {
-        interpolationMode = cv::INTER_LINEAR;
-        resizeMode = RESIZE_KEEP_ASPECT_LETTERBOX;
-    }
-    reverse_input_channels = get_from_any_maps("reverse_input_channels", top_priority, mid_priority, true);
-    scale_values = get_from_any_maps("scale_values", top_priority, mid_priority, std::vector<float>{255.0f});
-    confidence_threshold = get_from_any_maps("confidence_threshold", top_priority, mid_priority, 0.25f);
-    agnostic_nms = get_from_any_maps("agnostic_nms", top_priority, mid_priority, agnostic_nms);
-    iou_threshold = get_from_any_maps("iou_threshold", top_priority, mid_priority, 0.7f);
-}
-
-YOLOv5::YOLOv5(std::shared_ptr<ov::Model>& model, const ov::AnyMap& configuration)
-    : DetectionModelExt(model, configuration) {
-    init_from_config(configuration, model->get_rt_info<ov::AnyMap>("model_info"));
-}
-
-YOLOv5::YOLOv5(std::shared_ptr<InferenceAdapter>& adapter) : DetectionModelExt(adapter) {
-    init_from_config(adapter->getModelConfig(), ov::AnyMap{});
-}
-
-std::unique_ptr<ResultBase> YOLOv5::postprocess(InferenceResult& infResult) {
-    if (1 != infResult.outputsData.size()) {
-        throw std::runtime_error("YOLO: expect 1 output");
-    }
-    const ov::Tensor& detectionsTensor = infResult.getFirstOutputTensor();
-    const ov::Shape& out_shape = detectionsTensor.get_shape();
-    if (3 != out_shape.size()) {
-        throw std::runtime_error("YOLO: the output must be of rank 3");
-    }
-    if (1 != out_shape[0]) {
-        throw std::runtime_error("YOLO: the first dim of the output must be 1");
-    }
-    size_t num_proposals = out_shape[2];
-    std::vector<AnchorLabeled> boxes_with_class;
-    std::vector<float> confidences;
-    const float* const detections = detectionsTensor.data<float>();
-    for (size_t i = 0; i < num_proposals; ++i) {
-        float confidence = 0.0f;
-        size_t max_id = 0;
-        constexpr size_t LABELS_START = 4;
-        for (size_t j = LABELS_START; j < out_shape[1]; ++j) {
-            if (detections[j * num_proposals + i] > confidence) {
-                confidence = detections[j * num_proposals + i];
-                max_id = j;
-            }
-        }
-        if (confidence > confidence_threshold) {
-            boxes_with_class.emplace_back(detections[0 * num_proposals + i] - detections[2 * num_proposals + i] / 2.0f,
-                                          detections[1 * num_proposals + i] - detections[3 * num_proposals + i] / 2.0f,
-                                          detections[0 * num_proposals + i] + detections[2 * num_proposals + i] / 2.0f,
-                                          detections[1 * num_proposals + i] + detections[3 * num_proposals + i] / 2.0f,
-                                          max_id - LABELS_START);
-            confidences.push_back(confidence);
-        }
-    }
-    constexpr bool includeBoundaries = false;
-    constexpr size_t keep_top_k = 30000;
-    std::vector<size_t> keep;
-    if (agnostic_nms) {
-        keep = nms(boxes_with_class, confidences, iou_threshold, includeBoundaries, keep_top_k);
-    } else {
-        keep = multiclass_nms(boxes_with_class, confidences, iou_threshold, includeBoundaries, keep_top_k);
-    }
-    DetectionResult* result = new DetectionResult(infResult.frameId, infResult.metaData);
-    auto base = std::unique_ptr<ResultBase>(result);
-    const auto& internalData = infResult.internalModelData->asRef<InternalImageModelData>();
-    float floatInputImgWidth = float(internalData.inputImgWidth),
-          floatInputImgHeight = float(internalData.inputImgHeight);
-    float invertedScaleX = floatInputImgWidth / netInputWidth, invertedScaleY = floatInputImgHeight / netInputHeight;
-    int padLeft = 0, padTop = 0;
-    if (RESIZE_KEEP_ASPECT == resizeMode || RESIZE_KEEP_ASPECT_LETTERBOX == resizeMode) {
-        invertedScaleX = invertedScaleY = std::max(invertedScaleX, invertedScaleY);
-        if (RESIZE_KEEP_ASPECT_LETTERBOX == resizeMode) {
-            padLeft = (netInputWidth - int(std::round(floatInputImgWidth / invertedScaleX))) / 2;
-            padTop = (netInputHeight - int(std::round(floatInputImgHeight / invertedScaleY))) / 2;
-        }
-    }
-    for (size_t idx : keep) {
-        DetectedObject desc;
-        desc.x = clamp(round((boxes_with_class[idx].left - padLeft) * invertedScaleX), 0.f, floatInputImgWidth);
-        desc.y = clamp(round((boxes_with_class[idx].top - padTop) * invertedScaleY), 0.f, floatInputImgHeight);
-        desc.width =
-            clamp(round((boxes_with_class[idx].right - padLeft) * invertedScaleX), 0.f, floatInputImgWidth) - desc.x;
-        desc.height =
-            clamp(round((boxes_with_class[idx].bottom - padTop) * invertedScaleY), 0.f, floatInputImgHeight) - desc.y;
-        desc.confidence = confidences[idx];
-        desc.labelID = static_cast<size_t>(boxes_with_class[idx].labelID);
-        desc.label = getLabelName(desc.labelID);
-        result->objects.push_back(desc);
-    }
-    return base;
-}
-
-std::string YOLOv8::ModelType = "YOLOv8";
diff --git a/src/cpp/models/src/detection_model_yolov3_onnx.cpp b/src/cpp/models/src/detection_model_yolov3_onnx.cpp
deleted file mode 100644
index 68830220..00000000
--- a/src/cpp/models/src/detection_model_yolov3_onnx.cpp
+++ /dev/null
@@ -1,174 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#include "models/detection_model_yolov3_onnx.h"
-
-#include <algorithm>
-#include <cmath>
-#include <cstdint>
-#include <openvino/openvino.hpp>
-#include <stdexcept>
-#include <string>
-#include <utility>
-#include <utils/common.hpp>
-#include <utils/slog.hpp>
-#include <vector>
-
-#include "models/input_data.h"
-#include "models/internal_model_data.h"
-#include "models/results.h"
-#include "utils/image_utils.h"
-
-void ModelYoloV3ONNX::initDefaultParameters(const ov::AnyMap&) {
-    resizeMode = RESIZE_KEEP_ASPECT_LETTERBOX;  // Ignore configuration for now
-    useAutoResize = false;
-}
-
-ModelYoloV3ONNX::ModelYoloV3ONNX(std::shared_ptr<ov::Model>& model, const ov::AnyMap& configuration)
-    : DetectionModel(model, configuration) {
-    initDefaultParameters(configuration);
-}
-
-ModelYoloV3ONNX::ModelYoloV3ONNX(std::shared_ptr<InferenceAdapter>& adapter) : DetectionModel(adapter) {
-    const ov::AnyMap& configuration = adapter->getModelConfig();
-    initDefaultParameters(configuration);
-}
-
-void ModelYoloV3ONNX::prepareInputsOutputs(std::shared_ptr<ov::Model>& model) {
-    // --------------------------- Configure input & output -------------------------------------------------
-    // --------------------------- Prepare inputs ------------------------------------------------------
-    const ov::OutputVector& inputs = model->inputs();
-    if (inputs.size() != 2) {
-        throw std::logic_error("YoloV3ONNX model wrapper expects models that have 2 inputs");
-    }
-
-    ov::preprocess::PrePostProcessor ppp(model);
-    inputNames.reserve(inputs.size());
-    for (auto& input : inputs) {
-        const ov::Shape& currentShape = input.get_shape();
-        std::string currentName = input.get_any_name();
-        const ov::Layout& currentLayout = getInputLayout(input);
-
-        if (currentShape.size() == 4) {
-            if (currentShape[ov::layout::channels_idx(currentLayout)] != 3) {
-                throw std::logic_error("Expected 4D image input with 3 channels");
-            }
-            inputNames[0] = currentName;
-            netInputWidth = currentShape[ov::layout::width_idx(currentLayout)];
-            netInputHeight = currentShape[ov::layout::height_idx(currentLayout)];
-            ppp.input(currentName).tensor().set_element_type(ov::element::u8).set_layout({"NHWC"});
-        } else if (currentShape.size() == 2) {
-            if (currentShape[ov::layout::channels_idx(currentLayout)] != 2) {
-                throw std::logic_error("Expected 2D image info input with 2 channels");
-            }
-            inputNames[1] = currentName;
-            ppp.input(currentName).tensor().set_element_type(ov::element::i32);
-        }
-        ppp.input(currentName).model().set_layout(currentLayout);
-    }
-
-    // --------------------------- Prepare outputs -----------------------------------------------------
-    const ov::OutputVector& outputs = model->outputs();
-    if (outputs.size() != 3) {
-        throw std::logic_error("YoloV3ONNX model wrapper expects models that have 3 outputs");
-    }
-
-    for (auto& output : outputs) {
-        const ov::Shape& currentShape = output.get_partial_shape().get_max_shape();
-        std::string currentName = output.get_any_name();
-        if (currentShape.back() == 3) {
-            indicesOutputName = currentName;
-            ppp.output(currentName).tensor().set_element_type(ov::element::i32);
-        } else if (currentShape[2] == 4) {
-            boxesOutputName = currentName;
-            ppp.output(currentName).tensor().set_element_type(ov::element::f32);
-        } else if (currentShape[1] == numberOfClasses) {
-            scoresOutputName = currentName;
-            ppp.output(currentName).tensor().set_element_type(ov::element::f32);
-        } else {
-            throw std::logic_error("Expected shapes [:,:,4], [:," + std::to_string(numberOfClasses) +
-                                   ",:] and [:,3] for outputs");
-        }
-        outputNames.push_back(currentName);
-    }
-    model = ppp.build();
-}
-
-std::shared_ptr<InternalModelData> ModelYoloV3ONNX::preprocess(const InputData& inputData, InferenceInput& input) {
-    const auto& origImg = inputData.asRef<ImageInputData>().inputImage;
-    ov::Tensor info{ov::element::i32, ov::Shape({1, 2})};
-    int32_t* data = info.data<int32_t>();
-    data[0] = origImg.rows;
-    data[1] = origImg.cols;
-    input.emplace(inputNames[1], std::move(info));
-    return BaseModel::preprocess(inputData, input);
-}
-
-namespace {
-float getScore(const ov::Tensor& scoresTensor, size_t classInd, size_t boxInd) {
-    const float* scoresPtr = scoresTensor.data<float>();
-    const auto shape = scoresTensor.get_shape();
-    size_t N = shape[2];
-
-    return scoresPtr[classInd * N + boxInd];
-}
-}  // namespace
-
-std::unique_ptr<ResultBase> ModelYoloV3ONNX::postprocess(InferenceResult& infResult) {
-    // Get info about input image
-    const auto imgWidth = infResult.internalModelData->asRef<InternalImageModelData>().inputImgWidth;
-    const auto imgHeight = infResult.internalModelData->asRef<InternalImageModelData>().inputImgHeight;
-
-    // Get outputs tensors
-    const ov::Tensor& boxes = infResult.outputsData[boxesOutputName];
-    const float* boxesPtr = boxes.data<float>();
-
-    const ov::Tensor& scores = infResult.outputsData[scoresOutputName];
-    const ov::Tensor& indices = infResult.outputsData[indicesOutputName];
-
-    const int* indicesData = indices.data<int>();
-    const auto indicesShape = indices.get_shape();
-    const auto boxShape = boxes.get_shape();
-
-    // Generate detection results
-    DetectionResult* result = new DetectionResult(infResult.frameId, infResult.metaData);
-    size_t numberOfBoxes = indicesShape.size() == 3 ? indicesShape[1] : indicesShape[0];
-    size_t indicesStride = indicesShape.size() == 3 ? indicesShape[2] : indicesShape[1];
-
-    for (size_t i = 0; i < numberOfBoxes; ++i) {
-        int batchInd = indicesData[i * indicesStride];
-        int classInd = indicesData[i * indicesStride + 1];
-        int boxInd = indicesData[i * indicesStride + 2];
-
-        if (batchInd == -1) {
-            break;
-        }
-
-        float score = getScore(scores, classInd, boxInd);
-
-        if (score > confidence_threshold) {
-            DetectedObject obj;
-            size_t startPos = boxShape[2] * boxInd;
-
-            auto x = boxesPtr[startPos + 1];
-            auto y = boxesPtr[startPos];
-            auto width = boxesPtr[startPos + 3] - x;
-            auto height = boxesPtr[startPos + 2] - y;
-
-            // Create new detected box
-            obj.x = clamp(x, 0.f, static_cast<float>(imgWidth));
-            obj.y = clamp(y, 0.f, static_cast<float>(imgHeight));
-            obj.height = clamp(height, 0.f, static_cast<float>(imgHeight));
-            obj.width = clamp(width, 0.f, static_cast<float>(imgWidth));
-            obj.confidence = score;
-            obj.labelID = classInd;
-            obj.label = getLabelName(classInd);
-
-            result->objects.push_back(obj);
-        }
-    }
-
-    return std::unique_ptr<ResultBase>(result);
-}
diff --git a/src/cpp/models/src/detection_model_yolox.cpp b/src/cpp/models/src/detection_model_yolox.cpp
deleted file mode 100644
index 3c4df1fe..00000000
--- a/src/cpp/models/src/detection_model_yolox.cpp
+++ /dev/null
@@ -1,204 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#include "models/detection_model_yolox.h"
-
-#include <algorithm>
-#include <cmath>
-#include <cstdint>
-#include <openvino/openvino.hpp>
-#include <stdexcept>
-#include <string>
-#include <utility>
-#include <utils/common.hpp>
-#include <utils/slog.hpp>
-#include <vector>
-
-#include "models/input_data.h"
-#include "models/internal_model_data.h"
-#include "models/results.h"
-#include "utils/image_utils.h"
-#include "utils/nms.hpp"
-
-std::string ModelYoloX::ModelType = "yolox";
-
-void ModelYoloX::initDefaultParameters(const ov::AnyMap&) {
-    resizeMode = RESIZE_KEEP_ASPECT;  // Ignore configuration for now
-    useAutoResize = false;
-}
-
-ModelYoloX::ModelYoloX(std::shared_ptr<ov::Model>& model, const ov::AnyMap& configuration)
-    : DetectionModelExt(model, configuration) {
-    initDefaultParameters(configuration);
-}
-
-ModelYoloX::ModelYoloX(std::shared_ptr<InferenceAdapter>& adapter) : DetectionModelExt(adapter) {
-    const ov::AnyMap& configuration = adapter->getModelConfig();
-    initDefaultParameters(configuration);
-}
-
-void ModelYoloX::updateModelInfo() {
-    DetectionModelExt::updateModelInfo();
-
-    model->set_rt_info(ModelYoloX::ModelType, "model_info", "model_type");
-}
-
-void ModelYoloX::prepareInputsOutputs(std::shared_ptr<ov::Model>& model) {
-    // --------------------------- Configure input & output -------------------------------------------------
-    // --------------------------- Prepare input  ------------------------------------------------------
-    const ov::OutputVector& inputs = model->inputs();
-    if (inputs.size() != 1) {
-        throw std::logic_error("YOLOX model wrapper accepts models that have only 1 input");
-    }
-
-    //--- Check image input
-    const auto& input = model->input();
-    const ov::Shape& inputShape = model->input().get_shape();
-    ov::Layout inputLayout = getInputLayout(input);
-
-    if (inputShape.size() != 4 && inputShape[ov::layout::channels_idx(inputLayout)] != 3) {
-        throw std::logic_error("Expected 4D image input with 3 channels");
-    }
-
-    ov::preprocess::PrePostProcessor ppp(model);
-    ppp.input().tensor().set_element_type(ov::element::u8).set_layout({"NHWC"});
-
-    ppp.input().model().set_layout(inputLayout);
-
-    //--- Reading image input parameters
-    inputNames.push_back(input.get_any_name());
-    netInputWidth = inputShape[ov::layout::width_idx(inputLayout)];
-    netInputHeight = inputShape[ov::layout::height_idx(inputLayout)];
-    setStridesGrids();
-
-    // --------------------------- Prepare output  -----------------------------------------------------
-    if (model->outputs().size() != 1) {
-        throw std::logic_error("YoloX model wrapper expects models that have only 1 output");
-    }
-    const auto& output = model->output();
-    outputNames.push_back(output.get_any_name());
-    const ov::Shape& shape = output.get_shape();
-
-    if (shape.size() != 3) {
-        throw std::logic_error("YOLOX single output must have 3 dimensions, but had " + std::to_string(shape.size()));
-    }
-    ppp.output().tensor().set_element_type(ov::element::f32);
-
-    model = ppp.build();
-}
-
-void ModelYoloX::setStridesGrids() {
-    std::vector<size_t> strides = {8, 16, 32};
-    std::vector<size_t> hsizes(3);
-    std::vector<size_t> wsizes(3);
-
-    for (size_t i = 0; i < strides.size(); ++i) {
-        hsizes[i] = netInputHeight / strides[i];
-        wsizes[i] = netInputWidth / strides[i];
-    }
-
-    for (size_t size_index = 0; size_index < hsizes.size(); ++size_index) {
-        for (size_t h_index = 0; h_index < hsizes[size_index]; ++h_index) {
-            for (size_t w_index = 0; w_index < wsizes[size_index]; ++w_index) {
-                grids.emplace_back(w_index, h_index);
-                expandedStrides.push_back(strides[size_index]);
-            }
-        }
-    }
-}
-
-std::shared_ptr<InternalModelData> ModelYoloX::preprocess(const InputData& inputData, InferenceInput& input) {
-    const auto& origImg = inputData.asRef<ImageInputData>().inputImage;
-    float scale =
-        std::min(static_cast<float>(netInputWidth) / origImg.cols, static_cast<float>(netInputHeight) / origImg.rows);
-
-    cv::Mat resizedImage = resizeImageExt(origImg,
-                                          netInputWidth,
-                                          netInputHeight,
-                                          resizeMode,
-                                          interpolationMode,
-                                          nullptr,
-                                          cv::Scalar(114, 114, 114));
-
-    input.emplace(inputNames[0], wrapMat2Tensor(resizedImage));
-    return std::make_shared<InternalScaleData>(origImg.cols, origImg.rows, scale, scale);
-}
-
-std::unique_ptr<ResultBase> ModelYoloX::postprocess(InferenceResult& infResult) {
-    // Get metadata about input image shape and scale
-    const auto& scale = infResult.internalModelData->asRef<InternalScaleData>();
-
-    // Get output tensor
-    const ov::Tensor& output = infResult.outputsData[outputNames[0]];
-    const auto& outputShape = output.get_shape();
-    float* outputPtr = output.data<float>();
-
-    // Generate detection results
-    DetectionResult* result = new DetectionResult(infResult.frameId, infResult.metaData);
-
-    // Update coordinates according to strides
-    for (size_t box_index = 0; box_index < expandedStrides.size(); ++box_index) {
-        size_t startPos = outputShape[2] * box_index;
-        outputPtr[startPos] = (outputPtr[startPos] + grids[box_index].first) * expandedStrides[box_index];
-        outputPtr[startPos + 1] = (outputPtr[startPos + 1] + grids[box_index].second) * expandedStrides[box_index];
-        outputPtr[startPos + 2] = std::exp(outputPtr[startPos + 2]) * expandedStrides[box_index];
-        outputPtr[startPos + 3] = std::exp(outputPtr[startPos + 3]) * expandedStrides[box_index];
-    }
-
-    // Filter predictions
-    std::vector<Anchor> validBoxes;
-    std::vector<float> scores;
-    std::vector<size_t> classes;
-    for (size_t box_index = 0; box_index < expandedStrides.size(); ++box_index) {
-        size_t startPos = outputShape[2] * box_index;
-        float score = outputPtr[startPos + 4];
-        if (score < confidence_threshold)
-            continue;
-        float maxClassScore = -1;
-        size_t mainClass = 0;
-        for (size_t class_index = 0; class_index < numberOfClasses; ++class_index) {
-            if (outputPtr[startPos + 5 + class_index] > maxClassScore) {
-                maxClassScore = outputPtr[startPos + 5 + class_index];
-                mainClass = class_index;
-            }
-        }
-
-        // Filter by score
-        score *= maxClassScore;
-        if (score < confidence_threshold)
-            continue;
-
-        // Add successful boxes
-        scores.push_back(score);
-        classes.push_back(mainClass);
-        Anchor trueBox = {outputPtr[startPos + 0] - outputPtr[startPos + 2] / 2,
-                          outputPtr[startPos + 1] - outputPtr[startPos + 3] / 2,
-                          outputPtr[startPos + 0] + outputPtr[startPos + 2] / 2,
-                          outputPtr[startPos + 1] + outputPtr[startPos + 3] / 2};
-        validBoxes.push_back(Anchor({trueBox.left / scale.scaleX,
-                                     trueBox.top / scale.scaleY,
-                                     trueBox.right / scale.scaleX,
-                                     trueBox.bottom / scale.scaleY}));
-    }
-
-    // NMS for valid boxes
-    const std::vector<size_t>& keep = nms(validBoxes, scores, iou_threshold, true);
-    for (size_t index : keep) {
-        // Create new detected box
-        DetectedObject obj;
-        obj.x = clamp(validBoxes[index].left, 0.f, static_cast<float>(scale.inputImgWidth));
-        obj.y = clamp(validBoxes[index].top, 0.f, static_cast<float>(scale.inputImgHeight));
-        obj.height =
-            clamp(validBoxes[index].bottom - validBoxes[index].top, 0.f, static_cast<float>(scale.inputImgHeight));
-        obj.width =
-            clamp(validBoxes[index].right - validBoxes[index].left, 0.f, static_cast<float>(scale.inputImgWidth));
-        obj.confidence = scores[index];
-        obj.labelID = classes[index];
-        obj.label = getLabelName(classes[index]);
-        result->objects.push_back(obj);
-    }
-
-    return std::unique_ptr<ResultBase>(result);
-}
diff --git a/src/cpp/models/src/instance_segmentation.cpp b/src/cpp/models/src/instance_segmentation.cpp
deleted file mode 100644
index 384fb057..00000000
--- a/src/cpp/models/src/instance_segmentation.cpp
+++ /dev/null
@@ -1,375 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#include "models/instance_segmentation.h"
-
-#include <stddef.h>
-#include <stdint.h>
-
-#include <fstream>
-#include <limits>
-#include <opencv2/core.hpp>
-#include <opencv2/imgproc.hpp>
-#include <openvino/openvino.hpp>
-#include <stdexcept>
-#include <string>
-#include <vector>
-
-#include "models/input_data.h"
-#include "models/internal_model_data.h"
-#include "models/results.h"
-#include "utils/common.hpp"
-
-namespace {
-constexpr char saliency_map_name[]{"saliency_map"};
-constexpr char feature_vector_name[]{"feature_vector"};
-
-void append_xai_names(const std::vector<ov::Output<ov::Node>>& outputs, std::vector<std::string>& outputNames) {
-    for (const ov::Output<ov::Node>& output : outputs) {
-        if (output.get_names().count(saliency_map_name) > 0) {
-            outputNames.emplace_back(saliency_map_name);
-        } else if (output.get_names().count(feature_vector_name) > 0) {
-            outputNames.push_back(feature_vector_name);
-        }
-    }
-}
-
-cv::Rect expand_box(const cv::Rect2f& box, float scale) {
-    float w_half = box.width * 0.5f * scale, h_half = box.height * 0.5f * scale;
-    const cv::Point2f& center = (box.tl() + box.br()) * 0.5f;
-    return {cv::Point(int(center.x - w_half), int(center.y - h_half)),
-            cv::Point(int(center.x + w_half), int(center.y + h_half))};
-}
-
-std::vector<cv::Mat_<std::uint8_t>> average_and_normalize(const std::vector<std::vector<cv::Mat>>& saliency_maps) {
-    std::vector<cv::Mat_<std::uint8_t>> aggregated;
-    aggregated.reserve(saliency_maps.size());
-    for (const std::vector<cv::Mat>& per_object_maps : saliency_maps) {
-        if (per_object_maps.empty()) {
-            aggregated.emplace_back();
-        } else {
-            cv::Mat_<double> saliency_map{per_object_maps.front().size()};
-            for (const cv::Mat& per_object_map : per_object_maps) {
-                if (saliency_map.size != per_object_map.size) {
-                    throw std::runtime_error("saliency_maps must have same size");
-                }
-                if (per_object_map.channels() != 1) {
-                    throw std::runtime_error("saliency_maps must have one channel");
-                }
-                if (per_object_map.type() != CV_8U) {
-                    throw std::runtime_error("saliency_maps must have type CV_8U");
-                }
-            }
-            for (int row = 0; row < saliency_map.rows; ++row) {
-                for (int col = 0; col < saliency_map.cols; ++col) {
-                    std::uint8_t max_val = 0;
-                    for (const cv::Mat& per_object_map : per_object_maps) {
-                        max_val = std::max(max_val, per_object_map.at<std::uint8_t>(row, col));
-                    }
-                    saliency_map.at<double>(row, col) = max_val;
-                }
-            }
-            double min, max;
-            cv::minMaxLoc(saliency_map, &min, &max);
-            cv::Mat_<std::uint8_t> converted;
-            saliency_map.convertTo(converted, CV_8U, 255.0 / (max + 1e-12));
-            aggregated.push_back(std::move(converted));
-        }
-    }
-    return aggregated;
-}
-
-struct Lbm {
-    ov::Tensor labels, boxes, masks;
-};
-
-Lbm filterTensors(const std::map<std::string, ov::Tensor>& infResult) {
-    Lbm lbm;
-    for (const auto& pair : infResult) {
-        if (pair.first == saliency_map_name || pair.first == feature_vector_name) {
-            continue;
-        }
-        switch (pair.second.get_shape().size()) {
-        case 2:
-            lbm.labels = pair.second;
-            break;
-        case 3:
-            lbm.boxes = pair.second;
-            break;
-        case 4:
-            lbm.masks = pair.second;
-            break;
-        case 0:
-            break;
-        default:
-            throw std::runtime_error("Unexpected result: " + pair.first);
-        }
-    }
-    return lbm;
-}
-}  // namespace
-
-cv::Mat segm_postprocess(const SegmentedObject& box, const cv::Mat& unpadded, int im_h, int im_w) {
-    // Add zero border to prevent upsampling artifacts on segment borders.
-    cv::Mat raw_cls_mask;
-    cv::copyMakeBorder(unpadded, raw_cls_mask, 1, 1, 1, 1, cv::BORDER_CONSTANT, {0});
-    cv::Rect extended_box = expand_box(box, float(raw_cls_mask.cols) / (raw_cls_mask.cols - 2));
-
-    int w = std::max(extended_box.width + 1, 1);
-    int h = std::max(extended_box.height + 1, 1);
-    int x0 = clamp(extended_box.x, 0, im_w);
-    int y0 = clamp(extended_box.y, 0, im_h);
-    int x1 = clamp(extended_box.x + extended_box.width + 1, 0, im_w);
-    int y1 = clamp(extended_box.y + extended_box.height + 1, 0, im_h);
-
-    cv::Mat resized;
-    cv::resize(raw_cls_mask, resized, {w, h});
-    cv::Mat im_mask(cv::Size{im_w, im_h}, CV_8UC1, cv::Scalar{0});
-    im_mask(cv::Rect{x0, y0, x1 - x0, y1 - y0})
-        .setTo(1,
-               resized({cv::Point(x0 - extended_box.x, y0 - extended_box.y),
-                        cv::Point(x1 - extended_box.x, y1 - extended_box.y)}) > 0.5f);
-    return im_mask;
-}
-
-std::string MaskRCNNModel::ModelType = "MaskRCNN";
-
-void MaskRCNNModel::init_from_config(const ov::AnyMap& top_priority, const ov::AnyMap& mid_priority) {
-    confidence_threshold = get_from_any_maps("confidence_threshold", top_priority, mid_priority, confidence_threshold);
-    postprocess_semantic_masks =
-        get_from_any_maps("postprocess_semantic_masks", top_priority, mid_priority, postprocess_semantic_masks);
-}
-
-MaskRCNNModel::MaskRCNNModel(std::shared_ptr<ov::Model>& model, const ov::AnyMap& configuration)
-    : BaseModel(model, configuration) {
-    init_from_config(configuration,
-                     model->has_rt_info("model_info") ? model->get_rt_info<ov::AnyMap>("model_info") : ov::AnyMap{});
-}
-
-MaskRCNNModel::MaskRCNNModel(std::shared_ptr<InferenceAdapter>& adapter, const ov::AnyMap& configuration)
-    : BaseModel(adapter, configuration) {
-    init_from_config(configuration, adapter->getModelConfig());
-}
-
-std::unique_ptr<MaskRCNNModel> MaskRCNNModel::create_model(const std::string& modelFile,
-                                                           const ov::AnyMap& configuration,
-                                                           bool preload,
-                                                           const std::string& device) {
-    auto core = ov::Core();
-    std::shared_ptr<ov::Model> model = core.read_model(modelFile);
-
-    // Check model_type in the rt_info, ignore configuration
-    std::string model_type = MaskRCNNModel::ModelType;
-    try {
-        if (model->has_rt_info("model_info", "model_type")) {
-            model_type = model->get_rt_info<std::string>("model_info", "model_type");
-        }
-    } catch (const std::exception&) {
-        slog::warn << "Model type is not specified in the rt_info, use default model type: " << model_type
-                   << slog::endl;
-    }
-
-    if (model_type != MaskRCNNModel::ModelType) {
-        throw std::runtime_error("Incorrect or unsupported model_type is provided in the model_info section: " +
-                                 model_type);
-    }
-
-    std::unique_ptr<MaskRCNNModel> segmentor{new MaskRCNNModel(model, configuration)};
-    segmentor->prepare();
-    if (preload) {
-        segmentor->load(core, device);
-    }
-    return segmentor;
-}
-
-std::unique_ptr<MaskRCNNModel> MaskRCNNModel::create_model(std::shared_ptr<InferenceAdapter>& adapter) {
-    const ov::AnyMap& configuration = adapter->getModelConfig();
-    auto model_type_iter = configuration.find("model_type");
-    std::string model_type = MaskRCNNModel::ModelType;
-    if (model_type_iter != configuration.end()) {
-        model_type = model_type_iter->second.as<std::string>();
-    }
-
-    if (model_type != MaskRCNNModel::ModelType) {
-        throw std::runtime_error("Incorrect or unsupported model_type is provided: " + model_type);
-    }
-
-    std::unique_ptr<MaskRCNNModel> segmentor{new MaskRCNNModel(adapter)};
-    return segmentor;
-}
-
-void MaskRCNNModel::updateModelInfo() {
-    BaseModel::updateModelInfo();
-
-    model->set_rt_info(MaskRCNNModel::ModelType, "model_info", "model_type");
-    model->set_rt_info(confidence_threshold, "model_info", "confidence_threshold");
-    model->set_rt_info(postprocess_semantic_masks, "model_info", "postprocess_semantic_masks");
-}
-
-void MaskRCNNModel::prepareInputsOutputs(std::shared_ptr<ov::Model>& model) {
-    // --------------------------- Configure input & output ---------------------------------------------
-    // --------------------------- Prepare input  -----------------------------------------------------
-    if (model->inputs().size() != 1) {
-        throw std::logic_error("MaskRCNNModel model wrapper supports topologies with only 1 input");
-    }
-    const auto& input = model->input();
-    inputNames.push_back(input.get_any_name());
-
-    const ov::Layout& inputLayout = getInputLayout(input);
-    const ov::Shape& inputShape = input.get_partial_shape().get_max_shape();
-    if (inputShape.size() != 4 || inputShape[ov::layout::channels_idx(inputLayout)] != 3) {
-        throw std::logic_error("3-channel 4-dimensional model's input is expected");
-    }
-
-    if (!embedded_processing) {
-        model = BaseModel::embedProcessing(
-            model,
-            inputNames[0],
-            inputLayout,
-            resizeMode,
-            interpolationMode,
-            ov::Shape{inputShape[ov::layout::width_idx(inputLayout)], inputShape[ov::layout::height_idx(inputLayout)]},
-            pad_value,
-            reverse_input_channels,
-            mean_values,
-            scale_values);
-
-        netInputWidth = inputShape[ov::layout::width_idx(inputLayout)];
-        netInputHeight = inputShape[ov::layout::height_idx(inputLayout)];
-        useAutoResize = true;  // temporal solution
-        embedded_processing = true;
-    }
-
-    // --------------------------- Prepare output  -----------------------------------------------------
-    struct NameRank {
-        std::string name;
-        size_t rank;
-    };
-    std::vector<NameRank> filtered;
-    filtered.reserve(3);
-    for (ov::Output<ov::Node>& output : model->outputs()) {
-        const std::unordered_set<std::string>& out_names = output.get_names();
-        if (out_names.find(saliency_map_name) == out_names.end() &&
-            out_names.find(feature_vector_name) == out_names.end()) {
-            filtered.push_back({output.get_any_name(), output.get_partial_shape().get_max_shape().size()});
-        }
-    }
-    if (filtered.size() != 3 && filtered.size() != 4) {
-        throw std::logic_error(std::string{"MaskRCNNModel model wrapper supports topologies with "} +
-                               saliency_map_name + ", " + feature_vector_name + " and 3 or 4 other outputs");
-    }
-    outputNames.resize(3);
-    for (const NameRank& name_rank : filtered) {
-        switch (name_rank.rank) {
-        case 2:
-            outputNames[0] = name_rank.name;
-            break;
-        case 3:
-            outputNames[1] = name_rank.name;
-            break;
-        case 4:
-            outputNames[2] = name_rank.name;
-            break;
-        case 0:
-            break;
-        default:
-            throw std::runtime_error("Unexpected output: " + name_rank.name);
-        }
-    }
-    append_xai_names(model->outputs(), outputNames);
-}
-
-std::unique_ptr<ResultBase> MaskRCNNModel::postprocess(InferenceResult& infResult) {
-    const auto& internalData = infResult.internalModelData->asRef<InternalImageModelData>();
-    float floatInputImgWidth = float(internalData.inputImgWidth),
-          floatInputImgHeight = float(internalData.inputImgHeight);
-    float invertedScaleX = floatInputImgWidth / netInputWidth, invertedScaleY = floatInputImgHeight / netInputHeight;
-    int padLeft = 0, padTop = 0;
-    if (RESIZE_KEEP_ASPECT == resizeMode || RESIZE_KEEP_ASPECT_LETTERBOX == resizeMode) {
-        invertedScaleX = invertedScaleY = std::max(invertedScaleX, invertedScaleY);
-        if (RESIZE_KEEP_ASPECT_LETTERBOX == resizeMode) {
-            padLeft = (netInputWidth - int(std::round(floatInputImgWidth / invertedScaleX))) / 2;
-            padTop = (netInputHeight - int(std::round(floatInputImgHeight / invertedScaleY))) / 2;
-        }
-    }
-    const Lbm& lbm = filterTensors(infResult.outputsData);
-    const int64_t* const labels_tensor_ptr = lbm.labels.data<int64_t>();
-    const float* const boxes = lbm.boxes.data<float>();
-    size_t objectSize = lbm.boxes.get_shape().back();
-    float* const masks = lbm.masks.data<float>();
-    const cv::Size& masks_size{int(lbm.masks.get_shape()[3]), int(lbm.masks.get_shape()[2])};
-    InstanceSegmentationResult* result = new InstanceSegmentationResult(infResult.frameId, infResult.metaData);
-    auto retVal = std::unique_ptr<ResultBase>(result);
-    std::vector<std::vector<cv::Mat>> saliency_maps;
-    bool has_feature_vector_name =
-        std::find(outputNames.begin(), outputNames.end(), feature_vector_name) != outputNames.end();
-    if (has_feature_vector_name) {
-        if (labels.empty()) {
-            throw std::runtime_error("Can't get number of classes because labels are empty");
-        }
-        saliency_maps.resize(labels.size());
-    }
-    for (size_t i = 0; i < lbm.labels.get_size(); ++i) {
-        float confidence = boxes[i * objectSize + 4];
-        if (confidence <= confidence_threshold && !has_feature_vector_name) {
-            continue;
-        }
-        SegmentedObject obj;
-
-        obj.confidence = confidence;
-        obj.labelID = labels_tensor_ptr[i] + 1;
-        if (!labels.empty() && obj.labelID >= labels.size()) {
-            continue;
-        }
-        obj.label = getLabelName(obj.labelID);
-
-        obj.x = clamp(round((boxes[i * objectSize + 0] - padLeft) * invertedScaleX), 0.f, floatInputImgWidth);
-        obj.y = clamp(round((boxes[i * objectSize + 1] - padTop) * invertedScaleY), 0.f, floatInputImgHeight);
-        obj.width =
-            clamp(round((boxes[i * objectSize + 2] - padLeft) * invertedScaleX - obj.x), 0.f, floatInputImgWidth);
-        obj.height =
-            clamp(round((boxes[i * objectSize + 3] - padTop) * invertedScaleY - obj.y), 0.f, floatInputImgHeight);
-
-        if (obj.height * obj.width <= 1) {
-            continue;
-        }
-
-        cv::Mat raw_cls_mask{masks_size, CV_32F, masks + masks_size.area() * i};
-        cv::Mat resized_mask;
-        if (postprocess_semantic_masks || has_feature_vector_name) {
-            resized_mask = segm_postprocess(obj, raw_cls_mask, internalData.inputImgHeight, internalData.inputImgWidth);
-        } else {
-            resized_mask = raw_cls_mask;
-        }
-        obj.mask = postprocess_semantic_masks ? resized_mask : raw_cls_mask.clone();
-        if (confidence > confidence_threshold) {
-            result->segmentedObjects.push_back(obj);
-        }
-        if (has_feature_vector_name && confidence > confidence_threshold) {
-            saliency_maps[obj.labelID - 1].push_back(resized_mask);
-        }
-    }
-    result->saliency_map = average_and_normalize(saliency_maps);
-    if (has_feature_vector_name) {
-        result->feature_vector = std::move(infResult.outputsData[feature_vector_name]);
-    }
-    return retVal;
-}
-
-std::unique_ptr<InstanceSegmentationResult> MaskRCNNModel::infer(const ImageInputData& inputData) {
-    auto result = BaseModel::inferImage(inputData);
-    return std::unique_ptr<InstanceSegmentationResult>(static_cast<InstanceSegmentationResult*>(result.release()));
-}
-
-std::vector<std::unique_ptr<InstanceSegmentationResult>> MaskRCNNModel::inferBatch(
-    const std::vector<ImageInputData>& inputImgs) {
-    auto results = BaseModel::inferBatchImage(inputImgs);
-    std::vector<std::unique_ptr<InstanceSegmentationResult>> isegResults;
-    isegResults.reserve(results.size());
-    for (auto& result : results) {
-        isegResults.emplace_back(static_cast<InstanceSegmentationResult*>(result.release()));
-    }
-    return isegResults;
-}
diff --git a/src/cpp/models/src/keypoint_detection.cpp b/src/cpp/models/src/keypoint_detection.cpp
deleted file mode 100644
index 4fbe778c..00000000
--- a/src/cpp/models/src/keypoint_detection.cpp
+++ /dev/null
@@ -1,266 +0,0 @@
-/*
- * Copyright (C) 2020-2025 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#include "models/keypoint_detection.h"
-
-#include <opencv2/core.hpp>
-#include <opencv2/imgproc.hpp>
-#include <openvino/openvino.hpp>
-#include <string>
-#include <vector>
-
-#include "models/input_data.h"
-#include "models/internal_model_data.h"
-#include "models/results.h"
-#include "utils/slog.hpp"
-
-namespace {
-
-void colArgMax(const cv::Mat& src,
-               cv::Mat& dst_locs,
-               cv::Mat& dst_values,
-               bool apply_softmax = false,
-               float eps = 1e-6f) {
-    dst_locs = cv::Mat::zeros(src.rows, 1, CV_32S);
-    dst_values = cv::Mat::zeros(src.rows, 1, CV_32F);
-
-    for (int row = 0; row < src.rows; ++row) {
-        const float* ptr_row = src.ptr<float>(row);
-        int max_val_idx = 0;
-        float max_val = ptr_row[0];
-        for (int col = 1; col < src.cols; ++col) {
-            if (ptr_row[col] > max_val) {
-                max_val_idx = col;
-                dst_locs.at<int>(row) = max_val_idx;
-                max_val = ptr_row[col];
-            }
-        }
-
-        if (apply_softmax) {
-            float sum = 0.0f;
-            for (int col = 0; col < src.cols; ++col) {
-                sum += exp(ptr_row[col] - max_val);
-            }
-            dst_values.at<float>(row) = exp(ptr_row[max_val_idx] - max_val) / (sum + eps);
-        } else {
-            dst_values.at<float>(row) = max_val;
-        }
-    }
-}
-
-DetectedKeypoints decode_simcc(const cv::Mat& simcc_x,
-                               const cv::Mat& simcc_y,
-                               const cv::Point2f& extra_scale = cv::Point2f(1.f, 1.f),
-                               const cv::Point2i& extra_offset = cv::Point2f(0.f, 0.f),
-                               bool apply_softmax = false,
-                               float simcc_split_ratio = 2.0f,
-                               float decode_beta = 150.0f,
-                               float sigma = 6.0f) {
-    cv::Mat x_locs, max_val_x;
-    colArgMax(simcc_x, x_locs, max_val_x, false);
-
-    cv::Mat y_locs, max_val_y;
-    colArgMax(simcc_y, y_locs, max_val_y, false);
-
-    if (apply_softmax) {
-        cv::Mat tmp_locs;
-        colArgMax(decode_beta * sigma * simcc_x, tmp_locs, max_val_x, true);
-        colArgMax(decode_beta * sigma * simcc_y, tmp_locs, max_val_y, true);
-    }
-
-    std::vector<cv::Point2f> keypoints(x_locs.rows);
-    cv::Mat scores = cv::Mat::zeros(x_locs.rows, 1, CV_32F);
-    for (int i = 0; i < x_locs.rows; ++i) {
-        keypoints[i] = cv::Point2f((x_locs.at<int>(i) - extra_offset.x) * extra_scale.x,
-                                   (y_locs.at<int>(i) - extra_offset.y) * extra_scale.y) /
-                       simcc_split_ratio;
-        scores.at<float>(i) = std::min(max_val_x.at<float>(i), max_val_y.at<float>(i));
-
-        if (scores.at<float>(i) <= 0.f) {
-            keypoints[i] = cv::Point2f(-1.f, -1.f);
-        }
-    }
-
-    return {std::move(keypoints), scores};
-}
-
-}  // namespace
-
-std::string KeypointDetectionModel::ModelType = "keypoint_detection";
-
-void KeypointDetectionModel::init_from_config(const ov::AnyMap& top_priority, const ov::AnyMap& mid_priority) {
-    labels = get_from_any_maps("labels", top_priority, mid_priority, labels);
-    apply_softmax = get_from_any_maps("apply_softmax", top_priority, mid_priority, apply_softmax);
-}
-
-KeypointDetectionModel::KeypointDetectionModel(std::shared_ptr<ov::Model>& model, const ov::AnyMap& configuration)
-    : BaseModel(model, configuration) {
-    init_from_config(configuration,
-                     model->has_rt_info("model_info") ? model->get_rt_info<ov::AnyMap>("model_info") : ov::AnyMap{});
-}
-
-KeypointDetectionModel::KeypointDetectionModel(std::shared_ptr<InferenceAdapter>& adapter,
-                                               const ov::AnyMap& configuration)
-    : BaseModel(adapter, configuration) {
-    init_from_config(configuration, adapter->getModelConfig());
-}
-
-std::unique_ptr<KeypointDetectionModel> KeypointDetectionModel::create_model(const std::string& modelFile,
-                                                                             const ov::AnyMap& configuration,
-                                                                             bool preload,
-                                                                             const std::string& device) {
-    auto core = ov::Core();
-    std::shared_ptr<ov::Model> model = core.read_model(modelFile);
-
-    // Check model_type in the rt_info, ignore configuration
-    std::string model_type = KeypointDetectionModel::ModelType;
-    try {
-        if (model->has_rt_info("model_info", "model_type")) {
-            model_type = model->get_rt_info<std::string>("model_info", "model_type");
-        }
-    } catch (const std::exception&) {
-        slog::warn << "Model type is not specified in the rt_info, use default model type: " << model_type
-                   << slog::endl;
-    }
-
-    if (model_type != KeypointDetectionModel::ModelType) {
-        throw std::runtime_error("Incorrect or unsupported model_type is provided in the model_info section: " +
-                                 model_type);
-    }
-
-    std::unique_ptr<KeypointDetectionModel> kp_detector{new KeypointDetectionModel(model, configuration)};
-    kp_detector->prepare();
-    if (preload) {
-        kp_detector->load(core, device);
-    }
-    return kp_detector;
-}
-
-std::unique_ptr<KeypointDetectionModel> KeypointDetectionModel::create_model(
-    std::shared_ptr<InferenceAdapter>& adapter) {
-    const ov::AnyMap& configuration = adapter->getModelConfig();
-    auto model_type_iter = configuration.find("model_type");
-    std::string model_type = KeypointDetectionModel::ModelType;
-    if (model_type_iter != configuration.end()) {
-        model_type = model_type_iter->second.as<std::string>();
-    }
-
-    if (model_type != KeypointDetectionModel::ModelType) {
-        throw std::runtime_error("Incorrect or unsupported model_type is provided: " + model_type);
-    }
-
-    std::unique_ptr<KeypointDetectionModel> kp_detector{new KeypointDetectionModel(adapter)};
-    return kp_detector;
-}
-
-void KeypointDetectionModel::updateModelInfo() {
-    BaseModel::updateModelInfo();
-
-    model->set_rt_info(KeypointDetectionModel::ModelType, "model_info", "model_type");
-    model->set_rt_info(labels, "model_info", "labels");
-}
-
-void KeypointDetectionModel::prepareInputsOutputs(std::shared_ptr<ov::Model>& model) {
-    // --------------------------- Configure input & output ---------------------------------------------
-    // --------------------------- Prepare input  -----------------------------------------------------
-    if (model->inputs().size() != 1) {
-        throw std::logic_error(KeypointDetectionModel::ModelType +
-                               " model wrapper supports topologies with only 1 input");
-    }
-    const auto& input = model->input();
-    inputNames.push_back(input.get_any_name());
-    const ov::Layout& inputLayout = getInputLayout(input);
-    const ov::Shape& inputShape = input.get_partial_shape().get_max_shape();
-    if (inputShape.size() != 4 || inputShape[ov::layout::channels_idx(inputLayout)] != 3) {
-        throw std::logic_error("3-channel 4-dimensional model's input is expected");
-    }
-
-    if (model->outputs().size() != 2) {
-        throw std::logic_error(KeypointDetectionModel::ModelType + " model wrapper supports topologies with 2 outputs");
-    }
-
-    if (!embedded_processing) {
-        model = BaseModel::embedProcessing(
-            model,
-            inputNames[0],
-            inputLayout,
-            resizeMode,
-            interpolationMode,
-            ov::Shape{inputShape[ov::layout::width_idx(inputLayout)], inputShape[ov::layout::height_idx(inputLayout)]},
-            pad_value,
-            reverse_input_channels,
-            mean_values,
-            scale_values);
-
-        ov::preprocess::PrePostProcessor ppp = ov::preprocess::PrePostProcessor(model);
-        model = ppp.build();
-        embedded_processing = true;
-        useAutoResize = true;
-        netInputWidth = inputShape[ov::layout::width_idx(inputLayout)];
-        netInputHeight = inputShape[ov::layout::height_idx(inputLayout)];
-    }
-
-    for (ov::Output<ov::Node>& output : model->outputs()) {
-        outputNames.push_back(output.get_any_name());
-    }
-}
-
-std::unique_ptr<ResultBase> KeypointDetectionModel::postprocess(InferenceResult& infResult) {
-    KeypointDetectionResult* result = new KeypointDetectionResult(infResult.frameId, infResult.metaData);
-
-    const ov::Tensor& pred_x_tensor = infResult.outputsData.find(outputNames[0])->second;
-    size_t shape_offset = pred_x_tensor.get_shape().size() == 3 ? 1 : 0;
-    auto pred_x_mat = cv::Mat(cv::Size(static_cast<int>(pred_x_tensor.get_shape()[shape_offset + 1]),
-                                       static_cast<int>(pred_x_tensor.get_shape()[shape_offset])),
-                              CV_32F,
-                              pred_x_tensor.data(),
-                              pred_x_tensor.get_strides()[shape_offset]);
-
-    const ov::Tensor& pred_y_tensor = infResult.outputsData.find(outputNames[1])->second;
-    shape_offset = pred_y_tensor.get_shape().size() == 3 ? 1 : 0;
-    auto pred_y_mat = cv::Mat(cv::Size(static_cast<int>(pred_y_tensor.get_shape()[shape_offset + 1]),
-                                       static_cast<int>(pred_y_tensor.get_shape()[shape_offset])),
-                              CV_32F,
-                              pred_y_tensor.data(),
-                              pred_y_tensor.get_strides()[shape_offset]);
-
-    const auto& image_data = infResult.internalModelData->asRef<InternalImageModelData>();
-    float inverted_scale_x = static_cast<float>(image_data.inputImgWidth) / netInputWidth,
-          inverted_scale_y = static_cast<float>(image_data.inputImgHeight) / netInputHeight;
-
-    int pad_left = 0, pad_top = 0;
-    if (RESIZE_KEEP_ASPECT == resizeMode || RESIZE_KEEP_ASPECT_LETTERBOX == resizeMode) {
-        inverted_scale_x = inverted_scale_y = std::max(inverted_scale_x, inverted_scale_y);
-        if (RESIZE_KEEP_ASPECT_LETTERBOX == resizeMode) {
-            pad_left = (netInputWidth -
-                        static_cast<int>(std::round(static_cast<float>(image_data.inputImgWidth) / inverted_scale_x))) /
-                       2;
-            pad_top = (netInputHeight -
-                       static_cast<int>(std::round(static_cast<float>(image_data.inputImgHeight) / inverted_scale_y))) /
-                      2;
-        }
-    }
-
-    result->poses.emplace_back(
-        decode_simcc(pred_x_mat, pred_y_mat, {inverted_scale_x, inverted_scale_y}, {pad_left, pad_top}, apply_softmax));
-
-    return std::unique_ptr<ResultBase>(result);
-}
-
-std::unique_ptr<KeypointDetectionResult> KeypointDetectionModel::infer(const ImageInputData& inputData) {
-    auto result = BaseModel::inferImage(inputData);
-    return std::unique_ptr<KeypointDetectionResult>(static_cast<KeypointDetectionResult*>(result.release()));
-}
-
-std::vector<std::unique_ptr<KeypointDetectionResult>> KeypointDetectionModel::inferBatch(
-    const std::vector<ImageInputData>& inputImgs) {
-    auto results = BaseModel::inferBatchImage(inputImgs);
-    std::vector<std::unique_ptr<KeypointDetectionResult>> kpDetResults;
-    kpDetResults.reserve(results.size());
-    for (auto& result : results) {
-        kpDetResults.emplace_back(static_cast<KeypointDetectionResult*>(result.release()));
-    }
-    return kpDetResults;
-}
diff --git a/src/cpp/models/src/segmentation_model.cpp b/src/cpp/models/src/segmentation_model.cpp
deleted file mode 100644
index deea1c87..00000000
--- a/src/cpp/models/src/segmentation_model.cpp
+++ /dev/null
@@ -1,331 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#include "models/segmentation_model.h"
-
-#include <stddef.h>
-#include <stdint.h>
-
-#include <fstream>
-#include <opencv2/core.hpp>
-#include <opencv2/imgproc.hpp>
-#include <openvino/openvino.hpp>
-#include <stdexcept>
-#include <string>
-#include <vector>
-
-#include "models/input_data.h"
-#include "models/internal_model_data.h"
-#include "models/results.h"
-#include "utils/slog.hpp"
-
-namespace {
-constexpr char feature_vector_name[]{"feature_vector"};
-
-cv::Mat get_activation_map(const cv::Mat& features) {
-    double min_soft_score, max_soft_score;
-    cv::minMaxLoc(features, &min_soft_score, &max_soft_score);
-    double factor = 255.0 / (max_soft_score - min_soft_score + 1e-12);
-
-    cv::Mat int_act_map;
-    features.convertTo(int_act_map, CV_8U, factor, -min_soft_score * factor);
-    return int_act_map;
-}
-}  // namespace
-
-cv::Mat create_hard_prediction_from_soft_prediction(const cv::Mat& soft_prediction,
-                                                    float soft_threshold,
-                                                    int blur_strength) {
-    if (soft_prediction.channels() == 1) {
-        return soft_prediction;
-    }
-
-    cv::Mat soft_prediction_blurred = soft_prediction.clone();
-
-    bool applyBlurAndSoftThreshold = (blur_strength > -1 && soft_threshold < std::numeric_limits<float>::infinity());
-    if (applyBlurAndSoftThreshold) {
-        cv::blur(soft_prediction_blurred, soft_prediction_blurred, cv::Size{blur_strength, blur_strength});
-    }
-
-    cv::Mat hard_prediction{cv::Size{soft_prediction_blurred.cols, soft_prediction_blurred.rows}, CV_8UC1};
-    for (int i = 0; i < soft_prediction_blurred.rows; ++i) {
-        for (int j = 0; j < soft_prediction_blurred.cols; ++j) {
-            float max_prob = -std::numeric_limits<float>::infinity();
-            if (applyBlurAndSoftThreshold) {
-                max_prob = soft_threshold;
-            }
-
-            uint8_t max_id = 0;
-            for (int c = 0; c < soft_prediction_blurred.channels(); ++c) {
-                float prob = ((float*)soft_prediction_blurred.ptr(i, j))[c];
-                if (prob > max_prob) {
-                    max_prob = prob;
-                    max_id = c;
-                }
-            }
-            hard_prediction.at<uint8_t>(i, j) = max_id;
-        }
-    }
-    return hard_prediction;
-}
-
-std::string SegmentationModel::ModelType = "Segmentation";
-
-void SegmentationModel::init_from_config(const ov::AnyMap& top_priority, const ov::AnyMap& mid_priority) {
-    blur_strength = get_from_any_maps("blur_strength", top_priority, mid_priority, blur_strength);
-    soft_threshold = get_from_any_maps("soft_threshold", top_priority, mid_priority, soft_threshold);
-    return_soft_prediction =
-        get_from_any_maps("return_soft_prediction", top_priority, mid_priority, return_soft_prediction);
-}
-
-SegmentationModel::SegmentationModel(std::shared_ptr<ov::Model>& model, const ov::AnyMap& configuration)
-    : BaseModel(model, configuration) {
-    init_from_config(configuration,
-                     model->has_rt_info("model_info") ? model->get_rt_info<ov::AnyMap>("model_info") : ov::AnyMap{});
-}
-
-SegmentationModel::SegmentationModel(std::shared_ptr<InferenceAdapter>& adapter, const ov::AnyMap& configuration)
-    : BaseModel(adapter, configuration) {
-    init_from_config(configuration, adapter->getModelConfig());
-}
-
-std::unique_ptr<SegmentationModel> SegmentationModel::create_model(const std::string& modelFile,
-                                                                   const ov::AnyMap& configuration,
-                                                                   bool preload,
-                                                                   const std::string& device) {
-    auto core = ov::Core();
-    std::shared_ptr<ov::Model> model = core.read_model(modelFile);
-
-    // Check model_type in the rt_info, ignore configuration
-    std::string model_type = SegmentationModel::ModelType;
-    try {
-        if (model->has_rt_info("model_info", "model_type")) {
-            model_type = model->get_rt_info<std::string>("model_info", "model_type");
-        }
-    } catch (const std::exception&) {
-        slog::warn << "Model type is not specified in the rt_info, use default model type: " << model_type
-                   << slog::endl;
-    }
-
-    if (model_type != SegmentationModel::ModelType) {
-        throw std::runtime_error("Incorrect or unsupported model_type is provided in the model_info section: " +
-                                 model_type);
-    }
-
-    std::unique_ptr<SegmentationModel> segmentor{new SegmentationModel(model, configuration)};
-    segmentor->prepare();
-    if (preload) {
-        segmentor->load(core, device);
-    }
-    return segmentor;
-}
-
-std::unique_ptr<SegmentationModel> SegmentationModel::create_model(std::shared_ptr<InferenceAdapter>& adapter) {
-    const ov::AnyMap& configuration = adapter->getModelConfig();
-    auto model_type_iter = configuration.find("model_type");
-    std::string model_type = SegmentationModel::ModelType;
-    if (model_type_iter != configuration.end()) {
-        model_type = model_type_iter->second.as<std::string>();
-    }
-
-    if (model_type != SegmentationModel::ModelType) {
-        throw std::runtime_error("Incorrect or unsupported model_type is provided: " + model_type);
-    }
-
-    std::unique_ptr<SegmentationModel> segmentor{new SegmentationModel(adapter)};
-    return segmentor;
-}
-
-void SegmentationModel::updateModelInfo() {
-    BaseModel::updateModelInfo();
-
-    model->set_rt_info(SegmentationModel::ModelType, "model_info", "model_type");
-    model->set_rt_info(blur_strength, "model_info", "blur_strength");
-    model->set_rt_info(soft_threshold, "model_info", "soft_threshold");
-    model->set_rt_info(return_soft_prediction, "model_info", "return_soft_prediction");
-}
-
-void SegmentationModel::prepareInputsOutputs(std::shared_ptr<ov::Model>& model) {
-    // --------------------------- Configure input & output ---------------------------------------------
-    // --------------------------- Prepare input  -----------------------------------------------------
-    if (model->inputs().size() != 1) {
-        throw std::logic_error("Segmentation model wrapper supports topologies with only 1 input");
-    }
-    const auto& input = model->input();
-    inputNames.push_back(input.get_any_name());
-
-    const ov::Layout& inputLayout = getInputLayout(input);
-    const ov::Shape& inputShape = input.get_partial_shape().get_max_shape();
-    if (inputShape.size() != 4 || inputShape[ov::layout::channels_idx(inputLayout)] != 3) {
-        throw std::logic_error("3-channel 4-dimensional model's input is expected");
-    }
-    if (model->outputs().size() > 2) {
-        throw std::logic_error("Segmentation model wrapper supports topologies with 1 or 2 outputs");
-    }
-
-    std::string out_name;
-    for (ov::Output<ov::Node>& output : model->outputs()) {
-        const std::unordered_set<std::string>& out_names = output.get_names();
-        if (out_names.find(feature_vector_name) == out_names.end()) {
-            if (out_name.empty()) {
-                out_name = output.get_any_name();
-            } else {
-                throw std::runtime_error(std::string{"Only "} + feature_vector_name +
-                                         " and 1 other output are allowed");
-            }
-        }
-    }
-    if (out_name.empty()) {
-        throw std::runtime_error("No output containing segmentation masks found");
-    }
-
-    if (!embedded_processing) {
-        model = BaseModel::embedProcessing(
-            model,
-            inputNames[0],
-            inputLayout,
-            resizeMode,
-            interpolationMode,
-            ov::Shape{inputShape[ov::layout::width_idx(inputLayout)], inputShape[ov::layout::height_idx(inputLayout)]},
-            pad_value,
-            reverse_input_channels,
-            mean_values,
-            scale_values);
-
-        ov::preprocess::PrePostProcessor ppp = ov::preprocess::PrePostProcessor(model);
-        ov::Layout out_layout = getLayoutFromShape(model->output(out_name).get_partial_shape());
-        ppp.output(out_name).model().set_layout(out_layout);
-        ppp.output(out_name).tensor().set_element_type(ov::element::f32);
-        if (ov::layout::has_channels(out_layout)) {
-            ppp.output(out_name).tensor().set_layout("NCHW");
-        } else {
-            // deeplabv3
-            ppp.output(out_name).tensor().set_layout("NHW");
-        }
-        model = ppp.build();
-        useAutoResize = true;  // temporal solution
-        embedded_processing = true;
-    }
-
-    outputNames.push_back(out_name);
-    for (ov::Output<ov::Node>& output : model->outputs()) {
-        const std::unordered_set<std::string>& out_names = output.get_names();
-        if (out_names.find(feature_vector_name) == out_names.end()) {
-            outputNames.emplace_back(feature_vector_name);
-            return;
-        }
-    }
-}
-
-std::unique_ptr<ResultBase> SegmentationModel::postprocess(InferenceResult& infResult) {
-    const auto& inputImgSize = infResult.internalModelData->asRef<InternalImageModelData>();
-    const auto& outputName = outputNames[0] == feature_vector_name ? outputNames[1] : outputNames[0];
-    const auto& outTensor = infResult.outputsData[outputName];
-    const ov::Shape& outputShape = outTensor.get_shape();
-    const ov::Layout& outputLayout = getLayoutFromShape(outputShape);
-    size_t outChannels =
-        ov::layout::has_channels(outputLayout) ? outputShape[ov::layout::channels_idx(outputLayout)] : 1;
-    int outHeight = static_cast<int>(outputShape[ov::layout::height_idx(outputLayout)]);
-    int outWidth = static_cast<int>(outputShape[ov::layout::width_idx(outputLayout)]);
-    cv::Mat soft_prediction;
-    if (outChannels == 1 && outTensor.get_element_type() == ov::element::i32) {
-        cv::Mat predictions(outHeight, outWidth, CV_32SC1, outTensor.data<int32_t>());
-        predictions.convertTo(soft_prediction, CV_8UC1);
-    } else if (outChannels == 1 && outTensor.get_element_type() == ov::element::i64) {
-        cv::Mat predictions(outHeight, outWidth, CV_32SC1);
-        const auto data = outTensor.data<int64_t>();
-        for (size_t i = 0; i < predictions.total(); ++i) {
-            reinterpret_cast<int32_t*>(predictions.data)[i] = int32_t(data[i]);
-        }
-        predictions.convertTo(soft_prediction, CV_8UC1);
-    } else if (outTensor.get_element_type() == ov::element::f32) {
-        float* data = outTensor.data<float>();
-        std::vector<cv::Mat> channels;
-        for (size_t c = 0; c < outTensor.get_shape()[1]; ++c) {
-            channels.emplace_back(cv::Size{outWidth, outHeight}, CV_32FC1, data + c * outHeight * outWidth);
-        }
-        cv::merge(channels, soft_prediction);
-    }
-
-    cv::Mat hard_prediction =
-        create_hard_prediction_from_soft_prediction(soft_prediction, soft_threshold, blur_strength);
-
-    cv::resize(hard_prediction,
-               hard_prediction,
-               {inputImgSize.inputImgWidth, inputImgSize.inputImgHeight},
-               0.0,
-               0.0,
-               cv::INTER_NEAREST);
-
-    if (return_soft_prediction) {
-        ImageResultWithSoftPrediction* result =
-            new ImageResultWithSoftPrediction(infResult.frameId, infResult.metaData);
-        result->resultImage = hard_prediction;
-        cv::resize(soft_prediction,
-                   soft_prediction,
-                   {inputImgSize.inputImgWidth, inputImgSize.inputImgHeight},
-                   0.0,
-                   0.0,
-                   cv::INTER_NEAREST);
-        result->soft_prediction = soft_prediction;
-        auto iter = infResult.outputsData.find(feature_vector_name);
-        if (infResult.outputsData.end() != iter) {
-            result->saliency_map = get_activation_map(soft_prediction);
-            result->feature_vector = iter->second;
-        }
-        return std::unique_ptr<ResultBase>(result);
-    }
-
-    ImageResult* result = new ImageResult(infResult.frameId, infResult.metaData);
-    result->resultImage = hard_prediction;
-    return std::unique_ptr<ResultBase>(result);
-}
-
-std::vector<Contour> SegmentationModel::getContours(const ImageResultWithSoftPrediction& imageResult) {
-    if (imageResult.soft_prediction.channels() == 1) {
-        throw std::runtime_error{"Cannot get contours from soft prediction with 1 layer"};
-    }
-
-    std::vector<Contour> combined_contours = {};
-    cv::Mat label_index_map;
-    cv::Mat current_label_soft_prediction;
-    for (int index = 1; index < imageResult.soft_prediction.channels(); index++) {
-        cv::extractChannel(imageResult.soft_prediction, current_label_soft_prediction, index);
-        cv::inRange(imageResult.resultImage,
-                    cv::Scalar(index, index, index),
-                    cv::Scalar(index, index, index),
-                    label_index_map);
-        std::vector<std::vector<cv::Point>> contours;
-        cv::findContours(label_index_map, contours, cv::RETR_EXTERNAL, cv::CHAIN_APPROX_NONE);
-
-        std::string label = getLabelName(index - 1);
-
-        for (unsigned int i = 0; i < contours.size(); i++) {
-            cv::Mat mask = cv::Mat::zeros(imageResult.resultImage.rows,
-                                          imageResult.resultImage.cols,
-                                          imageResult.resultImage.type());
-            cv::drawContours(mask, contours, i, 255, -1);
-            float probability = (float)cv::mean(current_label_soft_prediction, mask)[0];
-            combined_contours.push_back({label, probability, contours[i]});
-        }
-    }
-
-    return combined_contours;
-}
-
-std::unique_ptr<ImageResult> SegmentationModel::infer(const ImageInputData& inputData) {
-    auto result = BaseModel::inferImage(inputData);
-    return std::unique_ptr<ImageResult>(static_cast<ImageResult*>(result.release()));
-}
-
-std::vector<std::unique_ptr<ImageResult>> SegmentationModel::inferBatch(const std::vector<ImageInputData>& inputImgs) {
-    auto results = BaseModel::inferBatchImage(inputImgs);
-    std::vector<std::unique_ptr<ImageResult>> segResults;
-    segResults.reserve(results.size());
-    for (auto& result : results) {
-        segResults.emplace_back(static_cast<ImageResult*>(result.release()));
-    }
-    return segResults;
-}
diff --git a/src/cpp/py_bindings/.gitignore b/src/cpp/py_bindings/.gitignore
deleted file mode 100644
index 20b07f5e..00000000
--- a/src/cpp/py_bindings/.gitignore
+++ /dev/null
@@ -1,3 +0,0 @@
-*.whl
-*.dll
-*.so*
diff --git a/src/cpp/py_bindings/CMakeLists.txt b/src/cpp/py_bindings/CMakeLists.txt
deleted file mode 100644
index 4ed1c5ad..00000000
--- a/src/cpp/py_bindings/CMakeLists.txt
+++ /dev/null
@@ -1,39 +0,0 @@
-# Copyright (C) 2025 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-#
-
-cmake_minimum_required(VERSION 3.26)
-
-if(WIN32)
-  set(CMAKE_GENERATOR_TOOLSET "v142")
-endif()
-
-
-add_subdirectory(../ model_api/cpp)
-
-set(Python_FIND_VIRTUALENV FIRST)
-project(_vision_api LANGUAGES CXX)
-find_package(Python COMPONENTS Interpreter Development REQUIRED)
-
-execute_process(
-  COMMAND "${Python_EXECUTABLE}" -m nanobind --cmake_dir
-  OUTPUT_STRIP_TRAILING_WHITESPACE OUTPUT_VARIABLE nanobind_ROOT)
-find_package(nanobind CONFIG REQUIRED)
-
-
-file(GLOB BINDINGS_SOURCES src/vision_api/*.cpp)
-file(GLOB BINDINGS_HEADERS src/vision_api/*.hpp)
-
-message(INFO ${BINDINGS_SOURCES})
-
-nanobind_add_module(_vision_api NB_STATIC STABLE_ABI LTO ${BINDINGS_SOURCES} ${BINDINGS_HEADERS})
-
-set_target_properties(_vision_api PROPERTIES
-    LIBRARY_OUTPUT_DIRECTORY "${CMAKE_CURRENT_BINARY_DIR}"
-)
-
-target_link_libraries(_vision_api PRIVATE model_api)
-
-install(TARGETS _vision_api
-    LIBRARY DESTINATION vision_api  # Same place relative to package
-)
diff --git a/src/cpp/py_bindings/pyproject.toml b/src/cpp/py_bindings/pyproject.toml
deleted file mode 100644
index 1436f3e5..00000000
--- a/src/cpp/py_bindings/pyproject.toml
+++ /dev/null
@@ -1,32 +0,0 @@
-[build-system]
-requires = ["scikit-build-core >=0.4.3", "nanobind >=1.3.2"]
-build-backend = "scikit_build_core.build"
-
-[project]
-name = "vision_api"
-version = "0.3.0.2"
-requires-python = ">=3.9"
-authors = [
-  {name = "Intel(R) Corporation"},
-]
-maintainers = [
-  {name = "Intel(R) Corporation"},
-]
-description = "Model API: model wrappers and pipelines for inference with OpenVINO"
-readme = "../../python/README.md"
-classifiers = [
-  "License :: OSI Approved :: Apache Software License",
-  "Programming Language :: Python :: 3.9"
-]
-
-[project.urls]
-Homepage = "https://github.com/open-edge-platform/model_api"
-
-[tool.scikit-build]
-# Protect the configuration against future changes in scikit-build-core
-minimum-version = "0.4"
-# Setuptools-style build caching in a local directory
-build-dir = "build/{wheel_tag}"
-# Build stable ABI wheels for CPython 3.12+
-wheel.py-api = "cp312"
-sdist.include = ["*.so*"]
diff --git a/src/cpp/py_bindings/src/vision_api/__init__.py b/src/cpp/py_bindings/src/vision_api/__init__.py
deleted file mode 100644
index 0dbae48c..00000000
--- a/src/cpp/py_bindings/src/vision_api/__init__.py
+++ /dev/null
@@ -1,13 +0,0 @@
-# Copyright (C) 2024 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-try:
-    from openvino import Core
-
-    _ = Core()  # Triggers loading of shared libs like libopenvino.so
-except Exception as e:
-    raise ImportError(f"Failed to initialize OpenVINO runtime: {e}")
-
-from ._vision_api import ClassificationModel
-
-__all__ = [ClassificationModel]
diff --git a/src/cpp/py_bindings/src/vision_api/py_base.cpp b/src/cpp/py_bindings/src/vision_api/py_base.cpp
deleted file mode 100644
index ecc5e4c7..00000000
--- a/src/cpp/py_bindings/src/vision_api/py_base.cpp
+++ /dev/null
@@ -1,24 +0,0 @@
-/*
- * Copyright (C) 2025 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#include <nanobind/nanobind.h>
-#include <nanobind/stl/string.h>
-
-#include <openvino/openvino.hpp>
-
-#include "models/base_model.h"
-#include "models/results.h"
-
-namespace nb = nanobind;
-
-void init_base_modules(nb::module_& m) {
-    nb::class_<ResultBase>(m, "ResultBase").def(nb::init<>());
-
-    nb::class_<BaseModel>(m, "BaseModel")
-        .def("load", [](BaseModel& self, const std::string& device, size_t num_infer_requests) {
-            auto core = ov::Core();
-            self.load(core, device, num_infer_requests);
-        });
-}
diff --git a/src/cpp/py_bindings/src/vision_api/py_classification.cpp b/src/cpp/py_bindings/src/vision_api/py_classification.cpp
deleted file mode 100644
index d01d84f0..00000000
--- a/src/cpp/py_bindings/src/vision_api/py_classification.cpp
+++ /dev/null
@@ -1,88 +0,0 @@
-/*
- * Copyright (C) 2025 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#include <nanobind/ndarray.h>
-#include <nanobind/operators.h>
-#include <nanobind/stl/map.h>
-#include <nanobind/stl/string.h>
-#include <nanobind/stl/unique_ptr.h>
-#include <nanobind/stl/vector.h>
-
-#include "models/classification_model.h"
-#include "models/results.h"
-#include "py_utils.hpp"
-
-namespace pyutils = vision::nanobind::utils;
-
-void init_classification(nb::module_& m) {
-    nb::class_<ClassificationResult::Classification>(m, "Classification")
-        .def(nb::init<unsigned int, const std::string, float>())
-        .def_rw("id", &ClassificationResult::Classification::id)
-        .def_rw("label", &ClassificationResult::Classification::label)
-        .def_rw("score", &ClassificationResult::Classification::score);
-
-    nb::class_<ClassificationResult, ResultBase>(m, "ClassificationResult")
-        .def(nb::init<>())
-        .def_ro("topLabels", &ClassificationResult::topLabels)
-        .def("__repr__", &ClassificationResult::operator std::string)
-        .def_prop_ro(
-            "feature_vector",
-            [](ClassificationResult& r) {
-                if (!r.feature_vector) {
-                    return nb::ndarray<float, nb::numpy, nb::c_contig>();
-                }
-
-                return nb::ndarray<float, nb::numpy, nb::c_contig>(r.feature_vector.data(),
-                                                                   r.feature_vector.get_shape().size(),
-                                                                   r.feature_vector.get_shape().data());
-            },
-            nb::rv_policy::reference_internal)
-        .def_prop_ro(
-            "saliency_map",
-            [](ClassificationResult& r) {
-                if (!r.saliency_map) {
-                    return nb::ndarray<float, nb::numpy, nb::c_contig>();
-                }
-
-                return nb::ndarray<float, nb::numpy, nb::c_contig>(r.saliency_map.data(),
-                                                                   r.saliency_map.get_shape().size(),
-                                                                   r.saliency_map.get_shape().data());
-            },
-            nb::rv_policy::reference_internal);
-
-    nb::class_<ClassificationModel, BaseModel>(m, "ClassificationModel")
-        .def_static(
-            "create_model",
-            [](const std::string& model_path,
-               const std::map<std::string, nb::object>& configuration,
-               bool preload,
-               const std::string& device) {
-                auto ov_any_config = ov::AnyMap();
-                for (const auto& item : configuration) {
-                    ov_any_config[item.first] = pyutils::py_object_to_any(item.second, item.first);
-                }
-
-                return ClassificationModel::create_model(model_path, ov_any_config, preload, device);
-            },
-            nb::arg("model_path"),
-            nb::arg("configuration") = ov::AnyMap({}),
-            nb::arg("preload") = true,
-            nb::arg("device") = "AUTO")
-
-        .def("__call__",
-             [](ClassificationModel& self, const nb::ndarray<>& input) {
-                 return self.infer(pyutils::wrap_np_mat(input));
-             })
-        .def("infer_batch", [](ClassificationModel& self, const std::vector<nb::ndarray<>> inputs) {
-            std::vector<ImageInputData> input_mats;
-            input_mats.reserve(inputs.size());
-
-            for (const auto& input : inputs) {
-                input_mats.push_back(pyutils::wrap_np_mat(input));
-            }
-
-            return self.inferBatch(input_mats);
-        });
-}
diff --git a/src/cpp/py_bindings/src/vision_api/py_utils.cpp b/src/cpp/py_bindings/src/vision_api/py_utils.cpp
deleted file mode 100644
index d08881c5..00000000
--- a/src/cpp/py_bindings/src/vision_api/py_utils.cpp
+++ /dev/null
@@ -1,33 +0,0 @@
-/*
- * Copyright (C) 2025 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#include "py_utils.hpp"
-
-namespace vision::nanobind::utils {
-
-cv::Mat wrap_np_mat(const nb::ndarray<>& input) {
-    if (input.ndim() != 3 || input.shape(2) != 3 || input.dtype() != nb::dtype<uint8_t>()) {
-        throw std::runtime_error("Input image should have HWC_8U layout");
-    }
-
-    int height = input.shape(0);
-    int width = input.shape(1);
-
-    return cv::Mat(height, width, CV_8UC3, input.data());
-}
-
-ov::Any py_object_to_any(const nb::object& py_obj, const std::string& property_name) {
-    if (nb::isinstance<nb::str>(py_obj)) {
-        return ov::Any(std::string(static_cast<nb::str>(py_obj).c_str()));
-    } else if (nb::isinstance<nb::float_>(py_obj)) {
-        return ov::Any(static_cast<double>(static_cast<nb::float_>(py_obj)));
-    } else if (nb::isinstance<nb::int_>(py_obj)) {
-        return ov::Any(static_cast<int>(static_cast<nb::int_>(py_obj)));
-    } else {
-        OPENVINO_THROW("Property \"" + property_name + "\" has unsupported type.");
-    }
-}
-
-}  // namespace vision::nanobind::utils
diff --git a/src/cpp/py_bindings/src/vision_api/py_utils.hpp b/src/cpp/py_bindings/src/vision_api/py_utils.hpp
deleted file mode 100644
index 955dbfe3..00000000
--- a/src/cpp/py_bindings/src/vision_api/py_utils.hpp
+++ /dev/null
@@ -1,17 +0,0 @@
-/*
- * Copyright (C) 2025 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#pragma once
-#include <nanobind/ndarray.h>
-
-#include <opencv2/core/core.hpp>
-#include <openvino/openvino.hpp>
-
-namespace nb = nanobind;
-
-namespace vision::nanobind::utils {
-cv::Mat wrap_np_mat(const nb::ndarray<>& input);
-ov::Any py_object_to_any(const nb::object& py_obj, const std::string& property_name);
-}  // namespace vision::nanobind::utils
diff --git a/src/cpp/py_bindings/src/vision_api/py_vision_api.cpp b/src/cpp/py_bindings/src/vision_api/py_vision_api.cpp
deleted file mode 100644
index 13605a01..00000000
--- a/src/cpp/py_bindings/src/vision_api/py_vision_api.cpp
+++ /dev/null
@@ -1,17 +0,0 @@
-/*
- * Copyright (C) 2025 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#include <nanobind/nanobind.h>
-
-namespace nb = nanobind;
-
-void init_classification(nb::module_& m);
-void init_base_modules(nb::module_& m);
-
-NB_MODULE(_vision_api, m) {
-    m.doc() = "Nanobind binding for OpenVINO Vision API library";
-    init_base_modules(m);
-    init_classification(m);
-}
diff --git a/src/cpp/adapters/src/openvino_adapter.cpp b/src/cpp/src/adapters/openvino_adapter.cpp
similarity index 93%
rename from src/cpp/adapters/src/openvino_adapter.cpp
rename to src/cpp/src/adapters/openvino_adapter.cpp
index 087b6ba7..920e5378 100644
--- a/src/cpp/adapters/src/openvino_adapter.cpp
+++ b/src/cpp/src/adapters/openvino_adapter.cpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (C) 2020-2024 Intel Corporation
+ * Copyright (C) 2020-2025 Intel Corporation
  * SPDX-License-Identifier: Apache-2.0
  */
 
@@ -7,7 +7,6 @@
 
 #include <openvino/openvino.hpp>
 #include <stdexcept>
-#include <utils/slog.hpp>
 #include <vector>
 
 void OpenVINOInferenceAdapter::loadModel(const std::shared_ptr<const ov::Model>& model,
@@ -15,7 +14,6 @@ void OpenVINOInferenceAdapter::loadModel(const std::shared_ptr<const ov::Model>&
                                          const std::string& device,
                                          const ov::AnyMap& compilationConfig,
                                          size_t max_num_requests) {
-    slog::info << "Loading model to the plugin" << slog::endl;
     ov::AnyMap customCompilationConfig(compilationConfig);
     if (max_num_requests != 1) {
         if (customCompilationConfig.find("PERFORMANCE_HINT") == customCompilationConfig.end()) {
@@ -114,11 +112,11 @@ void OpenVINOInferenceAdapter::initInputsOutputs() {
         outputNames.push_back(output.get_any_name());
     }
 }
-ov::element::Type_t OpenVINOInferenceAdapter::getInputDatatype(const std::string&) const {
-    throw std::runtime_error("Not implemented");
+ov::element::Type_t OpenVINOInferenceAdapter::getInputDatatype(const std::string& name) const {
+    return compiledModel.input(name).get_element_type();
 }
-ov::element::Type_t OpenVINOInferenceAdapter::getOutputDatatype(const std::string&) const {
-    throw std::runtime_error("Not implemented");
+ov::element::Type_t OpenVINOInferenceAdapter::getOutputDatatype(const std::string& name) const {
+    return compiledModel.output(name).get_element_type();
 }
 
 std::vector<std::string> OpenVINOInferenceAdapter::getInputNames() const {
diff --git a/src/cpp/tilers/src/detection.cpp b/src/cpp/src/tasks/detection.cpp
similarity index 50%
rename from src/cpp/tilers/src/detection.cpp
rename to src/cpp/src/tasks/detection.cpp
index ec248664..53403f46 100644
--- a/src/cpp/tilers/src/detection.cpp
+++ b/src/cpp/src/tasks/detection.cpp
@@ -1,117 +1,102 @@
 /*
- * Copyright (C) 2020-2024 Intel Corporation
+ * Copyright (C) 2020-2025 Intel Corporation
  * SPDX-License-Identifier: Apache-2.0
  */
 
-#include <models/results.h>
-#include <tilers/detection.h>
+#include "tasks/detection.h"
 
-#include <algorithm>
-#include <functional>
-#include <opencv2/core.hpp>
-#include <utils/nms.hpp>
-#include <vector>
+#include "adapters/openvino_adapter.h"
+#include "tasks/detection/ssd.h"
+#include "utils/config.h"
+#include "utils/nms.h"
+#include "utils/tensor.h"
 
-namespace {
+DetectionModel DetectionModel::load(const std::string& model_path, const ov::AnyMap& configuration) {
+    auto core = ov::Core();
+    std::shared_ptr<ov::Model> model = core.read_model(model_path);
 
-cv::Mat non_linear_normalization(cv::Mat& class_map) {
-    double min_soft_score, max_soft_score;
-    cv::minMaxLoc(class_map, &min_soft_score);
-    cv::pow(class_map - min_soft_score, 1.5, class_map);
-
-    cv::minMaxLoc(class_map, &min_soft_score, &max_soft_score);
-    class_map = 255.0 / (max_soft_score + 1e-12) * class_map;
+    if (model->has_rt_info("model_info", "model_type")) {
+        std::cout << "has model type in info: " << model->get_rt_info<std::string>("model_info", "model_type")
+                  << std::endl;
+    } else {
+        throw std::runtime_error("Incorrect or unsupported model_type");
+    }
 
-    return class_map;
+    cv::Size origin_input_shape;
+    if (utils::model_has_embedded_processing(model)) {
+        std::cout << "model already was serialized" << std::endl;
+        origin_input_shape = utils::get_input_shape_from_model_info(model);
+    } else {
+        origin_input_shape = SSD::serialize(model);
+    }
+    auto adapter = std::make_shared<OpenVINOInferenceAdapter>();
+    adapter->loadModel(model, core, "AUTO");
+    return DetectionModel(std::make_unique<SSD>(adapter, origin_input_shape), configuration);
 }
 
-}  // namespace
-
-DetectionTiler::DetectionTiler(const std::shared_ptr<BaseModel>& _model,
-                               const ov::AnyMap& configuration,
-                               ExecutionMode exec_mode)
-    : TilerBase(_model, configuration, exec_mode) {
-    ov::AnyMap extra_config;
-    try {
-        auto ov_model = model->getModel();
-        extra_config = ov_model->get_rt_info<ov::AnyMap>("model_info");
-    } catch (const std::runtime_error&) {
-        extra_config = model->getInferenceAdapter()->getModelConfig();
-    }
+InferenceInput DetectionModel::preprocess(cv::Mat image) {
+    return algorithm->preprocess(image);
+}
 
-    max_pred_number = get_from_any_maps("max_pred_number", configuration, extra_config, max_pred_number);
+DetectionResult DetectionModel::postprocess(InferenceResult result) {
+    return algorithm->postprocess(result);
 }
 
-std::unique_ptr<ResultBase> DetectionTiler::postprocess_tile(std::unique_ptr<ResultBase> tile_result,
-                                                             const cv::Rect& coord) {
-    DetectionResult* det_res = static_cast<DetectionResult*>(tile_result.get());
-    for (auto& det : det_res->objects) {
+DetectionResult DetectionModel::postprocess_tile(DetectionResult& result, const cv::Rect& coord) {
+    for (auto& det : result.objects) {
         det.x += coord.x;
         det.y += coord.y;
     }
 
-    if (det_res->feature_vector) {
-        auto tmp_feature_vector =
-            ov::Tensor(det_res->feature_vector.get_element_type(), det_res->feature_vector.get_shape());
-        det_res->feature_vector.copy_to(tmp_feature_vector);
-        det_res->feature_vector = tmp_feature_vector;
-    }
-
-    if (det_res->saliency_map) {
-        auto tmp_saliency_map = ov::Tensor(det_res->saliency_map.get_element_type(), det_res->saliency_map.get_shape());
-        det_res->saliency_map.copy_to(tmp_saliency_map);
-        det_res->saliency_map = tmp_saliency_map;
-    }
-
-    return tile_result;
+    return result;
 }
 
-std::unique_ptr<ResultBase> DetectionTiler::merge_results(const std::vector<std::unique_ptr<ResultBase>>& tiles_results,
-                                                          const cv::Size& image_size,
-                                                          const std::vector<cv::Rect>& tile_coords) {
-    DetectionResult* result = new DetectionResult();
-    auto retVal = std::unique_ptr<ResultBase>(result);
+DetectionResult DetectionModel::merge_tiling_results(const std::vector<DetectionResult>& tiles_results,
+                                                     const cv::Size& image_size,
+                                                     const std::vector<cv::Rect>& tile_coords,
+                                                     const utils::TilingInfo& tiling_info) {
+    size_t max_pred_number = 200;
+
+    DetectionResult result;
 
     std::vector<AnchorLabeled> all_detections;
-    std::vector<std::reference_wrapper<DetectedObject>> all_detections_refs;
+    std::vector<std::reference_wrapper<const DetectedObject>> all_detections_refs;
     std::vector<float> all_scores;
 
     for (const auto& result : tiles_results) {
-        DetectionResult* det_res = static_cast<DetectionResult*>(result.get());
-        for (auto& det : det_res->objects) {
+        for (const auto& det : result.objects) {
             all_detections.emplace_back(det.x, det.y, det.x + det.width, det.y + det.height, det.labelID);
             all_scores.push_back(det.confidence);
-            all_detections_refs.push_back(det);
+            all_detections_refs.push_back(std::ref(det));
         }
     }
 
-    auto keep_idx = multiclass_nms(all_detections, all_scores, iou_threshold, false, max_pred_number);
+    auto keep_idx = multiclass_nms(all_detections, all_scores, tiling_info.iou_threshold, false, max_pred_number);
 
-    result->objects.reserve(keep_idx.size());
+    result.objects.reserve(keep_idx.size());
     for (auto idx : keep_idx) {
-        result->objects.push_back(all_detections_refs[idx]);
+        result.objects.push_back(all_detections_refs[idx]);
     }
 
     if (tiles_results.size()) {
-        DetectionResult* det_res = static_cast<DetectionResult*>(tiles_results.begin()->get());
+        auto det_res = tiles_results.begin();
         if (det_res->feature_vector) {
-            result->feature_vector =
+            result.feature_vector =
                 ov::Tensor(det_res->feature_vector.get_element_type(), det_res->feature_vector.get_shape());
         }
         if (det_res->saliency_map) {
-            result->saliency_map = merge_saliency_maps(tiles_results, image_size, tile_coords);
+            result.saliency_map = merge_saliency_maps(tiles_results, image_size, tile_coords, tiling_info);
         }
     }
 
-    if (result->feature_vector) {
-        float* feature_ptr = result->feature_vector.data<float>();
-        size_t feature_size = result->feature_vector.get_size();
+    if (result.feature_vector) {
+        float* feature_ptr = result.feature_vector.data<float>();
+        size_t feature_size = result.feature_vector.get_size();
 
         std::fill(feature_ptr, feature_ptr + feature_size, 0.f);
 
         for (const auto& result : tiles_results) {
-            DetectionResult* det_res = static_cast<DetectionResult*>(result.get());
-            const float* current_feature_ptr = det_res->feature_vector.data<float>();
+            const float* current_feature_ptr = result.feature_vector.data<float>();
 
             for (size_t i = 0; i < feature_size; ++i) {
                 feature_ptr[i] += current_feature_ptr[i];
@@ -123,17 +108,16 @@ std::unique_ptr<ResultBase> DetectionTiler::merge_results(const std::vector<std:
         }
     }
 
-    return retVal;
+    return result;
 }
-
-ov::Tensor DetectionTiler::merge_saliency_maps(const std::vector<std::unique_ptr<ResultBase>>& tiles_results,
+ov::Tensor DetectionModel::merge_saliency_maps(const std::vector<DetectionResult>& tiles_results,
                                                const cv::Size& image_size,
-                                               const std::vector<cv::Rect>& tile_coords) {
+                                               const std::vector<cv::Rect>& tile_coords,
+                                               const utils::TilingInfo& tiling_info) {
     std::vector<ov::Tensor> all_saliency_maps;
     all_saliency_maps.reserve(tiles_results.size());
     for (const auto& result : tiles_results) {
-        auto det_res = static_cast<DetectionResult*>(result.get());
-        all_saliency_maps.push_back(det_res->saliency_map);
+        all_saliency_maps.push_back(result.saliency_map);
     }
 
     ov::Tensor image_saliency_map;
@@ -150,8 +134,8 @@ ov::Tensor DetectionTiler::merge_saliency_maps(const std::vector<std::unique_ptr
     size_t map_h = image_saliency_map.get_shape()[shape_shift + 1];
     size_t map_w = image_saliency_map.get_shape()[shape_shift + 2];
 
-    float ratio_h = static_cast<float>(map_h) / std::min(tile_size, static_cast<size_t>(image_size.height));
-    float ratio_w = static_cast<float>(map_w) / std::min(tile_size, static_cast<size_t>(image_size.width));
+    float ratio_h = static_cast<float>(map_h) / std::min(tiling_info.tile_size, static_cast<size_t>(image_size.height));
+    float ratio_w = static_cast<float>(map_w) / std::min(tiling_info.tile_size, static_cast<size_t>(image_size.width));
 
     size_t image_map_h = static_cast<size_t>(image_size.height * ratio_h);
     size_t image_map_w = static_cast<size_t>(image_size.width * ratio_w);
@@ -161,10 +145,11 @@ ov::Tensor DetectionTiler::merge_saliency_maps(const std::vector<std::unique_ptr
         class_map = cv::Mat_<float>(cv::Size{int(image_map_w), int(image_map_h)}, 0.f);
     }
 
-    size_t start_idx = tile_with_full_img ? 1 : 0;
+    size_t start_idx = tiling_info.tile_with_full_image ? 1 : 0;
     for (size_t i = start_idx; i < all_saliency_maps.size(); ++i) {
         for (size_t class_idx = 0; class_idx < num_classes; ++class_idx) {
-            auto current_cls_map_mat = wrap_saliency_map_tensor_to_mat(all_saliency_maps[i], shape_shift, class_idx);
+            auto current_cls_map_mat =
+                utils::wrap_saliency_map_tensor_to_mat(all_saliency_maps[i], shape_shift, class_idx);
             cv::Mat current_cls_map_mat_float;
             current_cls_map_mat.convertTo(current_cls_map_mat_float, CV_32F);
 
@@ -206,20 +191,23 @@ ov::Tensor DetectionTiler::merge_saliency_maps(const std::vector<std::unique_ptr
     }
 
     for (size_t class_idx = 0; class_idx < num_classes; ++class_idx) {
-        if (tile_with_full_img) {
-            auto image_map_cls = wrap_saliency_map_tensor_to_mat(image_saliency_map, shape_shift, class_idx);
+        if (tiling_info.tile_with_full_image) {
+            auto image_map_cls = utils::wrap_saliency_map_tensor_to_mat(image_saliency_map, shape_shift, class_idx);
             cv::resize(image_map_cls, image_map_cls, cv::Size(image_map_w, image_map_h));
             cv::addWeighted(merged_map_mat[class_idx], 1.0, image_map_cls, 0.5, 0., merged_map_mat[class_idx]);
         }
-        merged_map_mat[class_idx] = non_linear_normalization(merged_map_mat[class_idx]);
-        auto merged_cls_map_mat = wrap_saliency_map_tensor_to_mat(merged_map, shape_shift, class_idx);
+        merged_map_mat[class_idx] = utils::non_linear_normalization(merged_map_mat[class_idx]);
+        auto merged_cls_map_mat = utils::wrap_saliency_map_tensor_to_mat(merged_map, shape_shift, class_idx);
         merged_map_mat[class_idx].convertTo(merged_cls_map_mat, merged_cls_map_mat.type());
     }
 
     return merged_map;
 }
 
-std::unique_ptr<DetectionResult> DetectionTiler::run(const ImageInputData& inputData) {
-    auto result = this->run_impl(inputData);
-    return std::unique_ptr<DetectionResult>(static_cast<DetectionResult*>(result.release()));
+DetectionResult DetectionModel::infer(cv::Mat image) {
+    return pipeline->infer(image);
+}
+
+std::vector<DetectionResult> DetectionModel::inferBatch(std::vector<cv::Mat> images) {
+    return pipeline->inferBatch(images);
 }
diff --git a/src/cpp/src/tasks/detection/ssd.cpp b/src/cpp/src/tasks/detection/ssd.cpp
new file mode 100644
index 00000000..e66476a3
--- /dev/null
+++ b/src/cpp/src/tasks/detection/ssd.cpp
@@ -0,0 +1,250 @@
+/*
+ * Copyright (C) 2020-2025 Intel Corporation
+ * SPDX-License-Identifier: Apache-2.0
+ */
+
+#include "tasks/detection/ssd.h"
+
+#include "utils/config.h"
+#include "utils/math.h"
+#include "utils/tensor.h"
+
+constexpr char saliency_map_name[]{"saliency_map"};
+constexpr char feature_vector_name[]{"feature_vector"};
+
+NumAndStep NumAndStep::fromSingleOutput(const ov::Shape& shape) {
+    const ov::Layout& layout("NCHW");
+    if (shape.size() != 4) {
+        throw std::logic_error("SSD single output must have 4 dimensions, but had " + std::to_string(shape.size()));
+    }
+    size_t detectionsNum = shape[ov::layout::height_idx(layout)];
+    size_t objectSize = shape[ov::layout::width_idx(layout)];
+    if (objectSize != 7) {
+        throw std::logic_error("SSD single output must have 7 as a last dimension, but had " +
+                               std::to_string(objectSize));
+    }
+    return {detectionsNum, objectSize};
+}
+
+NumAndStep NumAndStep::fromMultipleOutputs(const ov::Shape& boxesShape) {
+    if (boxesShape.size() == 2) {
+        ov::Layout boxesLayout = "NC";
+        size_t detectionsNum = boxesShape[ov::layout::batch_idx(boxesLayout)];
+        size_t objectSize = boxesShape[ov::layout::channels_idx(boxesLayout)];
+
+        if (objectSize != 5) {
+            throw std::logic_error("Incorrect 'boxes' output shape, [n][5] shape is required");
+        }
+        return {detectionsNum, objectSize};
+    }
+    if (boxesShape.size() == 3) {
+        ov::Layout boxesLayout = "CHW";
+        size_t detectionsNum = boxesShape[ov::layout::height_idx(boxesLayout)];
+        size_t objectSize = boxesShape[ov::layout::width_idx(boxesLayout)];
+
+        if (objectSize != 4 && objectSize != 5) {
+            throw std::logic_error("Incorrect 'boxes' output shape, [b][n][{4 or 5}] shape is required");
+        }
+        return {detectionsNum, objectSize};
+    }
+    throw std::logic_error("Incorrect number of 'boxes' output dimensions, expected 2 or 3, but had " +
+                           std::to_string(boxesShape.size()));
+}
+
+std::map<std::string, ov::Tensor> SSD::preprocess(cv::Mat image) {
+    std::map<std::string, ov::Tensor> input = {};
+
+    if (adapter->getInputNames().size() > 1) {
+        ov::Tensor info{ov::element::i32, ov::Shape({1, 3})};
+        int32_t* data = info.data<int32_t>();
+        data[0] = input_shape.height;
+        data[1] = input_shape.width;
+        data[3] = 1;
+        input.emplace(adapter->getInputNames()[1], std::move(info));
+    }
+    input.emplace(adapter->getInputNames()[0], utils::wrapMat2Tensor(image));
+
+    return input;
+}
+
+cv::Size SSD::serialize(std::shared_ptr<ov::Model> ov_model) {
+    auto output_mode = ov_model->outputs().size() > 1 ? SSDOutputMode::multi : SSDOutputMode::single;
+
+    auto input_tensor = ov_model->inputs()[0];
+
+    auto layout = ov::layout::get_layout(input_tensor);
+    if (layout.empty()) {
+        layout = utils::getLayoutFromShape(input_tensor.get_partial_shape());
+    }
+
+    auto interpolation_mode = cv::INTER_LINEAR;
+    utils::RESIZE_MODE resize_mode = utils::RESIZE_FILL;
+
+    auto shape = input_tensor.get_partial_shape().get_max_shape();
+
+    auto input_shape = ov::Shape{shape[ov::layout::width_idx(layout)], shape[ov::layout::height_idx(layout)]};
+    uint8_t pad_value = 0;
+
+    auto config = ov_model->has_rt_info("model_info") ? ov_model->get_rt_info<ov::AnyMap>("model_info") : ov::AnyMap{};
+
+    std::vector<float> scale_values;
+    std::vector<float> mean_values;
+    scale_values = utils::get_from_any_maps("scale_values", config, ov::AnyMap{}, scale_values);
+    mean_values = utils::get_from_any_maps("mean_values", config, ov::AnyMap{}, mean_values);
+
+    bool reverse_input_channels = false;
+
+    ov_model = utils::embedProcessing(ov_model,
+                                      input_tensor.get_any_name(),
+                                      layout,
+                                      resize_mode,
+                                      interpolation_mode,
+                                      input_shape,
+                                      pad_value,
+                                      reverse_input_channels,
+                                      mean_values,
+                                      scale_values);
+
+    if (output_mode == SSDOutputMode::single) {
+        prepareSingleOutput(ov_model);
+    } else {
+        // prepareMultipleOutputs(ov_model); //This does nothing from what I can see.
+    }
+
+    return cv::Size(input_shape[0], input_shape[1]);
+}
+
+void SSD::prepareSingleOutput(std::shared_ptr<ov::Model> ov_model) {
+    const auto& output = ov_model->output();
+
+    ov::preprocess::PrePostProcessor ppp(ov_model);
+    ppp.output().tensor().set_element_type(ov::element::f32);
+    ov_model = ppp.build();
+}
+void SSD::prepareMultipleOutputs(std::shared_ptr<ov::Model> ov_model) {
+    const ov::OutputVector& outputs = ov_model->outputs();
+    std::vector<std::string> output_names;
+    for (auto& output : outputs) {
+        const auto& tensorNames = output.get_names();
+        for (const auto& name : tensorNames) {
+            if (name.find("boxes") != std::string::npos) {
+                output_names.push_back(name);
+                break;
+            } else if (name.find("labels") != std::string::npos) {
+                output_names.push_back(name);
+                break;
+            } else if (name.find("scores") != std::string::npos) {
+                output_names.push_back(name);
+                break;
+            }
+        }
+    }
+    if (output_names.size() != 2 && output_names.size() != 3) {
+        throw std::logic_error("SSD model wrapper must have 2 or 3 outputs, but had " +
+                               std::to_string(output_names.size()));
+    }
+    std::sort(output_names.begin(), output_names.end());
+
+    for (auto& name : output_names) {
+        std::cout << "output name: " << name << std::endl;
+    }
+}
+
+std::vector<std::string> SSD::filterOutXai(const std::vector<std::string>& names) {
+    std::vector<std::string> filtered;
+    std::copy_if(names.begin(), names.end(), std::back_inserter(filtered), [](const std::string& name) {
+        return name != saliency_map_name && name != feature_vector_name;
+    });
+    return filtered;
+}
+
+DetectionResult SSD::postprocess(InferenceResult& infResult) {
+    auto result = adapter->getOutputNames().size() > 1 ? postprocessMultipleOutputs(infResult)
+                                                       : postprocessSingleOutput(infResult);
+
+    {
+        auto iter = infResult.data.find(feature_vector_name);
+        if (iter != infResult.data.end()) {
+            result.feature_vector = iter->second;
+        }
+    }
+
+    {
+        auto iter = infResult.data.find(saliency_map_name);
+        if (iter != infResult.data.end()) {
+            result.saliency_map = iter->second;
+        }
+    }
+
+    return result;
+}
+
+DetectionResult SSD::postprocessSingleOutput(InferenceResult& infResult) {
+    DetectionResult result;
+
+    // WIP
+
+    return result;
+}
+DetectionResult SSD::postprocessMultipleOutputs(InferenceResult& infResult) {
+    const std::vector<std::string> namesWithoutXai = filterOutXai(adapter->getOutputNames());
+    const float* boxes = infResult.data[namesWithoutXai[0]].data<float>();
+    NumAndStep numAndStep = NumAndStep::fromMultipleOutputs(infResult.data[namesWithoutXai[0]].get_shape());
+    const int64_t* labels = infResult.data[namesWithoutXai[1]].data<int64_t>();
+    const float* scores = namesWithoutXai.size() > 2 ? infResult.data[namesWithoutXai[2]].data<float>() : nullptr;
+
+    float floatInputImgWidth = float(infResult.inputImageSize.width),
+          floatInputImgHeight = float(infResult.inputImageSize.height);
+    float invertedScaleX = floatInputImgWidth / input_shape.width,
+          invertedScaleY = floatInputImgHeight / input_shape.height;
+    int padLeft = 0, padTop = 0;
+    if (utils::RESIZE_KEEP_ASPECT == resize_mode || utils::RESIZE_KEEP_ASPECT_LETTERBOX == resize_mode) {
+        invertedScaleX = invertedScaleY = std::max(invertedScaleX, invertedScaleY);
+        if (utils::RESIZE_KEEP_ASPECT_LETTERBOX == resize_mode) {
+            padLeft = (input_shape.width - int(std::round(floatInputImgWidth / invertedScaleX))) / 2;
+            padTop = (input_shape.height - int(std::round(floatInputImgHeight / invertedScaleY))) / 2;
+        }
+    }
+
+    // In models with scores stored in separate output coordinates are normalized to [0,1]
+    // In other multiple-outputs models coordinates are normalized to [0,netInputWidth] and [0,netInputHeight]
+    float widthScale = scores ? input_shape.width : 1.0f;
+    float heightScale = scores ? input_shape.height : 1.0f;
+
+    DetectionResult result;
+    for (size_t i = 0; i < numAndStep.detectionsNum; i++) {
+        float confidence = scores ? scores[i] : boxes[i * numAndStep.objectSize + 4];
+
+        /** Filtering out objects with confidence < confidence_threshold probability **/
+        if (confidence > confidence_threshold) {
+            auto x = clamp_and_round((boxes[i * numAndStep.objectSize] * widthScale - padLeft) * invertedScaleX,
+                                     0.f,
+                                     floatInputImgWidth);
+            auto y = clamp_and_round((boxes[i * numAndStep.objectSize + 1] * heightScale - padTop) * invertedScaleY,
+                                     0.f,
+                                     floatInputImgHeight);
+            auto width = clamp_and_round((boxes[i * numAndStep.objectSize + 2] * widthScale - padLeft) * invertedScaleX,
+                                         0.f,
+                                         floatInputImgWidth) -
+                         x;
+            auto height =
+                clamp_and_round((boxes[i * numAndStep.objectSize + 3] * heightScale - padTop) * invertedScaleY,
+                                0.f,
+                                floatInputImgHeight) -
+                y;
+
+            if (width * height >= box_area_threshold) {
+                DetectedObject object;
+                object.x = x;
+                object.y = y;
+                object.width = width;
+                object.height = height;
+                object.confidence = confidence;
+                object.labelID = labels[i];
+                object.label = this->labels[object.labelID];
+                result.objects.push_back(object);
+            }
+        }
+    }
+    return result;
+}
diff --git a/src/cpp/src/tasks/instance_segmentation.cpp b/src/cpp/src/tasks/instance_segmentation.cpp
new file mode 100644
index 00000000..f12cfe9c
--- /dev/null
+++ b/src/cpp/src/tasks/instance_segmentation.cpp
@@ -0,0 +1,283 @@
+/*
+ * Copyright (C) 2020-2025 Intel Corporation
+ * SPDX-License-Identifier: Apache-2.0
+ */
+
+#include "tasks/instance_segmentation.h"
+
+#include "adapters/openvino_adapter.h"
+#include "utils/config.h"
+#include "utils/math.h"
+#include "utils/preprocessing.h"
+#include "utils/tensor.h"
+
+constexpr char saliency_map_name[]{"saliency_map"};
+constexpr char feature_vector_name[]{"feature_vector"};
+
+void append_xai_names(const std::vector<ov::Output<ov::Node>>& outputs, std::vector<std::string>& outputNames) {
+    for (const ov::Output<ov::Node>& output : outputs) {
+        if (output.get_names().count(saliency_map_name) > 0) {
+            outputNames.emplace_back(saliency_map_name);
+        } else if (output.get_names().count(feature_vector_name) > 0) {
+            outputNames.push_back(feature_vector_name);
+        }
+    }
+}
+
+cv::Rect expand_box(const cv::Rect2f& box, float scale) {
+    float w_half = box.width * 0.5f * scale, h_half = box.height * 0.5f * scale;
+    const cv::Point2f& center = (box.tl() + box.br()) * 0.5f;
+    return {cv::Point(int(center.x - w_half), int(center.y - h_half)),
+            cv::Point(int(center.x + w_half), int(center.y + h_half))};
+}
+
+std::vector<cv::Mat_<std::uint8_t>> average_and_normalize(const std::vector<std::vector<cv::Mat>>& saliency_maps) {
+    std::vector<cv::Mat_<std::uint8_t>> aggregated;
+    aggregated.reserve(saliency_maps.size());
+    for (const std::vector<cv::Mat>& per_object_maps : saliency_maps) {
+        if (per_object_maps.empty()) {
+            aggregated.emplace_back();
+        } else {
+            cv::Mat_<double> saliency_map{per_object_maps.front().size()};
+            for (const cv::Mat& per_object_map : per_object_maps) {
+                if (saliency_map.size != per_object_map.size) {
+                    throw std::runtime_error("saliency_maps must have same size");
+                }
+                if (per_object_map.channels() != 1) {
+                    throw std::runtime_error("saliency_maps must have one channel");
+                }
+                if (per_object_map.type() != CV_8U) {
+                    throw std::runtime_error("saliency_maps must have type CV_8U");
+                }
+            }
+            for (int row = 0; row < saliency_map.rows; ++row) {
+                for (int col = 0; col < saliency_map.cols; ++col) {
+                    std::uint8_t max_val = 0;
+                    for (const cv::Mat& per_object_map : per_object_maps) {
+                        max_val = std::max(max_val, per_object_map.at<std::uint8_t>(row, col));
+                    }
+                    saliency_map.at<double>(row, col) = max_val;
+                }
+            }
+            double min, max;
+            cv::minMaxLoc(saliency_map, &min, &max);
+            cv::Mat_<std::uint8_t> converted;
+            saliency_map.convertTo(converted, CV_8U, 255.0 / (max + 1e-12));
+            aggregated.push_back(std::move(converted));
+        }
+    }
+    return aggregated;
+}
+
+struct Lbm {
+    ov::Tensor labels, boxes, masks;
+};
+
+Lbm filterTensors(const std::map<std::string, ov::Tensor>& infResult) {
+    Lbm lbm;
+    for (const auto& pair : infResult) {
+        if (pair.first == saliency_map_name || pair.first == feature_vector_name) {
+            continue;
+        }
+        switch (pair.second.get_shape().size()) {
+        case 2:
+            lbm.labels = pair.second;
+            break;
+        case 3:
+            lbm.boxes = pair.second;
+            break;
+        case 4:
+            lbm.masks = pair.second;
+            break;
+        case 0:
+            break;
+        default:
+            throw std::runtime_error("Unexpected result: " + pair.first);
+        }
+    }
+    return lbm;
+}
+
+cv::Mat segm_postprocess(const SegmentedObject& box, const cv::Mat& unpadded, int im_h, int im_w) {
+    // Add zero border to prevent upsampling artifacts on segment borders.
+    cv::Mat raw_cls_mask;
+    cv::copyMakeBorder(unpadded, raw_cls_mask, 1, 1, 1, 1, cv::BORDER_CONSTANT, {0});
+    cv::Rect extended_box = expand_box(box, float(raw_cls_mask.cols) / (raw_cls_mask.cols - 2));
+
+    int w = std::max(extended_box.width + 1, 1);
+    int h = std::max(extended_box.height + 1, 1);
+    int x0 = clamp(extended_box.x, 0, im_w);
+    int y0 = clamp(extended_box.y, 0, im_h);
+    int x1 = clamp(extended_box.x + extended_box.width + 1, 0, im_w);
+    int y1 = clamp(extended_box.y + extended_box.height + 1, 0, im_h);
+
+    cv::Mat resized;
+    cv::resize(raw_cls_mask, resized, {w, h});
+    cv::Mat im_mask(cv::Size{im_w, im_h}, CV_8UC1, cv::Scalar{0});
+    im_mask(cv::Rect{x0, y0, x1 - x0, y1 - y0})
+        .setTo(1,
+               resized({cv::Point(x0 - extended_box.x, y0 - extended_box.y),
+                        cv::Point(x1 - extended_box.x, y1 - extended_box.y)}) > 0.5f);
+    return im_mask;
+}
+
+cv::Size InstanceSegmentation::serialize(std::shared_ptr<ov::Model>& ov_model) {
+    return {};
+}
+
+InstanceSegmentation InstanceSegmentation::load(const std::string& model_path) {
+    auto core = ov::Core();
+    std::shared_ptr<ov::Model> model = core.read_model(model_path);
+
+    if (model->has_rt_info("model_info", "model_type")) {
+        std::cout << "has model type in info: " << model->get_rt_info<std::string>("model_info", "model_type")
+                  << std::endl;
+    } else {
+        throw std::runtime_error("Incorrect or unsupported model_type");
+    }
+
+    cv::Size origin_input_shape;
+    if (utils::model_has_embedded_processing(model)) {
+        std::cout << "model already was serialized" << std::endl;
+        origin_input_shape = utils::get_input_shape_from_model_info(model);
+    } else {
+        origin_input_shape = serialize(model);
+    }
+    auto adapter = std::make_shared<OpenVINOInferenceAdapter>();
+    adapter->loadModel(model, core, "AUTO");
+    return InstanceSegmentation(adapter, origin_input_shape);
+}
+
+InstanceSegmentationResult InstanceSegmentation::infer(cv::Mat image) {
+    return pipeline.infer(image);
+}
+
+std::vector<InstanceSegmentationResult> InstanceSegmentation::inferBatch(std::vector<cv::Mat> images) {
+    return pipeline.inferBatch(images);
+}
+
+std::map<std::string, ov::Tensor> InstanceSegmentation::preprocess(cv::Mat image) {
+    std::map<std::string, ov::Tensor> input = {};
+    input.emplace(adapter->getInputNames()[0], utils::wrapMat2Tensor(image));
+    return input;
+}
+
+InstanceSegmentationResult InstanceSegmentation::postprocess(InferenceResult& infResult) {
+    float floatInputImgWidth = float(infResult.inputImageSize.width),
+          floatInputImgHeight = float(infResult.inputImageSize.height);
+    float invertedScaleX = floatInputImgWidth / input_shape.width,
+          invertedScaleY = floatInputImgHeight / input_shape.height;
+    int padLeft = 0, padTop = 0;
+    auto resizeMode = utils::RESIZE_FILL;
+    if (utils::RESIZE_KEEP_ASPECT == resizeMode || utils::RESIZE_KEEP_ASPECT_LETTERBOX == resizeMode) {
+        invertedScaleX = invertedScaleY = std::max(invertedScaleX, invertedScaleY);
+        if (utils::RESIZE_KEEP_ASPECT_LETTERBOX == resizeMode) {
+            padLeft = (input_shape.width - int(std::round(floatInputImgWidth / invertedScaleX))) / 2;
+            padTop = (input_shape.height - int(std::round(floatInputImgHeight / invertedScaleY))) / 2;
+        }
+    }
+    const Lbm& lbm = filterTensors(infResult.data);
+    const int64_t* const labels_tensor_ptr = lbm.labels.data<int64_t>();
+    const float* const boxes = lbm.boxes.data<float>();
+    size_t objectSize = lbm.boxes.get_shape().back();
+    float* const masks = lbm.masks.data<float>();
+    const cv::Size& masks_size{int(lbm.masks.get_shape()[3]), int(lbm.masks.get_shape()[2])};
+    InstanceSegmentationResult result;
+    std::vector<std::vector<cv::Mat>> saliency_maps;
+    auto outputNames = adapter->getOutputNames();
+    bool has_feature_vector_name =
+        std::find(outputNames.begin(), outputNames.end(), feature_vector_name) != outputNames.end();
+
+    if (has_feature_vector_name) {
+        if (labels.empty()) {
+            throw std::runtime_error("Can't get number of classes because labels are empty");
+        }
+        saliency_maps.resize(labels.size());
+    }
+
+    for (size_t i = 0; i < lbm.labels.get_size(); ++i) {
+        float confidence = boxes[i * objectSize + 4];
+        if (confidence <= confidence_threshold && !has_feature_vector_name) {
+            continue;
+        }
+        SegmentedObject obj;
+
+        obj.confidence = confidence;
+        obj.labelID = labels_tensor_ptr[i] + 1;
+        if (!labels.empty() && obj.labelID >= labels.size()) {
+            continue;
+        }
+        obj.label = getLabelName(obj.labelID);
+
+        obj.x = clamp(round((boxes[i * objectSize + 0] - padLeft) * invertedScaleX), 0.f, floatInputImgWidth);
+        obj.y = clamp(round((boxes[i * objectSize + 1] - padTop) * invertedScaleY), 0.f, floatInputImgHeight);
+        obj.width =
+            clamp(round((boxes[i * objectSize + 2] - padLeft) * invertedScaleX - obj.x), 0.f, floatInputImgWidth);
+        obj.height =
+            clamp(round((boxes[i * objectSize + 3] - padTop) * invertedScaleY - obj.y), 0.f, floatInputImgHeight);
+
+        if (obj.height * obj.width <= 1) {
+            continue;
+        }
+
+        cv::Mat raw_cls_mask{masks_size, CV_32F, masks + masks_size.area() * i};
+        cv::Mat resized_mask;
+        if (postprocess_semantic_masks || has_feature_vector_name) {
+            resized_mask =
+                segm_postprocess(obj, raw_cls_mask, infResult.inputImageSize.height, infResult.inputImageSize.width);
+        } else {
+            resized_mask = raw_cls_mask;
+        }
+        obj.mask = postprocess_semantic_masks ? resized_mask : raw_cls_mask.clone();
+        if (confidence > confidence_threshold) {
+            result.segmentedObjects.push_back(obj);
+        }
+        if (has_feature_vector_name && confidence > confidence_threshold) {
+            saliency_maps[obj.labelID - 1].push_back(resized_mask);
+        }
+    }
+    result.saliency_map = average_and_normalize(saliency_maps);
+    if (has_feature_vector_name) {
+        result.feature_vector = std::move(infResult.data[feature_vector_name]);
+    }
+    return result;
+}
+
+std::vector<SegmentedObjectWithRects> InstanceSegmentation::getRotatedRectangles(
+    const InstanceSegmentationResult& result) {
+    std::vector<SegmentedObjectWithRects> objects_with_rects;
+    objects_with_rects.reserve(result.segmentedObjects.size());
+    for (const SegmentedObject& segmented_object : result.segmentedObjects) {
+        objects_with_rects.push_back(SegmentedObjectWithRects{segmented_object});
+        cv::Mat mask;
+        segmented_object.mask.convertTo(mask, CV_8UC1);
+        std::vector<std::vector<cv::Point>> contours;
+        cv::findContours(mask, contours, cv::RETR_EXTERNAL, cv::CHAIN_APPROX_SIMPLE);
+
+        std::vector<cv::Point> contour = {};
+        for (size_t i = 0; i < contours.size(); i++) {
+            contour.insert(contour.end(), contours[i].begin(), contours[i].end());
+        }
+        if (contour.size() > 0) {
+            std::vector<cv::Point> hull;
+            cv::convexHull(contour, hull);
+            objects_with_rects.back().rotated_rect = cv::minAreaRect(hull);
+        }
+    }
+    return objects_with_rects;
+}
+
+std::vector<Contour> InstanceSegmentation::getContours(const std::vector<SegmentedObject>& objects) {
+    std::vector<Contour> combined_contours;
+    std::vector<std::vector<cv::Point>> contours;
+    for (const SegmentedObject& obj : objects) {
+        cv::findContours(obj.mask, contours, cv::RETR_EXTERNAL, cv::CHAIN_APPROX_NONE);
+        // Assuming one contour output for findContours. Based on OTX this is a safe
+        // assumption
+        if (contours.size() != 1) {
+            throw std::runtime_error("findContours() must have returned only one contour");
+        }
+        combined_contours.push_back({obj.label, obj.confidence, contours[0]});
+    }
+    return combined_contours;
+}
diff --git a/src/cpp/src/tasks/semantic_segmentation.cpp b/src/cpp/src/tasks/semantic_segmentation.cpp
new file mode 100644
index 00000000..d837d787
--- /dev/null
+++ b/src/cpp/src/tasks/semantic_segmentation.cpp
@@ -0,0 +1,274 @@
+/*
+ * Copyright (C) 2020-2025 Intel Corporation
+ * SPDX-License-Identifier: Apache-2.0
+ */
+
+#include "tasks/semantic_segmentation.h"
+
+#include "adapters/openvino_adapter.h"
+#include "utils/config.h"
+#include "utils/tensor.h"
+
+constexpr char feature_vector_name[]{"feature_vector"};
+cv::Mat get_activation_map(const cv::Mat& features) {
+    double min_soft_score, max_soft_score;
+    cv::minMaxLoc(features, &min_soft_score, &max_soft_score);
+    double factor = 255.0 / (max_soft_score - min_soft_score + 1e-12);
+
+    cv::Mat int_act_map;
+    features.convertTo(int_act_map, CV_8U, factor, -min_soft_score * factor);
+    return int_act_map;
+}
+
+SemanticSegmentation SemanticSegmentation::load(const std::string& model_path) {
+    auto core = ov::Core();
+    std::shared_ptr<ov::Model> model = core.read_model(model_path);
+
+    if (model->has_rt_info("model_info", "model_type")) {
+        std::cout << "has model type in info: " << model->get_rt_info<std::string>("model_info", "model_type")
+                  << std::endl;
+    } else {
+        throw std::runtime_error("Incorrect or unsupported model_type");
+    }
+
+    cv::Size origin_input_shape;
+    if (utils::model_has_embedded_processing(model)) {
+        std::cout << "model already was serialized" << std::endl;
+        origin_input_shape = utils::get_input_shape_from_model_info(model);
+    } else {
+        origin_input_shape = SemanticSegmentation::serialize(model);
+    }
+    auto adapter = std::make_shared<OpenVINOInferenceAdapter>();
+    adapter->loadModel(model, core, "AUTO");
+    return SemanticSegmentation(adapter);
+}
+
+cv::Size SemanticSegmentation::serialize(std::shared_ptr<ov::Model>& ov_model) {
+    if (ov_model->inputs().size() != 1) {
+        throw std::logic_error("Segmentation model wrapper supports topologies with only 1 input");
+    }
+    const auto& input = ov_model->input();
+    // inputNames.push_back(input.get_any_name());
+
+    auto layout = ov::layout::get_layout(input);
+    if (layout.empty()) {
+        layout = utils::getLayoutFromShape(input.get_partial_shape());
+    }
+    const ov::Shape& inputShape = input.get_partial_shape().get_max_shape();
+    if (inputShape.size() != 4 || inputShape[ov::layout::channels_idx(layout)] != 3) {
+        throw std::logic_error("3-channel 4-dimensional model's input is expected");
+    }
+    if (ov_model->outputs().size() > 2) {
+        throw std::logic_error("Segmentation model wrapper supports topologies with 1 or 2 outputs");
+    }
+
+    std::string out_name;
+    for (ov::Output<ov::Node>& output : ov_model->outputs()) {
+        const std::unordered_set<std::string>& out_names = output.get_names();
+        if (out_names.find(feature_vector_name) == out_names.end()) {
+            if (out_name.empty()) {
+                out_name = output.get_any_name();
+            } else {
+                throw std::runtime_error(std::string{"Only "} + feature_vector_name +
+                                         " and 1 other output are allowed");
+            }
+        }
+    }
+    if (out_name.empty()) {
+        throw std::runtime_error("No output containing segmentation masks found");
+    }
+
+    auto interpolation_mode = cv::INTER_LINEAR;
+    utils::RESIZE_MODE resize_mode = utils::RESIZE_FILL;
+    uint8_t pad_value = 0;
+    bool reverse_input_channels = false;
+
+    auto config = ov_model->has_rt_info("model_info") ? ov_model->get_rt_info<ov::AnyMap>("model_info") : ov::AnyMap{};
+
+    std::vector<float> scale_values;
+    std::vector<float> mean_values;
+    scale_values = utils::get_from_any_maps("scale_values", config, ov::AnyMap{}, scale_values);
+    mean_values = utils::get_from_any_maps("mean_values", config, ov::AnyMap{}, mean_values);
+
+    std::cout << "inputNames: " << input.get_any_name() << std::endl;
+    std::cout << "inputLayout: " << layout.to_string() << std::endl;
+    std::cout << "resize_mode: " << resize_mode << std::endl;
+    std::cout << "interpolationMode" << interpolation_mode << std::endl;
+    std::cout << "shape"
+              << ov::Shape{inputShape[ov::layout::width_idx(layout)], inputShape[ov::layout::height_idx(layout)]}
+              << std::endl;
+    std::cout << "pad_value" << pad_value << std::endl;
+    std::cout << "reverse_input_channels" << reverse_input_channels << std::endl;
+    std::cout << "mean_values" << mean_values.size() << std::endl;
+    std::cout << "scale_values" << scale_values.size() << std::endl;
+
+    ov_model = utils::embedProcessing(
+        ov_model,
+        input.get_any_name(),
+        layout,
+        resize_mode,
+        interpolation_mode,
+        ov::Shape{inputShape[ov::layout::width_idx(layout)], inputShape[ov::layout::height_idx(layout)]},
+        pad_value,
+        reverse_input_channels,
+        mean_values,
+        scale_values);
+
+    ov::preprocess::PrePostProcessor ppp = ov::preprocess::PrePostProcessor(ov_model);
+    ov::Layout out_layout = utils::getLayoutFromShape(ov_model->output(out_name).get_partial_shape());
+    ppp.output(out_name).model().set_layout(out_layout);
+    ppp.output(out_name).tensor().set_element_type(ov::element::f32);
+    if (ov::layout::has_channels(out_layout)) {
+        ppp.output(out_name).tensor().set_layout("NCHW");
+    } else {
+        // deeplabv3
+        ppp.output(out_name).tensor().set_layout("NHW");
+    }
+    ov_model = ppp.build();
+
+    // outputNames.push_back(out_name);
+    // for (ov::Output<ov::Node>& output : model->outputs()) {
+    //     const std::unordered_set<std::string>& out_names = output.get_names();
+    //     if (out_names.find(feature_vector_name) == out_names.end()) {
+    //         outputNames.emplace_back(feature_vector_name);
+    //         return;
+    //     }
+    // }
+
+    return cv::Size{};
+}
+
+std::map<std::string, ov::Tensor> SemanticSegmentation::preprocess(cv::Mat image) {
+    std::map<std::string, ov::Tensor> input = {};
+    input.emplace(adapter->getInputNames()[0], utils::wrapMat2Tensor(image));
+    return input;
+}
+
+SemanticSegmentationResult SemanticSegmentation::postprocess(InferenceResult& infResult) {
+    auto outputNames = adapter->getOutputNames();
+    const auto& outputName = outputNames[0] == feature_vector_name ? outputNames[1] : outputNames[0];
+    const auto& outTensor = infResult.data[outputName];
+    const ov::Shape& outputShape = outTensor.get_shape();
+    const ov::Layout& outputLayout = utils::getLayoutFromShape(outputShape);
+    size_t outChannels =
+        ov::layout::has_channels(outputLayout) ? outputShape[ov::layout::channels_idx(outputLayout)] : 1;
+    int outHeight = static_cast<int>(outputShape[ov::layout::height_idx(outputLayout)]);
+    int outWidth = static_cast<int>(outputShape[ov::layout::width_idx(outputLayout)]);
+    cv::Mat soft_prediction;
+    if (outChannels == 1 && outTensor.get_element_type() == ov::element::i32) {
+        cv::Mat predictions(outHeight, outWidth, CV_32SC1, outTensor.data<int32_t>());
+        predictions.convertTo(soft_prediction, CV_8UC1);
+    } else if (outChannels == 1 && outTensor.get_element_type() == ov::element::i64) {
+        cv::Mat predictions(outHeight, outWidth, CV_32SC1);
+        const auto data = outTensor.data<int64_t>();
+        for (size_t i = 0; i < predictions.total(); ++i) {
+            reinterpret_cast<int32_t*>(predictions.data)[i] = int32_t(data[i]);
+        }
+        predictions.convertTo(soft_prediction, CV_8UC1);
+    } else if (outTensor.get_element_type() == ov::element::f32) {
+        float* data = outTensor.data<float>();
+        std::vector<cv::Mat> channels;
+        for (size_t c = 0; c < outTensor.get_shape()[1]; ++c) {
+            channels.emplace_back(cv::Size{outWidth, outHeight}, CV_32FC1, data + c * outHeight * outWidth);
+        }
+        cv::merge(channels, soft_prediction);
+    }
+
+    cv::Mat hard_prediction =
+        create_hard_prediction_from_soft_prediction(soft_prediction, soft_threshold, blur_strength);
+
+    cv::resize(hard_prediction, hard_prediction, infResult.inputImageSize, 0.0, 0.0, cv::INTER_NEAREST);
+
+    SemanticSegmentationResult result;
+    result.resultImage = hard_prediction;
+    if (return_soft_prediction) {
+        std::cout << " got a soft prediction..." << std::endl;
+        cv::resize(soft_prediction, soft_prediction, infResult.inputImageSize, 0.0, 0.0, cv::INTER_NEAREST);
+        result.soft_prediction = soft_prediction;
+        auto iter = infResult.data.find(feature_vector_name);
+        if (infResult.data.end() != iter) {
+            result.saliency_map = get_activation_map(soft_prediction);
+            result.feature_vector = iter->second;
+        }
+    }
+
+    return result;
+}
+
+std::vector<Contour> SemanticSegmentation::getContours(const SemanticSegmentationResult& result) {
+    if (result.soft_prediction.empty()) {
+        throw std::runtime_error{"Cannot get contours from semantic segmentation result without soft prediction"};
+    }
+    if (result.soft_prediction.channels() == 1) {
+        throw std::runtime_error{"Cannot get contours from soft prediction with 1 layer"};
+    }
+
+    std::vector<Contour> combined_contours = {};
+    cv::Mat label_index_map;
+    cv::Mat current_label_soft_prediction;
+    for (int index = 1; index < result.soft_prediction.channels(); index++) {
+        cv::extractChannel(result.soft_prediction, current_label_soft_prediction, index);
+        cv::inRange(result.resultImage,
+                    cv::Scalar(index, index, index),
+                    cv::Scalar(index, index, index),
+                    label_index_map);
+        std::vector<std::vector<cv::Point>> contours;
+        cv::findContours(label_index_map, contours, cv::RETR_EXTERNAL, cv::CHAIN_APPROX_NONE);
+
+        std::string label = getLabelName(index - 1);
+
+        for (unsigned int i = 0; i < contours.size(); i++) {
+            cv::Mat mask = cv::Mat::zeros(result.resultImage.rows, result.resultImage.cols, result.resultImage.type());
+            cv::drawContours(mask, contours, i, 255, -1);
+            float probability = (float)cv::mean(current_label_soft_prediction, mask)[0];
+            combined_contours.push_back({label, probability, contours[i]});
+        }
+    }
+
+    return combined_contours;
+}
+
+SemanticSegmentationResult SemanticSegmentation::infer(cv::Mat image) {
+    return pipeline.infer(image);
+}
+
+std::vector<SemanticSegmentationResult> SemanticSegmentation::inferBatch(std::vector<cv::Mat> images) {
+    return pipeline.inferBatch(images);
+}
+
+cv::Mat SemanticSegmentation::create_hard_prediction_from_soft_prediction(cv::Mat soft_prediction,
+                                                                          float threshold,
+                                                                          int blur_strength) {
+    if (soft_prediction.channels() == 1) {
+        return soft_prediction;
+    }
+
+    cv::Mat soft_prediction_blurred = soft_prediction.clone();
+
+    bool applyBlurAndSoftThreshold = (blur_strength > -1 && soft_threshold < std::numeric_limits<float>::infinity());
+    if (applyBlurAndSoftThreshold) {
+        std::cout << "applying blur and soft threshold:  " << blur_strength << std::endl;
+        cv::blur(soft_prediction_blurred, soft_prediction_blurred, cv::Size{blur_strength, blur_strength});
+    }
+
+    cv::Mat hard_prediction{cv::Size{soft_prediction_blurred.cols, soft_prediction_blurred.rows}, CV_8UC1};
+    for (int i = 0; i < soft_prediction_blurred.rows; ++i) {
+        for (int j = 0; j < soft_prediction_blurred.cols; ++j) {
+            float max_prob = -std::numeric_limits<float>::infinity();
+            if (applyBlurAndSoftThreshold) {
+                max_prob = soft_threshold;
+            }
+
+            uint8_t max_id = 0;
+            for (int c = 0; c < soft_prediction_blurred.channels(); ++c) {
+                float prob = ((float*)soft_prediction_blurred.ptr(i, j))[c];
+                if (prob > max_prob) {
+                    max_prob = prob;
+                    max_id = c;
+                }
+            }
+            hard_prediction.at<uint8_t>(i, j) = max_id;
+        }
+    }
+    return hard_prediction;
+}
diff --git a/src/cpp/utils/src/async_infer_queue.cpp b/src/cpp/src/utils/async_infer_queue.cpp
similarity index 98%
rename from src/cpp/utils/src/async_infer_queue.cpp
rename to src/cpp/src/utils/async_infer_queue.cpp
index afebfe52..899dcbe5 100644
--- a/src/cpp/utils/src/async_infer_queue.cpp
+++ b/src/cpp/src/utils/async_infer_queue.cpp
@@ -1,9 +1,9 @@
 /*
- * Copyright (C) 2020-2024 Intel Corporation
+ * Copyright (C) 2020-2025 Intel Corporation
  * SPDX-License-Identifier: Apache-2.0
  */
 
-#include "utils/async_infer_queue.hpp"
+#include "utils/async_infer_queue.h"
 
 AsyncInferQueue::AsyncInferQueue(ov::CompiledModel& model, size_t jobs) {
     if (jobs == 0) {
diff --git a/src/cpp/src/utils/config.cpp b/src/cpp/src/utils/config.cpp
new file mode 100644
index 00000000..bc6ddcf3
--- /dev/null
+++ b/src/cpp/src/utils/config.cpp
@@ -0,0 +1,6 @@
+/*
+ * Copyright (C) 2020-2025 Intel Corporation
+ * SPDX-License-Identifier: Apache-2.0
+ */
+
+#include "utils/config.h"
diff --git a/src/cpp/utils/src/image_utils.cpp b/src/cpp/src/utils/preprocessing.cpp
similarity index 87%
rename from src/cpp/utils/src/image_utils.cpp
rename to src/cpp/src/utils/preprocessing.cpp
index b74588d9..d675a283 100644
--- a/src/cpp/utils/src/image_utils.cpp
+++ b/src/cpp/src/utils/preprocessing.cpp
@@ -1,9 +1,9 @@
 /*
- * Copyright (C) 2020-2024 Intel Corporation
+ * Copyright (C) 2020-2025 Intel Corporation
  * SPDX-License-Identifier: Apache-2.0
  */
 
-#include "utils/image_utils.h"
+#include "utils/preprocessing.h"
 
 #include <openvino/opsets/opset1.hpp>
 #include <openvino/opsets/opset10.hpp>
@@ -11,7 +11,83 @@
 
 using namespace ov;
 
-namespace {
+namespace utils {
+std::shared_ptr<ov::Model> embedProcessing(std::shared_ptr<ov::Model>& model,
+                                           const std::string& inputName,
+                                           const ov::Layout& layout,
+                                           const RESIZE_MODE resize_mode,
+                                           const cv::InterpolationFlags interpolationMode,
+                                           const ov::Shape& targetShape,
+                                           uint8_t pad_value,
+                                           bool brg2rgb,
+                                           const std::vector<float>& mean,
+                                           const std::vector<float>& scale,
+                                           const std::type_info& dtype) {
+    ov::preprocess::PrePostProcessor ppp(model);
+    // Change the input type to the 8-bit image
+    if (dtype == typeid(int)) {
+        ppp.input(inputName).tensor().set_element_type(ov::element::u8);
+    }
+
+    ppp.input(inputName).tensor().set_layout(ov::Layout("NHWC")).set_color_format(ov::preprocess::ColorFormat::BGR);
+
+    if (resize_mode != NO_RESIZE) {
+        ppp.input(inputName).tensor().set_spatial_dynamic_shape();
+        // Doing resize in u8 is more efficient than FP32 but can lead to slightly different results
+        ppp.input(inputName).preprocess().custom(
+            createResizeGraph(resize_mode, targetShape, interpolationMode, pad_value));
+    }
+
+    ppp.input(inputName).model().set_layout(ov::Layout(layout));
+
+    // Handle color format
+    if (brg2rgb) {
+        ppp.input(inputName).preprocess().convert_color(ov::preprocess::ColorFormat::RGB);
+    }
+
+    ppp.input(inputName).preprocess().convert_element_type(ov::element::f32);
+
+    if (!mean.empty()) {
+        ppp.input(inputName).preprocess().mean(mean);
+    }
+    if (!scale.empty()) {
+        ppp.input(inputName).preprocess().scale(scale);
+    }
+
+    return ppp.build();
+}
+
+ov::preprocess::PostProcessSteps::CustomPostprocessOp createResizeGraph(RESIZE_MODE resizeMode,
+                                                                        const ov::Shape& size,
+                                                                        const cv::InterpolationFlags interpolationMode,
+                                                                        uint8_t pad_value) {
+    switch (resizeMode) {
+    case RESIZE_FILL:
+        return [=](const ov::Output<ov::Node>& node) {
+            return resizeImageGraph(node, size, false, interpolationMode, pad_value);
+        };
+        break;
+    case RESIZE_KEEP_ASPECT:
+        return [=](const ov::Output<ov::Node>& node) {
+            return resizeImageGraph(node, size, true, interpolationMode, pad_value);
+        };
+        break;
+    case RESIZE_KEEP_ASPECT_LETTERBOX:
+        return [=](const ov::Output<ov::Node>& node) {
+            return fitToWindowLetterBoxGraph(node, size, interpolationMode, pad_value);
+        };
+        break;
+    case RESIZE_CROP:
+        return [=](const ov::Output<ov::Node>& node) {
+            return cropResizeGraph(node, size, interpolationMode);
+        };
+        break;
+    default:
+        throw std::runtime_error("Unsupported resize mode: " + resizeMode);
+        break;
+    }
+}
+
 opset10::Interpolate::InterpolateMode ov2ovInterpolationMode(cv::InterpolationFlags interpolationMode) {
     switch (interpolationMode) {
     case cv::INTER_NEAREST:
@@ -279,96 +355,5 @@ Output<Node> cropResizeGraph(const ov::Output<ov::Node>& input,
 
     return std::make_shared<opset10::Interpolate>(cropped_frame, target_size, scales, axes, attrs);
 }
-}  // namespace
-
-cv::Mat resizeImageExt(const cv::Mat& mat,
-                       int width,
-                       int height,
-                       RESIZE_MODE resizeMode,
-                       cv::InterpolationFlags interpolationMode,
-                       cv::Rect* roi,
-                       cv::Scalar BorderConstant) {
-    if (width == mat.cols && height == mat.rows) {
-        return mat;
-    }
-
-    cv::Mat dst;
-
-    switch (resizeMode) {
-    case RESIZE_FILL:
-    case RESIZE_CROP:  // TODO: hadle crop if not embedded
-    {
-        cv::resize(mat, dst, cv::Size(width, height), interpolationMode);
-        if (roi) {
-            *roi = cv::Rect(0, 0, width, height);
-        }
-        break;
-    }
-    case RESIZE_KEEP_ASPECT:
-    case RESIZE_KEEP_ASPECT_LETTERBOX: {
-        double scale = std::min(static_cast<double>(width) / mat.cols, static_cast<double>(height) / mat.rows);
-        cv::Mat resizedImage;
-        cv::resize(mat,
-                   resizedImage,
-                   {int(std::round(mat.cols * scale)), int(std::round(mat.rows * scale))},
-                   0,
-                   0,
-                   interpolationMode);
-
-        int dx = resizeMode == RESIZE_KEEP_ASPECT ? 0 : (width - resizedImage.cols) / 2;
-        int dy = resizeMode == RESIZE_KEEP_ASPECT ? 0 : (height - resizedImage.rows) / 2;
-
-        cv::copyMakeBorder(resizedImage,
-                           dst,
-                           dy,
-                           height - resizedImage.rows - dy,
-                           dx,
-                           width - resizedImage.cols - dx,
-                           cv::BORDER_CONSTANT,
-                           BorderConstant);
-        if (roi) {
-            *roi = cv::Rect(dx, dy, resizedImage.cols, resizedImage.rows);
-        }
-        break;
-    }
-    case NO_RESIZE: {
-        dst = mat;
-        if (roi) {
-            *roi = cv::Rect(0, 0, mat.cols, mat.rows);
-        }
-        break;
-    }
-    }
-    return dst;
-}
 
-preprocess::PostProcessSteps::CustomPostprocessOp createResizeGraph(RESIZE_MODE resizeMode,
-                                                                    const Shape& size,
-                                                                    const cv::InterpolationFlags interpolationMode,
-                                                                    uint8_t pad_value) {
-    switch (resizeMode) {
-    case RESIZE_FILL:
-        return [=](const Output<Node>& node) {
-            return resizeImageGraph(node, size, false, interpolationMode, pad_value);
-        };
-        break;
-    case RESIZE_KEEP_ASPECT:
-        return [=](const Output<Node>& node) {
-            return resizeImageGraph(node, size, true, interpolationMode, pad_value);
-        };
-        break;
-    case RESIZE_KEEP_ASPECT_LETTERBOX:
-        return [=](const Output<Node>& node) {
-            return fitToWindowLetterBoxGraph(node, size, interpolationMode, pad_value);
-        };
-        break;
-    case RESIZE_CROP:
-        return [=](const Output<Node>& node) {
-            return cropResizeGraph(node, size, interpolationMode);
-        };
-        break;
-    default:
-        throw std::runtime_error("Unsupported resize mode: " + resizeMode);
-        break;
-    }
-}
+}  // namespace utils
diff --git a/src/cpp/src/utils/tensor.cpp b/src/cpp/src/utils/tensor.cpp
new file mode 100644
index 00000000..b17c3ad0
--- /dev/null
+++ b/src/cpp/src/utils/tensor.cpp
@@ -0,0 +1,6 @@
+/*
+ * Copyright (C) 2020-2025 Intel Corporation
+ * SPDX-License-Identifier: Apache-2.0
+ */
+
+#include "utils/tensor.h"
diff --git a/src/cpp/tilers/include/tilers/detection.h b/src/cpp/tilers/include/tilers/detection.h
deleted file mode 100644
index 8fde112b..00000000
--- a/src/cpp/tilers/include/tilers/detection.h
+++ /dev/null
@@ -1,30 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#pragma once
-#include <tilers/tiler_base.h>
-
-struct DetectionResult;
-
-class DetectionTiler : public TilerBase {
-public:
-    DetectionTiler(const std::shared_ptr<BaseModel>& model,
-                   const ov::AnyMap& configuration,
-                   ExecutionMode exec_mode = ExecutionMode::sync);
-    virtual ~DetectionTiler() = default;
-
-    virtual std::unique_ptr<DetectionResult> run(const ImageInputData& inputData);
-
-protected:
-    virtual std::unique_ptr<ResultBase> postprocess_tile(std::unique_ptr<ResultBase>, const cv::Rect&);
-    virtual std::unique_ptr<ResultBase> merge_results(const std::vector<std::unique_ptr<ResultBase>>&,
-                                                      const cv::Size&,
-                                                      const std::vector<cv::Rect>&);
-    ov::Tensor merge_saliency_maps(const std::vector<std::unique_ptr<ResultBase>>&,
-                                   const cv::Size&,
-                                   const std::vector<cv::Rect>&);
-
-    size_t max_pred_number = 200;
-};
diff --git a/src/cpp/tilers/include/tilers/instance_segmentation.h b/src/cpp/tilers/include/tilers/instance_segmentation.h
deleted file mode 100644
index 3ca20dcb..00000000
--- a/src/cpp/tilers/include/tilers/instance_segmentation.h
+++ /dev/null
@@ -1,32 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#pragma once
-#include <tilers/tiler_base.h>
-
-struct InstanceSegmentationResult;
-
-class InstanceSegmentationTiler : public TilerBase {
-    /*InstanceSegmentationTiler tiler works with MaskRCNNModel model only*/
-public:
-    InstanceSegmentationTiler(std::shared_ptr<BaseModel> model,
-                              const ov::AnyMap& configuration,
-                              ExecutionMode exec_mode = ExecutionMode::sync);
-    virtual std::unique_ptr<InstanceSegmentationResult> run(const ImageInputData& inputData);
-    virtual ~InstanceSegmentationTiler() = default;
-    bool postprocess_semantic_masks = true;
-
-protected:
-    virtual std::unique_ptr<ResultBase> postprocess_tile(std::unique_ptr<ResultBase>, const cv::Rect&);
-    virtual std::unique_ptr<ResultBase> merge_results(const std::vector<std::unique_ptr<ResultBase>>&,
-                                                      const cv::Size&,
-                                                      const std::vector<cv::Rect>&);
-
-    std::vector<cv::Mat_<std::uint8_t>> merge_saliency_maps(const std::vector<std::unique_ptr<ResultBase>>&,
-                                                            const cv::Size&,
-                                                            const std::vector<cv::Rect>&);
-
-    size_t max_pred_number = 200;
-};
diff --git a/src/cpp/tilers/include/tilers/semantic_segmentation.h b/src/cpp/tilers/include/tilers/semantic_segmentation.h
deleted file mode 100644
index 4c9b9d1d..00000000
--- a/src/cpp/tilers/include/tilers/semantic_segmentation.h
+++ /dev/null
@@ -1,29 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#pragma once
-#include <tilers/tiler_base.h>
-
-struct ImageResult;
-struct ImageResultWithSoftPrediction;
-
-class SemanticSegmentationTiler : public TilerBase {
-public:
-    SemanticSegmentationTiler(std::shared_ptr<BaseModel> model,
-                              const ov::AnyMap& configuration,
-                              ExecutionMode exec_mode = ExecutionMode::sync);
-    virtual std::unique_ptr<ImageResultWithSoftPrediction> run(const ImageInputData& inputData);
-    virtual ~SemanticSegmentationTiler() = default;
-
-protected:
-    virtual std::unique_ptr<ResultBase> postprocess_tile(std::unique_ptr<ResultBase>, const cv::Rect&);
-    virtual std::unique_ptr<ResultBase> merge_results(const std::vector<std::unique_ptr<ResultBase>>&,
-                                                      const cv::Size&,
-                                                      const std::vector<cv::Rect>&);
-
-    int blur_strength = -1;
-    float soft_threshold = -std::numeric_limits<float>::infinity();
-    bool return_soft_prediction = true;
-};
diff --git a/src/cpp/tilers/include/tilers/tiler_base.h b/src/cpp/tilers/include/tilers/tiler_base.h
deleted file mode 100644
index 3fb45d1e..00000000
--- a/src/cpp/tilers/include/tilers/tiler_base.h
+++ /dev/null
@@ -1,47 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#pragma once
-#include <models/base_model.h>
-
-#include <map>
-#include <memory>
-#include <openvino/openvino.hpp>
-#include <string>
-#include <utils/args_helper.hpp>
-#include <utils/ocv_common.hpp>
-#include <vector>
-
-struct ResultBase;
-
-enum class ExecutionMode { sync, async };
-
-class TilerBase {
-public:
-    TilerBase(const std::shared_ptr<BaseModel>& model,
-              const ov::AnyMap& configuration,
-              ExecutionMode exec_mode = ExecutionMode::sync);
-
-    virtual ~TilerBase() = default;
-
-protected:
-    virtual std::unique_ptr<ResultBase> run_impl(const ImageInputData& inputData);
-    std::vector<cv::Rect> tile(const cv::Size&);
-    std::vector<cv::Rect> filter_tiles(const cv::Mat&, const std::vector<cv::Rect>&);
-    std::unique_ptr<ResultBase> predict_sync(const cv::Mat&, const std::vector<cv::Rect>&);
-    std::unique_ptr<ResultBase> predict_async(const cv::Mat&, const std::vector<cv::Rect>&);
-    cv::Mat crop_tile(const cv::Mat&, const cv::Rect&);
-    virtual std::unique_ptr<ResultBase> postprocess_tile(std::unique_ptr<ResultBase>, const cv::Rect&) = 0;
-    virtual std::unique_ptr<ResultBase> merge_results(const std::vector<std::unique_ptr<ResultBase>>&,
-                                                      const cv::Size&,
-                                                      const std::vector<cv::Rect>&) = 0;
-
-    std::shared_ptr<BaseModel> model;
-    size_t tile_size = 400;
-    float tiles_overlap = 0.5f;
-    float iou_threshold = 0.45f;
-    bool tile_with_full_img = true;
-    ExecutionMode run_mode = ExecutionMode::sync;
-};
diff --git a/src/cpp/tilers/src/instance_segmentation.cpp b/src/cpp/tilers/src/instance_segmentation.cpp
deleted file mode 100644
index 211a4761..00000000
--- a/src/cpp/tilers/src/instance_segmentation.cpp
+++ /dev/null
@@ -1,196 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#include <models/instance_segmentation.h>
-#include <models/results.h>
-#include <tilers/instance_segmentation.h>
-
-#include <algorithm>
-#include <functional>
-#include <opencv2/core.hpp>
-#include <utils/nms.hpp>
-#include <vector>
-
-#include "utils/common.hpp"
-
-namespace {
-class MaskRCNNModelParamsSetter {
-public:
-    std::shared_ptr<BaseModel> model;
-    bool state;
-    MaskRCNNModel* model_ptr;
-    MaskRCNNModelParamsSetter(std::shared_ptr<BaseModel> model_) : model(model_) {
-        model_ptr = static_cast<MaskRCNNModel*>(model.get());
-        state = model_ptr->postprocess_semantic_masks;
-        model_ptr->postprocess_semantic_masks = false;
-    }
-    ~MaskRCNNModelParamsSetter() {
-        model_ptr->postprocess_semantic_masks = state;
-    }
-};
-}  // namespace
-
-InstanceSegmentationTiler::InstanceSegmentationTiler(std::shared_ptr<BaseModel> _model,
-                                                     const ov::AnyMap& configuration,
-                                                     ExecutionMode exec_mode)
-    : TilerBase(_model, configuration, exec_mode) {
-    ov::AnyMap extra_config;
-    try {
-        auto ov_model = model->getModel();
-        extra_config = ov_model->get_rt_info<ov::AnyMap>("model_info");
-    } catch (const std::runtime_error&) {
-        extra_config = model->getInferenceAdapter()->getModelConfig();
-    }
-
-    postprocess_semantic_masks =
-        get_from_any_maps("postprocess_semantic_masks", configuration, extra_config, postprocess_semantic_masks);
-    max_pred_number = get_from_any_maps("max_pred_number", configuration, extra_config, max_pred_number);
-}
-
-std::unique_ptr<InstanceSegmentationResult> InstanceSegmentationTiler::run(const ImageInputData& inputData) {
-    auto setter = MaskRCNNModelParamsSetter(model);
-    auto result = this->run_impl(inputData);
-    return std::unique_ptr<InstanceSegmentationResult>(static_cast<InstanceSegmentationResult*>(result.release()));
-}
-
-std::unique_ptr<ResultBase> InstanceSegmentationTiler::postprocess_tile(std::unique_ptr<ResultBase> tile_result,
-                                                                        const cv::Rect& coord) {
-    auto* iseg_res = static_cast<InstanceSegmentationResult*>(tile_result.get());
-    for (auto& det : iseg_res->segmentedObjects) {
-        det.x += coord.x;
-        det.y += coord.y;
-    }
-
-    if (iseg_res->feature_vector) {
-        auto tmp_feature_vector =
-            ov::Tensor(iseg_res->feature_vector.get_element_type(), iseg_res->feature_vector.get_shape());
-        iseg_res->feature_vector.copy_to(tmp_feature_vector);
-        iseg_res->feature_vector = tmp_feature_vector;
-    }
-
-    return tile_result;
-}
-
-std::unique_ptr<ResultBase> InstanceSegmentationTiler::merge_results(
-    const std::vector<std::unique_ptr<ResultBase>>& tiles_results,
-    const cv::Size& image_size,
-    const std::vector<cv::Rect>& tile_coords) {
-    auto* result = new InstanceSegmentationResult();
-    auto retVal = std::unique_ptr<ResultBase>(result);
-
-    std::vector<AnchorLabeled> all_detections;
-    std::vector<std::reference_wrapper<SegmentedObject>> all_detections_ptrs;
-    std::vector<float> all_scores;
-
-    for (const auto& result : tiles_results) {
-        auto* iseg_res = static_cast<InstanceSegmentationResult*>(result.get());
-        for (auto& det : iseg_res->segmentedObjects) {
-            all_detections.emplace_back(det.x, det.y, det.x + det.width, det.y + det.height, det.labelID);
-            all_scores.push_back(det.confidence);
-            all_detections_ptrs.push_back(det);
-        }
-    }
-
-    auto keep_idx = multiclass_nms(all_detections, all_scores, iou_threshold, false, max_pred_number);
-
-    result->segmentedObjects.reserve(keep_idx.size());
-    for (auto idx : keep_idx) {
-        if (postprocess_semantic_masks) {
-            all_detections_ptrs[idx].get().mask = segm_postprocess(all_detections_ptrs[idx],
-                                                                   all_detections_ptrs[idx].get().mask,
-                                                                   image_size.height,
-                                                                   image_size.width);
-        }
-        result->segmentedObjects.push_back(all_detections_ptrs[idx]);
-    }
-
-    if (tiles_results.size()) {
-        auto* iseg_res = static_cast<InstanceSegmentationResult*>(tiles_results.begin()->get());
-        if (iseg_res->feature_vector) {
-            result->feature_vector =
-                ov::Tensor(iseg_res->feature_vector.get_element_type(), iseg_res->feature_vector.get_shape());
-        }
-    }
-
-    if (result->feature_vector) {
-        float* feature_ptr = result->feature_vector.data<float>();
-        size_t feature_size = result->feature_vector.get_size();
-
-        std::fill(feature_ptr, feature_ptr + feature_size, 0.f);
-
-        for (const auto& result : tiles_results) {
-            auto* iseg_res = static_cast<InstanceSegmentationResult*>(result.get());
-            const float* current_feature_ptr = iseg_res->feature_vector.data<float>();
-
-            for (size_t i = 0; i < feature_size; ++i) {
-                feature_ptr[i] += current_feature_ptr[i];
-            }
-        }
-
-        for (size_t i = 0; i < feature_size; ++i) {
-            feature_ptr[i] /= tiles_results.size();
-        }
-    }
-
-    result->saliency_map = merge_saliency_maps(tiles_results, image_size, tile_coords);
-
-    return retVal;
-}
-
-std::vector<cv::Mat_<std::uint8_t>> InstanceSegmentationTiler::merge_saliency_maps(
-    const std::vector<std::unique_ptr<ResultBase>>& tiles_results,
-    const cv::Size& image_size,
-    const std::vector<cv::Rect>& tile_coords) {
-    std::vector<std::vector<cv::Mat_<std::uint8_t>>> all_saliecy_maps;
-    all_saliecy_maps.reserve(tiles_results.size());
-    for (const auto& result : tiles_results) {
-        auto det_res = static_cast<InstanceSegmentationResult*>(result.get());
-        all_saliecy_maps.push_back(det_res->saliency_map);
-    }
-
-    std::vector<cv::Mat_<std::uint8_t>> image_saliency_map;
-    if (all_saliecy_maps.size()) {
-        image_saliency_map = all_saliecy_maps[0];
-    }
-
-    if (image_saliency_map.empty()) {
-        return image_saliency_map;
-    }
-
-    size_t num_classes = image_saliency_map.size();
-    std::vector<cv::Mat_<std::uint8_t>> merged_map(num_classes);
-    for (auto& map : merged_map) {
-        map = cv::Mat_<std::uint8_t>(image_size, 0);
-    }
-
-    size_t start_idx = tile_with_full_img ? 1 : 0;
-    for (size_t i = start_idx; i < all_saliecy_maps.size(); ++i) {
-        for (size_t class_idx = 0; class_idx < num_classes; ++class_idx) {
-            auto current_cls_map_mat = all_saliecy_maps[i][class_idx];
-            if (current_cls_map_mat.empty()) {
-                continue;
-            }
-            const auto& tile = tile_coords[i];
-            cv::Mat tile_map;
-            cv::resize(current_cls_map_mat, tile_map, tile.size());
-            auto tile_map_merged = cv::Mat(merged_map[class_idx], tile);
-            cv::Mat(cv::max(tile_map, tile_map_merged)).copyTo(tile_map_merged);
-        }
-    }
-
-    for (size_t class_idx = 0; class_idx < num_classes; ++class_idx) {
-        auto image_map_cls = tile_with_full_img ? image_saliency_map[class_idx] : cv::Mat_<std::uint8_t>();
-        if (image_map_cls.empty()) {
-            if (cv::sum(merged_map[class_idx]) == cv::Scalar(0.)) {
-                merged_map[class_idx] = cv::Mat_<std::uint8_t>();
-            }
-        } else {
-            cv::resize(image_map_cls, image_map_cls, image_size);
-            cv::Mat(cv::max(merged_map[class_idx], image_map_cls)).copyTo(merged_map[class_idx]);
-        }
-    }
-
-    return merged_map;
-}
diff --git a/src/cpp/tilers/src/semantic_segmentation.cpp b/src/cpp/tilers/src/semantic_segmentation.cpp
deleted file mode 100644
index 6a8efc89..00000000
--- a/src/cpp/tilers/src/semantic_segmentation.cpp
+++ /dev/null
@@ -1,106 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#include <models/results.h>
-#include <models/segmentation_model.h>
-#include <tilers/semantic_segmentation.h>
-
-#include <opencv2/core.hpp>
-#include <vector>
-
-#include "utils/common.hpp"
-
-namespace {
-void normalize_soft_prediction(cv::Mat& soft_prediction, const cv::Mat& normalize_factor) {
-    float* data = soft_prediction.ptr<float>(0);
-    const int num_classes = soft_prediction.channels();
-    const size_t step_rows = soft_prediction.step[0] / sizeof(float);
-    const size_t step_cols = soft_prediction.step[1] / sizeof(float);
-
-    for (int y = 0; y < soft_prediction.rows; ++y) {
-        for (int x = 0; x < soft_prediction.cols; ++x) {
-            int weight = normalize_factor.at<int>(y, x);
-            if (weight > 0) {
-                for (int c = 0; c < num_classes; ++c) {
-                    data[y * step_rows + x * step_cols + c] /= weight;
-                }
-            }
-        }
-    }
-}
-}  // namespace
-
-SemanticSegmentationTiler::SemanticSegmentationTiler(std::shared_ptr<BaseModel> _model,
-                                                     const ov::AnyMap& configuration,
-                                                     ExecutionMode exec_mode)
-    : TilerBase(_model, configuration, exec_mode) {
-    ov::AnyMap extra_config;
-    try {
-        auto ov_model = model->getModel();
-        extra_config = ov_model->get_rt_info<ov::AnyMap>("model_info");
-    } catch (const std::runtime_error&) {
-        extra_config = model->getInferenceAdapter()->getModelConfig();
-    }
-
-    blur_strength = get_from_any_maps("blur_strength", configuration, extra_config, blur_strength);
-    soft_threshold = get_from_any_maps("soft_threshold", configuration, extra_config, soft_threshold);
-    return_soft_prediction =
-        get_from_any_maps("return_soft_prediction", configuration, extra_config, return_soft_prediction);
-}
-
-std::unique_ptr<ImageResultWithSoftPrediction> SemanticSegmentationTiler::run(const ImageInputData& inputData) {
-    auto result = this->run_impl(inputData);
-    return std::unique_ptr<ImageResultWithSoftPrediction>(
-        static_cast<ImageResultWithSoftPrediction*>(result.release()));
-}
-
-std::unique_ptr<ResultBase> SemanticSegmentationTiler::postprocess_tile(std::unique_ptr<ResultBase> tile_result,
-                                                                        const cv::Rect&) {
-    ImageResultWithSoftPrediction* soft = dynamic_cast<ImageResultWithSoftPrediction*>(tile_result.get());
-    if (!soft) {
-        throw std::runtime_error(
-            "SemanticSegmentationTiler requires the underlying model to return ImageResultWithSoftPrediction");
-    }
-    return tile_result;
-}
-
-std::unique_ptr<ResultBase> SemanticSegmentationTiler::merge_results(
-    const std::vector<std::unique_ptr<ResultBase>>& tiles_results,
-    const cv::Size& image_size,
-    const std::vector<cv::Rect>& tile_coords) {
-    if (tiles_results.empty()) {
-        return std::unique_ptr<ResultBase>(new ImageResultWithSoftPrediction());
-    }
-
-    cv::Mat voting_mask(cv::Size(image_size.width, image_size.height), CV_32SC1, cv::Scalar(0));
-    auto* sseg_res = static_cast<ImageResultWithSoftPrediction*>(tiles_results[0].get());
-    cv::Mat merged_soft_prediction(cv::Size(image_size.width, image_size.height),
-                                   CV_32FC(sseg_res->soft_prediction.channels()),
-                                   cv::Scalar(0));
-
-    for (size_t i = 0; i < tiles_results.size(); ++i) {
-        auto* sseg_res = static_cast<ImageResultWithSoftPrediction*>(tiles_results[i].get());
-        voting_mask(tile_coords[i]) += 1;
-        merged_soft_prediction(tile_coords[i]) += sseg_res->soft_prediction;
-    }
-
-    normalize_soft_prediction(merged_soft_prediction, voting_mask);
-
-    cv::Mat hard_prediction =
-        create_hard_prediction_from_soft_prediction(merged_soft_prediction, soft_threshold, blur_strength);
-
-    std::unique_ptr<ResultBase> retVal;
-    if (return_soft_prediction) {
-        auto* result = new ImageResultWithSoftPrediction();
-        retVal = std::unique_ptr<ResultBase>(result);
-        result->soft_prediction = merged_soft_prediction;
-        result->resultImage = hard_prediction;
-    } else {
-        auto* result = new ImageResult();
-        retVal = std::unique_ptr<ResultBase>(result);
-        result->resultImage = hard_prediction;
-    }
-    return retVal;
-}
diff --git a/src/cpp/tilers/src/tiler_base.cpp b/src/cpp/tilers/src/tiler_base.cpp
deleted file mode 100644
index 6d979dea..00000000
--- a/src/cpp/tilers/src/tiler_base.cpp
+++ /dev/null
@@ -1,114 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#include <models/base_model.h>
-#include <models/input_data.h>
-#include <models/results.h>
-#include <tilers/tiler_base.h>
-
-#include <opencv2/core.hpp>
-#include <vector>
-
-TilerBase::TilerBase(const std::shared_ptr<BaseModel>& _model, const ov::AnyMap& configuration, ExecutionMode exec_mode)
-    : model(_model),
-      run_mode(exec_mode) {
-    ov::AnyMap extra_config;
-    try {
-        auto ov_model = model->getModel();
-        extra_config = ov_model->get_rt_info<ov::AnyMap>("model_info");
-    } catch (const std::runtime_error&) {
-        extra_config = model->getInferenceAdapter()->getModelConfig();
-    }
-
-    tile_size = get_from_any_maps("tile_size", configuration, extra_config, tile_size);
-    tiles_overlap = get_from_any_maps("tiles_overlap", configuration, extra_config, tiles_overlap);
-    iou_threshold = get_from_any_maps("iou_threshold", configuration, extra_config, iou_threshold);
-    tile_with_full_img = get_from_any_maps("tile_with_full_img", configuration, extra_config, tile_with_full_img);
-}
-
-std::vector<cv::Rect> TilerBase::tile(const cv::Size& image_size) {
-    std::vector<cv::Rect> coords;
-
-    size_t tile_step = static_cast<size_t>(tile_size * (1.f - tiles_overlap));
-    size_t num_h_tiles = image_size.height / tile_step;
-    size_t num_w_tiles = image_size.width / tile_step;
-
-    if (num_h_tiles * tile_step < static_cast<size_t>(image_size.height)) {
-        num_h_tiles += 1;
-    }
-
-    if (num_w_tiles * tile_step < static_cast<size_t>(image_size.width)) {
-        num_w_tiles += 1;
-    }
-
-    if (tile_with_full_img) {
-        coords.reserve(num_h_tiles * num_w_tiles + 1);
-        coords.push_back(cv::Rect(0, 0, image_size.width, image_size.height));
-    } else {
-        coords.reserve(num_h_tiles * num_w_tiles);
-    }
-
-    for (size_t i = 0; i < num_w_tiles; ++i) {
-        for (size_t j = 0; j < num_h_tiles; ++j) {
-            int loc_h = static_cast<int>(j * tile_step);
-            int loc_w = static_cast<int>(i * tile_step);
-
-            coords.push_back(cv::Rect(loc_w,
-                                      loc_h,
-                                      std::min(static_cast<int>(tile_size), image_size.width - loc_w),
-                                      std::min(static_cast<int>(tile_size), image_size.height - loc_h)));
-        }
-    }
-    return coords;
-}
-
-std::vector<cv::Rect> TilerBase::filter_tiles(const cv::Mat&, const std::vector<cv::Rect>& coords) {
-    return coords;
-}
-
-std::unique_ptr<ResultBase> TilerBase::predict_sync(const cv::Mat& image, const std::vector<cv::Rect>& tile_coords) {
-    std::vector<std::unique_ptr<ResultBase>> tile_results;
-
-    for (const auto& coord : tile_coords) {
-        auto tile_img = crop_tile(image, coord);
-        auto tile_prediction = model->inferImage(ImageInputData(tile_img.clone()));
-        auto tile_result = postprocess_tile(std::move(tile_prediction), coord);
-        tile_results.push_back(std::move(tile_result));
-    }
-
-    return merge_results(tile_results, image.size(), tile_coords);
-}
-
-std::unique_ptr<ResultBase> TilerBase::predict_async(const cv::Mat& image, const std::vector<cv::Rect>& tile_coords) {
-    std::vector<ImageInputData> input_data;
-
-    input_data.reserve(tile_coords.size());
-    for (const auto& coord : tile_coords) {
-        auto tile_img = crop_tile(image, coord);
-        input_data.push_back(ImageInputData(tile_img.clone()));
-    }
-
-    std::vector<std::unique_ptr<ResultBase>> tile_results;
-    auto tile_predictions = model->inferBatchImage(input_data);
-    for (size_t i = 0; i < tile_predictions.size(); ++i) {
-        auto tile_result = postprocess_tile(std::move(tile_predictions[i]), tile_coords[i]);
-        tile_results.push_back(std::move(tile_result));
-    }
-    return merge_results(tile_results, image.size(), tile_coords);
-}
-
-cv::Mat TilerBase::crop_tile(const cv::Mat& image, const cv::Rect& coord) {
-    return cv::Mat(image, coord);
-}
-
-std::unique_ptr<ResultBase> TilerBase::run_impl(const ImageInputData& inputData) {
-    auto& image = inputData.inputImage;
-    auto tile_coords = tile(image.size());
-    tile_coords = filter_tiles(image, tile_coords);
-    if (run_mode == ExecutionMode::async) {
-        return predict_async(image, tile_coords);
-    }
-    return predict_sync(image, tile_coords);
-}
diff --git a/src/cpp/utils/include/utils/args_helper.hpp b/src/cpp/utils/include/utils/args_helper.hpp
deleted file mode 100644
index d57a0947..00000000
--- a/src/cpp/utils/include/utils/args_helper.hpp
+++ /dev/null
@@ -1,62 +0,0 @@
-// Copyright (C) 2018-2024 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-/**
- * @brief a header file with common samples functionality
- * @file args_helper.hpp
- */
-
-#pragma once
-
-#include <map>
-#include <opencv2/core/types.hpp>
-#include <openvino/openvino.hpp>
-#include <set>
-#include <string>
-#include <vector>
-
-std::vector<std::string> split(const std::string& s, char delim);
-
-std::vector<std::string> parseDevices(const std::string& device_string);
-
-std::map<std::string, int32_t> parseValuePerDevice(const std::set<std::string>& devices,
-                                                   const std::string& values_string);
-
-std::map<std::string, ov::Layout> parseLayoutString(const std::string& layout_string);
-
-std::string formatLayouts(const std::map<std::string, ov::Layout>& layouts);
-
-template <typename Type>
-Type get_from_any_maps(const std::string& key,
-                       const ov::AnyMap& top_priority,
-                       const ov::AnyMap& mid_priority,
-                       Type low_priority) {
-    auto topk_iter = top_priority.find(key);
-    if (topk_iter != top_priority.end()) {
-        return topk_iter->second.as<Type>();
-    }
-    topk_iter = mid_priority.find(key);
-    if (topk_iter != mid_priority.end()) {
-        return topk_iter->second.as<Type>();
-    }
-    return low_priority;
-}
-
-template <>
-inline bool get_from_any_maps(const std::string& key,
-                              const ov::AnyMap& top_priority,
-                              const ov::AnyMap& mid_priority,
-                              bool low_priority) {
-    auto topk_iter = top_priority.find(key);
-    if (topk_iter != top_priority.end()) {
-        const std::string& val = topk_iter->second.as<std::string>();
-        return val == "True" || val == "YES";
-    }
-    topk_iter = mid_priority.find(key);
-    if (topk_iter != mid_priority.end()) {
-        const std::string& val = topk_iter->second.as<std::string>();
-        return val == "True" || val == "YES";
-    }
-    return low_priority;
-}
diff --git a/src/cpp/utils/include/utils/common.hpp b/src/cpp/utils/include/utils/common.hpp
deleted file mode 100644
index 5e4db57e..00000000
--- a/src/cpp/utils/include/utils/common.hpp
+++ /dev/null
@@ -1,58 +0,0 @@
-// Copyright (C) 2018-2024 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-/**
- * @brief a header file with common samples functionality
- * @file common.hpp
- */
-
-#pragma once
-
-#include <iostream>
-#include <openvino/openvino.hpp>
-#include <string>
-#include <utility>
-#include <vector>
-
-#include "utils/slog.hpp"
-
-template <typename T, std::size_t N>
-constexpr std::size_t arraySize(const T (&)[N]) noexcept {
-    return N;
-}
-
-template <typename T>
-T clamp(T value, T low, T high) {
-    return value < low ? low : (value > high ? high : value);
-}
-
-static inline void logBasicModelInfo(const std::shared_ptr<ov::Model>& model) {
-    slog::info << "Model name: " << model->get_friendly_name() << slog::endl;
-
-    // Dump information about model inputs/outputs
-    ov::OutputVector inputs = model->inputs();
-    ov::OutputVector outputs = model->outputs();
-
-    slog::info << "\tInputs: " << slog::endl;
-    for (const ov::Output<ov::Node>& input : inputs) {
-        const std::string name = input.get_any_name();
-        const ov::element::Type type = input.get_element_type();
-        const ov::PartialShape shape = input.get_partial_shape();
-        const ov::Layout layout = ov::layout::get_layout(input);
-
-        slog::info << "\t\t" << name << ", " << type << ", " << shape << ", " << layout.to_string() << slog::endl;
-    }
-
-    slog::info << "\tOutputs: " << slog::endl;
-    for (const ov::Output<ov::Node>& output : outputs) {
-        const std::string name = output.get_names().size() ? output.get_any_name() : "";
-        const ov::element::Type type = output.get_element_type();
-        const ov::PartialShape shape = output.get_partial_shape();
-        const ov::Layout layout = ov::layout::get_layout(output);
-
-        slog::info << "\t\t" << name << ", " << type << ", " << shape << ", " << layout.to_string() << slog::endl;
-    }
-
-    return;
-}
diff --git a/src/cpp/utils/include/utils/image_utils.h b/src/cpp/utils/include/utils/image_utils.h
deleted file mode 100644
index 59ba39e9..00000000
--- a/src/cpp/utils/include/utils/image_utils.h
+++ /dev/null
@@ -1,45 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#pragma once
-
-#include <opencv2/opencv.hpp>
-#include <openvino/openvino.hpp>
-
-enum RESIZE_MODE {
-    RESIZE_FILL,
-    RESIZE_KEEP_ASPECT,
-    RESIZE_KEEP_ASPECT_LETTERBOX,
-    RESIZE_CROP,
-    NO_RESIZE,
-};
-
-inline std::string formatResizeMode(RESIZE_MODE mode) {
-    switch (mode) {
-    case RESIZE_FILL:
-        return "standard";
-    case RESIZE_KEEP_ASPECT:
-        return "fit_to_window";
-    case RESIZE_KEEP_ASPECT_LETTERBOX:
-        return "fit_to_window_letterbox";
-    case RESIZE_CROP:
-        return "crop";
-    default:
-        return "unknown";
-    }
-}
-
-cv::Mat resizeImageExt(const cv::Mat& mat,
-                       int width,
-                       int height,
-                       RESIZE_MODE resizeMode = RESIZE_FILL,
-                       cv::InterpolationFlags interpolationMode = cv::INTER_LINEAR,
-                       cv::Rect* roi = nullptr,
-                       cv::Scalar BorderConstant = cv::Scalar(0, 0, 0));
-
-ov::preprocess::PostProcessSteps::CustomPostprocessOp createResizeGraph(RESIZE_MODE resizeMode,
-                                                                        const ov::Shape& size,
-                                                                        const cv::InterpolationFlags interpolationMode,
-                                                                        uint8_t pad_value);
diff --git a/src/cpp/utils/include/utils/kuhn_munkres.hpp b/src/cpp/utils/include/utils/kuhn_munkres.hpp
deleted file mode 100644
index 4423d03c..00000000
--- a/src/cpp/utils/include/utils/kuhn_munkres.hpp
+++ /dev/null
@@ -1,56 +0,0 @@
-// Copyright (C) 2018-2024 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-#pragma once
-
-#include <memory>
-#include <vector>
-
-#include "opencv2/core.hpp"
-
-///
-/// \brief The KuhnMunkres class
-///
-/// Solves the assignment problem.
-///
-class KuhnMunkres {
-public:
-    ///
-    /// \brief Initializes the class for assignment problem solving.
-    /// \param[in] greedy If a faster greedy matching algorithm should be used.
-    explicit KuhnMunkres(bool greedy = false);
-
-    ///
-    /// \brief Solves the assignment problem for given dissimilarity matrix.
-    /// It returns a vector that where each element is a column index for
-    /// corresponding row (e.g. result[0] stores optimal column index for very
-    /// first row in the dissimilarity matrix).
-    /// \param dissimilarity_matrix CV_32F dissimilarity matrix.
-    /// \return Optimal column index for each row. -1 means that there is no
-    /// column for row.
-    ///
-    std::vector<size_t> Solve(const cv::Mat& dissimilarity_matrix);
-
-private:
-    static constexpr int kStar = 1;
-    static constexpr int kPrime = 2;
-
-    cv::Mat dm_;
-    cv::Mat marked_;
-    std::vector<cv::Point> points_;
-
-    std::vector<int> is_row_visited_;
-    std::vector<int> is_col_visited_;
-
-    int n_;
-    bool greedy_;
-
-    void TrySimpleCase();
-    bool CheckIfOptimumIsFound();
-    cv::Point FindUncoveredMinValPos();
-    void UpdateDissimilarityMatrix(float val);
-    int FindInRow(int row, int what);
-    int FindInCol(int col, int what);
-    void Run();
-};
diff --git a/src/cpp/utils/include/utils/ocv_common.hpp b/src/cpp/utils/include/utils/ocv_common.hpp
deleted file mode 100644
index 3a25f755..00000000
--- a/src/cpp/utils/include/utils/ocv_common.hpp
+++ /dev/null
@@ -1,200 +0,0 @@
-// Copyright (C) 2018-2024 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-/**
- * @brief a header file with common samples functionality using OpenCV
- * @file ocv_common.hpp
- */
-
-#pragma once
-
-#include <opencv2/core.hpp>
-#include <opencv2/imgproc.hpp>
-#include <openvino/openvino.hpp>
-
-static inline ov::Tensor wrapMat2Tensor(const cv::Mat& mat) {
-    auto matType = mat.type() & CV_MAT_DEPTH_MASK;
-    if (matType != CV_8U && matType != CV_32F) {
-        throw std::runtime_error("Unsupported mat type for wrapping");
-    }
-    bool isMatFloat = matType == CV_32F;
-
-    const size_t channels = mat.channels();
-    const size_t height = mat.rows;
-    const size_t width = mat.cols;
-
-    const size_t strideH = mat.step.buf[0];
-    const size_t strideW = mat.step.buf[1];
-
-    const bool isDense = !isMatFloat
-                             ? (strideW == channels && strideH == channels * width)
-                             : (strideW == channels * sizeof(float) && strideH == channels * width * sizeof(float));
-    if (!isDense) {
-        throw std::runtime_error("Doesn't support conversion from not dense cv::Mat");
-    }
-    auto precision = isMatFloat ? ov::element::f32 : ov::element::u8;
-    struct SharedMatAllocator {
-        const cv::Mat mat;
-        void* allocate(size_t bytes, size_t) {
-            return bytes <= mat.rows * mat.step[0] ? mat.data : nullptr;
-        }
-        void deallocate(void*, size_t, size_t) {}
-        bool is_equal(const SharedMatAllocator& other) const noexcept {
-            return this == &other;
-        }
-    };
-    return ov::Tensor(precision, ov::Shape{1, height, width, channels}, SharedMatAllocator{mat});
-}
-
-struct IntervalCondition {
-    using DimType = size_t;
-    using IndexType = size_t;
-    using ConditionChecker = std::function<bool(IndexType, const ov::PartialShape&)>;
-
-    template <class Cond>
-    constexpr IntervalCondition(IndexType i1, IndexType i2, Cond c)
-        : impl([=](IndexType i0, const ov::PartialShape& shape) {
-              return c(shape[i0].get_max_length(), shape[i1].get_max_length()) &&
-                     c(shape[i0].get_max_length(), shape[i2].get_max_length());
-          }) {}
-    bool operator()(IndexType i0, const ov::PartialShape& shape) const {
-        return impl(i0, shape);
-    }
-
-private:
-    ConditionChecker impl;
-};
-
-template <template <class> class Cond, class... Args>
-IntervalCondition makeCond(Args&&... args) {
-    return IntervalCondition(std::forward<Args>(args)..., Cond<IntervalCondition::DimType>{});
-}
-using LayoutCondition = std::tuple<size_t /*dim index*/, IntervalCondition, std::string>;
-
-static inline std::tuple<bool, ov::Layout> makeGuesLayoutFrom4DShape(const ov::PartialShape& shape) {
-    // at the moment we make assumption about NCHW & NHCW only
-    // if hypothetical C value is less than hypothetical H and W - then
-    // out assumption is correct and we pick a corresponding layout
-    static const std::array<LayoutCondition, 2> hypothesisMatrix{
-        {{1, makeCond<std::less_equal>(2, 3), "NCHW"}, {3, makeCond<std::less_equal>(1, 2), "NHWC"}}};
-    for (const auto& h : hypothesisMatrix) {
-        auto channel_index = std::get<0>(h);
-        const auto& cond = std::get<1>(h);
-        if (cond(channel_index, shape)) {
-            return std::make_tuple(true, ov::Layout{std::get<2>(h)});
-        }
-    }
-    return {false, ov::Layout{}};
-}
-
-static inline ov::Layout getLayoutFromShape(const ov::PartialShape& shape) {
-    if (shape.size() == 2) {
-        return "NC";
-    }
-    if (shape.size() == 3) {
-        if (shape[0] == 1) {
-            return "NHW";
-        }
-        if (shape[2] == 1) {
-            return "HWN";
-        }
-        throw std::runtime_error("Can't guess layout for " + shape.to_string());
-    }
-    if (shape.size() == 4) {
-        if (ov::Interval{1, 4}.contains(shape[1].get_interval())) {
-            return "NCHW";
-        }
-        if (ov::Interval{1, 4}.contains(shape[3].get_interval())) {
-            return "NHWC";
-        }
-        if (shape[1] == shape[2]) {
-            return "NHWC";
-        }
-        if (shape[2] == shape[3]) {
-            return "NCHW";
-        }
-        bool guesResult = false;
-        ov::Layout guessedLayout;
-        std::tie(guesResult, guessedLayout) = makeGuesLayoutFrom4DShape(shape);
-        if (guesResult) {
-            return guessedLayout;
-        }
-    }
-    throw std::runtime_error("Usupported " + std::to_string(shape.size()) + "D shape");
-}
-
-static cv::Scalar string2Scalar(const std::string& string) {
-    std::stringstream ss{string};
-    std::string item;
-    std::vector<double> values;
-    values.reserve(3);
-    while (getline(ss, item, ' ')) {
-        try {
-            values.push_back(std::stod(item));
-        } catch (const std::invalid_argument&) {
-            throw std::runtime_error("Invalid parameter --mean_values or --scale_values is provided.");
-        }
-    }
-    if (values.size() != 3) {
-        throw std::runtime_error("InputTransform expects 3 values per channel, but got \"" + string + "\".");
-    }
-    return cv::Scalar(values[0], values[1], values[2]);
-}
-
-class InputTransform {
-public:
-    InputTransform() : reverseInputChannels(false), isTrivial(true) {}
-
-    InputTransform(bool reverseInputChannels, const std::string& meanValues, const std::string& scaleValues)
-        : reverseInputChannels(reverseInputChannels),
-          isTrivial(!reverseInputChannels && meanValues.empty() && scaleValues.empty()),
-          means(meanValues.empty() ? cv::Scalar(0.0, 0.0, 0.0) : string2Scalar(meanValues)),
-          stdScales(scaleValues.empty() ? cv::Scalar(1.0, 1.0, 1.0) : string2Scalar(scaleValues)) {}
-
-    void setPrecision(ov::preprocess::PrePostProcessor& ppp, const std::string& tensorName) {
-        const auto precision = isTrivial ? ov::element::u8 : ov::element::f32;
-        ppp.input(tensorName).tensor().set_element_type(precision);
-    }
-
-    cv::Mat operator()(const cv::Mat& inputs) {
-        if (isTrivial) {
-            return inputs;
-        }
-        cv::Mat result;
-        inputs.convertTo(result, CV_32F);
-        if (reverseInputChannels) {
-            cv::cvtColor(result, result, cv::COLOR_BGR2RGB);
-        }
-        // TODO: merge the two following lines after OpenCV3 is droppped
-        result -= means;
-        result /= cv::Mat{stdScales};
-        return result;
-    }
-
-private:
-    bool reverseInputChannels;
-    bool isTrivial;
-    cv::Scalar means;
-    cv::Scalar stdScales;
-};
-
-static inline cv::Mat wrap_saliency_map_tensor_to_mat(ov::Tensor& t, size_t shape_shift, size_t class_idx) {
-    int ocv_dtype;
-    switch (t.get_element_type()) {
-    case ov::element::u8:
-        ocv_dtype = CV_8U;
-        break;
-    case ov::element::f32:
-        ocv_dtype = CV_32F;
-        break;
-    default:
-        throw std::runtime_error("Unsupported saliency map data type in ov::Tensor to cv::Mat wrapper: " +
-                                 t.get_element_type().get_type_name());
-    }
-    void* t_ptr = static_cast<char*>(t.data()) + class_idx * t.get_strides()[shape_shift];
-    auto mat_size =
-        cv::Size(static_cast<int>(t.get_shape()[shape_shift + 2]), static_cast<int>(t.get_shape()[shape_shift + 1]));
-
-    return cv::Mat(mat_size, ocv_dtype, t_ptr, t.get_strides()[shape_shift + 1]);
-}
diff --git a/src/cpp/utils/include/utils/performance_metrics.hpp b/src/cpp/utils/include/utils/performance_metrics.hpp
deleted file mode 100644
index fa220000..00000000
--- a/src/cpp/utils/include/utils/performance_metrics.hpp
+++ /dev/null
@@ -1,88 +0,0 @@
-// Copyright (C) 2020-2024 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-/**
- * @brief a header file for performance metrics calculation class
- * @file performance_metrics.hpp
- */
-
-#pragma once
-
-#include <chrono>
-#include <iomanip>
-#include <iostream>
-#include <sstream>
-
-#include "utils/ocv_common.hpp"
-
-class PerformanceMetrics {
-public:
-    using Clock = std::chrono::steady_clock;
-    using TimePoint = std::chrono::time_point<Clock>;
-    using Duration = Clock::duration;
-    using Ms = std::chrono::duration<double, std::ratio<1, 1000>>;
-    using Sec = std::chrono::duration<double, std::ratio<1, 1>>;
-
-    struct Metrics {
-        double latency;
-        double fps;
-    };
-
-    enum MetricTypes { ALL, FPS, LATENCY };
-
-    PerformanceMetrics(Duration timeWindow = std::chrono::seconds(1));
-    void update(TimePoint lastRequestStartTime,
-                const cv::Mat& frame,
-                cv::Point position = {15, 30},
-                int fontFace = cv::FONT_HERSHEY_COMPLEX,
-                double fontScale = 0.75,
-                cv::Scalar color = {200, 10, 10},
-                int thickness = 2,
-                MetricTypes metricType = ALL);
-    void update(TimePoint lastRequestStartTime);
-
-    /// Paints metrics over provided mat
-    /// @param frame frame to paint over
-    /// @param position left top corner of text block
-    /// @param fontScale font scale
-    /// @param color font color
-    /// @param thickness font thickness
-    void paintMetrics(const cv::Mat& frame,
-                      cv::Point position = {15, 30},
-                      int fontFace = cv::FONT_HERSHEY_COMPLEX,
-                      double fontScale = 0.75,
-                      cv::Scalar color = {200, 10, 10},
-                      int thickness = 2,
-                      MetricTypes metricType = ALL) const;
-
-    Metrics getLast() const;
-    Metrics getTotal() const;
-    void logTotal() const;
-
-private:
-    struct Statistic {
-        Duration latency;
-        Duration period;
-        int frameCount;
-
-        Statistic() {
-            latency = Duration::zero();
-            period = Duration::zero();
-            frameCount = 0;
-        }
-
-        void combine(const Statistic& other) {
-            latency += other.latency;
-            period += other.period;
-            frameCount += other.frameCount;
-        }
-    };
-
-    Duration timeWindowSize;
-    Statistic lastMovingStatistic;
-    Statistic currentMovingStatistic;
-    Statistic totalStatistic;
-    TimePoint lastUpdateTime;
-    bool firstFrameProcessed;
-};
diff --git a/src/cpp/utils/include/utils/slog.hpp b/src/cpp/utils/include/utils/slog.hpp
deleted file mode 100644
index afea545a..00000000
--- a/src/cpp/utils/include/utils/slog.hpp
+++ /dev/null
@@ -1,95 +0,0 @@
-// Copyright (C) 2018-2024 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-/**
- * @brief a header file with logging facility for common samples
- * @file log.hpp
- */
-
-#pragma once
-
-#include <iostream>
-#include <string>
-
-namespace slog {
-
-/**
- * @class LogStreamEndLine
- * @brief The LogStreamEndLine class implements an end line marker for a log stream
- */
-class LogStreamEndLine {};
-
-static constexpr LogStreamEndLine endl;
-
-/**
- * @class LogStreamBoolAlpha
- * @brief The LogStreamBoolAlpha class implements bool printing for a log stream
- */
-class LogStreamBoolAlpha {};
-
-static constexpr LogStreamBoolAlpha boolalpha;
-
-/**
- * @class LogStream
- * @brief The LogStream class implements a stream for sample logging
- */
-class LogStream {
-    std::string _prefix;
-    std::ostream* _log_stream;
-    bool _new_line;
-
-public:
-    /**
-     * @brief A constructor. Creates a LogStream object
-     * @param prefix The prefix to print
-     */
-    LogStream(const std::string& prefix, std::ostream& log_stream) : _prefix(prefix), _new_line(true) {
-        _log_stream = &log_stream;
-    }
-
-    /**
-     * @brief A stream output operator to be used within the logger
-     * @param arg Object for serialization in the logger message
-     */
-    template <class T>
-    LogStream& operator<<(const T& arg) {
-        if (_new_line) {
-            (*_log_stream) << "[ " << _prefix << " ] ";
-            _new_line = false;
-        }
-
-        (*_log_stream) << arg;
-        return *this;
-    }
-
-    // Specializing for LogStreamEndLine to support slog::endl
-    LogStream& operator<<(const LogStreamEndLine& /*arg*/) {
-        _new_line = true;
-
-        (*_log_stream) << std::endl;
-        return *this;
-    }
-
-    // Specializing for LogStreamBoolAlpha to support slog::boolalpha
-    LogStream& operator<<(const LogStreamBoolAlpha& /*arg*/) {
-        (*_log_stream) << std::boolalpha;
-        return *this;
-    }
-
-    // Specializing for std::vector and std::list
-    template <template <class, class> class Container, class T>
-    LogStream& operator<<(const Container<T, std::allocator<T>>& container) {
-        for (const auto& el : container) {
-            *this << el << slog::endl;
-        }
-        return *this;
-    }
-};
-
-static LogStream info("INFO", std::cout);
-static LogStream debug("DEBUG", std::cout);
-static LogStream warn("WARNING", std::cout);
-static LogStream err("ERROR", std::cerr);
-
-}  // namespace slog
diff --git a/src/cpp/utils/src/args_helper.cpp b/src/cpp/utils/src/args_helper.cpp
deleted file mode 100644
index 085ca237..00000000
--- a/src/cpp/utils/src/args_helper.cpp
+++ /dev/null
@@ -1,110 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#include "utils/args_helper.hpp"
-
-#include <algorithm>
-#include <map>
-#include <sstream>
-#include <vector>
-
-std::vector<std::string> split(const std::string& s, char delim) {
-    std::vector<std::string> result;
-    std::stringstream ss(s);
-    std::string item;
-
-    while (getline(ss, item, delim)) {
-        result.push_back(item);
-    }
-    return result;
-}
-
-std::vector<std::string> parseDevices(const std::string& device_string) {
-    const std::string::size_type colon_position = device_string.find(":");
-    if (colon_position != std::string::npos) {
-        std::string device_type = device_string.substr(0, colon_position);
-        if (device_type == "HETERO" || device_type == "MULTI") {
-            std::string comma_separated_devices = device_string.substr(colon_position + 1);
-            std::vector<std::string> devices = split(comma_separated_devices, ',');
-            for (auto& device : devices)
-                device = device.substr(0, device.find("("));
-            return devices;
-        }
-    }
-    return {device_string};
-}
-
-// Format: <device1>:<value1>,<device2>:<value2> or just <value>
-std::map<std::string, int32_t> parseValuePerDevice(const std::set<std::string>& devices,
-                                                   const std::string& values_string) {
-    auto values_string_upper = values_string;
-    std::transform(values_string_upper.begin(),
-                   values_string_upper.end(),
-                   values_string_upper.begin(),
-                   [](unsigned char c) {
-                       return std::toupper(c);
-                   });
-    std::map<std::string, int32_t> result;
-    auto device_value_strings = split(values_string_upper, ',');
-    for (const auto& device_value_string : device_value_strings) {
-        auto device_value_vec = split(device_value_string, ':');
-        if (device_value_vec.size() == 2) {
-            auto it = std::find(devices.begin(), devices.end(), device_value_vec.at(0));
-            if (it != devices.end()) {
-                result[device_value_vec.at(0)] = std::stoi(device_value_vec.at(1));
-            }
-        } else if (device_value_vec.size() == 1) {
-            uint32_t value = std::stoi(device_value_vec.at(0));
-            for (const auto& device : devices) {
-                result[device] = value;
-            }
-        } else if (device_value_vec.size() != 0) {
-            throw std::runtime_error("Unknown string format: " + values_string);
-        }
-    }
-    return result;
-}
-
-std::map<std::string, ov::Layout> parseLayoutString(const std::string& layout_string) {
-    // Parse parameter string like "input0:NCHW,input1:NC" or "NCHW" (applied to all
-    // inputs)
-    std::map<std::string, ov::Layout> layouts;
-    std::string searchStr =
-        (layout_string.find_last_of(':') == std::string::npos && !layout_string.empty() ? ":" : "") + layout_string;
-    auto colonPos = searchStr.find_last_of(':');
-    while (colonPos != std::string::npos) {
-        auto startPos = searchStr.find_last_of(',');
-        auto inputName = searchStr.substr(startPos + 1, colonPos - startPos - 1);
-        auto inputLayout = searchStr.substr(colonPos + 1);
-        layouts[inputName] = ov::Layout(inputLayout);
-        searchStr.resize(startPos + 1);
-        if (searchStr.empty() || searchStr.back() != ',') {
-            break;
-        }
-        searchStr.pop_back();
-        colonPos = searchStr.find_last_of(':');
-    }
-    if (!searchStr.empty()) {
-        throw std::invalid_argument("Can't parse input layout string: " + layout_string);
-    }
-    return layouts;
-}
-
-std::string formatLayouts(const std::map<std::string, ov::Layout>& layouts) {
-    // Serialize layout as "input0:NCHW,input1:NC"
-    std::string result;
-    for (const auto& layout : layouts) {
-        auto layout_string = layout.second.to_string();
-        layout_string.erase(layout_string.begin());  // remove "["
-        layout_string.pop_back();                    // remove "]"
-        layout_string.erase(std::remove(layout_string.begin(), layout_string.end(), ','),
-                            layout_string.end());  // remove ","
-        result += layout.first + ":" + layout_string + ",";
-    }
-    if (!result.empty()) {
-        result.pop_back();
-    }
-    return result;
-}
diff --git a/src/cpp/utils/src/kuhn_munkres.cpp b/src/cpp/utils/src/kuhn_munkres.cpp
deleted file mode 100644
index 350c2ffb..00000000
--- a/src/cpp/utils/src/kuhn_munkres.cpp
+++ /dev/null
@@ -1,170 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#include <algorithm>
-#include <limits>
-#include <utils/kuhn_munkres.hpp>
-#include <vector>
-
-KuhnMunkres::KuhnMunkres(bool greedy) : n_(), greedy_(greedy) {}
-
-std::vector<size_t> KuhnMunkres::Solve(const cv::Mat& dissimilarity_matrix) {
-    CV_Assert(dissimilarity_matrix.type() == CV_32F);
-    double min_val;
-    cv::minMaxLoc(dissimilarity_matrix, &min_val);
-
-    n_ = std::max(dissimilarity_matrix.rows, dissimilarity_matrix.cols);
-    dm_ = cv::Mat(n_, n_, CV_32F, cv::Scalar(0));
-    marked_ = cv::Mat(n_, n_, CV_8S, cv::Scalar(0));
-    points_ = std::vector<cv::Point>(n_ * 2);
-
-    dissimilarity_matrix.copyTo(dm_(cv::Rect(0, 0, dissimilarity_matrix.cols, dissimilarity_matrix.rows)));
-
-    is_row_visited_ = std::vector<int>(n_, 0);
-    is_col_visited_ = std::vector<int>(n_, 0);
-
-    Run();
-
-    std::vector<size_t> results(dissimilarity_matrix.rows, -1);
-    for (int i = 0; i < dissimilarity_matrix.rows; i++) {
-        const auto ptr = marked_.ptr<char>(i);
-        for (int j = 0; j < dissimilarity_matrix.cols; j++) {
-            if (ptr[j] == kStar) {
-                results[i] = (size_t)j;
-            }
-        }
-    }
-    return results;
-}
-
-void KuhnMunkres::TrySimpleCase() {
-    auto is_row_visited = std::vector<int>(n_, 0);
-    auto is_col_visited = std::vector<int>(n_, 0);
-
-    for (int row = 0; row < n_; row++) {
-        auto ptr = dm_.ptr<float>(row);
-        auto marked_ptr = marked_.ptr<char>(row);
-        auto min_val = *std::min_element(ptr, ptr + n_);
-        for (int col = 0; col < n_; col++) {
-            ptr[col] -= min_val;
-            if (ptr[col] == 0 && !is_col_visited[col] && !is_row_visited[row]) {
-                marked_ptr[col] = kStar;
-                is_col_visited[col] = 1;
-                is_row_visited[row] = 1;
-            }
-        }
-    }
-}
-
-bool KuhnMunkres::CheckIfOptimumIsFound() {
-    int count = 0;
-    for (int i = 0; i < n_; i++) {
-        const auto marked_ptr = marked_.ptr<char>(i);
-        for (int j = 0; j < n_; j++) {
-            if (marked_ptr[j] == kStar) {
-                is_col_visited_[j] = 1;
-                count++;
-            }
-        }
-    }
-
-    return count >= n_;
-}
-
-cv::Point KuhnMunkres::FindUncoveredMinValPos() {
-    auto min_val = std::numeric_limits<float>::max();
-    cv::Point min_val_pos(-1, -1);
-    for (int i = 0; i < n_; i++) {
-        if (!is_row_visited_[i]) {
-            auto dm_ptr = dm_.ptr<float>(i);
-            for (int j = 0; j < n_; j++) {
-                if (!is_col_visited_[j] && dm_ptr[j] < min_val) {
-                    min_val = dm_ptr[j];
-                    min_val_pos = cv::Point(j, i);
-                }
-            }
-        }
-    }
-    return min_val_pos;
-}
-
-void KuhnMunkres::UpdateDissimilarityMatrix(float val) {
-    for (int i = 0; i < n_; i++) {
-        auto dm_ptr = dm_.ptr<float>(i);
-        for (int j = 0; j < n_; j++) {
-            if (is_row_visited_[i])
-                dm_ptr[j] += val;
-            if (!is_col_visited_[j])
-                dm_ptr[j] -= val;
-        }
-    }
-}
-
-int KuhnMunkres::FindInRow(int row, int what) {
-    for (int j = 0; j < n_; j++) {
-        if (marked_.at<char>(row, j) == what) {
-            return j;
-        }
-    }
-    return -1;
-}
-
-int KuhnMunkres::FindInCol(int col, int what) {
-    for (int i = 0; i < n_; i++) {
-        if (marked_.at<char>(i, col) == what) {
-            return i;
-        }
-    }
-    return -1;
-}
-
-void KuhnMunkres::Run() {
-    TrySimpleCase();
-    if (greedy_)
-        return;
-    while (!CheckIfOptimumIsFound()) {
-        while (true) {
-            auto point = FindUncoveredMinValPos();
-            auto min_val = dm_.at<float>(point.y, point.x);
-            if (min_val > 0) {
-                UpdateDissimilarityMatrix(min_val);
-            } else {
-                marked_.at<char>(point.y, point.x) = kPrime;
-                int col = FindInRow(point.y, kStar);
-                if (col >= 0) {
-                    is_row_visited_[point.y] = 1;
-                    is_col_visited_[col] = 0;
-                } else {
-                    int count = 0;
-                    points_[count] = point;
-
-                    while (true) {
-                        int row = FindInCol(points_[count].x, kStar);
-                        if (row >= 0) {
-                            count++;
-                            points_[count] = cv::Point(points_[count - 1].x, row);
-                            int idx = FindInRow(points_[count].y, kPrime);
-                            count++;
-                            points_[count] = cv::Point(idx, points_[count - 1].y);
-                        } else {
-                            break;
-                        }
-                    }
-
-                    for (int i = 0; i < count + 1; i++) {
-                        auto& mark = marked_.at<char>(points_[i].y, points_[i].x);
-                        mark = mark == kStar ? 0 : kStar;
-                    }
-
-                    is_row_visited_ = std::vector<int>(n_, 0);
-                    is_col_visited_ = std::vector<int>(n_, 0);
-
-                    marked_.setTo(0, marked_ == kPrime);
-                    break;
-                }
-            }
-        }
-    }
-}
diff --git a/src/cpp/utils/src/nms.cpp b/src/cpp/utils/src/nms.cpp
deleted file mode 100644
index 192354ad..00000000
--- a/src/cpp/utils/src/nms.cpp
+++ /dev/null
@@ -1,28 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-
-#include "utils/nms.hpp"
-
-#include <vector>
-
-std::vector<size_t> multiclass_nms(const std::vector<AnchorLabeled>& boxes,
-                                   const std::vector<float>& scores,
-                                   const float iou_threshold,
-                                   bool includeBoundaries,
-                                   size_t maxNum) {
-    std::vector<Anchor> boxes_copy;
-    boxes_copy.reserve(boxes.size());
-
-    float max_coord = 0.f;
-    for (const auto& box : boxes) {
-        max_coord = std::max(max_coord, std::max(box.right, box.bottom));
-    }
-    for (auto& box : boxes) {
-        float offset = box.labelID * max_coord;
-        boxes_copy.emplace_back(box.left + offset, box.top + offset, box.right + offset, box.bottom + offset);
-    }
-
-    return nms<Anchor>(boxes_copy, scores, iou_threshold, includeBoundaries, maxNum);
-}
diff --git a/src/python/model_api/__init__.py b/src/python/model_api/__init__.py
index e585bb28..15b4a514 100644
--- a/src/python/model_api/__init__.py
+++ b/src/python/model_api/__init__.py
@@ -1,4 +1,4 @@
 #
-# Copyright (C) 2020-2024 Intel Corporation
+# Copyright (C) 2020-2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #
diff --git a/src/python/model_api/adapters/__init__.py b/src/python/model_api/adapters/__init__.py
index 5d108556..819f484a 100644
--- a/src/python/model_api/adapters/__init__.py
+++ b/src/python/model_api/adapters/__init__.py
@@ -1,5 +1,5 @@
 #
-# Copyright (C) 2020-2024 Intel Corporation
+# Copyright (C) 2020-2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #
 
diff --git a/src/python/model_api/adapters/inference_adapter.py b/src/python/model_api/adapters/inference_adapter.py
index c18b452b..632e6cc1 100644
--- a/src/python/model_api/adapters/inference_adapter.py
+++ b/src/python/model_api/adapters/inference_adapter.py
@@ -1,5 +1,5 @@
 #
-# Copyright (C) 2020-2024 Intel Corporation
+# Copyright (C) 2020-2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #
 
diff --git a/src/python/model_api/adapters/onnx_adapter.py b/src/python/model_api/adapters/onnx_adapter.py
index c14a589f..f376f87f 100644
--- a/src/python/model_api/adapters/onnx_adapter.py
+++ b/src/python/model_api/adapters/onnx_adapter.py
@@ -1,5 +1,5 @@
 #
-# Copyright (C) 2020-2024 Intel Corporation
+# Copyright (C) 2020-2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #
 
diff --git a/src/python/model_api/adapters/ovms_adapter.py b/src/python/model_api/adapters/ovms_adapter.py
index 603552a0..30d802b1 100644
--- a/src/python/model_api/adapters/ovms_adapter.py
+++ b/src/python/model_api/adapters/ovms_adapter.py
@@ -1,5 +1,5 @@
 #
-# Copyright (C) 2020-2024 Intel Corporation
+# Copyright (C) 2020-2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #
 
diff --git a/src/python/model_api/models/__init__.py b/src/python/model_api/models/__init__.py
index 2b329c45..48833116 100644
--- a/src/python/model_api/models/__init__.py
+++ b/src/python/model_api/models/__init__.py
@@ -1,5 +1,5 @@
 #
-# Copyright (C) 2020-2024 Intel Corporation
+# Copyright (C) 2020-2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #
 
diff --git a/src/python/model_api/models/action_classification.py b/src/python/model_api/models/action_classification.py
index 8af041ab..2ead89eb 100644
--- a/src/python/model_api/models/action_classification.py
+++ b/src/python/model_api/models/action_classification.py
@@ -1,5 +1,5 @@
 #
-# Copyright (C) 2020-2024 Intel Corporation
+# Copyright (C) 2020-2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #
 
diff --git a/src/python/model_api/models/anomaly.py b/src/python/model_api/models/anomaly.py
index 7affdd94..301f5fd6 100644
--- a/src/python/model_api/models/anomaly.py
+++ b/src/python/model_api/models/anomaly.py
@@ -1,5 +1,5 @@
 #
-# Copyright (C) 2020-2024 Intel Corporation
+# Copyright (C) 2020-2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #
 """Definition for anomaly models.
diff --git a/src/python/model_api/models/detection_model.py b/src/python/model_api/models/detection_model.py
index 4e2d4c0a..07c298e7 100644
--- a/src/python/model_api/models/detection_model.py
+++ b/src/python/model_api/models/detection_model.py
@@ -1,5 +1,5 @@
 #
-# Copyright (C) 2020-2024 Intel Corporation
+# Copyright (C) 2020-2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #
 
diff --git a/src/python/model_api/models/image_model.py b/src/python/model_api/models/image_model.py
index b68ebc2f..d6d41eb2 100644
--- a/src/python/model_api/models/image_model.py
+++ b/src/python/model_api/models/image_model.py
@@ -1,5 +1,5 @@
 #
-# Copyright (C) 2020-2024 Intel Corporation
+# Copyright (C) 2020-2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #
 
diff --git a/src/python/model_api/models/instance_segmentation.py b/src/python/model_api/models/instance_segmentation.py
index 7f605130..8cc9cbf3 100644
--- a/src/python/model_api/models/instance_segmentation.py
+++ b/src/python/model_api/models/instance_segmentation.py
@@ -1,5 +1,5 @@
 #
-# Copyright (C) 2020-2024 Intel Corporation
+# Copyright (C) 2020-2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #
 
diff --git a/src/python/model_api/models/model.py b/src/python/model_api/models/model.py
index 88bb13a9..86a3f0b6 100644
--- a/src/python/model_api/models/model.py
+++ b/src/python/model_api/models/model.py
@@ -1,5 +1,5 @@
 #
-# Copyright (C) 2020-2024 Intel Corporation
+# Copyright (C) 2020-2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #
 
diff --git a/src/python/model_api/models/sam_models.py b/src/python/model_api/models/sam_models.py
index dd60965c..3371f7f7 100644
--- a/src/python/model_api/models/sam_models.py
+++ b/src/python/model_api/models/sam_models.py
@@ -1,5 +1,5 @@
 #
-# Copyright (C) 2020-2024 Intel Corporation
+# Copyright (C) 2020-2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #
 
diff --git a/src/python/model_api/models/segmentation.py b/src/python/model_api/models/segmentation.py
index dc530e11..dd811ae7 100644
--- a/src/python/model_api/models/segmentation.py
+++ b/src/python/model_api/models/segmentation.py
@@ -1,5 +1,5 @@
 #
-# Copyright (C) 2020-2024 Intel Corporation
+# Copyright (C) 2020-2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #
 
diff --git a/src/python/model_api/models/ssd.py b/src/python/model_api/models/ssd.py
index 1e223216..608481e3 100644
--- a/src/python/model_api/models/ssd.py
+++ b/src/python/model_api/models/ssd.py
@@ -1,5 +1,5 @@
 #
-# Copyright (C) 2020-2024 Intel Corporation
+# Copyright (C) 2020-2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #
 
diff --git a/src/python/model_api/models/types.py b/src/python/model_api/models/types.py
index 53d86b38..61fc45c0 100644
--- a/src/python/model_api/models/types.py
+++ b/src/python/model_api/models/types.py
@@ -1,5 +1,5 @@
 #
-# Copyright (C) 2020-2024 Intel Corporation
+# Copyright (C) 2020-2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #
 
diff --git a/src/python/model_api/models/utils.py b/src/python/model_api/models/utils.py
index abc21c0c..24bf2a78 100644
--- a/src/python/model_api/models/utils.py
+++ b/src/python/model_api/models/utils.py
@@ -1,5 +1,5 @@
 #
-# Copyright (C) 2020-2024 Intel Corporation
+# Copyright (C) 2020-2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #
 
diff --git a/src/python/model_api/models/visual_prompting.py b/src/python/model_api/models/visual_prompting.py
index 9f65247c..c24cc8c6 100644
--- a/src/python/model_api/models/visual_prompting.py
+++ b/src/python/model_api/models/visual_prompting.py
@@ -1,5 +1,5 @@
 #
-# Copyright (C) 2020-2024 Intel Corporation
+# Copyright (C) 2020-2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #
 
diff --git a/src/python/model_api/models/yolo.py b/src/python/model_api/models/yolo.py
index a7a17bbf..bc4703fb 100644
--- a/src/python/model_api/models/yolo.py
+++ b/src/python/model_api/models/yolo.py
@@ -1,5 +1,5 @@
 #
-# Copyright (C) 2020-2024 Intel Corporation
+# Copyright (C) 2020-2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #
 
diff --git a/src/python/model_api/performance_metrics.py b/src/python/model_api/performance_metrics.py
index e3c52a42..82fc4f76 100644
--- a/src/python/model_api/performance_metrics.py
+++ b/src/python/model_api/performance_metrics.py
@@ -1,5 +1,5 @@
 #
-# Copyright (C) 2020-2024 Intel Corporation
+# Copyright (C) 2020-2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #
 
diff --git a/src/python/model_api/pipelines/__init__.py b/src/python/model_api/pipelines/__init__.py
index b4237f43..b1843803 100644
--- a/src/python/model_api/pipelines/__init__.py
+++ b/src/python/model_api/pipelines/__init__.py
@@ -1,5 +1,5 @@
 #
-# Copyright (C) 2020-2024 Intel Corporation
+# Copyright (C) 2020-2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #
 from .async_pipeline import AsyncPipeline
diff --git a/src/python/model_api/pipelines/async_pipeline.py b/src/python/model_api/pipelines/async_pipeline.py
index 83dc974c..9c3fc10b 100644
--- a/src/python/model_api/pipelines/async_pipeline.py
+++ b/src/python/model_api/pipelines/async_pipeline.py
@@ -1,5 +1,5 @@
 #
-# Copyright (C) 2020-2024 Intel Corporation
+# Copyright (C) 2020-2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #
 
diff --git a/src/python/model_api/tilers/__init__.py b/src/python/model_api/tilers/__init__.py
index 8caf4852..44f4208e 100644
--- a/src/python/model_api/tilers/__init__.py
+++ b/src/python/model_api/tilers/__init__.py
@@ -1,5 +1,5 @@
 #
-# Copyright (C) 2020-2024 Intel Corporation
+# Copyright (C) 2020-2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #
 
diff --git a/src/python/model_api/tilers/detection.py b/src/python/model_api/tilers/detection.py
index 5fb46b39..8329fd80 100644
--- a/src/python/model_api/tilers/detection.py
+++ b/src/python/model_api/tilers/detection.py
@@ -1,5 +1,5 @@
 #
-# Copyright (C) 2020-2024 Intel Corporation
+# Copyright (C) 2020-2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #
 
diff --git a/src/python/model_api/tilers/instance_segmentation.py b/src/python/model_api/tilers/instance_segmentation.py
index 13ec4a65..26e68ac4 100644
--- a/src/python/model_api/tilers/instance_segmentation.py
+++ b/src/python/model_api/tilers/instance_segmentation.py
@@ -1,5 +1,5 @@
 #
-# Copyright (C) 2020-2024 Intel Corporation
+# Copyright (C) 2020-2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #
 
diff --git a/src/python/model_api/tilers/semantic_segmentation.py b/src/python/model_api/tilers/semantic_segmentation.py
index 22ce6589..29ffac43 100644
--- a/src/python/model_api/tilers/semantic_segmentation.py
+++ b/src/python/model_api/tilers/semantic_segmentation.py
@@ -1,5 +1,5 @@
 #
-# Copyright (C) 2020-2024 Intel Corporation
+# Copyright (C) 2020-2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #
 
diff --git a/src/python/model_api/tilers/tiler.py b/src/python/model_api/tilers/tiler.py
index 1a027a05..a7596dfa 100644
--- a/src/python/model_api/tilers/tiler.py
+++ b/src/python/model_api/tilers/tiler.py
@@ -1,5 +1,5 @@
 #
-# Copyright (C) 2020-2024 Intel Corporation
+# Copyright (C) 2020-2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #
 
diff --git a/tests/cpp/CMakeLists.txt b/tests/cpp/CMakeLists.txt
new file mode 100644
index 00000000..90c1b0ab
--- /dev/null
+++ b/tests/cpp/CMakeLists.txt
@@ -0,0 +1,25 @@
+cmake_minimum_required(VERSION 3.26)
+
+
+project(tests)
+
+add_subdirectory(../../src/cpp ${tests_BINARY_DIR}/src/cpp)
+
+include(FetchContent)
+
+FetchContent_Declare(json GIT_REPOSITORY https://github.com/nlohmann/json.git
+                          GIT_TAG d41ca94fa85d5119852e2f7a3f94335cc7cb0486  # PR #4709, fixes cmake deprecation warnings
+                    )
+FetchContent_Declare(googletest
+    GIT_REPOSITORY https://github.com/google/googletest.git
+    GIT_TAG a7f443b80b105f940225332ed3c31f2790092f47  # latest main
+)
+FetchContent_MakeAvailable(json googletest)
+
+find_package(OpenCV REQUIRED COMPONENTS imgcodecs)
+
+add_executable(test_accuracy test_accuracy.cpp)
+target_link_libraries(test_accuracy gtest_main nlohmann_json::nlohmann_json model_api ${OpenCV_LIBRARIES})
+
+#include(GoogleTest)
+#gtest_discover_tests(test_accuracy)
diff --git a/tests/cpp/accuracy/CMakeLists.txt b/tests/cpp/accuracy/CMakeLists.txt
deleted file mode 100644
index e9648e91..00000000
--- a/tests/cpp/accuracy/CMakeLists.txt
+++ /dev/null
@@ -1,73 +0,0 @@
-# Copyright (C) 2018-2019 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-#
-
-cmake_minimum_required(VERSION 3.26)
-
-# Multi config generators such as Visual Studio ignore CMAKE_BUILD_TYPE. Multi config generators are configured with
-# CMAKE_CONFIGURATION_TYPES, but limiting options in it completely removes such build options
-get_property(GENERATOR_IS_MULTI_CONFIG_VAR GLOBAL PROPERTY GENERATOR_IS_MULTI_CONFIG)
-if(NOT GENERATOR_IS_MULTI_CONFIG_VAR AND NOT DEFINED CMAKE_BUILD_TYPE)
-    message(STATUS "CMAKE_BUILD_TYPE not defined, 'Release' will be used")
-    # Setting CMAKE_BUILD_TYPE as CACHE must go before project(). Otherwise project() sets its value and set() doesn't take an effect
-    set(CMAKE_BUILD_TYPE Release CACHE STRING "Choose the type of build, options are: None Debug Release RelWithDebInfo MinSizeRel ...")
-endif()
-
-project(tests)
-
-if(WIN32)
-    if(NOT "${CMAKE_SIZEOF_VOID_P}" EQUAL "8")
-        message(FATAL_ERROR "Only 64-bit supported on Windows")
-    endif()
-
-    add_definitions(-DNOMINMAX)
-endif()
-
-if(MSVC)
-    add_compile_options(/wd4251 /wd4275 /wd4267  # disable some warnings
-                        /W3  # Specify the level of warnings to be generated by the compiler
-                        /EHsc)  # Enable standard C++ stack unwinding, assume functions with extern "C" never throw
-endif()
-
-if(CMAKE_CXX_COMPILER_ID MATCHES "^GNU|(Apple)?Clang$")
-    add_compile_options(-Wall -Wextra)
-endif()
-
-if(CMAKE_SYSTEM_PROCESSOR MATCHES "^(arm64.*|aarch64.*|AARCH64.*)")
-  set(AARCH64 ON)
-elseif(CMAKE_SYSTEM_PROCESSOR MATCHES "^(arm.*|ARM.*)")
-  set(ARM ON)
-endif()
-if(ARM AND NOT CMAKE_CROSSCOMPILING)
-    add_compile_options(-march=armv7-a+fp)
-endif()
-
-set(CMAKE_CXX_STANDARD 17)
-set(CMAKE_CXX_STANDARD_REQUIRED ON)
-set(CMAKE_POSITION_INDEPENDENT_CODE ON)
-# Something: OpenCV or OpenVINO links gflags with /MT instead of default flag.
-# Set the same to avoid linkage conflicts
-if(WIN32)
-    set(CMAKE_CXX_FLAGS_RELEASE "${CMAKE_CXX_FLAGS_RELEASE} /MT")
-endif()
-
-include(CMakeParseArguments)
-include(FetchContent)
-
-FetchContent_Declare(json GIT_REPOSITORY https://github.com/nlohmann/json.git
-                          GIT_TAG d41ca94fa85d5119852e2f7a3f94335cc7cb0486  # PR #4709, fixes cmake deprecation warnings
-                    )
-FetchContent_Declare(googletest
-    GIT_REPOSITORY https://github.com/google/googletest.git
-    GIT_TAG a7f443b80b105f940225332ed3c31f2790092f47  # latest main
-)
-FetchContent_MakeAvailable(json googletest)
-
-include(../cmake/common.cmake)
-
-find_package(OpenCV REQUIRED COMPONENTS core highgui videoio imgproc imgcodecs)
-
-add_subdirectory(../../../src/cpp ${tests_BINARY_DIR}/model_api/cpp)
-
-add_test(NAME test_accuracy SOURCES test_accuracy.cpp DEPENDENCIES model_api)
-add_test(NAME test_YOLOv8 SOURCES test_YOLOv8.cpp DEPENDENCIES model_api)
diff --git a/tests/cpp/accuracy/conftest.py b/tests/cpp/accuracy/conftest.py
deleted file mode 100644
index c05e5922..00000000
--- a/tests/cpp/accuracy/conftest.py
+++ /dev/null
@@ -1,9 +0,0 @@
-#
-# Copyright (C) 2025 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-#
-
-
-def pytest_addoption(parser):
-    parser.addoption("--data", action="store", help="data folder with dataset")
-    parser.addoption("--config", action="store", help="path to models config")
diff --git a/tests/cpp/accuracy/test_YOLOv8.cpp b/tests/cpp/accuracy/test_YOLOv8.cpp
deleted file mode 100644
index c4ee90bd..00000000
--- a/tests/cpp/accuracy/test_YOLOv8.cpp
+++ /dev/null
@@ -1,82 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-#include <gtest/gtest.h>
-#include <models/detection_model.h>
-#include <models/input_data.h>
-#include <models/results.h>
-
-#include <filesystem>
-#include <fstream>
-
-using namespace std;
-
-namespace {
-string data() {
-    // Get data from env var, not form cmd arg to stay aligned with Python version
-    static const char* const data = getenv("DATA");
-    EXPECT_NE(data, nullptr);
-    return data;
-}
-
-string model_path(const char model_name[]) {
-    return data() + "/ultralytics/" + model_name;
-}
-
-shared_ptr<DetectionModel> cached_model(const char model_name[]) {
-    static const char* prev_arg;
-    static shared_ptr<DetectionModel> prev_model;
-    if (model_name == prev_arg) {
-        return prev_model;
-    } else {
-        prev_arg = model_name;
-        filesystem::path xml;
-        for (auto const& dir_entry : filesystem::directory_iterator{model_path(model_name)}) {
-            const filesystem::path& path = dir_entry.path();
-            if (".xml" == path.extension()) {
-                EXPECT_TRUE(xml.empty());
-                xml = path;
-            }
-        }
-        bool preload = true;
-        prev_model = DetectionModel::create_model(xml.string(), {}, "", preload, "CPU");
-        return prev_model;
-    }
-}
-
-struct Param {
-    const char* model_name;
-    filesystem::path refpath;
-};
-
-class AccuracySuit : public testing::TestWithParam<Param> {};
-
-TEST_P(AccuracySuit, TestDetector) {
-    Param param = GetParam();
-    ifstream file{param.refpath};
-    stringstream ss;
-    ss << file.rdbuf();
-    EXPECT_EQ(ss.str(),
-              string{*cached_model(param.model_name)
-                          ->infer(cv::imread(data() + "/coco128/images/train2017/" + param.refpath.stem().string() +
-                                             ".jpg"))});
-}
-
-INSTANTIATE_TEST_SUITE_P(YOLOv8, AccuracySuit, testing::ValuesIn([] {
-                             std::vector<Param> params;
-                             for (const char* model_name : {"yolov5mu_openvino_model", "yolov8l_openvino_model"}) {
-                                 vector<filesystem::path> refpaths;
-                                 for (auto const& dir_entry :
-                                      filesystem::directory_iterator{model_path(model_name) + "/ref/"}) {
-                                     refpaths.push_back(dir_entry.path());
-                                 }
-                                 EXPECT_GT(refpaths.size(), 0);
-                                 sort(refpaths.begin(), refpaths.end());
-                                 for (const filesystem::path& refpath : refpaths) {
-                                     params.push_back({model_name, refpath});
-                                 }
-                             }
-                             return params;
-                         }()));
-}  // namespace
diff --git a/tests/cpp/accuracy/test_accuracy.cpp b/tests/cpp/accuracy/test_accuracy.cpp
deleted file mode 100644
index 615ebc43..00000000
--- a/tests/cpp/accuracy/test_accuracy.cpp
+++ /dev/null
@@ -1,373 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-#include <adapters/openvino_adapter.h>
-#include <gtest/gtest.h>
-#include <models/anomaly_model.h>
-#include <models/classification_model.h>
-#include <models/detection_model.h>
-#include <models/input_data.h>
-#include <models/instance_segmentation.h>
-#include <models/keypoint_detection.h>
-#include <models/results.h>
-#include <models/segmentation_model.h>
-#include <stddef.h>
-#include <tilers/detection.h>
-#include <tilers/instance_segmentation.h>
-#include <tilers/semantic_segmentation.h>
-
-#include <cstdint>
-#include <exception>
-#include <fstream>
-#include <iomanip>
-#include <iostream>
-#include <nlohmann/json.hpp>
-#include <opencv2/core.hpp>
-#include <stdexcept>
-#include <string>
-
-using json = nlohmann::json;
-
-std::string PUBLIC_SCOPE_PATH = "../../tests/cpp/accuracy/public_scope.json";
-std::string DATA_DIR = "../data";
-std::string MODEL_PATH_TEMPLATE = "public/%s/FP16/%s.xml";
-
-struct TestData {
-    std::string image;
-    std::vector<std::string> reference;
-};
-
-struct ModelData {
-    std::string name;
-    std::string type;
-    std::vector<TestData> testData;
-    std::string tiler;
-    cv::Size input_res = cv::Size(0, 0);
-};
-
-class ModelParameterizedTest : public testing::TestWithParam<ModelData> {};
-
-template <typename... Args>
-std::string string_format(const std::string& fmt, Args... args) {
-    size_t size = snprintf(nullptr, 0, fmt.c_str(), args...);
-    std::string buf;
-    buf.reserve(size + 1);
-    buf.resize(size);
-    snprintf(&buf[0], size + 1, fmt.c_str(), args...);
-    return buf;
-}
-
-inline void from_json(const nlohmann::json& j, ModelData& test) {
-    test.name = j.at("name").get<std::string>();
-    test.type = j.at("type").get<std::string>();
-    for (auto& item : j.at("test_data")) {
-        TestData data;
-        data.image = item.at("image").get<std::string>();
-        for (auto& ref : item.at("reference")) {
-            data.reference.push_back(ref.get<std::string>());
-        }
-        test.testData.push_back(data);
-    }
-    if (j.contains("tiler")) {
-        test.tiler = j.at("tiler").get<std::string>();
-    }
-    if (j.contains("input_res")) {
-        auto res = j.at("input_res").get<std::string>();
-        res.erase(std::remove(res.begin(), res.end(), '('), res.end());
-        res.erase(std::remove(res.begin(), res.end(), ')'), res.end());
-        test.input_res.width = std::stoi(res.substr(0, res.find(',')));
-        res.erase(0, res.find(',') + 1);
-        test.input_res.height = std::stoi(res);
-    }
-}
-
-namespace {
-std::vector<ModelData> GetTestData(const std::string& path) {
-    std::ifstream input(path);
-    nlohmann::json j;
-    input >> j;
-    return j;
-}
-
-template <typename Type>
-std::vector<std::shared_ptr<Type>> create_models(const std::string& model_path) {
-    bool preload = true;
-    std::vector<std::shared_ptr<Type>> models{Type::create_model(model_path, {}, preload, "CPU")};
-    if (std::string::npos != model_path.find("/serialized/")) {
-        static ov::Core core;
-        std::shared_ptr<ov::Model> model = core.read_model(model_path);
-        std::shared_ptr<InferenceAdapter> adapter = std::make_shared<OpenVINOInferenceAdapter>();
-        adapter->loadModel(model, core, "CPU");
-        models.push_back(Type::create_model(adapter));
-    }
-    return models;
-}
-
-template <>
-std::vector<std::shared_ptr<DetectionModel>> create_models(const std::string& model_path) {
-    bool preload = true;
-    std::vector<std::shared_ptr<DetectionModel>> models{
-        DetectionModel::create_model(model_path, {}, "", preload, "CPU")};
-    if (std::string::npos != model_path.find("/serialized/")) {
-        static ov::Core core;
-        std::shared_ptr<ov::Model> model = core.read_model(model_path);
-        std::shared_ptr<InferenceAdapter> adapter = std::make_shared<OpenVINOInferenceAdapter>();
-        adapter->loadModel(model, core, "CPU");
-        models.push_back(DetectionModel::create_model(adapter));
-    }
-    return models;
-}
-}  // namespace
-
-TEST_P(ModelParameterizedTest, AccuracyTest) {
-    auto modelData = GetParam();
-
-    std::string modelPath;
-    const std::string& name = modelData.name;
-    if (name.find(".onnx") != std::string::npos) {
-        GTEST_SKIP() << "ONNX models are not supported in C++ implementation";
-    }
-    if (name.find("action_cls_xd3_kinetic") != std::string::npos) {
-        GTEST_SKIP() << "ActionClassificationModel is not supported in C++ implementation";
-    }
-    if (name.find("mobilenet_v3_large_hc_cf") != std::string::npos) {
-        GTEST_SKIP() << "mobilenet_v3_large_hc_cf fails in OV 2025.0";
-    }
-    if (name.find("anomaly_padim_bottle_mvtec") != std::string::npos) {
-        GTEST_SKIP() << "anomaly_padim_bottle_mvtec fails in OV 2025.0";
-    }
-    if (name.find("sam_vit_b") != std::string::npos) {
-        GTEST_SKIP() << "SAM-based models are not supported in C++ implementation";
-    }
-
-    if (name.substr(name.size() - 4) == ".xml") {
-        modelPath = DATA_DIR + '/' + name;
-    } else {
-        modelPath = DATA_DIR + '/' + string_format(MODEL_PATH_TEMPLATE, name.c_str(), name.c_str());
-    }
-    const std::string& basename = modelPath.substr(modelPath.find_last_of("/\\") + 1);
-    for (const std::string& modelXml : {modelPath, DATA_DIR + "/serialized/" + basename}) {
-        if (modelData.type == "DetectionModel") {
-            for (const std::shared_ptr<DetectionModel>& model : create_models<DetectionModel>(modelXml)) {
-                for (size_t i = 0; i < modelData.testData.size(); i++) {
-                    ASSERT_EQ(modelData.testData[i].reference.size(), 1);
-                    auto imagePath = DATA_DIR + "/" + modelData.testData[i].image;
-
-                    cv::Mat image = cv::imread(imagePath);
-                    if (!image.data) {
-                        throw std::runtime_error{"Failed to read the image"};
-                    }
-
-                    std::unique_ptr<DetectionResult> result;
-                    if (modelData.tiler == "DetectionTiler") {
-                        auto tiler = DetectionTiler(std::move(model), {});
-                        if (modelData.input_res.height > 0 && modelData.input_res.width > 0) {
-                            cv::resize(image, image, modelData.input_res);
-                        }
-                        result = tiler.run(image);
-                    } else {
-                        result = model->infer(image);
-                    }
-                    EXPECT_EQ(std::string{*result}, modelData.testData[i].reference[0]);
-                }
-            }
-        } else if (modelData.type == "ClassificationModel") {
-            for (const std::shared_ptr<ClassificationModel>& model : create_models<ClassificationModel>(modelXml)) {
-                for (size_t i = 0; i < modelData.testData.size(); i++) {
-                    ASSERT_EQ(modelData.testData[i].reference.size(), 1);
-                    auto imagePath = DATA_DIR + "/" + modelData.testData[i].image;
-
-                    cv::Mat image = cv::imread(imagePath);
-                    if (!image.data) {
-                        throw std::runtime_error{"Failed to read the image"};
-                    }
-                    auto result = model->infer(image);
-                    EXPECT_EQ(std::string{*result}, modelData.testData[i].reference[0]);
-                }
-            }
-        } else if (modelData.type == "SegmentationModel") {
-            for (const std::shared_ptr<SegmentationModel>& model : create_models<SegmentationModel>(modelXml)) {
-                for (size_t i = 0; i < modelData.testData.size(); i++) {
-                    ASSERT_EQ(modelData.testData[i].reference.size(), 1);
-                    auto imagePath = DATA_DIR + "/" + modelData.testData[i].image;
-
-                    cv::Mat image = cv::imread(imagePath);
-                    if (!image.data) {
-                        throw std::runtime_error{"Failed to read the image"};
-                    }
-
-                    std::unique_ptr<ImageResult> pred;
-                    if (modelData.tiler == "SemanticSegmentationTiler") {
-                        auto tiler = SemanticSegmentationTiler(std::move(model), {});
-                        if (modelData.input_res.height > 0 && modelData.input_res.width > 0) {
-                            cv::resize(image, image, modelData.input_res);
-                        }
-                        pred = tiler.run(image);
-                    } else {
-                        pred = model->infer(image);
-                    }
-
-                    ImageResultWithSoftPrediction* soft = dynamic_cast<ImageResultWithSoftPrediction*>(pred.get());
-                    if (soft) {
-                        const std::vector<Contour>& contours = model->getContours(*soft);
-                        std::stringstream ss;
-                        ss << *soft << "; ";
-                        for (const Contour& contour : contours) {
-                            ss << contour << ", ";
-                        }
-                        ASSERT_EQ(ss.str(), modelData.testData[i].reference[0]);
-                    } else {
-                        ASSERT_EQ(std::string{*pred}, modelData.testData[i].reference[0]);
-                    }
-                }
-            }
-        } else if (modelData.type == "MaskRCNNModel") {
-            for (const std::shared_ptr<MaskRCNNModel>& model : create_models<MaskRCNNModel>(modelXml)) {
-                for (size_t i = 0; i < modelData.testData.size(); i++) {
-                    ASSERT_EQ(modelData.testData[i].reference.size(), 1);
-                    auto imagePath = DATA_DIR + "/" + modelData.testData[i].image;
-
-                    cv::Mat image = cv::imread(imagePath);
-                    if (!image.data) {
-                        throw std::runtime_error{"Failed to read the image"};
-                    }
-
-                    std::unique_ptr<InstanceSegmentationResult> result;
-                    if (modelData.tiler == "InstanceSegmentationTiler") {
-                        auto tiler = InstanceSegmentationTiler(std::move(model), {});
-                        if (modelData.input_res.height > 0 && modelData.input_res.width > 0) {
-                            cv::resize(image, image, modelData.input_res);
-                        }
-                        result = tiler.run(image);
-                    } else {
-                        result = model->infer(image);
-                    }
-
-                    const std::vector<SegmentedObjectWithRects>& withRects =
-                        add_rotated_rects(result->segmentedObjects);
-                    std::stringstream ss;
-                    for (const SegmentedObjectWithRects& obj : withRects) {
-                        ss << obj << "; ";
-                    }
-                    size_t filled = 0;
-                    for (const cv::Mat_<std::uint8_t>& cls_map : result->saliency_map) {
-                        if (cls_map.data) {
-                            ++filled;
-                        }
-                    }
-                    ss << filled << "; ";
-                    try {
-                        ss << result->feature_vector.get_shape();
-                    } catch (ov::Exception&) {
-                        ss << "[0]";
-                    }
-                    ss << "; ";
-                    try {
-                        // getContours() assumes each instance generates only one contour.
-                        // That doesn't hold for some models
-                        for (const Contour& contour : getContours(result->segmentedObjects)) {
-                            ss << contour << "; ";
-                        }
-                    } catch (const std::runtime_error&) {
-                    }
-                    EXPECT_EQ(ss.str(), modelData.testData[i].reference[0]);
-                }
-            }
-        } else if (modelData.type == "AnomalyDetection") {
-            for (const std::shared_ptr<AnomalyModel>& model : create_models<AnomalyModel>(modelXml)) {
-                for (size_t i = 0; i < modelData.testData.size(); i++) {
-                    ASSERT_EQ(modelData.testData[i].reference.size(), 1);
-                    auto imagePath = DATA_DIR + "/" + modelData.testData[i].image;
-
-                    cv::Mat image = cv::imread(imagePath);
-                    if (!image.data) {
-                        throw std::runtime_error{"Failed to read the image"};
-                    }
-                    auto result = model->infer(image);
-                    EXPECT_EQ(std::string{*result}, modelData.testData[i].reference[0]);
-                }
-            }
-        } else if (modelData.type == "KeypointDetectionModel") {
-            for (const std::shared_ptr<KeypointDetectionModel>& model :
-                 create_models<KeypointDetectionModel>(modelXml)) {
-                for (size_t i = 0; i < modelData.testData.size(); i++) {
-                    if (i == 0) {
-                        GTEST_SKIP() << "OV gives different results on unpreprocessed keypoint model";
-                    }
-                    ASSERT_EQ(modelData.testData[i].reference.size(), 1);
-                    auto imagePath = DATA_DIR + "/" + modelData.testData[i].image;
-
-                    cv::Mat image = cv::imread(imagePath);
-                    if (!image.data) {
-                        throw std::runtime_error{"Failed to read the image"};
-                    }
-                    auto result = model->infer(image);
-                    EXPECT_EQ(std::string{(*result).poses[0]}, modelData.testData[i].reference[0]);
-                }
-            }
-        }
-
-        else {
-            throw std::runtime_error("Unknown model type: " + modelData.type);
-        }
-    }
-}
-
-INSTANTIATE_TEST_SUITE_P(TestAccuracyPublic, ModelParameterizedTest, testing::ValuesIn(GetTestData(PUBLIC_SCOPE_PATH)));
-
-class InputParser {
-public:
-    InputParser(int& argc, char** argv) {
-        for (int i = 1; i < argc; ++i)
-            this->tokens.push_back(std::string(argv[i]));
-    }
-
-    const std::string& getCmdOption(const std::string& option) const {
-        std::vector<std::string>::const_iterator itr;
-        itr = std::find(this->tokens.begin(), this->tokens.end(), option);
-        if (itr != this->tokens.end() && ++itr != this->tokens.end()) {
-            return *itr;
-        }
-        static const std::string empty_string("");
-        return empty_string;
-    }
-
-    bool cmdOptionExists(const std::string& option) const {
-        return std::find(this->tokens.begin(), this->tokens.end(), option) != this->tokens.end();
-    }
-
-private:
-    std::vector<std::string> tokens;
-};
-
-void print_help(const char* program_name) {
-    std::cout << "Usage: " << program_name << " -p <path_to_public_scope.json> -d <path_to_data>" << std::endl;
-}
-
-int main(int argc, char** argv) {
-    InputParser input(argc, argv);
-
-    if (input.cmdOptionExists("-h")) {
-        print_help(argv[0]);
-        return 1;
-    }
-    const std::string& public_scope = input.getCmdOption("-p");
-    if (!public_scope.empty()) {
-        PUBLIC_SCOPE_PATH = public_scope;
-    } else {
-        print_help(argv[0]);
-        return 1;
-    }
-    const std::string& data_dir = input.getCmdOption("-d");
-    if (!data_dir.empty()) {
-        DATA_DIR = data_dir;
-    } else {
-        print_help(argv[0]);
-        return 1;
-    }
-
-    testing::InitGoogleTest(&argc, argv);
-
-    return RUN_ALL_TESTS();
-}
diff --git a/tests/cpp/accuracy/test_bindings.py b/tests/cpp/accuracy/test_bindings.py
deleted file mode 100644
index 00b4fb3d..00000000
--- a/tests/cpp/accuracy/test_bindings.py
+++ /dev/null
@@ -1,56 +0,0 @@
-#
-# Copyright (C) 2025 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-#
-
-import pytest
-import json
-from pathlib import Path
-
-import cv2
-
-from model_api.models import Model
-from vision_api import ClassificationModel
-
-
-def read_config(models_config: str, model_type: str):
-    with open(models_config, "r") as f:
-        data = json.load(f)
-        for item in data:
-            if item["type"] == model_type:
-                yield item
-
-
-@pytest.fixture(scope="session")
-def data(pytestconfig) -> str:
-    return pytestconfig.getoption("data")
-
-
-@pytest.fixture(scope="session")
-def models_config(pytestconfig) -> str:
-    return pytestconfig.getoption("config")
-
-
-@pytest.fixture()
-def classification_configs(models_config: str):
-    return read_config(models_config, "ClassificationModel")
-
-
-def test_classification_models(data: str, classification_configs):
-    for model_data in classification_configs:
-        name = model_data["name"]
-        if ".xml" not in name:
-            continue
-        if name.endswith(".xml") or name.endswith(".onnx"):
-            name = f"{data}/{name}"
-
-        model = Model.create_model(name, preload=True)
-        cpp_model = ClassificationModel.create_model(name, preload=True)
-
-        image_path = Path(data) / next(iter(model_data["test_data"]))["image"]
-        image = cv2.cvtColor(cv2.imread(image_path), cv2.COLOR_BGR2RGB)
-
-        py_result = model(image)
-        cpp_result = cpp_model(image)
-
-        assert str(py_result) == str(cpp_result)
diff --git a/tests/cpp/cmake/common.cmake b/tests/cpp/cmake/common.cmake
deleted file mode 100644
index af7326df..00000000
--- a/tests/cpp/cmake/common.cmake
+++ /dev/null
@@ -1,46 +0,0 @@
-# Copyright (C) 2018-2019 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-#
-
-cmake_minimum_required(VERSION 3.26)
-
-macro(add_test)
-    set(oneValueArgs NAME OPENCV_VERSION_REQUIRED)
-    set(multiValueArgs SOURCES HEADERS DEPENDENCIES INCLUDE_DIRECTORIES)
-    cmake_parse_arguments(TEST "${options}" "${oneValueArgs}"
-                          "${multiValueArgs}" ${ARGN})
-
-    if(TEST_OPENCV_VERSION_REQUIRED AND OpenCV_VERSION VERSION_LESS TEST_OPENCV_VERSION_REQUIRED)
-        message(WARNING "${TEST_NAME} is disabled; required OpenCV version ${TEST_OPENCV_VERSION_REQUIRED}, provided ${OpenCV_VERSION}")
-        return()
-    endif()
-
-    # Create named folders for the sources within the .vcproj
-    # Empty name lists them directly under the .vcproj
-    source_group("src" FILES ${TEST_SOURCES})
-    if(TEST_HEADERS)
-        source_group("include" FILES ${TEST_HEADERS})
-    endif()
-
-    # Create executable file from sources
-    add_executable(${TEST_NAME} ${TEST_SOURCES} ${TEST_HEADERS})
-
-    if(WIN32)
-        set_target_properties(${TEST_NAME} PROPERTIES COMPILE_PDB_NAME ${TEST_NAME})
-    endif()
-
-    include_directories(${GTEST_INCLUDE_DIRS})
-
-    if(TEST_INCLUDE_DIRECTORIES)
-        target_include_directories(${TEST_NAME} PRIVATE ${TEST_INCLUDE_DIRECTORIES})
-    endif()
-
-    target_link_libraries(${TEST_NAME} PRIVATE ${OpenCV_LIBRARIES} ${TEST_DEPENDENCIES})
-
-    if(UNIX)
-        target_link_libraries(${TEST_NAME} PRIVATE pthread)
-    endif()
-
-    target_link_libraries(${TEST_NAME} PRIVATE gtest_main gmock_main nlohmann_json::nlohmann_json)
-
-endmacro()
diff --git a/tests/cpp/matchers.h b/tests/cpp/matchers.h
new file mode 100644
index 00000000..80878ab0
--- /dev/null
+++ b/tests/cpp/matchers.h
@@ -0,0 +1,47 @@
+#pragma once
+
+#include "tasks/instance_segmentation.h"
+#include "tasks/semantic_segmentation.h"
+
+inline std::string format_test_output_to_string(const InstanceSegmentation& model,
+                                                const InstanceSegmentationResult& result) {
+    const std::vector<SegmentedObjectWithRects>& withRects = model.getRotatedRectangles(result);
+    std::stringstream ss;
+    for (const SegmentedObjectWithRects& obj : withRects) {
+        ss << obj << "; ";
+    }
+    size_t filled = 0;
+    for (const cv::Mat_<std::uint8_t>& cls_map : result.saliency_map) {
+        if (cls_map.data) {
+            ++filled;
+        }
+    }
+    ss << filled << "; ";
+    try {
+        ss << result.feature_vector.get_shape();
+    } catch (ov::Exception&) {
+        ss << "[0]";
+    }
+    ss << "; ";
+    try {
+        // getContours() assumes each instance generates only one contour.
+        // That doesn't hold for some models
+        for (const Contour& contour : model.getContours(result.segmentedObjects)) {
+            ss << contour << "; ";
+        }
+    } catch (const std::runtime_error&) {
+    }
+    return ss.str();
+}
+
+inline std::string format_test_output_to_string(SemanticSegmentation& model, const SemanticSegmentationResult& result) {
+    const std::vector<Contour>& contours = model.getContours(result);
+    std::stringstream ss;
+    ss << result << "; ";
+    std::cout << contours.size() << std::endl;
+    for (const Contour& contour : contours) {
+        ss << contour << ", ";
+    }
+
+    return ss.str();
+}
diff --git a/tests/cpp/precommit/CMakeLists.txt b/tests/cpp/precommit/CMakeLists.txt
deleted file mode 100644
index 0c56bf15..00000000
--- a/tests/cpp/precommit/CMakeLists.txt
+++ /dev/null
@@ -1,72 +0,0 @@
-# Copyright (C) 2018-2019 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-#
-
-cmake_minimum_required(VERSION 3.26)
-
-# Multi config generators such as Visual Studio ignore CMAKE_BUILD_TYPE. Multi config generators are configured with
-# CMAKE_CONFIGURATION_TYPES, but limiting options in it completely removes such build options
-get_property(GENERATOR_IS_MULTI_CONFIG_VAR GLOBAL PROPERTY GENERATOR_IS_MULTI_CONFIG)
-if(NOT GENERATOR_IS_MULTI_CONFIG_VAR AND NOT DEFINED CMAKE_BUILD_TYPE)
-    message(STATUS "CMAKE_BUILD_TYPE not defined, 'Release' will be used")
-    # Setting CMAKE_BUILD_TYPE as CACHE must go before project(). Otherwise project() sets its value and set() doesn't take an effect
-    set(CMAKE_BUILD_TYPE Release CACHE STRING "Choose the type of build, options are: None Debug Release RelWithDebInfo MinSizeRel ...")
-endif()
-project(tests)
-
-if(WIN32)
-    if(NOT "${CMAKE_SIZEOF_VOID_P}" EQUAL "8")
-        message(FATAL_ERROR "Only 64-bit supported on Windows")
-    endif()
-
-    add_definitions(-DNOMINMAX)
-endif()
-
-if(MSVC)
-    add_compile_options(/wd4251 /wd4275 /wd4267  # disable some warnings
-                        /W3  # Specify the level of warnings to be generated by the compiler
-                        /EHsc)  # Enable standard C++ stack unwinding, assume functions with extern "C" never throw
-endif()
-
-if(CMAKE_CXX_COMPILER_ID MATCHES "^GNU|(Apple)?Clang$")
-    add_compile_options(-Wall -Wextra -Wpedantic)
-endif()
-
-if(CMAKE_SYSTEM_PROCESSOR MATCHES "^(arm64.*|aarch64.*|AARCH64.*)")
-  set(AARCH64 ON)
-elseif(CMAKE_SYSTEM_PROCESSOR MATCHES "^(arm.*|ARM.*)")
-  set(ARM ON)
-endif()
-if(ARM AND NOT CMAKE_CROSSCOMPILING)
-    add_compile_options(-march=armv7-a+fp)
-endif()
-
-set(CMAKE_CXX_STANDARD 17)
-set(CMAKE_CXX_STANDARD_REQUIRED ON)
-set(CMAKE_POSITION_INDEPENDENT_CODE ON)
-# Something: OpenCV or OpenVINO links gflags with /MT instead of default flag.
-# Set the same to avoid linkage conflicts
-if(WIN32)
-    set(CMAKE_CXX_FLAGS_RELEASE "${CMAKE_CXX_FLAGS_RELEASE} /MT")
-endif()
-
-include(CMakeParseArguments)
-include(FetchContent)
-
-FetchContent_Declare(json GIT_REPOSITORY https://github.com/nlohmann/json.git
-                          GIT_TAG d41ca94fa85d5119852e2f7a3f94335cc7cb0486  # PR #4709, fixes cmake deprecation warnings
-                    )
-FetchContent_Declare(googletest
-    GIT_REPOSITORY https://github.com/google/googletest.git
-    GIT_TAG a7f443b80b105f940225332ed3c31f2790092f47  # latest main
-)
-FetchContent_MakeAvailable(json googletest)
-
-include(../cmake/common.cmake)
-
-find_package(OpenCV REQUIRED COMPONENTS core highgui videoio imgproc imgcodecs)
-
-add_subdirectory(../../../src/cpp ${tests_BINARY_DIR}/model_api/cpp)
-
-add_test(NAME test_sanity SOURCES test_sanity.cpp DEPENDENCIES model_api)
-add_test(NAME test_model_config SOURCES test_model_config.cpp DEPENDENCIES model_api)
diff --git a/tests/cpp/precommit/test_model_config.cpp b/tests/cpp/precommit/test_model_config.cpp
deleted file mode 100644
index 1f68e37e..00000000
--- a/tests/cpp/precommit/test_model_config.cpp
+++ /dev/null
@@ -1,323 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-#include <adapters/openvino_adapter.h>
-#include <gtest/gtest.h>
-#include <models/classification_model.h>
-#include <models/detection_model.h>
-#include <models/detection_model_ssd.h>
-#include <models/input_data.h>
-#include <models/results.h>
-#include <stddef.h>
-
-#include <cstdint>
-#include <cstdio>
-#include <exception>
-#include <fstream>
-#include <iomanip>
-#include <iostream>
-#include <nlohmann/json.hpp>
-#include <opencv2/core.hpp>
-#include <stdexcept>
-#include <string>
-
-using json = nlohmann::json;
-
-std::string DATA_DIR = "../data";
-std::string MODEL_PATH_TEMPLATE = "otx_models/%s.xml";
-std::string IMAGE_PATH = "coco128/images/train2017/000000000074.jpg";
-
-std::string TMP_MODEL_FILE = "tmp_model.xml";
-
-struct ModelData {
-    std::string name;
-    ModelData(const std::string& name) : name(name) {}
-};
-
-class MockAdapter : public OpenVINOInferenceAdapter {
-public:
-    MockAdapter(const std::string& modelPath) : OpenVINOInferenceAdapter() {
-        auto core = ov::Core();
-        auto model = core.read_model(modelPath);
-        loadModel(model, core, "CPU");
-    }
-};
-
-class ClassificationModelParameterizedTest : public testing::TestWithParam<ModelData> {};
-
-class SSDModelParameterizedTest : public testing::TestWithParam<ModelData> {};
-
-class ClassificationModelParameterizedTestSaveLoad : public testing::TestWithParam<ModelData> {
-protected:
-    void TearDown() override {
-        auto fileName = TMP_MODEL_FILE;
-        std::remove(fileName.c_str());
-        std::remove(fileName.replace(fileName.end() - 4, fileName.end(), ".bin").c_str());
-    }
-};
-
-class DetectionModelParameterizedTestSaveLoad : public ClassificationModelParameterizedTestSaveLoad {};
-
-template <typename... Args>
-std::string string_format(const std::string& fmt, Args... args) {
-    size_t size = snprintf(nullptr, 0, fmt.c_str(), args...);
-    std::string buf;
-    buf.reserve(size + 1);
-    buf.resize(size);
-    snprintf(&buf[0], size + 1, fmt.c_str(), args...);
-    return buf;
-}
-
-TEST_P(ClassificationModelParameterizedTest, TestClassificationDefaultConfig) {
-    auto model_path = string_format(MODEL_PATH_TEMPLATE, GetParam().name.c_str(), GetParam().name.c_str());
-    bool preload = true;
-    auto model = ClassificationModel::create_model(DATA_DIR + "/" + model_path, {}, preload, "CPU");
-
-    auto ov_model = model->getModel();
-
-    EXPECT_EQ(ov_model->get_rt_info<std::string>("model_info", "model_type"), ClassificationModel::ModelType);
-
-    auto embedded_processing = ov_model->get_rt_info<bool>("model_info", "embedded_processing");
-    EXPECT_TRUE(embedded_processing);
-}
-
-TEST_P(ClassificationModelParameterizedTest, TestClassificationCustomConfig) {
-    GTEST_SKIP() << "Classification config tests fail on CI";
-    auto model_path = string_format(MODEL_PATH_TEMPLATE, GetParam().name.c_str(), GetParam().name.c_str());
-    std::vector<std::string> mock_labels;
-    size_t num_classes = 1000;
-    for (size_t i = 0; i < num_classes; i++) {
-        mock_labels.push_back(std::to_string(i));
-    }
-    ov::AnyMap configuration = {{"layout", "data:HWC"}, {"resize_type", "fit_to_window"}, {"labels", mock_labels}};
-    bool preload = true;
-    auto model = ClassificationModel::create_model(DATA_DIR + "/" + model_path, configuration, preload, "CPU");
-
-    auto ov_model = model->getModel();
-
-    auto layout = ov_model->get_rt_info<std::string>("model_info", "layout");
-    EXPECT_EQ(layout, configuration.at("layout").as<std::string>());
-
-    auto resize_type = ov_model->get_rt_info<std::string>("model_info", "resize_type");
-    EXPECT_EQ(resize_type, configuration.at("resize_type").as<std::string>());
-
-    auto labels = split(ov_model->get_rt_info<std::string>("model_info", "labels"), ' ');
-    for (size_t i = 0; i < num_classes; i++) {
-        EXPECT_EQ(labels[i], mock_labels[i]);
-    }
-}
-
-TEST_P(ClassificationModelParameterizedTestSaveLoad, TestClassificationCorrectnessAfterSaveLoad) {
-    cv::Mat image = cv::imread(DATA_DIR + "/" + IMAGE_PATH);
-    if (!image.data) {
-        throw std::runtime_error{"Failed to read the image"};
-    }
-
-    auto model_path = string_format(MODEL_PATH_TEMPLATE, GetParam().name.c_str(), GetParam().name.c_str());
-    std::cout << model_path << "\n";
-    bool preload = true;
-    auto model = ClassificationModel::create_model(DATA_DIR + "/" + model_path, {}, preload, "CPU");
-
-    auto ov_model = model->getModel();
-    ov::serialize(ov_model, TMP_MODEL_FILE);
-
-    auto result = model->infer(image)->topLabels;
-
-    auto model_restored = ClassificationModel::create_model(TMP_MODEL_FILE, {}, preload, "CPU");
-    auto result_data = model_restored->infer(image);
-    auto result_restored = result_data->topLabels;
-
-    EXPECT_EQ(result_restored[0].id, result[0].id);
-    EXPECT_EQ(result_restored[0].score, result[0].score);
-}
-
-TEST_P(ClassificationModelParameterizedTestSaveLoad, TestClassificationCorrectnessAfterSaveLoadWithAdapter) {
-    cv::Mat image = cv::imread(DATA_DIR + "/" + IMAGE_PATH);
-    if (!image.data) {
-        throw std::runtime_error{"Failed to read the image"};
-    }
-
-    auto model_path = string_format(MODEL_PATH_TEMPLATE, GetParam().name.c_str(), GetParam().name.c_str());
-    bool preload = true;
-    auto model = ClassificationModel::create_model(DATA_DIR + "/" + model_path, {}, preload, "CPU");
-    auto ov_model = model->getModel();
-    ov::serialize(ov_model, TMP_MODEL_FILE);
-    auto result = model->infer(image)->topLabels;
-
-    std::shared_ptr<InferenceAdapter> adapter = std::make_shared<MockAdapter>(TMP_MODEL_FILE);
-    auto model_restored = ClassificationModel::create_model(adapter);
-    auto result_data = model_restored->infer(image);
-    auto result_restored = result_data->topLabels;
-
-    EXPECT_EQ(result_restored[0].id, result[0].id);
-    EXPECT_EQ(result_restored[0].score, result[0].score);
-}
-
-TEST_P(SSDModelParameterizedTest, TestDetectionDefaultConfig) {
-    auto model_path = string_format(MODEL_PATH_TEMPLATE, GetParam().name.c_str(), GetParam().name.c_str());
-    bool preload = true;
-    auto model = DetectionModel::create_model(DATA_DIR + "/" + model_path, {}, "", preload, "CPU");
-
-    auto ov_model = model->getModel();
-
-    EXPECT_EQ(ov_model->get_rt_info<std::string>("model_info", "model_type"), ModelSSD::ModelType);
-
-    auto embedded_processing = ov_model->get_rt_info<bool>("model_info", "embedded_processing");
-    EXPECT_TRUE(embedded_processing);
-}
-
-TEST_P(SSDModelParameterizedTest, TestDetectionCustomConfig) {
-    GTEST_SKIP() << "Detection config tests fail on CI";
-    auto model_path = string_format(MODEL_PATH_TEMPLATE, GetParam().name.c_str(), GetParam().name.c_str());
-    std::vector<std::string> mock_labels;
-    size_t num_classes = 80;
-    for (size_t i = 0; i < num_classes; i++) {
-        mock_labels.push_back(std::to_string(i));
-    }
-    ov::AnyMap configuration = {{"layout", "data:HWC"}, {"resize_type", "fit_to_window"}, {"labels", mock_labels}};
-    bool preload = true;
-    auto model = DetectionModel::create_model(DATA_DIR + "/" + model_path, configuration, "", preload, "CPU");
-
-    auto ov_model = model->getModel();
-
-    auto layout = ov_model->get_rt_info<std::string>("model_info", "layout");
-    EXPECT_EQ(layout, configuration.at("layout").as<std::string>());
-
-    auto resize_type = ov_model->get_rt_info<std::string>("model_info", "resize_type");
-    EXPECT_EQ(resize_type, configuration.at("resize_type").as<std::string>());
-
-    auto labels = split(ov_model->get_rt_info<std::string>("model_info", "labels"), ' ');
-    for (size_t i = 0; i < num_classes; i++) {
-        EXPECT_EQ(labels[i], mock_labels[i]);
-    }
-}
-
-TEST_P(DetectionModelParameterizedTestSaveLoad, TestDetctionCorrectnessAfterSaveLoad) {
-    cv::Mat image = cv::imread(DATA_DIR + "/" + IMAGE_PATH);
-    if (!image.data) {
-        throw std::runtime_error{"Failed to read the image"};
-    }
-
-    auto model_path = string_format(MODEL_PATH_TEMPLATE, GetParam().name.c_str(), GetParam().name.c_str());
-    bool preload = true;
-    auto model = DetectionModel::create_model(DATA_DIR + "/" + model_path, {}, "", preload, "CPU");
-
-    auto ov_model = model->getModel();
-    ov::serialize(ov_model, TMP_MODEL_FILE);
-
-    auto result = model->infer(image)->objects;
-
-    image = cv::imread(DATA_DIR + "/" + IMAGE_PATH);
-    if (!image.data) {
-        throw std::runtime_error{"Failed to read the image"};
-    }
-    auto model_restored = DetectionModel::create_model(TMP_MODEL_FILE, {}, "", preload, "CPU");
-    auto result_data = model_restored->infer(image);
-    auto result_restored = result_data->objects;
-
-    ASSERT_EQ(result.size(), result_restored.size());
-
-    for (size_t i = 0; i < result.size(); i++) {
-        ASSERT_EQ(result[i].x, result_restored[i].x);
-        ASSERT_EQ(result[i].y, result_restored[i].y);
-        ASSERT_EQ(result[i].width, result_restored[i].width);
-        ASSERT_EQ(result[i].height, result_restored[i].height);
-    }
-}
-
-TEST_P(DetectionModelParameterizedTestSaveLoad, TestDetctionCorrectnessAfterSaveLoadWithAdapter) {
-    cv::Mat image = cv::imread(DATA_DIR + "/" + IMAGE_PATH);
-    if (!image.data) {
-        throw std::runtime_error{"Failed to read the image"};
-    }
-
-    auto model_path = string_format(MODEL_PATH_TEMPLATE, GetParam().name.c_str(), GetParam().name.c_str());
-    bool preload = true;
-    auto model = DetectionModel::create_model(DATA_DIR + "/" + model_path, {}, "", preload, "CPU");
-    auto ov_model = model->getModel();
-    ov::serialize(ov_model, TMP_MODEL_FILE);
-    auto result = model->infer(image)->objects;
-
-    image = cv::imread(DATA_DIR + "/" + IMAGE_PATH);
-    if (!image.data) {
-        throw std::runtime_error{"Failed to read the image"};
-    }
-
-    std::shared_ptr<InferenceAdapter> adapter = std::make_shared<MockAdapter>(TMP_MODEL_FILE);
-    auto model_restored = DetectionModel::create_model(adapter);
-    auto result_data = model_restored->infer(image);
-    auto result_restored = result_data->objects;
-
-    ASSERT_EQ(result.size(), result_restored.size());
-
-    for (size_t i = 0; i < result.size(); i++) {
-        ASSERT_EQ(result[i].x, result_restored[i].x);
-        ASSERT_EQ(result[i].y, result_restored[i].y);
-        ASSERT_EQ(result[i].width, result_restored[i].width);
-        ASSERT_EQ(result[i].height, result_restored[i].height);
-    }
-}
-
-INSTANTIATE_TEST_SUITE_P(ClassificationTestInstance,
-                         ClassificationModelParameterizedTest,
-                         ::testing::Values(ModelData("mlc_mobilenetv3_large_voc")));
-INSTANTIATE_TEST_SUITE_P(ClassificationTestInstance,
-                         ClassificationModelParameterizedTestSaveLoad,
-                         ::testing::Values(ModelData("mlc_mobilenetv3_large_voc")));
-INSTANTIATE_TEST_SUITE_P(SSDTestInstance,
-                         SSDModelParameterizedTest,
-                         ::testing::Values(ModelData("detection_model_with_xai_head")));
-INSTANTIATE_TEST_SUITE_P(SSDTestInstance,
-                         DetectionModelParameterizedTestSaveLoad,
-                         ::testing::Values(ModelData("detection_model_with_xai_head")));
-
-class InputParser {
-public:
-    InputParser(int& argc, char** argv) {
-        for (int i = 1; i < argc; ++i)
-            this->tokens.push_back(std::string(argv[i]));
-    }
-
-    const std::string& getCmdOption(const std::string& option) const {
-        std::vector<std::string>::const_iterator itr;
-        itr = std::find(this->tokens.begin(), this->tokens.end(), option);
-        if (itr != this->tokens.end() && ++itr != this->tokens.end()) {
-            return *itr;
-        }
-        static const std::string empty_string("");
-        return empty_string;
-    }
-
-    bool cmdOptionExists(const std::string& option) const {
-        return std::find(this->tokens.begin(), this->tokens.end(), option) != this->tokens.end();
-    }
-
-private:
-    std::vector<std::string> tokens;
-};
-
-void print_help(const char* program_name) {
-    std::cout << "Usage: " << program_name << "-d <path_to_data>" << std::endl;
-}
-
-int main(int argc, char** argv) {
-    InputParser input(argc, argv);
-
-    if (input.cmdOptionExists("-h")) {
-        print_help(argv[0]);
-        return 1;
-    }
-
-    const std::string& data_dir = input.getCmdOption("-d");
-    if (!data_dir.empty()) {
-        DATA_DIR = data_dir;
-    } else {
-        print_help(argv[0]);
-        return 1;
-    }
-
-    testing::InitGoogleTest(&argc, argv);
-
-    return RUN_ALL_TESTS();
-}
diff --git a/tests/cpp/precommit/test_sanity.cpp b/tests/cpp/precommit/test_sanity.cpp
deleted file mode 100644
index 9aa5a5c6..00000000
--- a/tests/cpp/precommit/test_sanity.cpp
+++ /dev/null
@@ -1,147 +0,0 @@
-/*
- * Copyright (C) 2020-2024 Intel Corporation
- * SPDX-License-Identifier: Apache-2.0
- */
-#include <gtest/gtest.h>
-#include <models/classification_model.h>
-#include <models/detection_model.h>
-#include <models/input_data.h>
-#include <models/results.h>
-#include <models/segmentation_model.h>
-#include <stddef.h>
-
-#include <cstdint>
-#include <exception>
-#include <fstream>
-#include <iomanip>
-#include <iostream>
-#include <nlohmann/json.hpp>
-#include <opencv2/core.hpp>
-#include <stdexcept>
-#include <string>
-
-using json = nlohmann::json;
-
-std::string PUBLIC_SCOPE_PATH = "../../tests/cpp/precommit/public_scope.json";
-std::string DATA_DIR = "../data";
-std::string MODEL_PATH_TEMPLATE = "public/%s/FP16/%s.xml";
-std::string IMAGE_PATH = "coco128/images/train2017/000000000074.jpg";
-
-struct ModelData {
-    std::string name;
-    std::string type;
-};
-
-class ModelParameterizedTest : public testing::TestWithParam<ModelData> {};
-
-template <typename... Args>
-std::string string_format(const std::string& fmt, Args... args) {
-    size_t size = snprintf(nullptr, 0, fmt.c_str(), args...);
-    std::string buf;
-    buf.reserve(size + 1);
-    buf.resize(size);
-    snprintf(&buf[0], size + 1, fmt.c_str(), args...);
-    return buf;
-}
-
-inline void from_json(const nlohmann::json& j, ModelData& test) {
-    test.name = j.at("name").get<std::string>();
-    test.type = j.at("type").get<std::string>();
-}
-
-std::vector<ModelData> GetTestData(const std::string& path) {
-    std::ifstream input(path);
-    nlohmann::json j;
-    input >> j;
-    return j;
-}
-TEST_P(ModelParameterizedTest, SynchronousInference) {
-    cv::Mat image = cv::imread(DATA_DIR + "/" + IMAGE_PATH);
-    if (!image.data) {
-        throw std::runtime_error{"Failed to read the image"};
-    }
-
-    std::string model_path;
-    const std::string& name = GetParam().name;
-    if (name.substr(name.size() - 4) == ".xml") {
-        model_path = name;
-    } else {
-        model_path = string_format(MODEL_PATH_TEMPLATE, name.c_str(), name.c_str());
-    }
-
-    if ("DetectionModel" == GetParam().type) {
-        bool preload = true;
-        auto model = DetectionModel::create_model(DATA_DIR + "/" + model_path, {}, "", preload, "CPU");
-        auto result = model->infer(image);
-        EXPECT_GT(result->objects.size(), 0);
-    } else if ("ClassificationModel" == GetParam().type) {
-        bool preload = true;
-        auto model = ClassificationModel::create_model(DATA_DIR + "/" + model_path, {}, preload, "CPU");
-        std::unique_ptr<ClassificationResult> result = model->infer(image);
-        ASSERT_GT(result->topLabels.size(), 0);
-        EXPECT_GT(result->topLabels.front().score, 0.0f);
-    } else if ("SegmentationModel" == GetParam().type) {
-        bool preload = true;
-        auto model = SegmentationModel::create_model(DATA_DIR + "/" + model_path, {}, preload, "CPU");
-        auto result = model->infer(image)->asRef<ImageResultWithSoftPrediction>();
-        ASSERT_GT(model->getContours(result).size(), 0);
-    }
-}
-
-INSTANTIATE_TEST_SUITE_P(TestSanityPublic, ModelParameterizedTest, testing::ValuesIn(GetTestData(PUBLIC_SCOPE_PATH)));
-
-class InputParser {
-public:
-    InputParser(int& argc, char** argv) {
-        for (int i = 1; i < argc; ++i)
-            this->tokens.push_back(std::string(argv[i]));
-    }
-
-    const std::string& getCmdOption(const std::string& option) const {
-        std::vector<std::string>::const_iterator itr;
-        itr = std::find(this->tokens.begin(), this->tokens.end(), option);
-        if (itr != this->tokens.end() && ++itr != this->tokens.end()) {
-            return *itr;
-        }
-        static const std::string empty_string("");
-        return empty_string;
-    }
-
-    bool cmdOptionExists(const std::string& option) const {
-        return std::find(this->tokens.begin(), this->tokens.end(), option) != this->tokens.end();
-    }
-
-private:
-    std::vector<std::string> tokens;
-};
-
-void print_help(const char* program_name) {
-    std::cout << "Usage: " << program_name << " -p <path_to_public_scope.json> -d <path_to_data>" << std::endl;
-}
-
-int main(int argc, char** argv) {
-    InputParser input(argc, argv);
-
-    if (input.cmdOptionExists("-h")) {
-        print_help(argv[0]);
-        return 1;
-    }
-    const std::string& public_scope = input.getCmdOption("-p");
-    if (!public_scope.empty()) {
-        PUBLIC_SCOPE_PATH = public_scope;
-    } else {
-        print_help(argv[0]);
-        return 1;
-    }
-    const std::string& data_dir = input.getCmdOption("-d");
-    if (!data_dir.empty()) {
-        DATA_DIR = data_dir;
-    } else {
-        print_help(argv[0]);
-        return 1;
-    }
-
-    testing::InitGoogleTest(&argc, argv);
-
-    return RUN_ALL_TESTS();
-}
diff --git a/tests/cpp/public_scope.json b/tests/cpp/public_scope.json
new file mode 100644
index 00000000..2dbed871
--- /dev/null
+++ b/tests/cpp/public_scope.json
@@ -0,0 +1,100 @@
+[
+  {
+    "name": "otx_models/Lite-hrnet-18.xml",
+    "type": "SegmentationModel",
+    "test_data": [
+      {
+        "image": "coco128/images/train2017/000000000074.jpg",
+        "reference": [
+          "0: 0.537, 1: 0.463, [426,640,2], [0], [0]; object: 0.675, 508, object: 0.527, 65, object: 0.507, 18, object: 0.624, 144, object: 0.538, 67, object: 0.507, 15, object: 0.518, 41, object: 0.507, 8, object: 0.505, 14, object: 0.885, 2138, "
+        ]
+      }
+    ]
+  },
+  {
+    "name": "otx_models/Lite-hrnet-18_mod2.xml",
+    "type": "SegmentationModel",
+    "test_data": [
+      {
+        "image": "coco128/images/train2017/000000000074.jpg",
+        "reference": [
+          "0: 0.992, 1: 0.008, [426,640,2], [0], [0]; object: 0.555, 112, object: 0.506, 17, object: 0.555, 154, object: 0.511, 19, object: 0.514, 52, "
+        ]
+      }
+    ]
+  },
+  {
+    "name": "otx_models/segmentation_model_with_xai_head.xml",
+    "type": "SegmentationModel",
+    "test_data": [
+      {
+        "image": "coco128/images/train2017/000000000074.jpg",
+        "reference": [
+          "0: 1.000, 1: 0.000, [426,640,3], [426,640,3], [1,600,1,1]; backpack: 0.505, 2, "
+        ]
+      }
+    ]
+  },
+  {
+    "name": "otx_models/maskrcnn_model_with_xai_head.xml",
+    "type": "MaskRCNNModel",
+    "test_data": [
+      {
+        "image": "coco128/images/train2017/000000000074.jpg",
+        "reference": [
+          "61, 277, 358, 382, 17 (horse): 0.998, 18312, RotatedRect: 212.000 327.000 290.000 100.000 0.000; 1, 14, 162, 321, 2 (car): 0.994, 25867, RotatedRect: 54.067 173.034 285.208 156.889 61.996; 327, 96, 341, 134, 1 (bicycle): 0.930, 279, RotatedRect: 333.500 114.000 36.000 13.000 90.000; 460, 106, 493, 148, 1 (bicycle): 0.898, 786, RotatedRect: 476.284 126.621 27.308 45.993 19.179; 294, 93, 315, 153, 1 (bicycle): 0.869, 789, RotatedRect: 304.000 124.000 58.000 18.000 90.000; 278, 109, 290, 152, 1 (bicycle): 0.817, 355, RotatedRect: 283.500 130.000 42.000 11.000 90.000; 4, 4, 102, 191, 2 (car): 0.701, 9658, RotatedRect: 51.806 97.259 184.445 95.281 89.246; 270, 93, 290, 152, 1 (bicycle): 0.660, 723, RotatedRect: 280.500 122.500 17.000 59.000 0.000; 322, 114, 343, 152, 18 (sheep): 0.520, 298, RotatedRect: 332.000 133.000 34.000 14.000 90.000; 4; [1,1280,1,1]; "
+        ]
+      }
+    ]
+  },
+  {
+    "name": "otx_models/is_resnet50_maskrcnn_coco_reduced.xml",
+    "type": "MaskRCNNModel",
+    "test_data": [
+      {
+        "image": "coco128/images/train2017/000000000074.jpg",
+        "reference": [
+          "59, 277, 360, 380, 16 (horse): 0.999, 19053, RotatedRect: 210.000 327.500 101.000 296.000 90.000; 2, 9, 162, 318, 2 (car): 0.999, 31153, RotatedRect: 82.086 163.312 307.394 156.997 89.669; 294, 94, 316, 153, 1 (bicycle): 0.985, 840, RotatedRect: 305.000 123.500 59.000 18.000 90.000; 326, 97, 341, 136, 1 (bicycle): 0.974, 397, RotatedRect: 332.500 116.000 38.000 13.000 90.000; 461, 105, 493, 150, 1 (bicycle): 0.918, 846, RotatedRect: 476.052 126.972 27.619 47.834 16.928; 350, 92, 386, 149, 1 (bicycle): 0.807, 1458, RotatedRect: 369.319 119.891 54.848 34.230 82.405; 279, 110, 291, 146, 1 (bicycle): 0.788, 312, RotatedRect: 284.000 127.500 35.000 10.000 90.000; 0; [0]; horse: 0.999, 668; car: 0.999, 782; bicycle: 0.985, 127; bicycle: 0.974, 87; bicycle: 0.918, 122; bicycle: 0.807, 140; bicycle: 0.788, 79; "
+        ]
+      }
+    ]
+  },
+  {
+    "name": "otx_models/det_mobilenetv2_atss_bccd.xml",
+    "type": "DetectionModel",
+    "test_data": [
+      {
+        "image": "BloodImage_00007.jpg",
+        "reference": [
+          "494, 159, 637, 308, 2 (WBC): 0.697; 28, 139, 135, 228, 1 (RBC): 0.628; 535, 375, 638, 479, 1 (RBC): 0.524; 513, 8, 633, 152, 1 (RBC): 0.430; 21, 291, 143, 399, 1 (RBC): 0.422; 196, 86, 410, 286, 1 (RBC): 0.422; [0]; [0]"
+        ]
+      }
+    ]
+  },
+  {
+    "name": "otx_models/detection_model_with_xai_head.xml",
+    "type": "DetectionModel",
+    "test_data": [
+      {
+        "image": "coco128/images/train2017/000000000074.jpg",
+        "reference": [
+          "61, 277, 355, 379, 1 (person): 0.364; 461, 105, 495, 149, 1 (person): 0.305; [1,2,6,8]; [1,320,1,1]"
+        ]
+      }
+    ]
+  },
+  {
+    "name": "otx_models/detection_model_with_xai_head.xml",
+    "type": "DetectionModel",
+    "tiler": "DetectionTiler",
+    "input_res": "(3500,3500)",
+    "test_data": [
+      {
+        "image": "coco128/images/train2017/000000000074.jpg",
+        "reference": [
+          "336, 2275, 1944, 3114, 1 (person): 0.361; 2523, 862, 2709, 1224, 1 (person): 0.313; [1,2,35,46]; [1,320,1,1]"
+        ]
+      }
+    ]
+  }
+]
diff --git a/tests/cpp/test_accuracy.cpp b/tests/cpp/test_accuracy.cpp
new file mode 100644
index 00000000..3bf6b178
--- /dev/null
+++ b/tests/cpp/test_accuracy.cpp
@@ -0,0 +1,266 @@
+#include <gtest/gtest.h>
+
+#include <fstream>
+#include <nlohmann/json.hpp>
+#include <opencv2/opencv.hpp>
+#include <optional>
+#include <thread>
+
+#include "matchers.h"
+#include "tasks/detection.h"
+#include "tasks/instance_segmentation.h"
+#include "tasks/semantic_segmentation.h"
+
+std::string PUBLIC_SCOPE_PATH = "../public_scope.json";
+std::string DATA_DIR = "../data";
+
+struct TestData {
+    std::string image;
+    std::vector<std::string> reference;
+};
+
+NLOHMANN_DEFINE_TYPE_NON_INTRUSIVE(TestData, image, reference);
+
+namespace cv {}
+
+struct ModelData {
+    std::string name;
+    std::string type;
+    std::vector<TestData> test_data;
+    std::string tiler = "";
+    cv::Size input_res = cv::Size(0, 0);
+};
+
+void from_json(const nlohmann::json& nlohmann_json_j, ModelData& nlohmann_json_t) {
+    nlohmann_json_t.name = nlohmann_json_j["name"];
+    nlohmann_json_t.type = nlohmann_json_j["type"];
+    nlohmann_json_t.test_data = nlohmann_json_j["test_data"];
+    nlohmann_json_t.tiler = (nlohmann_json_j.contains("tiler") ? nlohmann_json_j["tiler"] : "");
+    if (nlohmann_json_j.contains("input_res")) {
+        auto res = nlohmann_json_j.at("input_res").get<std::string>();
+        res.erase(std::remove(res.begin(), res.end(), '('), res.end());
+        res.erase(std::remove(res.begin(), res.end(), ')'), res.end());
+        nlohmann_json_t.input_res.width = std::stoi(res.substr(0, res.find(',')));
+        res.erase(0, res.find(',') + 1);
+        nlohmann_json_t.input_res.height = std::stoi(res);
+    }
+}
+
+void to_json(nlohmann::json& nlohmann_json_j, const ModelData& nlohmann_json_t) {
+    nlohmann_json_j["name"] = nlohmann_json_t.name;
+    nlohmann_json_j["type"] = nlohmann_json_t.type;
+    nlohmann_json_j["test_data"] = nlohmann_json_t.test_data;
+    if (!nlohmann_json_t.tiler.empty()) {
+        nlohmann_json_j["tiler"] = nlohmann_json_t.tiler;
+    }
+    if (!nlohmann_json_t.input_res.empty()) {
+        nlohmann_json_j["input_res"] = "(" + std::to_string(nlohmann_json_t.input_res.width) + "," +
+                                       std::to_string(nlohmann_json_t.input_res.width) + ")";
+    }
+}
+
+void PrintTo(const ModelData& param, std::ostream* os) {
+    nlohmann::json d = param;
+
+    *os << "TestCase(name=" << param.name << ",\n"
+        << "expected=" << param.test_data[0].reference[0] << ",\n"
+        << "input=" << d.dump(2);
+    *os << "\n)";
+}
+
+class ModelParameterizedTest : public testing::TestWithParam<ModelData> {
+public:
+    struct PrintToStringParamName {
+        std::string operator()(const testing::TestParamInfo<ModelData>& info) const {
+            auto data = info.param;
+            return std::to_string(info.index) + "_" + data.type;
+        }
+    };
+};
+
+TEST_P(ModelParameterizedTest, AccuracyTest) {
+    auto data = GetParam();
+
+    auto model_path = DATA_DIR + '/' + data.name;
+
+    if (data.type == "DetectionModel") {
+        auto use_tiling = !data.input_res.empty();
+        auto model = DetectionModel::load(model_path, {{"tiling", use_tiling}});
+
+        for (auto& test_data : data.test_data) {
+            std::string image_path = DATA_DIR + '/' + test_data.image;
+            cv::Mat image = cv::imread(image_path);
+            if (use_tiling) {
+                cv::resize(image, image, data.input_res);
+            }
+            auto result = model.infer(image);
+            EXPECT_EQ(std::string{result}, test_data.reference[0]) << "hello world";
+        }
+
+    } else if (data.type == "SegmentationModel") {
+        GTEST_SKIP();  // Skip since serialization is broken for now.
+        // auto model = SemanticSegmentation::load(model_path);
+    } else if (data.type == "MaskRCNNModel") {
+        GTEST_SKIP();
+    } else {
+        FAIL() << "No implementation for model type " << data.type;
+    }
+}
+
+TEST_P(ModelParameterizedTest, SerializedAccuracyTest) {
+    auto data = GetParam();
+
+    const std::string& basename = data.name.substr(data.name.find_last_of("/\\") + 1);
+    auto model_path = DATA_DIR + "/serialized/" + basename;
+    if (data.type == "DetectionModel") {
+        auto use_tiling = !data.input_res.empty();
+        auto model = DetectionModel::load(model_path, {{"tiling", use_tiling}});
+        for (auto& test_data : data.test_data) {
+            std::string image_path = DATA_DIR + '/' + test_data.image;
+            cv::Mat image = cv::imread(image_path);
+            if (use_tiling) {
+                cv::resize(image, image, data.input_res);
+            }
+            auto result = model.infer(image);
+            EXPECT_EQ(std::string{result}, test_data.reference[0]);
+        }
+    } else if (data.type == "SegmentationModel") {
+        auto model = SemanticSegmentation::load(model_path);
+
+        for (auto& test_data : data.test_data) {
+            std::string image_path = DATA_DIR + '/' + test_data.image;
+            cv::Mat image = cv::imread(image_path);
+            auto result = model.infer(image);
+
+            EXPECT_EQ(format_test_output_to_string(model, result), test_data.reference[0]);
+        }
+    } else if (data.type == "MaskRCNNModel") {
+        auto model = InstanceSegmentation::load(model_path);
+
+        for (auto& test_data : data.test_data) {
+            std::string image_path = DATA_DIR + '/' + test_data.image;
+            cv::Mat image = cv::imread(image_path);
+            auto result = model.infer(image);
+
+            EXPECT_EQ(format_test_output_to_string(model, result), test_data.reference[0]);
+        }
+    } else {
+        FAIL() << "No implementation for model type " << data.type;
+    }
+}
+
+TEST_P(ModelParameterizedTest, AccuracyTestBatch) {
+    auto data = GetParam();
+
+    const std::string& basename = data.name.substr(data.name.find_last_of("/\\") + 1);
+    auto model_path = DATA_DIR + "/serialized/" + basename;
+
+    if (data.type == "DetectionModel") {
+        auto use_tiling = !data.input_res.empty();
+        auto model = DetectionModel::load(model_path, {{"tiling", use_tiling}});
+
+        for (auto& test_data : data.test_data) {
+            std::string image_path = DATA_DIR + '/' + test_data.image;
+            cv::Mat image = cv::imread(image_path);
+            if (use_tiling) {
+                cv::resize(image, image, data.input_res);
+            }
+            auto result = model.inferBatch({image});
+            ASSERT_EQ(result.size(), 1);
+            EXPECT_EQ(std::string{result[0]}, test_data.reference[0]);
+        }
+    } else if (data.type == "SegmentationModel") {
+        auto model = SemanticSegmentation::load(model_path);
+
+        for (auto& test_data : data.test_data) {
+            std::string image_path = DATA_DIR + '/' + test_data.image;
+            cv::Mat image = cv::imread(image_path);
+            auto result = model.inferBatch({image});
+
+            EXPECT_EQ(format_test_output_to_string(model, result[0]), test_data.reference[0]);
+        }
+    } else if (data.type == "MaskRCNNModel") {
+        auto model = InstanceSegmentation::load(model_path);
+
+        for (auto& test_data : data.test_data) {
+            std::string image_path = DATA_DIR + '/' + test_data.image;
+            cv::Mat image = cv::imread(image_path);
+            auto result = model.inferBatch({image});
+
+            ASSERT_EQ(result.size(), 1);
+            EXPECT_EQ(format_test_output_to_string(model, result[0]), test_data.reference[0]);
+        }
+    } else {
+        FAIL() << "No implementation for model type " << data.type;
+    }
+}
+
+std::vector<ModelData> GetTestData(const std::string& path) {
+    std::ifstream input(path);
+    nlohmann::json j;
+    input >> j;
+    return j;
+}
+
+INSTANTIATE_TEST_SUITE_P(TestAccuracy,
+                         ModelParameterizedTest,
+                         testing::ValuesIn(GetTestData(PUBLIC_SCOPE_PATH)),
+                         [](const ::testing::TestParamInfo<ModelData>& info) {
+                             return std::to_string(info.index) + "_" + info.param.type;  // So test name will be "case1"
+                         });
+
+class InputParser {
+public:
+    InputParser(int& argc, char** argv) {
+        for (int i = 1; i < argc; ++i)
+            this->tokens.push_back(std::string(argv[i]));
+    }
+
+    const std::string& getCmdOption(const std::string& option) const {
+        std::vector<std::string>::const_iterator itr;
+        itr = std::find(this->tokens.begin(), this->tokens.end(), option);
+        if (itr != this->tokens.end() && ++itr != this->tokens.end()) {
+            return *itr;
+        }
+        static const std::string empty_string("");
+        return empty_string;
+    }
+
+    bool cmdOptionExists(const std::string& option) const {
+        return std::find(this->tokens.begin(), this->tokens.end(), option) != this->tokens.end();
+    }
+
+private:
+    std::vector<std::string> tokens;
+};
+
+void print_help(const char* program_name) {
+    std::cout << "Usage: " << program_name << " -p <path_to_public_scope.json> -d <path_to_data>" << std::endl;
+}
+
+int main(int argc, char** argv) {
+    InputParser input(argc, argv);
+
+    if (input.cmdOptionExists("-h")) {
+        print_help(argv[0]);
+        return 1;
+    }
+    const std::string& public_scope = input.getCmdOption("-p");
+    if (!public_scope.empty()) {
+        PUBLIC_SCOPE_PATH = public_scope;
+    } else {
+        print_help(argv[0]);
+        return 1;
+    }
+    const std::string& data_dir = input.getCmdOption("-d");
+    if (!data_dir.empty()) {
+        DATA_DIR = data_dir;
+    } else {
+        print_help(argv[0]);
+        return 1;
+    }
+
+    testing::InitGoogleTest(&argc, argv);
+
+    return RUN_ALL_TESTS();
+}
diff --git a/tests/python/accuracy/conftest.py b/tests/python/accuracy/conftest.py
index 1afca4bc..6379d72f 100644
--- a/tests/python/accuracy/conftest.py
+++ b/tests/python/accuracy/conftest.py
@@ -1,5 +1,5 @@
 #
-# Copyright (C) 2020-2024 Intel Corporation
+# Copyright (C) 2020-2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #
 import json
diff --git a/tests/python/accuracy/prepare_data.py b/tests/python/accuracy/prepare_data.py
index ba7e9b4d..ed9a00f7 100644
--- a/tests/python/accuracy/prepare_data.py
+++ b/tests/python/accuracy/prepare_data.py
@@ -1,5 +1,5 @@
 #
-# Copyright (C) 2020-2024 Intel Corporation
+# Copyright (C) 2020-2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #
 import argparse
diff --git a/tests/python/accuracy/public_scope.json b/tests/python/accuracy/public_scope.json
index f198a02f..2dbed871 100644
--- a/tests/python/accuracy/public_scope.json
+++ b/tests/python/accuracy/public_scope.json
@@ -24,50 +24,37 @@
     ]
   },
   {
-    "name": "otx_models/Lite-hrnet-s_mod2.xml",
-    "type": "SegmentationModel",
-    "test_data": [
-      {
-        "image": "coco128/images/train2017/000000000074.jpg",
-        "reference": [
-          "0: 0.563, 1: 0.437, [426,640,2], [0], [0]; object: 0.520, 26, object: 0.530, 42, object: 0.501, 4, object: 0.507, 27, object: 0.503, 8, object: 0.502, 6, object: 0.505, 18, object: 0.504, 13, object: 0.524, 87, object: 0.521, 89, object: 0.757, 2706, "
-        ]
-      }
-    ]
-  },
-  {
-    "name": "otx_models/Lite-hrnet-s_mod2.onnx",
+    "name": "otx_models/segmentation_model_with_xai_head.xml",
     "type": "SegmentationModel",
     "test_data": [
       {
         "image": "coco128/images/train2017/000000000074.jpg",
         "reference": [
-          "0: 0.563, 1: 0.437, [426,640,2], [0], [0]; object: 0.520, 26, object: 0.530, 42, object: 0.501, 4, object: 0.507, 27, object: 0.503, 8, object: 0.502, 6, object: 0.505, 18, object: 0.504, 13, object: 0.524, 87, object: 0.521, 89, object: 0.757, 2706, "
+          "0: 1.000, 1: 0.000, [426,640,3], [426,640,3], [1,600,1,1]; backpack: 0.505, 2, "
         ]
       }
     ]
   },
   {
-    "name": "otx_models/Lite-hrnet-s_mod2.onnx",
-    "type": "SegmentationModel",
-    "force_ort": "True",
+    "name": "otx_models/maskrcnn_model_with_xai_head.xml",
+    "type": "MaskRCNNModel",
     "test_data": [
       {
         "image": "coco128/images/train2017/000000000074.jpg",
         "reference": [
-          "0: 0.561, 1: 0.439, [426,640,2], [0], [0]; object: 0.519, 26, object: 0.531, 42, object: 0.502, 21, object: 0.505, 9, object: 0.501, 4, object: 0.509, 22, object: 0.524, 85, object: 0.520, 93, object: 0.754, 2564, "
+          "61, 277, 358, 382, 17 (horse): 0.998, 18312, RotatedRect: 212.000 327.000 290.000 100.000 0.000; 1, 14, 162, 321, 2 (car): 0.994, 25867, RotatedRect: 54.067 173.034 285.208 156.889 61.996; 327, 96, 341, 134, 1 (bicycle): 0.930, 279, RotatedRect: 333.500 114.000 36.000 13.000 90.000; 460, 106, 493, 148, 1 (bicycle): 0.898, 786, RotatedRect: 476.284 126.621 27.308 45.993 19.179; 294, 93, 315, 153, 1 (bicycle): 0.869, 789, RotatedRect: 304.000 124.000 58.000 18.000 90.000; 278, 109, 290, 152, 1 (bicycle): 0.817, 355, RotatedRect: 283.500 130.000 42.000 11.000 90.000; 4, 4, 102, 191, 2 (car): 0.701, 9658, RotatedRect: 51.806 97.259 184.445 95.281 89.246; 270, 93, 290, 152, 1 (bicycle): 0.660, 723, RotatedRect: 280.500 122.500 17.000 59.000 0.000; 322, 114, 343, 152, 18 (sheep): 0.520, 298, RotatedRect: 332.000 133.000 34.000 14.000 90.000; 4; [1,1280,1,1]; "
         ]
       }
     ]
   },
   {
-    "name": "otx_models/Lite-hrnet-x-mod3.xml",
-    "type": "SegmentationModel",
+    "name": "otx_models/is_resnet50_maskrcnn_coco_reduced.xml",
+    "type": "MaskRCNNModel",
     "test_data": [
       {
         "image": "coco128/images/train2017/000000000074.jpg",
         "reference": [
-          "0: 0.944, 1: 0.056, [426,640,2], [0], [0]; object: 0.505, 2, object: 0.518, 8, object: 0.512, 5, object: 0.506, 4, object: 0.526, 8, object: 0.529, 21, object: 0.513, 12, object: 0.535, 49, object: 0.505, 2, object: 0.512, 4, object: 0.547, 6, object: 0.511, 6, object: 0.503, 1, object: 0.539, 6, object: 0.543, 39, object: 0.529, 2, object: 0.516, 9, object: 0.565, 157, object: 0.524, 6, object: 0.528, 15, object: 0.521, 18, object: 0.502, 1, object: 0.537, 73, object: 0.513, 4, object: 0.524, 27, object: 0.513, 6, object: 0.538, 65, object: 0.501, 6, object: 0.504, 1, object: 0.507, 4, object: 0.502, 1, object: 0.518, 8, object: 0.530, 11, object: 0.502, 2, object: 0.516, 2, object: 0.506, 1, object: 0.567, 17, object: 0.502, 1, object: 0.512, 7, object: 0.538, 24, object: 0.507, 1, object: 0.534, 12, object: 0.537, 6, object: 0.519, 13, object: 0.505, 2, object: 0.517, 16, object: 0.505, 5, object: 0.506, 20, object: 0.508, 6, object: 0.519, 24, object: 0.507, 4, object: 0.506, 2, object: 0.511, 4, object: 0.556, 47, object: 0.510, 10, object: 0.500, 1, object: 0.504, 5, object: 0.501, 1, object: 0.510, 6, object: 0.549, 13, object: 0.509, 2, object: 0.510, 3, object: 0.514, 1, object: 0.529, 15, object: 0.551, 110, object: 0.504, 2, object: 0.503, 3, object: 0.518, 16, object: 0.511, 14, object: 0.502, 1, object: 0.523, 1, object: 0.533, 16, object: 0.568, 66, object: 0.582, 1793, "
+          "59, 277, 360, 380, 16 (horse): 0.999, 19053, RotatedRect: 210.000 327.500 101.000 296.000 90.000; 2, 9, 162, 318, 2 (car): 0.999, 31153, RotatedRect: 82.086 163.312 307.394 156.997 89.669; 294, 94, 316, 153, 1 (bicycle): 0.985, 840, RotatedRect: 305.000 123.500 59.000 18.000 90.000; 326, 97, 341, 136, 1 (bicycle): 0.974, 397, RotatedRect: 332.500 116.000 38.000 13.000 90.000; 461, 105, 493, 150, 1 (bicycle): 0.918, 846, RotatedRect: 476.052 126.972 27.619 47.834 16.928; 350, 92, 386, 149, 1 (bicycle): 0.807, 1458, RotatedRect: 369.319 119.891 54.848 34.230 82.405; 279, 110, 291, 146, 1 (bicycle): 0.788, 312, RotatedRect: 284.000 127.500 35.000 10.000 90.000; 0; [0]; horse: 0.999, 668; car: 0.999, 782; bicycle: 0.985, 127; bicycle: 0.974, 87; bicycle: 0.918, 122; bicycle: 0.807, 140; bicycle: 0.788, 79; "
         ]
       }
     ]
@@ -84,188 +71,6 @@
       }
     ]
   },
-  {
-    "name": "otx_models/det_mobilenetv2_atss_bccd_onnx.onnx",
-    "type": "DetectionModel",
-    "test_data": [
-      {
-        "image": "BloodImage_00007.jpg",
-        "reference": [
-          "494, 159, 637, 308, 2 (WBC): 0.697; 28, 139, 135, 228, 1 (RBC): 0.628; 535, 375, 638, 479, 1 (RBC): 0.524; 513, 8, 633, 152, 1 (RBC): 0.430; 21, 291, 143, 399, 1 (RBC): 0.422; 196, 86, 410, 286, 1 (RBC): 0.422; [0]; [0]"
-        ]
-      }
-    ]
-  },
-  {
-    "name": "otx_models/det_mobilenetv2_atss_bccd_onnx.onnx",
-    "type": "DetectionModel",
-    "force_ort": "True",
-    "test_data": [
-      {
-        "image": "BloodImage_00007.jpg",
-        "reference": [
-          "494, 159, 637, 308, 2 (WBC): 0.700; 28, 139, 136, 228, 1 (RBC): 0.623; 535, 374, 638, 479, 1 (RBC): 0.535; 513, 8, 633, 151, 1 (RBC): 0.454; 197, 86, 412, 286, 1 (RBC): 0.405; 21, 291, 143, 399, 1 (RBC): 0.401; [0]; [0]"
-        ]
-      }
-    ]
-  },
-  {
-    "name": "otx_models/mlc_mobilenetv3_large_voc.xml",
-    "type": "ClassificationModel",
-    "test_data": [
-      {
-        "image": "coco128/images/train2017/000000000081.jpg",
-        "reference": ["0 (aeroplane): 0.943, [0], [0], [0]"]
-      }
-    ]
-  },
-  {
-    "name": "otx_models/mlc_efficient_b0_voc.xml",
-    "type": "ClassificationModel",
-    "test_data": [
-      {
-        "image": "coco128/images/train2017/000000000074.jpg",
-        "reference": [
-          "1 (bicycle): 0.768, 11 (dog): 0.876, 14 (person): 0.922, [0], [0], [0]"
-        ]
-      }
-    ]
-  },
-  {
-    "name": "otx_models/mlc_efficient_v2s_voc.xml",
-    "type": "ClassificationModel",
-    "test_data": [
-      {
-        "image": "coco128/images/train2017/000000000074.jpg",
-        "reference": [
-          "1 (bicycle): 0.825, 11 (dog): 0.873, 14 (person): 0.824, [0], [0], [0]"
-        ]
-      }
-    ]
-  },
-  {
-    "name": "otx_models/cls_mobilenetv3_large_cars.xml",
-    "type": "ClassificationModel",
-    "check_extra_rt_info": "True",
-    "test_data": [
-      {
-        "image": "coco128/images/train2017/000000000471.jpg",
-        "reference": ["105 (194): 0.456, [0], [0], [0]"]
-      }
-    ]
-  },
-  {
-    "name": "otx_models/cls_mobilenetv3_large_cars.onnx",
-    "type": "ClassificationModel",
-    "test_data": [
-      {
-        "image": "coco128/images/train2017/000000000471.jpg",
-        "reference": ["105 (194): 0.456, [0], [0], [196]"]
-      }
-    ]
-  },
-  {
-    "name": "otx_models/cls_mobilenetv3_large_cars.onnx",
-    "type": "ClassificationModel",
-    "force_ort": "True",
-    "test_data": [
-      {
-        "image": "coco128/images/train2017/000000000471.jpg",
-        "reference": ["105 (194): 0.062, [0], [0], [196]"]
-      }
-    ]
-  },
-  {
-    "name": "otx_models/cls_efficient_b0_cars.xml",
-    "type": "ClassificationModel",
-    "test_data": [
-      {
-        "image": "coco128/images/train2017/000000000471.jpg",
-        "reference": ["0 (1): 0.838, [0], [0], [0]"]
-      }
-    ]
-  },
-  {
-    "name": "otx_models/cls_efficient_b0_shuffled_outputs.xml",
-    "type": "ClassificationModel",
-    "test_data": [
-      {
-        "image": "coco128/images/train2017/000000000471.jpg",
-        "reference": [
-          "4 (Circle): 0.943, 5 (Lion): 0.969, 3 (Non-Rigid): 0.503, 6 (Panda): 0.988, [1,7,7,7], [1,7], [0]"
-        ]
-      }
-    ]
-  },
-  {
-    "name": "otx_models/cls_efficient_v2s_cars.xml",
-    "type": "ClassificationModel",
-    "test_data": [
-      {
-        "image": "coco128/images/train2017/000000000471.jpg",
-        "reference": ["0 (1): 0.849, [0], [0], [0]"]
-      }
-    ]
-  },
-  {
-    "name": "otx_models/is_efficientnetb2b_maskrcnn_coco_reduced.xml",
-    "type": "MaskRCNNModel",
-    "test_data": [
-      {
-        "image": "coco128/images/train2017/000000000074.jpg",
-        "reference": [
-          "458, 106, 495, 150, 1 (bicycle): 0.818, 852, RotatedRect: 478.119 130.332 28.677 46.408 46.637; 0, 30, 178, 323, 2 (car): 0.753, 26728, RotatedRect: 79.739 177.262 251.785 156.656 87.397; 0; [0]; bicycle: 0.818, 139; car: 0.753, 622; "
-        ]
-      }
-    ]
-  },
-  {
-    "name": "otx_models/is_efficientnetb2b_maskrcnn_coco_reduced_onnx.onnx",
-    "type": "MaskRCNNModel",
-    "test_data": [
-      {
-        "image": "coco128/images/train2017/000000000074.jpg",
-        "reference": [
-          "458, 106, 495, 150, 1 (person): 0.818, 852, RotatedRect: 478.119 130.332 28.677 46.408 46.637; 0, 30, 178, 323, 2 (bicycle): 0.753, 26728, RotatedRect: 79.739 177.262 251.785 156.656 87.397; 0; [0]; person: 0.818, 139; bicycle: 0.753, 622; "
-        ]
-      }
-    ]
-  },
-  {
-    "name": "otx_models/is_efficientnetb2b_maskrcnn_coco_reduced_onnx.onnx",
-    "type": "MaskRCNNModel",
-    "force_ort": "True",
-    "test_data": [
-      {
-        "image": "coco128/images/train2017/000000000074.jpg",
-        "reference": [
-          "458, 106, 495, 150, 1 (person): 0.816, 851, RotatedRect: 478.119 130.332 28.677 46.408 46.637; 0, 30, 178, 323, 2 (bicycle): 0.754, 26748, RotatedRect: 79.762 177.261 251.785 156.702 87.397; 0; [0]; person: 0.816, 142; bicycle: 0.754, 622; "
-        ]
-      }
-    ]
-  },
-  {
-    "name": "otx_models/is_resnet50_maskrcnn_coco_reduced.xml",
-    "type": "MaskRCNNModel",
-    "test_data": [
-      {
-        "image": "coco128/images/train2017/000000000074.jpg",
-        "reference": [
-          "59, 277, 360, 380, 16 (horse): 0.999, 19053, RotatedRect: 210.000 327.500 101.000 296.000 90.000; 2, 9, 162, 318, 2 (car): 0.999, 31153, RotatedRect: 82.086 163.312 307.394 156.997 89.669; 294, 94, 316, 153, 1 (bicycle): 0.985, 840, RotatedRect: 305.000 123.500 59.000 18.000 90.000; 326, 97, 341, 136, 1 (bicycle): 0.974, 397, RotatedRect: 332.500 116.000 38.000 13.000 90.000; 461, 105, 493, 150, 1 (bicycle): 0.918, 846, RotatedRect: 476.052 126.972 27.619 47.834 16.928; 350, 92, 386, 149, 1 (bicycle): 0.807, 1458, RotatedRect: 369.319 119.891 54.848 34.230 82.405; 279, 110, 291, 146, 1 (bicycle): 0.788, 312, RotatedRect: 284.000 127.500 35.000 10.000 90.000; 0; [0]; horse: 0.999, 668; car: 0.999, 782; bicycle: 0.985, 127; bicycle: 0.974, 87; bicycle: 0.918, 122; bicycle: 0.807, 140; bicycle: 0.788, 79; "
-        ]
-      }
-    ]
-  },
-  {
-    "name": "otx_models/classification_model_with_xai_head.xml",
-    "type": "ClassificationModel",
-    "test_data": [
-      {
-        "image": "coco128/images/train2017/000000000081.jpg",
-        "reference": ["0 (horse): 0.543, [1,4,7,7], [1,1280,1,1], [0]"]
-      }
-    ]
-  },
   {
     "name": "otx_models/detection_model_with_xai_head.xml",
     "type": "DetectionModel",
@@ -278,46 +83,6 @@
       }
     ]
   },
-  {
-    "name": "otx_models/segmentation_model_with_xai_head.xml",
-    "type": "SegmentationModel",
-    "test_data": [
-      {
-        "image": "coco128/images/train2017/000000000074.jpg",
-        "reference": [
-          "0: 1.000, 1: 0.000, [426,640,3], [426,640,3], [1,600,1,1]; backpack: 0.505, 2, "
-        ]
-      }
-    ]
-  },
-  {
-    "name": "otx_models/maskrcnn_model_with_xai_head.xml",
-    "type": "MaskRCNNModel",
-    "test_data": [
-      {
-        "image": "coco128/images/train2017/000000000074.jpg",
-        "reference": [
-          "61, 277, 358, 382, 17 (horse): 0.998, 18312, RotatedRect: 212.000 327.000 290.000 100.000 0.000; 1, 14, 162, 321, 2 (car): 0.994, 25867, RotatedRect: 54.067 173.034 285.208 156.889 61.996; 327, 96, 341, 134, 1 (bicycle): 0.930, 279, RotatedRect: 333.500 114.000 36.000 13.000 90.000; 460, 106, 493, 148, 1 (bicycle): 0.898, 786, RotatedRect: 476.284 126.621 27.308 45.993 19.179; 294, 93, 315, 153, 1 (bicycle): 0.869, 789, RotatedRect: 304.000 124.000 58.000 18.000 90.000; 278, 109, 290, 152, 1 (bicycle): 0.817, 355, RotatedRect: 283.500 130.000 42.000 11.000 90.000; 4, 4, 102, 191, 2 (car): 0.701, 9658, RotatedRect: 51.806 97.259 184.445 95.281 89.246; 270, 93, 290, 152, 1 (bicycle): 0.660, 723, RotatedRect: 280.500 122.500 17.000 59.000 0.000; 322, 114, 343, 152, 18 (sheep): 0.520, 298, RotatedRect: 332.000 133.000 34.000 14.000 90.000; 4; [1,1280,1,1]; "
-        ]
-      }
-    ]
-  },
-  {
-    "name": "otx_models/maskrcnn_xai_tiling.xml",
-    "type": "MaskRCNNModel",
-    "tiler": "InstanceSegmentationTiler",
-    "extra_model": "otx_models/tile_classifier.xml",
-    "extra_type": "ImageModel",
-    "input_res": "(3500,3500)",
-    "test_data": [
-      {
-        "image": "coco128/images/train2017/000000000074.jpg",
-        "reference": [
-          "1535, 585, 1662, 697, 2 (ellipse): 0.643, 9822, RotatedRect: 1598.500 641.500 111.000 109.000 90.000; 3091, 3097, 3105, 3112, 1 (rectangle): 0.483, 197, RotatedRect: 3097.500 3104.000 14.000 13.000 90.000; 2734, 60, 2867, 324, 1 (rectangle): 0.401, 30622, RotatedRect: 2800.000 188.500 255.000 132.000 90.000; 2; [1,1280,1,1]; ellipse: 0.643, 331; rectangle: 0.483, 48; rectangle: 0.401, 758; "
-        ]
-      }
-    ]
-  },
   {
     "name": "otx_models/detection_model_with_xai_head.xml",
     "type": "DetectionModel",
@@ -331,105 +96,5 @@
         ]
       }
     ]
-  },
-  {
-    "name": "otx_models/anomaly_padim_bottle_mvtec.xml",
-    "type": "AnomalyDetection",
-    "test_data": [
-      {
-        "image": "coco128/images/train2017/000000000074.jpg",
-        "reference": [
-          "anomaly_map min:151 max:255;pred_score:1.0;pred_label:Anomaly;pred_mask min:1 max:1;"
-        ]
-      }
-    ]
-  },
-  {
-    "name": "otx_models/anomaly_stfpm_bottle_mvtec.xml",
-    "type": "AnomalyDetection",
-    "test_data": [
-      {
-        "image": "coco128/images/train2017/000000000074.jpg",
-        "reference": [
-          "anomaly_map min:124 max:225;pred_score:0.9;pred_label:Anomaly;pred_mask min:0 max:1;"
-        ]
-      }
-    ]
-  },
-  {
-    "name": "otx_models/deit-tiny.xml",
-    "type": "ClassificationModel",
-    "test_data": [
-      {
-        "image": "coco128/images/train2017/000000000074.jpg",
-        "reference": ["3 (cat): 0.648, [0], [0], [10]"]
-      }
-    ]
-  },
-  {
-    "name": "otx_models/action_cls_xd3_kinetic.xml",
-    "type": "ActionClassificationModel",
-    "test_data": [
-      {
-        "image": "coco128/images/train2017/000000000471.jpg",
-        "reference": ["38 (WritingOnBoard): 0.096, [0], [0], [0]"]
-      }
-    ]
-  },
-  {
-    "name": "otx_models/sam_vit_b_zsl_decoder.xml",
-    "type": "SAMDecoder",
-    "prompter": "SAMLearnableVisualPrompter",
-    "encoder": "otx_models/sam_vit_b_zsl_encoder.xml",
-    "encoder_type": "SAMImageEncoder",
-    "test_data": [
-      {
-        "image": "coco128/images/train2017/000000000471.jpg",
-        "reference": [
-          "mask sum: 108565; [385.0, 315.0] iou: 0.930 [335.0, 414.0] iou: 0.763 [44.0, 205.0] iou: 0.665 [605.0, 224.0] iou: 0.653, mask sum: 73931; [175.0, 215.0] iou: 0.781 [124.0, 165.0] iou: 0.651"
-        ]
-      }
-    ]
-  },
-  {
-    "name": "otx_models/sam_vit_b_zsl_decoder.xml",
-    "type": "SAMDecoder",
-    "prompter": "SAMVisualPrompter",
-    "encoder": "otx_models/sam_vit_b_zsl_encoder.xml",
-    "encoder_type": "SAMImageEncoder",
-    "test_data": [
-      {
-        "image": "coco128/images/train2017/000000000471.jpg",
-        "reference": [
-          "upscaled_masks min:-25.907 max:11.185;hard_predictions shape:(4, 427, 640);"
-        ]
-      }
-    ]
-  },
-  {
-    "name": "otx_models/rtmpose_tiny.xml",
-    "type": "KeypointDetectionModel",
-    "test_data": [
-      {
-        "image": "coco128/images/train2017/000000000471.jpg",
-        "reference": [
-          "keypoints: (17, 2), keypoints_x_sum: 2930.000, scores: (17,) 14.061"
-        ]
-      }
-    ]
-  },
-  {
-    "name": "otx_models/segnext_t_tiling.xml",
-    "type": "SegmentationModel",
-    "tiler": "SemanticSegmentationTiler",
-    "input_res": "(3500,3500)",
-    "test_data": [
-      {
-        "image": "coco128/images/train2017/000000000074.jpg",
-        "reference": [
-          "0: 0.272, 1: 0.728, [3500,3500,5], [0], [0]; background: 1.404, 311, background: 1.397, 44, background: 1.371, 34, background: 1.377, 12, background: 1.356, 155, background: 1.345, 12, background: 1.183, 219, background: 1.524, 8, background: 1.533, 4, background: 1.519, 2, background: 1.524, 4, background: 1.530, 6, background: 1.537, 2, background: 1.514, 4, background: 1.519, 8, background: 1.529, 6, background: 1.550, 6, background: 1.558, 4, background: 1.520, 2, background: 1.529, 4, background: 1.532, 6, background: 1.535, 6, background: 1.530, 2, background: 1.529, 50, background: 1.528, 22, background: 1.527, 38, background: 1.451, 1476, background: 1.345, 2743, background: 1.609, 2987, background: 1.636, 29909, "
-        ]
-      }
-    ]
   }
 ]
diff --git a/tests/python/accuracy/test_YOLOv8.py b/tests/python/accuracy/test_YOLOv8.py
index 2b1ae77e..1a37a78f 100644
--- a/tests/python/accuracy/test_YOLOv8.py
+++ b/tests/python/accuracy/test_YOLOv8.py
@@ -1,5 +1,5 @@
 #
-# Copyright (C) 2020-2024 Intel Corporation
+# Copyright (C) 2020-2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #
 import functools
diff --git a/tests/python/accuracy/test_accuracy.py b/tests/python/accuracy/test_accuracy.py
index 98af9f72..f3cf21f4 100644
--- a/tests/python/accuracy/test_accuracy.py
+++ b/tests/python/accuracy/test_accuracy.py
@@ -1,5 +1,5 @@
 #
-# Copyright (C) 2020-2024 Intel Corporation
+# Copyright (C) 2020-2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #
 import json
diff --git a/tests/python/functional/test_load.py b/tests/python/functional/test_load.py
index 37dc6c98..b4d6b946 100644
--- a/tests/python/functional/test_load.py
+++ b/tests/python/functional/test_load.py
@@ -1,5 +1,5 @@
 #
-# Copyright (C) 2020-2024 Intel Corporation
+# Copyright (C) 2020-2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #
 
diff --git a/tests/python/functional/test_save.py b/tests/python/functional/test_save.py
index 754d3310..0fc372c6 100644
--- a/tests/python/functional/test_save.py
+++ b/tests/python/functional/test_save.py
@@ -1,5 +1,5 @@
 #
-# Copyright (C) 2020-2024 Intel Corporation
+# Copyright (C) 2020-2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #
 
diff --git a/tests/python/unit/results/test_cls_result.py b/tests/python/unit/results/test_cls_result.py
index 7110e4a1..bfa5a84d 100644
--- a/tests/python/unit/results/test_cls_result.py
+++ b/tests/python/unit/results/test_cls_result.py
@@ -1,5 +1,5 @@
 #
-# Copyright (C) 2020-2024 Intel Corporation
+# Copyright (C) 2020-2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #