openvinotoolkit
diff --git a/‎demos/common/cpp/utils/include/utils/common.hpp
Lines changed: 2 additions & 2 deletions b/‎demos/common/cpp/utils/include/utils/common.hpp
Lines changed: 2 additions & 2 deletions
diff --git a/‎demos/common/cpp/utils/include/utils/ocv_common.hpp
Lines changed: 87 additions & 22 deletions b/‎demos/common/cpp/utils/include/utils/ocv_common.hpp
Lines changed: 87 additions & 22 deletions
diff --git a/‎demos/gaze_estimation_demo/cpp/include/eye_state_estimator.hpp
Lines changed: 3 additions & 3 deletions b/‎demos/gaze_estimation_demo/cpp/include/eye_state_estimator.hpp
Lines changed: 3 additions & 3 deletions
diff --git a/‎demos/gaze_estimation_demo/cpp/include/face_detector.hpp
Lines changed: 5 additions & 6 deletions b/‎demos/gaze_estimation_demo/cpp/include/face_detector.hpp
Lines changed: 5 additions & 6 deletions
diff --git a/‎demos/gaze_estimation_demo/cpp/include/gaze_estimator.hpp
Lines changed: 3 additions & 3 deletions b/‎demos/gaze_estimation_demo/cpp/include/gaze_estimator.hpp
Lines changed: 3 additions & 3 deletions
diff --git a/‎demos/gaze_estimation_demo/cpp/include/head_pose_estimator.hpp
Lines changed: 3 additions & 3 deletions b/‎demos/gaze_estimation_demo/cpp/include/head_pose_estimator.hpp
Lines changed: 3 additions & 3 deletions
diff --git a/‎demos/gaze_estimation_demo/cpp/include/ie_wrapper.hpp
Lines changed: 18 additions & 18 deletions b/‎demos/gaze_estimation_demo/cpp/include/ie_wrapper.hpp
Lines changed: 18 additions & 18 deletions
@@ -36,7 +36,7 @@
 #endif
 
 template <typename T, std::size_t N>
-constexpr std::size_t arraySize(const T (&)[N]) noexcept {
+constexpr std::size_t arraySize(const T(&)[N]) noexcept {
     return N;
 }
 
@@ -221,7 +221,7 @@ inline void showAvailableDevices() {
     std::cout << std::endl;
 }
 
-inline std::string fileNameNoExt(const std::string &filepath) {
+inline std::string fileNameNoExt(const std::string& filepath) {
     auto pos = filepath.rfind('.');
     if (pos == std::string::npos) return filepath;
     return filepath.substr(0, pos);
 
@@ -14,10 +14,12 @@
 #include "utils/common.hpp"
 #include "utils/shared_blob_allocator.h"
 
+#include "openvino/openvino.hpp"
 
-/**
-* @brief Get cv::Mat value in the correct format.
-*/
+
+ /**
+ * @brief Get cv::Mat value in the correct format.
+ */
 template <typename T>
 static const T getMatValue(const cv::Mat& mat, size_t h, size_t w, size_t c) {
     switch (mat.type()) {
@@ -48,9 +50,11 @@ static UNUSED void matToBlob(const cv::Mat& mat, const InferenceEngine::Blob::Pt
     }
     int batchOffset = batchIndex * width * height * channels;
 
-    cv::Mat resizedMat(mat);
+    cv::Mat resizedMat;
     if (static_cast<int>(width) != mat.size().width || static_cast<int>(height) != mat.size().height) {
         cv::resize(mat, resizedMat, cv::Size(width, height));
+    } else {
+        resizedMat = mat;
     }
 
     InferenceEngine::LockedMemory<void> blobMapped = InferenceEngine::as<InferenceEngine::MemoryBlob>(blob)->wmap();
@@ -61,10 +65,9 @@ static UNUSED void matToBlob(const cv::Mat& mat, const InferenceEngine::Blob::Pt
                 for (size_t w = 0; w < width; w++)
                     blobData[batchOffset + c * width * height + h * width + w] =
                         getMatValue<float_t>(resizedMat, h, w, c);
-    }
-    else {
+    } else {
         uint8_t* blobData = blobMapped.as<uint8_t*>();
-        if ((resizedMat.type() & CV_MAT_DEPTH_MASK) == CV_32F) {
+        if (resizedMat.depth() == CV_32F) {
             throw std::runtime_error("Conversion of cv::Mat from float_t to uint8_t is forbidden");
         }
         for (size_t c = 0; c < channels; c++)
@@ -75,14 +78,62 @@ static UNUSED void matToBlob(const cv::Mat& mat, const InferenceEngine::Blob::Pt
     }
 }
 
+/**
+* @brief Resize and copy image data from cv::Mat object to a given Tensor object.
+* @param mat - given cv::Mat object with an image data.
+* @param tensor - Tensor object which to be filled by an image data.
+* @param batchIndex - batch index of an image inside of the blob.
+*/
+static UNUSED void matToTensor(const cv::Mat& mat, const ov::runtime::Tensor& tensor, int batchIndex = 0) {
+    ov::Shape tensorShape = tensor.get_shape();
+    ov::Layout layout("NCHW");
+    const size_t width = tensorShape[ov::layout::width_idx(layout)];
+    const size_t height = tensorShape[ov::layout::height_idx(layout)];
+    const size_t channels = tensorShape[ov::layout::channels_idx(layout)];
+    if (static_cast<size_t>(mat.channels()) != channels) {
+        throw std::runtime_error("The number of channels for net input and image must match");
+    }
+    if (channels != 1 && channels != 3) {
+        throw std::runtime_error("Unsupported number of channels");
+    }
+    int batchOffset = batchIndex * width * height * channels;
+
+    cv::Mat resizedMat;
+    if (static_cast<int>(width) != mat.size().width || static_cast<int>(height) != mat.size().height) {
+        cv::resize(mat, resizedMat, cv::Size(width, height));
+    } else {
+        resizedMat = mat;
+    }
+
+    if (tensor.get_element_type() == ov::element::f32) {
+        float_t* tensorData = tensor.data<float_t>();
+        for (size_t c = 0; c < channels; c++)
+            for (size_t h = 0; h < height; h++)
+                for (size_t w = 0; w < width; w++)
+                    tensorData[batchOffset + c * width * height + h * width + w] =
+                        getMatValue<float_t>(resizedMat, h, w, c);
+    }
+    else {
+        uint8_t* tensorData = tensor.data<uint8_t>();
+        if (resizedMat.depth() == CV_32F) {
+            throw std::runtime_error("Conversion of cv::Mat from float_t to uint8_t is forbidden");
+        }
+        for (size_t c = 0; c < channels; c++)
+            for (size_t h = 0; h < height; h++)
+                for (size_t w = 0; w < width; w++)
+                    tensorData[batchOffset + c * width * height + h * width + w] =
+                        getMatValue<uint8_t>(resizedMat, h, w, c);
+    }
+}
+
 /**
  * @brief Wraps data stored inside of a passed cv::Mat object by new Blob pointer.
  * @note: No memory allocation is happened. The blob just points to already existing
  *        cv::Mat data.
  * @param mat - given cv::Mat object with an image data.
  * @return resulting Blob pointer.
  */
-static UNUSED InferenceEngine::Blob::Ptr wrapMat2Blob(const cv::Mat &mat) {
+static UNUSED InferenceEngine::Blob::Ptr wrapMat2Blob(const cv::Mat& mat) {
     auto matType = mat.type() & CV_MAT_DEPTH_MASK;
     if (matType != CV_8U && matType != CV_32F) {
         throw std::runtime_error("Unsupported mat type for wrapping");
@@ -104,21 +155,34 @@ static UNUSED InferenceEngine::Blob::Ptr wrapMat2Blob(const cv::Mat &mat) {
     InferenceEngine::Precision precision = isMatFloat ?
         InferenceEngine::Precision::FP32 : InferenceEngine::Precision::U8;
     InferenceEngine::TensorDesc tDesc(precision,
-                                      {1, channels, height, width},
-                                      InferenceEngine::Layout::NHWC);
+        { 1, channels, height, width },
+        InferenceEngine::Layout::NHWC);
 
     InferenceEngine::Blob::Ptr blob;
     if (isMatFloat) {
         blob = InferenceEngine::make_shared_blob<float>(tDesc, std::make_shared<SharedBlobAllocator>(mat));
-    }
-    else {
+    } else {
         blob = InferenceEngine::make_shared_blob<uint8_t>(tDesc, std::make_shared<SharedBlobAllocator>(mat));
     }
 
     blob->allocate();
     return blob;
 }
 
+static UNUSED ov::runtime::Tensor wrapMat2Tensor(const cv::Mat& mat) {
+    const size_t channels = mat.channels();
+    const size_t height = mat.size().height;
+    const size_t width = mat.size().width;
+
+    const size_t strideH = mat.step.buf[0];
+    const size_t strideW = mat.step.buf[1];
+
+    const bool is_dense = strideW == channels && strideH == channels * width;
+    OPENVINO_ASSERT(is_dense, "Doesn't support conversion from not dense cv::Mat");
+
+    return ov::runtime::Tensor(ov::element::u8, ov::Shape{ 1, height, width, channels }, mat.data);
+}
+
 /**
  * @brief Puts text message on the frame, highlights the text with a white border to make it distinguishable from
  *        the background.
@@ -131,12 +195,12 @@ static UNUSED InferenceEngine::Blob::Ptr wrapMat2Blob(const cv::Mat &mat) {
  * @param thickness - thickness of the lines used to draw a text.
  */
 inline void putHighlightedText(const cv::Mat& frame,
-                               const std::string& message,
-                               cv::Point position,
-                               int fontFace,
-                               double fontScale,
-                               cv::Scalar color,
-                               int thickness) {
+    const std::string& message,
+    cv::Point position,
+    int fontFace,
+    double fontScale,
+    cv::Scalar color,
+    int thickness) {
     cv::putText(frame, message, position, fontFace, fontScale, cv::Scalar(255, 255, 255), thickness + 1);
     cv::putText(frame, message, position, fontFace, fontScale, color, thickness);
 }
@@ -153,7 +217,7 @@ class OutputTransform {
         float inputWidth = static_cast<float>(inputSize.width);
         float inputHeight = static_cast<float>(inputSize.height);
         scaleFactor = std::min(outputResolution.height / inputHeight, outputResolution.width / inputWidth);
-        newResolution = cv::Size{static_cast<int>(inputWidth * scaleFactor), static_cast<int>(inputHeight * scaleFactor)};
+        newResolution = cv::Size{ static_cast<int>(inputWidth * scaleFactor), static_cast<int>(inputHeight * scaleFactor) };
         return newResolution;
     }
 
@@ -197,20 +261,21 @@ class InputTransform {
 public:
     InputTransform() : reverseInputChannels(false), isTrivial(true) {}
 
-    InputTransform(bool reverseInputChannels, const std::string &meanValues, const std::string &scaleValues) :
+    InputTransform(bool reverseInputChannels, const std::string& meanValues, const std::string& scaleValues) :
         reverseInputChannels(reverseInputChannels),
         isTrivial(!reverseInputChannels && meanValues.empty() && scaleValues.empty()),
         means(meanValues.empty() ? cv::Scalar(0.0, 0.0, 0.0) : string2Vec(meanValues)),
         stdScales(scaleValues.empty() ? cv::Scalar(1.0, 1.0, 1.0) : string2Vec(scaleValues)) {
     }
 
-    cv::Scalar string2Vec(const std::string &string) {
+    cv::Scalar string2Vec(const std::string& string) {
         const auto& strValues = split(string, ' ');
         std::vector<float> values;
         try {
             for (auto& str : strValues)
                 values.push_back(std::stof(str));
-        } catch (const std::invalid_argument&) {
+        }
+        catch (const std::invalid_argument&) {
             throw std::runtime_error("Invalid parameter --mean_values or --scale_values is provided.");
         }
         if (values.size() != 3) {
 
@@ -1,4 +1,4 @@
-// Copyright (C) 2018 Intel Corporation
+// Copyright (C) 2018-2022 Intel Corporation
 // SPDX-License-Identifier: Apache-2.0
 //
 
@@ -15,7 +15,7 @@
 namespace gaze_estimation {
 class EyeStateEstimator: public BaseEstimator {
 public:
-    EyeStateEstimator(InferenceEngine::Core& ie,
+    EyeStateEstimator(ov::runtime::Core& ie,
                       const std::string& modelPath,
                       const std::string& deviceName);
     void estimate(const cv::Mat& image, FaceInferenceResults& outputResults) override;
@@ -28,6 +28,6 @@ class EyeStateEstimator: public BaseEstimator {
     void rotateImageAroundCenter(const cv::Mat& srcImage, cv::Mat& dstImage, float angle) const;
 
     IEWrapper ieWrapper;
-    std::string inputBlobName, outputBlobName;
+    std::string inputTensorName, outputTensorName;
 };
 }  // namespace gaze_estimation
@@ -1,4 +1,4 @@
-// Copyright (C) 2018 Intel Corporation
+// Copyright (C) 2018-2022 Intel Corporation
 // SPDX-License-Identifier: Apache-2.0
 //
 
@@ -8,7 +8,6 @@
 #include <vector>
 #include <map>
 
-#include <inference_engine.hpp>
 #include <opencv2/core/core.hpp>
 
 #include "face_inference_results.hpp"
@@ -17,7 +16,7 @@
 namespace gaze_estimation {
 class FaceDetector {
 public:
-    FaceDetector(InferenceEngine::Core& ie,
+    FaceDetector(ov::runtime::Core& ie,
                  const std::string& modelPath,
                  const std::string& deviceName,
                  double detectionConfidenceThreshold,
@@ -29,9 +28,9 @@ class FaceDetector {
 
 private:
     IEWrapper ieWrapper;
-    std::string inputBlobName;
-    std::vector<unsigned long> inputBlobDims;
-    std::string outputBlobName;
+    std::string inputTensorName;
+    ov::Shape inputTensorDims;
+    std::string outputTensorName;
     std::size_t numTotalDetections;
 
     double detectionThreshold;
 
@@ -1,4 +1,4 @@
-// Copyright (C) 2018 Intel Corporation
+// Copyright (C) 2018-2022 Intel Corporation
 // SPDX-License-Identifier: Apache-2.0
 //
 
@@ -15,7 +15,7 @@
 namespace gaze_estimation {
 class GazeEstimator: public BaseEstimator {
 public:
-    GazeEstimator(InferenceEngine::Core& ie,
+    GazeEstimator(ov::runtime::Core& ie,
                   const std::string& modelPath,
                   const std::string& deviceName,
                   bool doRollAlign = true);
@@ -27,7 +27,7 @@ class GazeEstimator: public BaseEstimator {
 
 private:
     IEWrapper ieWrapper;
-    std::string outputBlobName;
+    std::string outputTensorName;
     bool rollAlign;
 
     void rotateImageAroundCenter(const cv::Mat& srcImage, cv::Mat& dstImage, float angle) const;
 
@@ -1,4 +1,4 @@
-// Copyright (C) 2018 Intel Corporation
+// Copyright (C) 2018-2022 Intel Corporation
 // SPDX-License-Identifier: Apache-2.0
 //
 
@@ -15,7 +15,7 @@
 namespace gaze_estimation {
 class HeadPoseEstimator: public BaseEstimator {
 public:
-    HeadPoseEstimator(InferenceEngine::Core& ie,
+    HeadPoseEstimator(ov::runtime::Core& ie,
                       const std::string& modelPath,
                       const std::string& deviceName);
     void estimate(const cv::Mat& image,
@@ -26,6 +26,6 @@ class HeadPoseEstimator: public BaseEstimator {
 
 private:
     IEWrapper ieWrapper;
-    std::string inputBlobName;
+    std::string inputTensorName;
 };
 }  // namespace gaze_estimation
@@ -1,4 +1,4 @@
-// Copyright (C) 2018 Intel Corporation
+// Copyright (C) 2018-2022 Intel Corporation
 // SPDX-License-Identifier: Apache-2.0
 //
 
@@ -16,40 +16,40 @@
 namespace gaze_estimation {
 class IEWrapper {
 public:
-    IEWrapper(InferenceEngine::Core& ie,
+    IEWrapper(ov::runtime::Core& core,
               const std::string& modelPath,
               const std::string& modelType,
               const std::string& deviceName);
-    // For setting input blobs containing images
-    void setInputBlob(const std::string& blobName, const cv::Mat& image);
-    // For setting input blobs containing vectors of data
-    void setInputBlob(const std::string& blobName, const std::vector<float>& data);
+    // For setting input tensors containing images
+    void setInputTensor(const std::string& tensorName, const cv::Mat& image);
+    // For setting input tensors containing vectors of data
+    void setInputTensor(const std::string& tensorName, const std::vector<float>& data);
 
-    // Get output blob content as a vector given its name
-    void getOutputBlob(const std::string& blobName, std::vector<float>& output);
+    // Get output tensor content as a vector given its name
+    void getOutputTensor(const std::string& tensorName, std::vector<float>& output);
 
-    const std::map<std::string, std::vector<unsigned long>>& getInputBlobDimsInfo() const;
-    const std::map<std::string, std::vector<unsigned long>>& getOutputBlobDimsInfo() const;
+    const std::map<std::string, ov::Shape>& getInputTensorDimsInfo() const;
+    const std::map<std::string, ov::Shape>& getOutputTensorDimsInfo() const;
 
     std::string expectSingleInput() const;
     std::string expectSingleOutput() const;
 
-    void expectImageInput(const std::string& blobName) const;
+    void expectImageInput(const std::string& tensorName) const;
 
-    void reshape(const std::map<std::string, std::vector<unsigned long>>& newBlobsDimsInfo);
+    void reshape(const std::map<std::string, ov::Shape>& newTensorsDimsInfo);
 
     void infer();
 
 private:
     std::string modelPath;
     std::string modelType;
     std::string deviceName;
-    InferenceEngine::Core& ie;
-    InferenceEngine::CNNNetwork network;
-    InferenceEngine::ExecutableNetwork executableNetwork;
-    InferenceEngine::InferRequest request;
-    std::map<std::string, std::vector<unsigned long>> inputBlobsDimsInfo;
-    std::map<std::string, std::vector<unsigned long>> outputBlobsDimsInfo;
+    ov::runtime::Core core;
+    std::shared_ptr<ov::Model> model;
+    ov::runtime::CompiledModel compiled_model;
+    ov::runtime::InferRequest infer_request;
+    std::map<std::string, ov::Shape> input_tensors_dims_info;
+    std::map<std::string, ov::Shape> output_tensors_dims_info;
 
     void setExecPart();
 };
Original file line number	Diff line number	Diff line change
`@@ -36,7 +36,7 @@`
`36`	`36`	`#endif`
`37`	`37`
`38`	`38`	`template <typename T, std::size_t N>`
`39`		`-constexpr std::size_t arraySize(const T (&)[N]) noexcept {`
	`39`	`+constexpr std::size_t arraySize(const T(&)[N]) noexcept {`
`40`	`40`	`return N;`
`41`	`41`	`}`
`42`	`42`
`@@ -221,7 +221,7 @@ inline void showAvailableDevices() {`
`221`	`221`	`std::cout << std::endl;`
`222`	`222`	`}`
`223`	`223`
`224`		`-inline std::string fileNameNoExt(const std::string &filepath) {`
	`224`	`+inline std::string fileNameNoExt(const std::string& filepath) {`
`225`	`225`	`auto pos = filepath.rfind('.');`
`226`	`226`	`if (pos == std::string::npos) return filepath;`
`227`	`227`	`return filepath.substr(0, pos);`