Added NN examples

Erol444 · Erol444 · commit 8d6a6d338f91 · 2022-01-17T17:31:32.000-08:00
diff --git a/docs/source/_static/images/examples/normalize_model.png b/docs/source/_static/images/examples/normalize_model.png
diff --git a/docs/source/samples/NeuralNetwork/concat_multi_input.rst b/docs/source/samples/NeuralNetwork/concat_multi_input.rst
@@ -0,0 +1,38 @@
+Multi-Input Frame Concationation
+================================
+
+Example concatenates all 3 inputs with a simple custom NN created with PyTorch (`link here <https://github.com/luxonis/depthai-experiments/blob/master/gen2-custom-models/generate_model/pytorch_concat.py>`__, `tutorial here <https://docs.luxonis.com/en/latest/pages/tutorials/creating-custom-nn-models/>`__).
+It uses multiple input :ref:`NeuralNetwork` feature and links all 3 camera streams directly to the NN node.
+
+Demo
+####
+
+.. image:: https://user-images.githubusercontent.com/18037362/134209980-09c6e2f9-8a26-45d5-a6ad-c31d9e2816e1.png
+
+Setup
+#####
+
+.. include::  /includes/install_from_pypi.rst
+
+Source code
+###########
+
+.. tabs::
+
+    .. tab:: Python
+
+        Also `available on GitHub <https://github.com/luxonis/depthai-python/blob/main/examples/NeuralNetwork/concat_multiple_input.py>`__
+
+        .. literalinclude:: ../../../../examples/NeuralNetwork/concat_multi_input.py
+           :language: python
+           :linenos:
+
+    .. tab:: C++
+
+        Also `available on GitHub <https://github.com/luxonis/depthai-core/blob/main/examples/src/concat_multiple_input.cpp>`__
+
+        .. literalinclude:: ../../../../depthai-core/examples/src/concat_multi_input.cpp
+           :language: cpp
+           :linenos:
+
+.. include::  /includes/footer-short.rst
diff --git a/docs/source/samples/NeuralNetwork/normalization_multi_input.rst b/docs/source/samples/NeuralNetwork/normalization_multi_input.rst
@@ -0,0 +1,46 @@
+Multi-Input Frame Normalization
+===============================
+
+This example shows how you can normalize a frame before sending it to another NN. Many neural network models
+require frames with RGB values (pixels) in range between :code:`-0.5` to :code:`0.5`. :ref:`ColorCamera`'s preview outputs
+values between :code:`0` and :code:`255`. Simple custom NN, created with PyTorch (`link here <https://github.com/luxonis/depthai-experiments/blob/master/gen2-custom-models/generate_model/pytorch_normalize.py>`__, `tutorial here <https://docs.luxonis.com/en/latest/pages/tutorials/creating-custom-nn-models/>`__),
+allows users to specify mean and scale factors that will apply for all frame values (pixels).
+
+.. math::
+
+   output = (input - mean) / scale
+
+.. image:: /_static/images/examples/normalize)model.png
+
+On the host, values are converted back to :code:`0`-:code:`255`, so they can be displayed by OpenCV.
+
+.. note::
+    This is just a demo, for normalization you should look into OpenVINO's `model optimizer <https://docs.openvinotoolkit.org/latest/openvino_docs_MO_DG_prepare_model_convert_model_Converting_Model_General.html>`__ arguments :code:`--mean_values` and :code:`--scale_values`.
+
+Setup
+#####
+
+.. include::  /includes/install_from_pypi.rst
+
+Source code
+###########
+
+.. tabs::
+
+    .. tab:: Python
+
+        Also `available on GitHub <https://github.com/luxonis/depthai-python/blob/main/examples/NeuralNetwork/normalization_multiple_input.py>`__
+
+        .. literalinclude:: ../../../../examples/NeuralNetwork/normalization_multi_input.py
+           :language: python
+           :linenos:
+
+    .. tab:: C++
+
+        Also `available on GitHub <https://github.com/luxonis/depthai-core/blob/main/examples/src/normalization_multiple_input.cpp>`__
+
+        .. literalinclude:: ../../../../depthai-core/examples/src/normalization_multi_input.cpp
+           :language: cpp
+           :linenos:
+
+.. include::  /includes/footer-short.rst
diff --git a/examples/NeuralNetwork/concat_multi_input.py b/examples/NeuralNetwork/concat_multi_input.py
@@ -0,0 +1,73 @@
+#!/usr/bin/env python3
+
+from pathlib import Path
+import sys
+import numpy as np
+import cv2
+import depthai as dai
+SHAPE = 300
+
+# Get argument first
+nnPath = str((Path(__file__).parent / Path('../models/concat_openvino_2021.4_6shave.blob')).resolve().absolute())
+if len(sys.argv) > 1:
+    nnPath = sys.argv[1]
+
+if not Path(nnPath).exists():
+    import sys
+    raise FileNotFoundError(f'Required file/s not found, please run "{sys.executable} install_requirements.py"')
+
+p = dai.Pipeline()
+p.setOpenVINOVersion(dai.OpenVINO.VERSION_2021_4)
+
+camRgb = p.createColorCamera()
+camRgb.setPreviewSize(SHAPE, SHAPE)
+camRgb.setInterleaved(False)
+camRgb.setColorOrder(dai.ColorCameraProperties.ColorOrder.BGR)
+
+left = p.create(dai.node.MonoCamera)
+left.setBoardSocket(dai.CameraBoardSocket.LEFT)
+left.setResolution(dai.MonoCameraProperties.SensorResolution.THE_400_P)
+
+# ImageManip for cropping (face detection NN requires input image of 300x300) and to change frame type
+manipLeft = p.create(dai.node.ImageManip)
+manipLeft.initialConfig.setResize(300, 300)
+manipLeft.initialConfig.setFrameType(dai.RawImgFrame.Type.BGR888p)
+left.out.link(manipLeft.inputImage)
+
+right = p.create(dai.node.MonoCamera)
+right.setBoardSocket(dai.CameraBoardSocket.RIGHT)
+right.setResolution(dai.MonoCameraProperties.SensorResolution.THE_400_P)
+
+# ImageManip for cropping (face detection NN requires input image of 300x300) and to change frame type
+manipRight = p.create(dai.node.ImageManip)
+manipRight.initialConfig.setResize(300, 300)
+manipRight.initialConfig.setFrameType(dai.RawImgFrame.Type.BGR888p)
+right.out.link(manipRight.inputImage)
+
+# NN that detects faces in the image
+nn = p.createNeuralNetwork()
+nn.setBlobPath(nnPath)
+nn.setNumInferenceThreads(2)
+
+manipLeft.out.link(nn.inputs['img1'])
+camRgb.preview.link(nn.inputs['img2'])
+manipRight.out.link(nn.inputs['img3'])
+
+# Send bouding box from the NN to the host via XLink
+nn_xout = p.createXLinkOut()
+nn_xout.setStreamName("nn")
+nn.out.link(nn_xout.input)
+
+# Pipeline is defined, now we can connect to the device
+with dai.Device(p) as device:
+    qNn = device.getOutputQueue(name="nn", maxSize=4, blocking=False)
+    shape = (3, SHAPE, SHAPE * 3)
+
+    while True:
+        inNn = np.array(qNn.get().getData())
+        frame = inNn.view(np.float16).reshape(shape).transpose(1, 2, 0).astype(np.uint8).copy()
+
+        cv2.imshow("Concat", frame)
+
+        if cv2.waitKey(1) == ord('q'):
+            break
diff --git a/examples/NeuralNetwork/normalization_multi_input.py b/examples/NeuralNetwork/normalization_multi_input.py
@@ -0,0 +1,78 @@
+#!/usr/bin/env python3
+
+from pathlib import Path
+import sys
+import numpy as np
+import cv2
+import depthai as dai
+SHAPE = 300
+
+# Get argument first
+nnPath = str((Path(__file__).parent / Path('../models/normalize_openvino_2021.4_4shave.blob')).resolve().absolute())
+if len(sys.argv) > 1:
+    nnPath = sys.argv[1]
+
+if not Path(nnPath).exists():
+    import sys
+    raise FileNotFoundError(f'Required file/s not found, please run "{sys.executable} install_requirements.py"')
+
+p = dai.Pipeline()
+p.setOpenVINOVersion(dai.OpenVINO.VERSION_2021_4)
+
+camRgb = p.createColorCamera()
+# Model expects values in FP16, as we have compiled it with `-ip FP16`
+camRgb.setFp16(True)
+camRgb.setInterleaved(False)
+camRgb.setPreviewSize(SHAPE, SHAPE)
+
+nn = p.createNeuralNetwork()
+nn.setBlobPath(nnPath)
+nn.setNumInferenceThreads(2)
+
+script = p.create(dai.node.Script)
+script.setScript("""
+# Run script only once
+# Model formula:
+# output = (input - mean) / scale
+
+# This configuration will subtract all frame values (pixels) by 127.5
+# 0.0 .. 255.0 -> -127.5 .. 127.5
+data = NNData(2)
+data.setLayer("mean", [127.5])
+node.io['mean'].send(data)
+
+# This configuration will divide all frame values (pixels) by 255.0
+# -127.5 .. 127.5 -> -0.5 .. 0.5
+data = NNData(2)
+data.setLayer("scale", [255.0])
+node.io['scale'].send(data)
+""")
+
+# Re-use the initial values for multiplier/addend
+script.outputs['mean'].link(nn.inputs['mean'])
+nn.inputs['mean'].setWaitForMessage(False)
+
+script.outputs['scale'].link(nn.inputs['scale'])
+nn.inputs['scale'].setWaitForMessage(False)
+# Always wait for the new frame before starting inference
+camRgb.preview.link(nn.inputs['frame'])
+
+# Send normalized frame values to host
+nn_xout = p.createXLinkOut()
+nn_xout.setStreamName("nn")
+nn.out.link(nn_xout.input)
+
+# Pipeline is defined, now we can connect to the device
+with dai.Device(p) as device:
+    qNn = device.getOutputQueue(name="nn", maxSize=4, blocking=False)
+    shape = (3, SHAPE, SHAPE)
+    while True:
+        inNn = np.array(qNn.get().getData())
+        # Get back the frame. It's currently normalized to -1.0 - 1.0
+        frame = inNn.view(np.float16).reshape(shape).transpose(1, 2, 0)
+        # To get original frame back (0-255), we add multiply all frame values (pixels) by 255 and then add 127.5 to them.
+        frame = (frame * 255.0 + 127.5).astype(np.uint8)
+        cv2.imshow("Original frame", frame)
+
+        if cv2.waitKey(1) == ord('q'):
+            break
diff --git a/examples/models/concat-model/model.yml b/examples/models/concat-model/model.yml
@@ -0,0 +1,25 @@
+# Copyright (c) 2021 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+description: >-
+  concat-model
+task_type: image_inpainting # Just random task type, so it's supported by model downloader
+files:
+  - name: concat_openvino_2021.4_6shave.blob
+    size: 1024
+    sha256: 6ac3023ea8dac9b7501ead0f9b2c2a4495d2791a58b7049de065246455cf87be
+    source: https://artifacts.luxonis.com/artifactory/luxonis-depthai-data-local/network/concat_openvino_2021.4_6shave.blob
+
+framework: dldt
+license: https://raw.githubusercontent.com/openvinotoolkit/open_model_zoo/master/LICENSE
diff --git a/examples/models/normalization-model/model.yml b/examples/models/normalization-model/model.yml
@@ -0,0 +1,25 @@
+# Copyright (c) 2021 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+description: >-
+  normalization-model
+task_type: image_inpainting # Just random task type, so it's supported by model downloader
+files:
+  - name: normalize_openvino_2021.4_4shave.blob
+    size: 1216
+    sha256:   9b5dc4b375ed9218c2910284556f8152cbfcc0130e7b7a42d9a9991eae8be23a
+    source: https://artifacts.luxonis.com/artifactory/luxonis-depthai-data-local/network/normalize_openvino_2021.4_4shave.blob
+
+framework: dldt
+license: https://raw.githubusercontent.com/openvinotoolkit/open_model_zoo/master/LICENSE