Merge pull request #89 from makerforgetech/feature/imx500

danic85 · web-flow · commit 6a60405e40ca · 2024-10-18T17:05:52.000+01:00
Feature/imx500
diff --git a/config/servos.yml b/config/servos.yml
@@ -1,4 +1,5 @@
 servos:
+  port: /dev/ttyAMA0
   conf:
     leg_l_hip: { id: 0, pin: 9, range: [0, 180], start: 40 }
     leg_l_knee: { id: 1, pin: 10, range: [0, 180], start: 10 }
diff --git a/install.sh b/install.sh
@@ -25,7 +25,7 @@
 # sudo apt-get install libatlas-base-dev
 
 # CREATE VIRTUAL ENVIRONMENT
-python3 -m venv myenv
+python3 -m venv --system-site-package myenv
 source myenv/bin/activate
 
 # INSTALL ALL PYTHON DEPENDENCIES
diff --git a/main.py b/main.py
@@ -72,12 +72,11 @@ def main():
 
     # Throw exception to safely exit script when terminated
     signal.signal(signal.SIGTERM, Config.exit)
-
     # GPIO
     # gpio = pigpio.pi()
 
     # Arduino connection
-    serial = ArduinoSerial()
+    serial = ArduinoSerial(port=Config.get('servos','port'))
 
     servos = dict()
     servo_conf = Config.get('servos','conf')
@@ -184,7 +183,12 @@ def main():
     minute_loop = time()
     loop = True
     # pub.sendMessage('speak', msg='hi')
-    # pub.sendMessage('animate', action='celebrate')
+    # print('taking over servos')
+    # pub.sendMessage('servo:pan:mvabs', percentage=50)
+    # print('done')
+    # print('nodding')
+    # pub.sendMessage('animate', action='head_nod')
+    # print('done')
 
     try:
         pub.sendMessage('log', msg="[Main] Loop started")
diff --git a/main_viam.py b/main_viam.py
@@ -159,7 +159,9 @@ async def main():
     # print(f"my-webcam get_image return value: {my_webcam_return_value}")
     # roboflow_test = VisionClient.from_robot(robot, "roboflow-test")
     
-                
+    # print('taking over servos')
+    # pub.sendMessage('servo:pan:mvabs', percentage=50)
+    # print('done')
         
     try:
         while loop:
diff --git a/modules/arduinoserial.py b/modules/arduinoserial.py
@@ -16,14 +16,17 @@ class ArduinoSerial:
     DEVICE_SERVO_RELATIVE = 4
     ORDER_RECEIVED = 5
     def __init__(self, **kwargs):
-        self.serial_file = ArduinoSerial.initialise()
+        self.port = kwargs.get('port', '/dev/ttyAMA0')
+        self.baudrate = kwargs.get('baudrate', 115200)
+        self.serial_file = ArduinoSerial.initialise(self.port, self.baudrate)
         self.file = None
         pub.subscribe(self.send, 'serial')
 
     @staticmethod
-    def initialise():
+    def initialise(port, baudrate):
         try:
-            serial_file = open_serial_port(baudrate=115200, timeout=None)
+            print('Trying to select port ' + port)
+            serial_file = open_serial_port(serial_port=port, baudrate=baudrate, timeout=None)
         except Exception as e:
             raise e
         is_connected = True # assume connection
diff --git a/modules/picamimx500.py b/modules/picamimx500.py
@@ -0,0 +1,207 @@
+import argparse
+import sys
+from functools import lru_cache
+
+import cv2, json
+import numpy as np
+
+from picamera2 import MappedArray, Picamera2
+from picamera2.devices import IMX500
+from picamera2.devices.imx500 import (NetworkIntrinsics,
+                                      postprocess_nanodet_detection)
+from libcamera import Transform
+
+from pubsub import pub
+
+
+class Detection:
+    def __init__(self, imx500, picam2, selfref, coords, category, conf, metadata):
+        """Create a Detection object, recording the bounding box, category and confidence."""
+        self.category = category
+        self.conf = conf
+        self.box = imx500.convert_inference_coords(coords, metadata, picam2)
+        self.piCamImx500 = selfref
+    def display(self):
+        label = f"{self.piCamImx500.get_labels()[int(self.category)]} ({self.conf:.2f}%): {self.box}"
+        print(label)
+        print("")
+    def json_out(self):
+        return {
+            'category': self.piCamImx500.get_labels()[int(self.category)],
+            'confidence': self.conf,
+            'box': self.box
+        }
+        
+        
+        
+class PiCamImx500:
+    def __init__(self, **kwargs):
+        self.last_detections = []
+        self.last_results = []
+        
+        self.args = PiCamImx500.get_args()
+
+        # This must be called before instantiation of Picamera2
+        self.imx500 = IMX500(self.args.model)
+        self.intrinsics = self.imx500.network_intrinsics
+        if not self.intrinsics:
+            self.intrinsics = NetworkIntrinsics()
+            self.intrinsics.task = "object detection"
+        elif self.intrinsics.task != "object detection":
+            print("Network is not an object detection task", file=sys.stderr)
+            exit()
+
+        # Override self.intrinsics from self.args
+        for key, value in vars(self.args).items():
+            if key == 'labels' and value is not None:
+                with open(value, 'r') as f:
+                    self.intrinsics.labels = f.read().splitlines()
+            elif hasattr(self.intrinsics, key) and value is not None:
+                setattr(self.intrinsics, key, value)
+
+        # Defaults
+        if self.intrinsics.labels is None:
+            with open("assets/coco_labels.txt", "r") as f:
+                self.intrinsics.labels = f.read().splitlines()
+        self.intrinsics.update_with_defaults()
+
+        # if self.args.print_self.intrinsics:
+        #     print(self.intrinsics)
+        #     exit()
+
+        self.picam2 = Picamera2(self.imx500.camera_num)
+        config = self.picam2.create_preview_configuration(controls={"FrameRate": self.intrinsics.inference_rate}, buffer_count=12, transform=Transform(vflip=False, hflip=False))
+
+        self.imx500.show_network_fw_progress_bar()
+        self.picam2.start(config, show_preview=False)
+
+        if self.intrinsics.preserve_aspect_ratio:
+            self.imx500.set_auto_aspect_ratio()
+
+        self.picam2.pre_callback = self.draw_detections
+        
+        pub.subscribe(self.scan, 'vision:detect')
+
+    def scan(self, captures=1):
+        json_array = []
+        for i in range(captures):
+            self.last_results = self.parse_detections(self.picam2.capture_metadata())
+            for i in self.last_results:
+                this_capture = [obj.json_out() for obj in self.last_results]
+                if captures > 1:
+                    json_array = json_array + [this_capture]
+                else:
+                    json_array = this_capture
+
+        pub.sendMessage('vision:detections', data=json_array)                
+        return json_array
+
+    def parse_detections(self, metadata: dict):
+        """Parse the output tensor into a number of detected objects, scaled to the ISP out."""
+        bbox_normalization = self.intrinsics.bbox_normalization
+        threshold = self.args.threshold
+        iou = self.args.iou
+        max_detections = self.args.max_detections
+
+        np_outputs = self.imx500.get_outputs(metadata, add_batch=True)
+        input_w, input_h = self.imx500.get_input_size()
+        if np_outputs is None:
+            return self.last_detections
+        if self.intrinsics.postprocess == "nanodet":
+            boxes, scores, classes = \
+                postprocess_nanodet_detection(outputs=np_outputs[0], conf=threshold, iou_thres=iou,
+                                            max_out_dets=max_detections)[0]
+            from picamera2.devices.imx500.postprocess import scale_boxes
+            boxes = scale_boxes(boxes, 1, 1, input_h, input_w, False, False)
+        else:
+            boxes, scores, classes = np_outputs[0][0], np_outputs[1][0], np_outputs[2][0]
+            if bbox_normalization:
+                boxes = boxes / input_h
+
+            boxes = np.array_split(boxes, 4, axis=1)
+            boxes = zip(*boxes)
+
+        self.last_detections = [
+            Detection(self.imx500, self.picam2, self, box, category, score, metadata)
+            for box, score, category in zip(boxes, scores, classes)
+            if score > threshold
+        ]
+        return self.last_detections
+
+    @lru_cache
+    def get_labels(self):
+        labels = self.intrinsics.labels
+
+        if self.intrinsics.ignore_dash_labels:
+            labels = [label for label in labels if label and label != "-"]
+        return labels
+
+    def draw_detections(self, request, stream="main"):
+        """Draw the detections for this request onto the ISP output."""
+        detections = self.last_results
+        if detections is None:
+            return
+        labels = self.get_labels()
+        with MappedArray(request, stream) as m:
+            for detection in detections:
+                x, y, w, h = detection.box
+                label = f"{labels[int(detection.category)]} ({detection.conf:.2f})"
+
+                # Calculate text size and position
+                (text_width, text_height), baseline = cv2.getTextSize(label, cv2.FONT_HERSHEY_SIMPLEX, 0.5, 1)
+                text_x = x + 5
+                text_y = y + 15
+
+                # Create a copy of the array to draw the background with opacity
+                overlay = m.array.copy()
+
+                # Draw the background rectangle on the overlay
+                cv2.rectangle(overlay,
+                            (text_x, text_y - text_height),
+                            (text_x + text_width, text_y + baseline),
+                            (255, 255, 255),  # Background color (white)
+                            cv2.FILLED)
+
+                alpha = 0.30
+                cv2.addWeighted(overlay, alpha, m.array, 1 - alpha, 0, m.array)
+
+                # Draw text on top of the background
+                cv2.putText(m.array, label, (text_x, text_y),
+                            cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 0, 255), 1)
+
+                # Draw detection box
+                cv2.rectangle(m.array, (x, y), (x + w, y + h), (0, 255, 0, 0), thickness=2)
+
+            if self.intrinsics.preserve_aspect_ratio:
+                b_x, b_y, b_w, b_h = self.imx500.get_roi_scaled(request)
+                color = (255, 0, 0)  # red
+                cv2.putText(m.array, "ROI", (b_x + 5, b_y + 15), cv2.FONT_HERSHEY_SIMPLEX, 0.5, color, 1)
+                cv2.rectangle(m.array, (b_x, b_y), (b_x + b_w, b_y + b_h), (255, 0, 0, 0))
+
+    @staticmethod
+    def get_args():
+        parser = argparse.ArgumentParser()
+        parser.add_argument("--model", type=str, help="Path of the model",
+                            default="/usr/share/imx500-models/imx500_network_ssd_mobilenetv2_fpnlite_320x320_pp.rpk")
+        parser.add_argument("--fps", type=int, help="Frames per second")
+        parser.add_argument("--bbox-normalization", action=argparse.BooleanOptionalAction, help="Normalize bbox")
+        parser.add_argument("--threshold", type=float, default=0.55, help="Detection threshold")
+        parser.add_argument("--iou", type=float, default=0.65, help="Set iou threshold")
+        parser.add_argument("--max-detections", type=int, default=10, help="Set max detections")
+        parser.add_argument("--ignore-dash-labels", action=argparse.BooleanOptionalAction, help="Remove '-' labels ")
+        parser.add_argument("--postprocess", choices=["", "nanodet"],
+                            default=None, help="Run post process of type")
+        parser.add_argument("-r", "--preserve-aspect-ratio", action=argparse.BooleanOptionalAction,
+                            help="preserve the pixel aspect ratio of the input tensor")
+        parser.add_argument("--labels", type=str,
+                            help="Path to the labels file")
+        parser.add_argument("--print-self.intrinsics", action="store_true",
+                            help="Print JSON network_intrinsics then exit")
+        return parser.parse_args()
+
+
+if __name__ == "__main__":
+    mycam = PiCamImx500()
+    
+    # while True:
+    print(mycam.scan(1))
diff --git a/modules/robust_serial/utils.py b/modules/robust_serial/utils.py
@@ -56,6 +56,7 @@ def get_serial_ports():
         try:
             s = serial.Serial(port)
             s.close()
+            print('[Serial] Found ' + port)
             results.append(port)
         except (OSError, serial.SerialException):
             pass
@@ -73,9 +74,11 @@ def open_serial_port(serial_port=None, baudrate=115200, timeout=0, write_timeout
     :param write_timeout: (int)
     :return: (Serial Object)
     """
+    ports = get_serial_ports()
+    print('Serial port sent: ' + serial_port)
     # Open serial port (for communication with Arduino)
     if serial_port is None:
-        serial_port = get_serial_ports()[0]
+        serial_port = ports[0]
     # timeout=0 non-blocking mode, return immediately in any case, returning zero or more,
     # up to the requested number of bytes
     return serial.Serial(port=serial_port, baudrate=baudrate, timeout=timeout, writeTimeout=write_timeout)

Original file line number	Diff line number	Diff line change
`@@ -1,4 +1,5 @@`
`1`	`1`	`servos:`
	`2`	`+ port: /dev/ttyAMA0`
`2`	`3`	`conf:`
`3`	`4`	`leg_l_hip: { id: 0, pin: 9, range: [0, 180], start: 40 }`
`4`	`5`	`leg_l_knee: { id: 1, pin: 10, range: [0, 180], start: 10 }`