add 280riscv yolov8

wangWking · wangWking · commit 404b6160ec54 · 2025-04-08T12:01:27.000+08:00
diff --git a/libraries/offset/myCobot 280 for RISCV_yolov8.txt b/libraries/offset/myCobot 280 for RISCV_yolov8.txt
@@ -0,0 +1 @@
+['170', '15', '65']
diff --git a/libraries/pyqtFile/AiKit_auto.py b/libraries/pyqtFile/AiKit_auto.py
@@ -632,6 +632,7 @@ def setupUi(self, AiKit_UI):
         self.comboBox_function.addItem("")
         self.comboBox_function.addItem("")
         self.comboBox_function.addItem("")
+        self.comboBox_function.addItem("")
         self.horizontalLayout_14.addWidget(self.comboBox_function)
         self.horizontalLayout_14.setStretch(0, 1)
         self.horizontalLayout_14.setStretch(1, 2)
@@ -975,6 +976,7 @@ def retranslateUi(self, AiKit_UI):
         self.comboBox_function.setItemText(2, _translate("AiKit_UI", "QR code recognition"))
         self.comboBox_function.setItemText(3, _translate("AiKit_UI", "Keypoints"))
         self.comboBox_function.setItemText(4, _translate("AiKit_UI", "yolov5"))
+        self.comboBox_function.setItemText(5, _translate("AiKit_UI", "yolov8"))
         self.func_lab_11.setText(_translate("AiKit_UI", "Add New Pictures"))
         self.add_img_btn.setText(_translate("AiKit_UI", "Add"))
         self.exit_add_btn.setText(_translate("AiKit_UI", "Exit"))
diff --git a/libraries/pyqtFile/AiKit_auto.ui b/libraries/pyqtFile/AiKit_auto.ui
@@ -1367,6 +1367,11 @@ border-style: outset;</string>
                      <string>yolov5</string>
                     </property>
                    </item>
+                   <item>
+                    <property name="text">
+                     <string>yolov8</string>
+                    </property>
+                   </item>
                   </widget>
                  </item>
                 </layout>
diff --git a/libraries/yolov8File/yolov8_detect.py b/libraries/yolov8File/yolov8_detect.py
@@ -0,0 +1,241 @@
+import os
+import cv2
+import numpy as np
+import onnxruntime as ort
+
+
+class YOLODetection:
+    def __init__(self, model_path, labels_path):
+        self.path = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
+        self.model_path = model_path
+        self.labels_path = labels_path
+        self.class_conf = 0.3
+        self.nms_thresh = 0.45
+        self.labels = [line.strip() for line in open(self.labels_path, 'r').readlines()]
+        self.infer_session = self.init_infer_session()
+        self.warm_up_times = 1
+        self.input_name = self.infer_session.get_inputs()[0].name
+        self.output_name = self.infer_session.get_outputs()[0].name
+        self.input_size = self.infer_session.get_inputs()[0].shape[2:4]
+
+    def init_infer_session(self):
+        session_options = ort.SessionOptions()
+        session_options.intra_op_num_threads = 4
+
+        # 加载 ONNX 模型
+        session = ort.InferenceSession(self.model_path, sess_options=session_options)
+
+        return session
+
+    def warm_up(self):
+        warm_up_img = np.random.rand(1, 3, self.input_size[0], self.input_size[1]).astype(np.float32)
+
+        for i in range(self.warm_up_times):
+            self.infer_session.run([self.output_name], {self.input_name: warm_up_img})
+
+    def infer(self, image):
+        img = image.copy()
+
+        # 图像预处理
+        input_tensor = self.preprocess(img, self.input_size)
+        # 进行推理
+        outputs = self.infer_session.run([self.output_name], {self.input_name: input_tensor})
+        output = outputs[0]
+        offset = output.shape[1]
+        anchors = output.shape[2]
+
+        # 后处理
+        dets = self.postprocess(image, output, anchors, offset, self.class_conf, self.input_size)
+        dets = self.nms(dets)
+
+        rect_result = self.convert_rect_list(dets)
+        if rect_result:
+            center_x, center_y = self.convert_rect_list(dets)
+            # 绘制结果
+            result_img = self.draw_result(img, dets, self.labels)
+            # 返回类别索引和名称列表
+            class_ids = [int(det[4]) for det in dets]  # 获取所有检测到物体的类别索引
+            # class_names = [self.labels[int(id)] for id in class_ids]  # 获取类别名称
+            return center_x, center_y, class_ids, result_img
+        return None
+
+    def preprocess(self, image, input_size=(320, 320)):
+        shape = image.shape[:2]
+        pad_color = (0, 0, 0)
+        # 调整图像大小
+        # Scale ratio
+        r = min(input_size[0] / shape[0], input_size[1] / shape[1])
+        # Compute padding
+        ratio = r  # width, height ratios
+        new_unpad = int(round(shape[1] * r)), int(round(shape[0] * r))
+        dw, dh = input_size[1] - new_unpad[0], input_size[0] - new_unpad[1]  # wh padding
+        dw /= 2  # divide padding into 2 sides
+        dh /= 2
+        if shape[::-1] != new_unpad:  # resize
+            image = cv2.resize(image, new_unpad, interpolation=cv2.INTER_LINEAR)
+        image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
+        top, bottom = int(round(dh - 0.1)), int(round(dh + 0.1))
+        left, right = int(round(dw - 0.1)), int(round(dw + 0.1))
+        image = cv2.copyMakeBorder(image, top, bottom, left, right, cv2.BORDER_CONSTANT, value=pad_color)  # add border
+
+        # 归一化处理
+        image = image.astype(np.float32) / 255.0
+        # 调整维度以匹配模型输入 [batch, channel, height, width]
+        image = np.transpose(image, (2, 0, 1))
+        image = np.expand_dims(image, axis=0)
+
+        return image
+
+    def postprocess(self, image, output, anchors, offset, conf_threshold, input_size=(320, 320)):
+        # 获取图像的高和宽
+        shape = image.shape[:2]
+        # 计算缩放比例
+        r = min(input_size[0] / shape[0], input_size[1] / shape[1])
+        # 计算新的未填充尺寸
+        new_unpad = (int(round(shape[1] * r)), int(round(shape[0] * r)))
+        # 计算填充量
+        dw, dh = input_size[1] - new_unpad[0], input_size[0] - new_unpad[1]
+        # 将填充量平分到两侧
+        dw /= 2
+        dh /= 2
+
+        # 去除 output 多余的维度
+        output = output.squeeze()
+
+        # 提取每个锚点对应的边界框信息（中心坐标、宽高）
+        center_x = output[0, :anchors]
+        center_y = output[1, :anchors]
+        box_width = output[2, :anchors]
+        box_height = output[3, :anchors]
+
+        # 提取每个锚点对应的所有类别概率
+        class_probs = output[4:offset, :anchors]
+
+        # 找出每个锚点下概率最大的类别索引及其概率值
+        max_prob_indices = np.argmax(class_probs, axis=0)
+        max_probs = class_probs[max_prob_indices, np.arange(anchors)]
+
+        # 过滤掉置信度低于阈值的锚点
+        valid_mask = max_probs > conf_threshold
+        valid_center_x = center_x[valid_mask]
+        valid_center_y = center_y[valid_mask]
+        valid_box_width = box_width[valid_mask]
+        valid_box_height = box_height[valid_mask]
+        valid_max_prob_indices = max_prob_indices[valid_mask]
+        valid_max_probs = max_probs[valid_mask]
+
+        # 过滤掉类别为 'person'（COCO 数据集中 'person' 类别的索引是 0）
+        valid_mask = valid_max_prob_indices != 0  # 排除掉 'person' 类别，防止误识别手
+        valid_center_x = valid_center_x[valid_mask]
+        valid_center_y = valid_center_y[valid_mask]
+        valid_box_width = valid_box_width[valid_mask]
+        valid_box_height = valid_box_height[valid_mask]
+        valid_max_prob_indices = valid_max_prob_indices[valid_mask]
+        valid_max_probs = valid_max_probs[valid_mask]
+
+        # 计算边界框坐标
+        half_width = valid_box_width / 2
+        half_height = valid_box_height / 2
+        x1 = np.maximum(0, ((valid_center_x - half_width) - dw) / r).astype(int)
+        x2 = np.maximum(0, ((valid_center_x + half_width) - dw) / r).astype(int)
+        y1 = np.maximum(0, ((valid_center_y - half_height) - dh) / r).astype(int)
+        y2 = np.maximum(0, ((valid_center_y + half_height) - dh) / r).astype(int)
+
+        # 组合结果
+        objects = np.column_stack((x1, y1, x2, y2, valid_max_prob_indices, valid_max_probs)).tolist()
+
+        return objects
+
+    def nms(self, dets):
+        if len(dets) == 0:
+            return np.empty((0, 6))
+
+        dets_array = np.array(dets)
+        # 按类别分组
+        unique_labels = np.unique(dets_array[:, 4])
+        final_dets = []
+
+        for label in unique_labels:
+            # 获取当前类别的检测结果
+            mask = dets_array[:, 4] == label
+            dets_class = dets_array[mask]
+
+            # 按置信度从高到低排序
+            order = np.argsort(-dets_class[:, 5])
+            dets_class = dets_class[order]
+
+            # 逐个进行 NMS
+            keep = []
+            while dets_class.shape[0] > 0:
+                # 保留当前置信度最高的检测结果
+                keep.append(dets_class[0])
+                if dets_class.shape[0] == 1:
+                    break
+
+                # 计算当前框与其他框的 IoU
+                ious = self.calculate_iou(keep[-1], dets_class[1:])
+                # 去除 IoU 大于阈值的框
+                dets_class = dets_class[1:][ious < self.nms_thresh]
+
+            # 将当前类别的结果添加到最终结果中
+            final_dets.extend(keep)
+
+        return final_dets
+
+    def calculate_iou(self, box, boxes):
+        """
+        计算一个框与一组框的 IoU
+        :param box: 单个框 [x1, y1, x2, y2]
+        :param boxes: 一组框 [N, 4]
+        :return: IoU 值 [N]
+        """
+        # 计算交集区域
+        x1 = np.maximum(box[0], boxes[:, 0])
+        y1 = np.maximum(box[1], boxes[:, 1])
+        x2 = np.minimum(box[2], boxes[:, 2])
+        y2 = np.minimum(box[3], boxes[:, 3])
+        inter_area = np.maximum(0, x2 - x1) * np.maximum(0, y2 - y1)
+
+        # 计算并集区域
+        box_area = (box[2] - box[0]) * (box[3] - box[1])
+        boxes_area = (boxes[:, 2] - boxes[:, 0]) * (boxes[:, 3] - boxes[:, 1])
+        union_area = box_area + boxes_area - inter_area
+
+        # 计算 IoU
+        return inter_area / union_area
+
+    # 可视化结果
+    def draw_result(self, image, dets, class_names, color=(0, 255, 0), thickness=2):
+        image = image.copy()
+        image_h, image_w = image.shape[:2]
+
+        for det in dets:
+            x1, y1, x2, y2, label, score = det
+            x1 = int(x1)
+            y1 = int(y1)
+            x2 = int(x2)
+            y2 = int(y2)
+            center_x, center_y = (x1 + x2) // 2, (y1 + y2) // 2  # 计算中心坐标
+            # 绘制边界框
+            cv2.rectangle(image, (x1, y1), (x2, y2), (0, 255, 0), 2)
+            cv2.circle(image, (center_x, center_y), 5, (0, 0, 255), -1)  # 画出中心点
+            cv2.putText(image, f'{class_names[int(label)]}: {score:.2f}', (x1, y1 - 10), cv2.FONT_HERSHEY_SIMPLEX, 0.9,
+                        (0, 255, 0), 2)
+
+        return image
+
+    def convert_rect_list(self, original_list):
+        converted_list = []
+        center_x = 0
+        center_y = 0
+        for x1, y1, x2, y2, label, prob in original_list:
+            width = x2 - x1
+            height = y2 - y1
+            new_rect = ((x1, y1), width, height, label, prob)
+            converted_list.append(new_rect)
+            center_x = x1 + width // 2  # 计算中心点x坐标
+            center_y = y1 + height // 2  # 计算中心点y坐标
+        if center_x + center_y > 0:
+            return center_x, center_y
+        else:
+            return None
diff --git a/libraries/yolov8File/yolov8_label.txt b/libraries/yolov8File/yolov8_label.txt
@@ -0,0 +1,80 @@
+person
+bicycle
+car
+motorbike
+aeroplane
+bus
+train
+truck
+boat
+traffic light
+fire hydrant
+stop sign
+parking meter
+bench
+bird
+cat
+dog
+horse
+sheep
+cow
+elephant
+bear
+zebra
+giraffe
+backpack
+umbrella
+handbag
+tie
+suitcase
+frisbee
+skis
+snowboard
+sports ball
+kite
+baseball bat
+baseball glove
+skateboard
+surfboard
+tennis racket
+bottle
+wine glass
+cup
+fork
+knife
+spoon
+bowl
+banana
+apple
+sandwich
+orange
+broccoli
+carrot
+hot dog
+pizza
+donut
+cake
+chair
+sofa
+pottedplant
+bed
+diningtable
+toilet
+tvmonitor
+laptop
+mouse
+remote
+keyboard
+cell phone
+microwave
+oven
+toaster
+sink
+refrigerator
+book
+clock
+vase
+scissors
+teddy bear
+hair drier
+toothbrush
diff --git a/libraries/yolov8File/yolov8n.q.onnx b/libraries/yolov8File/yolov8n.q.onnx
diff --git a/main.py b/main.py