open-edge-platform · ashwinvaidya17 · Nov 4, 2024 · Nov 1, 2024 · Nov 1, 2024
@@ -11,25 +11,26 @@
 from .instance_segmentation import MaskRCNNModel
 from .keypoint_detection import KeypointDetectionModel, TopDownKeypointDetectionPipeline
 from .model import Model
-from .sam_models import SAMDecoder, SAMImageEncoder
-from .segmentation import SalientObjectDetectionModel, SegmentationModel
-from .ssd import SSD
-from .utils import (
+from .result_types import (
     AnomalyResult,
     ClassificationResult,
     Contour,
     DetectedKeypoints,
     Detection,
     DetectionResult,
-    DetectionWithLandmarks,
     ImageResultWithSoftPrediction,
     InstanceSegmentationResult,
-    OutputTransform,
     PredictedMask,
     SegmentedObject,
     SegmentedObjectWithRects,
     VisualPromptingResult,
     ZSLVisualPromptingResult,
+)
+from .sam_models import SAMDecoder, SAMImageEncoder
+from .segmentation import SalientObjectDetectionModel, SegmentationModel
+from .ssd import SSD
+from .utils import (
+    OutputTransform,
     add_rotated_rects,
     get_contours,
 )
@@ -62,8 +63,6 @@
     "ClassificationModel",
     "Contour",
     "DetectionModel",
-    "DetectionWithLandmarks",
-    "ImageMattingWithBackground",
     "ImageModel",
     "ImageResultWithSoftPrediction",
     "InstanceSegmentationResult",
@@ -77,11 +76,9 @@
     "MaskRCNNModel",
     "Model",
     "OutputTransform",
-    "PortraitBackgroundMatting",
     "SalientObjectDetectionModel",
     "SegmentationModel",
     "SSD",
-    "VideoBackgroundMatting",
     "YOLO",
     "YoloV3ONNX",
     "YoloV4",
@@ -95,7 +92,6 @@
     "Prompt",
     "Detection",
     "DetectionResult",
-    "DetectionWithLandmarks",
     "DetectedKeypoints",
     "classification_models",
     "detection_models",

@@ -12,8 +12,9 @@
 from model_api.adapters.utils import RESIZE_TYPES, InputTransform
 
 from .model import Model
+from .result_types import ClassificationResult
 from .types import BooleanValue, ListValue, NumericalValue, StringValue
-from .utils import ClassificationResult, load_labels
+from .utils import load_labels
 
 if TYPE_CHECKING:
     from model_api.adapters.inference_adapter import InferenceAdapter

@@ -17,8 +17,8 @@
 from model_api.adapters.inference_adapter import InferenceAdapter
 
 from .image_model import ImageModel
+from .result_types import AnomalyResult
 from .types import ListValue, NumericalValue, StringValue
-from .utils import AnomalyResult
 
 
 class AnomalyDetection(ImageModel):

@@ -17,8 +17,8 @@
 from model_api.adapters.inference_adapter import InferenceAdapter
 
 from .image_model import ImageModel
+from .result_types import ClassificationResult
 from .types import BooleanValue, ListValue, NumericalValue, StringValue
-from .utils import ClassificationResult
 
 
 class ClassificationModel(ImageModel):

@@ -7,8 +7,9 @@
 import numpy as np
 
 from .image_model import ImageModel
+from .result_types import InstanceSegmentationResult, SegmentedObject
 from .types import BooleanValue, ListValue, NumericalValue, StringValue
-from .utils import InstanceSegmentationResult, SegmentedObject, load_labels
+from .utils import load_labels
 
 
 class MaskRCNNModel(ImageModel):

@@ -10,8 +10,8 @@
 import numpy as np
 
 from .image_model import ImageModel
+from .result_types import DetectedKeypoints, Detection
 from .types import ListValue
-from .utils import DetectedKeypoints, Detection
 
 
 class KeypointDetectionModel(ImageModel):

@@ -0,0 +1,247 @@
+#
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+#
+
+from __future__ import annotations  # TODO: remove when Python3.9 support is dropped
+
+from typing import NamedTuple
+
+import cv2 as cv
+import numpy as np
+
+
+class AnomalyResult(NamedTuple):
+    """Results for anomaly models."""
+
+    anomaly_map: np.ndarray | None = None
+    pred_boxes: np.ndarray | None = None
+    pred_label: str | None = None
+    pred_mask: np.ndarray | None = None
+    pred_score: float | None = None
+
+    def _compute_min_max(self, tensor: np.ndarray) -> tuple[np.ndarray, np.ndarray]:
+        """Computes min and max values of the tensor."""
+        return tensor.min(), tensor.max()
+
+    def __str__(self) -> str:
+        assert self.anomaly_map is not None
+        assert self.pred_mask is not None
+        anomaly_map_min, anomaly_map_max = self._compute_min_max(self.anomaly_map)
+        pred_mask_min, pred_mask_max = self._compute_min_max(self.pred_mask)
+        return (
+            f"anomaly_map min:{anomaly_map_min} max:{anomaly_map_max};"
+            f"pred_score:{np.round(self.pred_score, 1) if self.pred_score else 0.0};"
+            f"pred_label:{self.pred_label};"
+            f"pred_mask min:{pred_mask_min} max:{pred_mask_max};"
+        )
+
+
+class ClassificationResult(NamedTuple):
+    """Results for classification models."""
+
+    top_labels: list[tuple[int, str, float]] | None = None
+    saliency_map: np.ndarray | None = None
+    feature_vector: np.ndarray | None = None
+    raw_scores: np.ndarray | None = None
+
+    def __str__(self) -> str:
+        assert self.top_labels is not None
+        labels = ", ".join(f"{idx} ({label}): {confidence:.3f}" for idx, label, confidence in self.top_labels)
+        return (
+            f"{labels}, {_array_shape_to_str(self.saliency_map)}, {_array_shape_to_str(self.feature_vector)}, "
+            f"{_array_shape_to_str(self.raw_scores)}"
+        )
+
+
+class Detection:
+    def __init__(self, xmin, ymin, xmax, ymax, score, id, str_label=None):
+        self.xmin: int = xmin
+        self.ymin: int = ymin
+        self.xmax: int = xmax
+        self.ymax: int = ymax
+        self.score: float = score
+        self.id: int = int(id)
+        self.str_label: str | None = str_label
+
+    def __str__(self):
+        return f"{self.xmin}, {self.ymin}, {self.xmax}, {self.ymax}, {self.id} ({self.str_label}): {self.score:.3f}"
+
+
+class DetectionResult(NamedTuple):
+    """Result for detection model."""
+
+    objects: list[Detection] | None = None
+    saliency_map: np.ndarray | None = None
+    feature_vector: np.ndarray | None = None
+
+    def __str__(self):
+        assert self.objects is not None
+        obj_str = "; ".join(str(obj) for obj in self.objects)
+        if obj_str:
+            obj_str += "; "
+        return f"{obj_str}{_array_shape_to_str(self.saliency_map)}; {_array_shape_to_str(self.feature_vector)}"
+
+
+class SegmentedObject(Detection):
+    def __init__(self, xmin, ymin, xmax, ymax, score, id, str_label, mask):
+        super().__init__(xmin, ymin, xmax, ymax, score, id, str_label)
+        self.mask = mask
+
+    def __str__(self):
+        return f"{super().__str__()}, {(self.mask > 0.5).sum()}"
+
+
+class SegmentedObjectWithRects(SegmentedObject):
+    def __init__(self, segmented_object, rotated_rect):
+        super().__init__(
+            segmented_object.xmin,
+            segmented_object.ymin,
+            segmented_object.xmax,
+            segmented_object.ymax,
+            segmented_object.score,
+            segmented_object.id,
+            segmented_object.str_label,
+            segmented_object.mask,
+        )
+        self.rotated_rect = rotated_rect
+
+    def __str__(self):
+        res = super().__str__()
+        rect = self.rotated_rect
+        res += f", RotatedRect: {rect[0][0]:.3f} {rect[0][1]:.3f} {rect[1][0]:.3f} {rect[1][1]:.3f} {rect[2]:.3f}"
+        return res
+
+
+class InstanceSegmentationResult(NamedTuple):
+    segmentedObjects: list[SegmentedObject | SegmentedObjectWithRects]
+    # Contain per class saliency_maps and "feature_vector" model output if feature_vector exists
+    saliency_map: list[np.ndarray]
+    feature_vector: np.ndarray
+
+    def __str__(self):
+        obj_str = "; ".join(str(obj) for obj in self.segmentedObjects)
+        filled = 0
+        for cls_map in self.saliency_map:
+            if cls_map.size:
+                filled += 1
+        prefix = f"{obj_str}; " if len(obj_str) else ""
+        return prefix + f"{filled}; [{','.join(str(i) for i in self.feature_vector.shape)}]"
+
+
+class VisualPromptingResult(NamedTuple):
+    upscaled_masks: list[np.ndarray] | None = None
+    processed_mask: list[np.ndarray] | None = None
+    low_res_masks: list[np.ndarray] | None = None
+    iou_predictions: list[np.ndarray] | None = None
+    scores: list[np.ndarray] | None = None
+    labels: list[np.ndarray] | None = None
+    hard_predictions: list[np.ndarray] | None = None
+    soft_predictions: list[np.ndarray] | None = None
+    best_iou: list[float] | None = None
+
+    def _compute_min_max(self, tensor: np.ndarray) -> tuple[np.ndarray, np.ndarray]:
+        return tensor.min(), tensor.max()
+
+    def __str__(self) -> str:
+        assert self.hard_predictions is not None
+        assert self.upscaled_masks is not None
+        upscaled_masks_min, upscaled_masks_max = self._compute_min_max(
+            self.upscaled_masks[0],
+        )
+
+        return (
+            f"upscaled_masks min:{upscaled_masks_min:.3f} max:{upscaled_masks_max:.3f};"
+            f"hard_predictions shape:{self.hard_predictions[0].shape};"
+        )
+
+
+class PredictedMask(NamedTuple):
+    mask: list[np.ndarray]
+    points: list[np.ndarray] | np.ndarray
+    scores: list[float] | np.ndarray
+
+    def __str__(self) -> str:
+        obj_str = ""
+        obj_str += f"mask sum: {np.sum(sum(self.mask))}; "
+
+        if isinstance(self.points, list):
+            for i, point in enumerate(self.points):
+                obj_str += "["
+                obj_str += ", ".join(str(round(c, 2)) for c in point)
+                obj_str += "] "
+                obj_str += "iou: " + f"{float(self.scores[i]):.3f} "
+        else:
+            for i in range(self.points.shape[0]):
+                point = self.points[i]
+                obj_str += "["
+                obj_str += ", ".join(str(round(c, 2)) for c in point)
+                obj_str += "] "
+                obj_str += "iou: " + f"{float(self.scores[i]):.3f} "
+
+        return obj_str.strip()
+
+
+class ZSLVisualPromptingResult(NamedTuple):
+    data: dict[int, PredictedMask]
+
+    def __str__(self) -> str:
+        return ", ".join(str(self.data[k]) for k in self.data)
+
+    def get_mask(self, label: int) -> PredictedMask:
+        """Returns a mask belonging to a given label"""
+        return self.data[label]
+
+
+class DetectedKeypoints(NamedTuple):
+    keypoints: np.ndarray
+    scores: np.ndarray
+
+    def __str__(self):
+        return (
+            f"keypoints: {self.keypoints.shape}, "
+            f"keypoints_x_sum: {np.sum(self.keypoints[:, :1]):.3f}, "
+            f"scores: {self.scores.shape}"
+        )
+
+
+class Contour(NamedTuple):
+    label: str
+    probability: float
+    shape: list[tuple[int, int]]
+
+    def __str__(self):
+        return f"{self.label}: {self.probability:.3f}, {len(self.shape)}"
+
+
+class ImageResultWithSoftPrediction(NamedTuple):
+    resultImage: np.ndarray
+    soft_prediction: np.ndarray
+    # Contain per class saliency_maps and "feature_vector" model output if feature_vector exists
+    saliency_map: np.ndarray  # Requires return_soft_prediction==True
+    feature_vector: np.ndarray
+
+    def __str__(self):
+        outHist = cv.calcHist(
+            [self.resultImage.astype(np.uint8)],
+            channels=None,
+            mask=None,
+            histSize=[256],
+            ranges=[0, 255],
+        )
+        hist = ""
+        for i, count in enumerate(outHist):
+            if count > 0:
+                hist += f"{i}: {count[0] / self.resultImage.size:.3f}, "
+        return (
+            f"{hist}{_array_shape_to_str(self.soft_prediction)}, "
+            f"{_array_shape_to_str(self.saliency_map)}, "
+            f"{_array_shape_to_str(self.feature_vector)}"
+        )
+
+
+def _array_shape_to_str(array: np.ndarray | None) -> str:
+    if array is not None:
+        return f"[{','.join(str(i) for i in array.shape)}]"
+    else:
+        return "[]"
@@ -11,8 +11,9 @@
 import numpy as np
 
 from .image_model import ImageModel
+from .result_types import Contour, ImageResultWithSoftPrediction
 from .types import BooleanValue, ListValue, NumericalValue, StringValue
-from .utils import Contour, ImageResultWithSoftPrediction, load_labels
+from .utils import load_labels
 
 
 def create_hard_prediction_from_soft_prediction(

@@ -6,7 +6,7 @@
 import numpy as np
 
 from .detection_model import DetectionModel
-from .utils import Detection, DetectionResult
+from .result_types import Detection, DetectionResult
 
 
 class SSD(DetectionModel):