Schema - V2 (#1396)

yarden-yagil-sony · yarden-sony · web-flow · commit 516061b5fef7 · 2025-04-01T17:17:18.000+03:00
* add box decode to op set names

---------

Co-authored-by: yarden-sony &lt;yardeny-sony@sony.com&gt;
diff --git a/model_compression_toolkit/target_platform_capabilities/schema/mct_current_schema.py b/model_compression_toolkit/target_platform_capabilities/schema/mct_current_schema.py
@@ -1,4 +1,4 @@
-import model_compression_toolkit.target_platform_capabilities.schema.v1 as schema
+import model_compression_toolkit.target_platform_capabilities.schema.v2 as schema
 
 OperatorSetNames = schema.OperatorSetNames
 Signedness = schema.Signedness
diff --git a/model_compression_toolkit/target_platform_capabilities/schema/v2.py b/model_compression_toolkit/target_platform_capabilities/schema/v2.py
@@ -0,0 +1,177 @@
+# Copyright 2025 Sony Semiconductor Israel, Inc. All rights reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+import pprint
+from enum import Enum
+from typing import Dict, Any, Tuple, Optional
+
+from pydantic import BaseModel, root_validator
+
+from mct_quantizers import QuantizationMethod
+from model_compression_toolkit.constants import FLOAT_BITWIDTH
+from model_compression_toolkit.logger import Logger
+from model_compression_toolkit.target_platform_capabilities.schema.v1 import (
+    Signedness,
+    AttributeQuantizationConfig,
+    OpQuantizationConfig,
+    QuantizationConfigOptions,
+    TargetPlatformModelComponent,
+    OperatorsSetBase,
+    OperatorsSet,
+    OperatorSetGroup,
+    Fusing)
+
+
+class OperatorSetNames(str, Enum):
+    CONV = "Conv"
+    DEPTHWISE_CONV = "DepthwiseConv2D"
+    CONV_TRANSPOSE = "ConvTranspose"
+    FULLY_CONNECTED = "FullyConnected"
+    CONCATENATE = "Concatenate"
+    STACK = "Stack"
+    UNSTACK = "Unstack"
+    GATHER = "Gather"
+    EXPAND = "Expend"
+    BATCH_NORM = "BatchNorm"
+    L2NORM = "L2Norm"
+    RELU = "ReLU"
+    RELU6 = "ReLU6"
+    LEAKY_RELU = "LeakyReLU"
+    ELU = "Elu"
+    HARD_TANH = "HardTanh"
+    ADD = "Add"
+    SUB = "Sub"
+    MUL = "Mul"
+    DIV = "Div"
+    MIN = "Min"
+    MAX = "Max"
+    PRELU = "PReLU"
+    ADD_BIAS = "AddBias"
+    SWISH = "Swish"
+    SIGMOID = "Sigmoid"
+    SOFTMAX = "Softmax"
+    LOG_SOFTMAX = "LogSoftmax"
+    TANH = "Tanh"
+    GELU = "Gelu"
+    HARDSIGMOID = "HardSigmoid"
+    HARDSWISH = "HardSwish"
+    FLATTEN = "Flatten"
+    GET_ITEM = "GetItem"
+    RESHAPE = "Reshape"
+    UNSQUEEZE = "Unsqueeze"
+    SQUEEZE = "Squeeze"
+    PERMUTE = "Permute"
+    TRANSPOSE = "Transpose"
+    DROPOUT = "Dropout"
+    SPLIT_CHUNK = "SplitChunk"
+    MAXPOOL = "MaxPool"
+    AVGPOOL = "AvgPool"
+    SIZE = "Size"
+    SHAPE = "Shape"
+    EQUAL = "Equal"
+    ARGMAX = "ArgMax"
+    TOPK = "TopK"
+    FAKE_QUANT = "FakeQuant"
+    COMBINED_NON_MAX_SUPPRESSION = "CombinedNonMaxSuppression"
+    BOX_DECODE = "BoxDecode"
+    ZERO_PADDING2D = "ZeroPadding2D"
+    CAST = "Cast"
+    RESIZE = "Resize"
+    PAD = "Pad"
+    FOLD = "Fold"
+    STRIDED_SLICE = "StridedSlice"
+    SSD_POST_PROCESS = "SSDPostProcess"
+
+    @classmethod
+    def get_values(cls):
+        return [v.value for v in cls]
+
+
+class TargetPlatformCapabilities(BaseModel):
+    """
+    Represents the hardware configuration used for quantized model inference.
+
+    Attributes:
+        default_qco (QuantizationConfigOptions): Default quantization configuration options for the model.
+        operator_set (Optional[Tuple[OperatorsSet, ...]]): Tuple of operator sets within the model.
+        fusing_patterns (Optional[Tuple[Fusing, ...]]): Tuple of fusing patterns for the model.
+        tpc_minor_version (Optional[int]): Minor version of the Target Platform Configuration.
+        tpc_patch_version (Optional[int]): Patch version of the Target Platform Configuration.
+        tpc_platform_type (Optional[str]): Type of the platform for the Target Platform Configuration.
+        add_metadata (bool): Flag to determine if metadata should be added.
+        name (str): Name of the Target Platform Model.
+        is_simd_padding (bool): Indicates if SIMD padding is applied.
+        SCHEMA_VERSION (int): Version of the schema for the Target Platform Model.
+    """
+    default_qco: QuantizationConfigOptions
+    operator_set: Optional[Tuple[OperatorsSet, ...]]
+    fusing_patterns: Optional[Tuple[Fusing, ...]]
+    tpc_minor_version: Optional[int]
+    tpc_patch_version: Optional[int]
+    tpc_platform_type: Optional[str]
+    add_metadata: bool = True
+    name: Optional[str] = "default_tpc"
+    is_simd_padding: bool = False
+
+    SCHEMA_VERSION: int = 2
+
+    class Config:
+        frozen = True
+
+    @root_validator(allow_reuse=True)
+    def validate_after_initialization(cls, values: Dict[str, Any]) -> Dict[str, Any]:
+        """
+        Perform validation after the model has been instantiated.
+
+        Args:
+            values (Dict[str, Any]): The instantiated target platform model.
+
+        Returns:
+            Dict[str, Any]: The validated values.
+        """
+        # Validate `default_qco`
+        default_qco = values.get('default_qco')
+        if len(default_qco.quantization_configurations) != 1:
+            Logger.critical("Default QuantizationConfigOptions must contain exactly one option.")  # pragma: no cover
+
+        # Validate `operator_set` uniqueness
+        operator_set = values.get('operator_set')
+        if operator_set is not None:
+            opsets_names = [
+                op.name.value if isinstance(op.name, OperatorSetNames) else op.name
+                for op in operator_set
+            ]
+            if len(set(opsets_names)) != len(opsets_names):
+                Logger.critical("Operator Sets must have unique names.")  # pragma: no cover
+
+        return values
+
+    def get_info(self) -> Dict[str, Any]:
+        """
+        Get a dictionary summarizing the TargetPlatformCapabilities properties.
+
+        Returns:
+            Dict[str, Any]: Summary of the TargetPlatformCapabilities properties.
+        """
+        return {
+            "Model name": self.name,
+            "Operators sets": [o.get_info() for o in self.operator_set] if self.operator_set else [],
+            "Fusing patterns": [f.get_info() for f in self.fusing_patterns] if self.fusing_patterns else [],
+        }
+
+    def show(self):
+        """
+        Display the TargetPlatformCapabilities.
+        """
+        pprint.pprint(self.get_info(), sort_dicts=False)
diff --git a/model_compression_toolkit/target_platform_capabilities/targetplatform2framework/attach2keras.py b/model_compression_toolkit/target_platform_capabilities/targetplatform2framework/attach2keras.py
@@ -93,6 +93,7 @@ def __init__(self):
             OperatorSetNames.TOPK: [tf.nn.top_k],
             OperatorSetNames.FAKE_QUANT: [tf.quantization.fake_quant_with_min_max_vars],
             OperatorSetNames.COMBINED_NON_MAX_SUPPRESSION: [tf.image.combined_non_max_suppression],
+            OperatorSetNames.BOX_DECODE: [],  # no such operator in keras
             OperatorSetNames.ZERO_PADDING2D: [ZeroPadding2D],
             OperatorSetNames.CAST: [tf.cast],
             OperatorSetNames.STRIDED_SLICE: [tf.strided_slice],
diff --git a/model_compression_toolkit/target_platform_capabilities/targetplatform2framework/attach2pytorch.py b/model_compression_toolkit/target_platform_capabilities/targetplatform2framework/attach2pytorch.py
@@ -97,7 +97,8 @@ def __init__(self):
             OperatorSetNames.L2NORM: [LayerFilterParams(torch.nn.functional.normalize,
                                                         Eq('p', 2) | Eq('p', None))],
             OperatorSetNames.SSD_POST_PROCESS: [],  # no such operator in pytorch
-            OperatorSetNames.COMBINED_NON_MAX_SUPPRESSION: []  # no such operator in pytorch
+            OperatorSetNames.COMBINED_NON_MAX_SUPPRESSION: [],  # no such operator in pytorch
+            OperatorSetNames.BOX_DECODE: []  # no such operator in pytorch
         }
 
         pytorch_linear_attr_mapping = {KERNEL_ATTR: DefaultDict(default_value=PYTORCH_KERNEL),
diff --git a/tests/common_tests/helpers/tpcs_for_tests/v4/tpc.py b/tests/common_tests/helpers/tpcs_for_tests/v4/tpc.py
@@ -14,8 +14,7 @@
 # ==============================================================================
 from typing import List, Tuple
 
-import model_compression_toolkit as mct
-import model_compression_toolkit.target_platform_capabilities.schema.v1 as schema
+import model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema as schema
 from mct_quantizers import QuantizationMethod
 from model_compression_toolkit.constants import FLOAT_BITWIDTH
 from model_compression_toolkit.target_platform_capabilities.constants import KERNEL_ATTR, BIAS_ATTR, WEIGHTS_N_BITS, \
diff --git a/tests_pytest/_fw_tests_common_base/base_tpc_attach2fw_test.py b/tests_pytest/_fw_tests_common_base/base_tpc_attach2fw_test.py
@@ -51,7 +51,7 @@ def setup_method(self):
 
     def test_attach2fw_init(self):
         # verify built-in opset to operator mapping structure
-        assert len(self.attach2fw._opset2layer) == 57  # number of built-in operator sets
+        assert len(self.attach2fw._opset2layer) == 58  # number of built-in operator sets
         assert all(opset in self.attach2fw._opset2layer for opset in list(schema.OperatorSetNames))
         assert all(isinstance(key, schema.OperatorSetNames) for key in self.attach2fw._opset2layer.keys())
         assert all(isinstance(value, list) for value in self.attach2fw._opset2layer.values())
diff --git a/tests_pytest/common_tests/unit_tests/core/quantization/quantization_params_selection/test_qarams_activations_computation.py b/tests_pytest/common_tests/unit_tests/core/quantization/quantization_params_selection/test_qarams_activations_computation.py
@@ -33,7 +33,7 @@
     get_activations_qparams
 )
 from model_compression_toolkit.target_platform_capabilities import Signedness, OpQuantizationConfig
-from model_compression_toolkit.target_platform_capabilities.schema.v1 import AttributeQuantizationConfig
+from model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema import AttributeQuantizationConfig
 
 
 class TestActivationQParams:

Original file line number	Diff line number	Diff line change
`@@ -1,4 +1,4 @@`
`1`		`-import model_compression_toolkit.target_platform_capabilities.schema.v1 as schema`
	`1`	`+import model_compression_toolkit.target_platform_capabilities.schema.v2 as schema`
`2`	`2`
`3`	`3`	`OperatorSetNames = schema.OperatorSetNames`
`4`	`4`	`Signedness = schema.Signedness`
Original file line number	Diff line number	Diff line change
`@@ -97,7 +97,8 @@ def __init__(self):`
`97`	`97`	`OperatorSetNames.L2NORM: [LayerFilterParams(torch.nn.functional.normalize,`
`98`	`98`	`Eq('p', 2) \| Eq('p', None))],`
`99`	`99`	`OperatorSetNames.SSD_POST_PROCESS: [], # no such operator in pytorch`
`100`		`- OperatorSetNames.COMBINED_NON_MAX_SUPPRESSION: [] # no such operator in pytorch`
	`100`	`+ OperatorSetNames.COMBINED_NON_MAX_SUPPRESSION: [], # no such operator in pytorch`
	`101`	`+ OperatorSetNames.BOX_DECODE: [] # no such operator in pytorch`
`101`	`102`	`}`
`102`	`103`
`103`	`104`	`pytorch_linear_attr_mapping = {KERNEL_ATTR: DefaultDict(default_value=PYTORCH_KERNEL),`
Original file line number	Diff line number	Diff line change
`@@ -33,7 +33,7 @@`
`33`	`33`	`get_activations_qparams`
`34`	`34`	`)`
`35`	`35`	`from model_compression_toolkit.target_platform_capabilities import Signedness, OpQuantizationConfig`
`36`		`-from model_compression_toolkit.target_platform_capabilities.schema.v1 import AttributeQuantizationConfig`
	`36`	`+from model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema import AttributeQuantizationConfig`
`37`	`37`
`38`	`38`
`39`	`39`	`class TestActivationQParams:`