pulp-platform
diff --git a/‎.github/workflows/CI.yml‎
Lines changed: 2 additions & 4 deletions b/‎.github/workflows/CI.yml‎
Lines changed: 2 additions & 4 deletions
diff --git a/‎DeepQuant/ExportBrevitas.py‎
Lines changed: 12 additions & 21 deletions b/‎DeepQuant/ExportBrevitas.py‎
Lines changed: 12 additions & 21 deletions
diff --git a/‎Tests/TestConv.py‎
Lines changed: 60 additions & 0 deletions b/‎Tests/TestConv.py‎
Lines changed: 60 additions & 0 deletions
diff --git a/‎Tests/TestLinear.py‎
Lines changed: 59 additions & 0 deletions b/‎Tests/TestLinear.py‎
Lines changed: 59 additions & 0 deletions
diff --git a/‎Tests/TestSimpleMHA.py‎ ‎Tests/TestMHSA.py‎Tests/TestSimpleMHA.py renamed to Tests/TestMHSA.py
Lines changed: 5 additions & 3 deletions b/‎Tests/TestSimpleMHA.py‎ ‎Tests/TestMHSA.py‎Tests/TestSimpleMHA.py renamed to Tests/TestMHSA.py
Lines changed: 5 additions & 3 deletions
diff --git a/‎Tests/TestMobileNetV3Small.py‎
Lines changed: 124 additions & 0 deletions b/‎Tests/TestMobileNetV3Small.py‎
Lines changed: 124 additions & 0 deletions
@@ -36,9 +36,7 @@ jobs:
           pip install -e .
       - name: Run Tests
         run: |
-          pytest Tests/TestSimpleCNN.py
-          pytest Tests/TestSimpleMHA.py
-          pytest Tests/TestSimpleNN.py
+          pytest -m SingleLayerTests
 
   model-tests:
     runs-on: ubuntu-latest
@@ -55,4 +53,4 @@ jobs:
           pip install -e .
       - name: Run Tests
         run: |
-          pytest Tests/TestMnist.py
+          pytest -m ModelTests
@@ -95,12 +95,12 @@ def exportBrevitas(
             exampleInput
         )  # Compute original model output on example input for validation
 
-    export_onnx_qcdq(  # Export original model to ONNX format with QCDQ (Quant-Cast-DeQuant) nodes
-        model,  # Model to export
-        args=exampleInput,  # Example input for tracing
-        export_path=EXPORT_FOLDER / "1_model_qcdq_original.onnx",
-        opset_version=13,
-    )
+    # export_onnx_qcdq(  # Export original model to ONNX format with QCDQ (Quant-Cast-DeQuant) nodes
+    #     model,  # Model to export
+    #     args=exampleInput,  # Example input for tracing
+    #     export_path=EXPORT_FOLDER / "1_model_qcdq_original.onnx",
+    #     opset_version=13,
+    # )
 
     ###############################################################################
     # 2. Injection of New Modules
@@ -151,12 +151,12 @@ def exportBrevitas(
         print("\n=== 2. Network after the Injection of New Modules ===\n")
         printer.print_tabular(fxModel)
 
-    export_onnx_qcdq(  # Export transformed model to ONNX
-        fxModel,  # Transformed model
-        args=exampleInput,
-        export_path=EXPORT_FOLDER / "2_model_qcdq_transformed.onnx",
-        opset_version=13,
-    )
+    # export_onnx_qcdq(  # Export transformed model to ONNX
+    #     fxModel,  # Transformed model
+    #     args=exampleInput,
+    #     export_path=EXPORT_FOLDER / "2_model_qcdq_transformed.onnx",
+    #     opset_version=13,
+    # )
 
     ###############################################################################
     # 3. Extraction of Parameters & Split of Quant Nodes
@@ -274,15 +274,6 @@ def exportBrevitas(
             f"{RED} ✗ Modification of Dequant Nodes changed the output significantly{ENDC}"
         )
 
-    # try:
-    #     tracer = NodeTracer(debug=True)
-    #     tracer.trace(fx_model_unified, example_input)
-    #     if debug:
-    #         print(f"{BLUE} ✓ Tracing completed{ENDC}")
-    # except Exception as e:
-    #     print(f"{RED} ✗ Tracing failed: {str(e)}{ENDC}")
-    #     print("This doesn't affect the validity of the exported model")
-
     import numpy as np
     import onnxruntime as ort
     import onnx
 
@@ -0,0 +1,60 @@
+# Copyright 2025 ETH Zurich and University of Bologna.
+# Licensed under the Apache License, Version 2.0, see LICENSE for details.
+# SPDX-License-Identifier: Apache-2.0
+#
+# Victor Jung <[email protected]>
+# Federico Brancasi <[email protected]>
+
+
+import pytest
+import torch
+import torch.nn as nn
+import brevitas.nn as qnn
+from brevitas.quant.scaled_int import (
+    Int8ActPerTensorFloat,
+    Int32Bias,
+    Int8WeightPerTensorFloat,
+)
+from DeepQuant.ExportBrevitas import exportBrevitas
+
+
+class QuantConvNet(nn.Module):
+
+    convAndLinQuantParams = {
+        "bias": True,
+        "weight_bit_width": 4,
+        "bias_quant": Int32Bias,
+        "input_quant": Int8ActPerTensorFloat,
+        "weight_quant": Int8WeightPerTensorFloat,
+        "output_quant": Int8ActPerTensorFloat,
+        "return_quant_tensor": True,
+    }
+
+    def __init__(self, in_channels: int = 1) -> None:
+        super().__init__()
+        self.inputQuant = qnn.QuantIdentity(return_quant_tensor=True)
+
+        self.conv1 = qnn.QuantConv2d(
+            in_channels=in_channels,
+            out_channels=16,
+            kernel_size=3,
+            padding=1,
+            **QuantConvNet.convAndLinQuantParams
+        )
+
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        
+        x = self.inputQuant(x)
+        x = self.conv1(x)
+        
+        return x
+
+
+@pytest.mark.SingleLayerTests
+def deepQuantTestConv() -> None:
+    
+    torch.manual_seed(42)
+
+    model = QuantConvNet().eval()
+    sampleInput = torch.randn(1, 1, 28, 28)
+    exportBrevitas(model, sampleInput, debug=True)
@@ -0,0 +1,59 @@
+# Copyright 2025 ETH Zurich and University of Bologna.
+# Licensed under the Apache License, Version 2.0, see LICENSE for details.
+# SPDX-License-Identifier: Apache-2.0
+#
+# Federico Brancasi <[email protected]>
+
+
+import pytest
+
+### PyTorch Imports ###
+import torch
+import torch.nn as nn
+
+### Brevitas Import ###
+import brevitas.nn as qnn
+from brevitas.quant.scaled_int import (
+    Int8ActPerTensorFloat,
+    Int32Bias,
+    Int8WeightPerTensorFloat,
+)
+from DeepQuant.ExportBrevitas import exportBrevitas
+
+
+class QuantLinearNet(nn.Module):
+
+    def __init__(self, in_features: int = 16, hidden_features: int = 32) -> None:
+        super().__init__()
+
+        self.inputQuant = qnn.QuantIdentity(return_quant_tensor=True)
+
+        self.linear1 = qnn.QuantLinear(
+            in_features=in_features,
+            out_features=hidden_features,
+            bias=True,
+            weight_bit_width=4,
+            bias_quant=Int32Bias,
+            output_quant=Int8ActPerTensorFloat,
+            input_quant=Int8ActPerTensorFloat,
+            weight_quant=Int8WeightPerTensorFloat,
+            return_quant_tensor=True,
+        )
+
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+
+        x = self.inputQuant(x)
+        x = self.linear1(x)
+
+        return x
+
+
+@pytest.mark.SingleLayerTests
+def deepQuantTestLinear() -> None:
+    
+    torch.manual_seed(42)
+
+    model = QuantLinearNet().eval()
+    sampleInput = torch.randn(1, 4, 16)
+
+    exportBrevitas(model, sampleInput, debug=True)
@@ -5,6 +5,7 @@
 # Federico Brancasi <[email protected]>
 
 
+import pytest
 import torch
 import torch.nn as nn
 import brevitas.nn as qnn
@@ -19,7 +20,7 @@
 )
 
 
-class SimpleQuantMHA(nn.Module):
+class QuantMHSANet(nn.Module):
 
     def __init__(self, embed_dim: int, num_heads: int) -> None:
         """
@@ -65,11 +66,12 @@ def forward(self, x: Tensor) -> Tensor:
         return out
 
 
-def deepQuantTestSimpleQuantMHA() -> None:
+@pytest.mark.SingleLayerTests
+def deepQuantTestMHSA() -> None:
 
     torch.manual_seed(42)
 
-    model = SimpleQuantMHA(embed_dim=16, num_heads=4).eval()
+    model = QuantMHSANet(embed_dim=16, num_heads=4).eval()
     sampleInput = torch.randn(10, 2, 16)
 
     exportBrevitas(model, sampleInput, debug=True)
@@ -0,0 +1,124 @@
+# Copyright 2025 ETH Zurich and University of Bologna.
+# Licensed under the Apache License, Version 2.0, see LICENSE for details.
+# SPDX-License-Identifier: Apache-2.0
+#
+# Victor Juing <[email protected]>
+
+import pytest
+import torch
+import torch.nn as nn
+import torchvision.models as models
+from brevitas.graph.quantize import preprocess_for_quantize
+from brevitas.graph.per_input import AdaptiveAvgPoolToAvgPool
+import brevitas.nn as qnn
+from brevitas.quant import (
+    Int8ActPerTensorFloat,
+    Int8WeightPerTensorFloat,
+    Int32Bias,
+    Uint8ActPerTensorFloat,
+)
+from brevitas.graph.quantize import quantize
+
+from DeepQuant.ExportBrevitas import exportBrevitas
+
+
+def prepareMBNetV3Model() -> nn.Module:
+    """
+    Prepare a quantized MobileNetV3Small model for testing.
+    Steps:
+      1) Load the torchvision MobileNetV3Small.
+      2) Convert it to eval mode.
+      3) Preprocess and adapt average pooling.
+      4) Quantize it using Brevitas.
+
+    Returns:
+        A quantized MobileNetV3Small model ready for export tests.
+    """
+    baseModel = models.mobilenet_v3_small(weights=models.MobileNet_V3_Small_Weights.IMAGENET1K_V1)
+    baseModel = baseModel.eval()
+
+    computeLayerMap = {
+        nn.Conv2d: (
+            qnn.QuantConv2d,
+            {
+                "input_quant": Int8ActPerTensorFloat,
+                "weight_quant": Int8WeightPerTensorFloat,
+                "output_quant": Int8ActPerTensorFloat,
+                "bias_quant": Int32Bias,
+                "bias": True,
+                "return_quant_tensor": True,
+                "output_bit_width": 8,
+                "weight_bit_width": 4,
+            },
+        ),
+        nn.Linear: (
+            qnn.QuantLinear,
+            {
+                "input_quant": Int8ActPerTensorFloat,
+                "weight_quant": Int8WeightPerTensorFloat,
+                "output_quant": Int8ActPerTensorFloat,
+                "bias_quant": Int32Bias,
+                "bias": True,
+                "return_quant_tensor": True,
+                "output_bit_width": 8,
+                "weight_bit_width": 4,
+            },
+        ),
+    }
+
+    quantActMap = {
+        nn.ReLU: (
+            qnn.QuantReLU,
+            {
+                "act_quant": Uint8ActPerTensorFloat,
+                "return_quant_tensor": True,
+                "bit_width": 8,
+            },
+        ),
+    }
+
+    quantIdentityMap = {
+        "signed": (
+            qnn.QuantIdentity,
+            {
+                "act_quant": Int8ActPerTensorFloat,
+                "return_quant_tensor": True,
+                "bit_width": 8,
+            },
+        ),
+        "unsigned": (
+            qnn.QuantIdentity,
+            {
+                "act_quant": Uint8ActPerTensorFloat,
+                "return_quant_tensor": True,
+                "bit_width": 8,
+            },
+        ),
+    }
+
+    baseModel = preprocess_for_quantize(
+        baseModel, equalize_iters=20, equalize_scale_computation="range"
+    )
+    baseModel = AdaptiveAvgPoolToAvgPool().apply(
+        baseModel, torch.ones(1, 3, 224, 224)
+    )
+
+    quantizedModel = quantize(
+        graph_model=baseModel,
+        compute_layer_map=computeLayerMap,
+        quant_act_map=quantActMap,
+        quant_identity_map=quantIdentityMap,
+    )
+
+    return quantizedModel
+
+
+@pytest.mark.ModelTests
+def deepQuantTestMobileNetV3Small() -> None:
+
+    torch.manual_seed(42)
+
+    quantizedModel = prepareMBNetV3Model()
+    sampleInput = torch.randn(1, 3, 224, 224)
+
+    exportBrevitas(quantizedModel, sampleInput, debug=True)