NXP backend: Improve quantization annotation process

roman-janik-nxp · StrycekSimon · commit 338c6374234d · 2025-07-01T09:05:48.000+02:00
- fixes multiple subsequent nodes with SharedSpecPattern problem
diff --git a/backends/nxp/quantizer/neutron_quantizer.py b/backends/nxp/quantizer/neutron_quantizer.py
@@ -10,7 +10,6 @@
 from executorch.backends.nxp.aten_passes.neutron_aten_pass_manager import (
     NeutronAtenPassManager,
 )
-
 from executorch.backends.nxp.quantizer.patterns import (
     AddmmPattern,
     AvgPoolPattern,
@@ -24,6 +23,7 @@
     ReluInPlacePattern,
     ReluPattern,
     ReshapePattern,
+    SharedSpecPattern,
     SoftMaxPattern,
 )
 from executorch.backends.nxp.quantizer.utils import (
@@ -202,9 +202,34 @@ def __init__(self):
                 NeutronAtenQuantizer(AvgPoolPattern(), static_qconfig),
             ]
         )
+        self.op_to_quantizer = {
+            pt: q for q in self.quantizers for pt in q.pattern.partition_types()
+        }
+        self.op_to_applied_quantizer = {
+            pt: False for q in self.quantizers for pt in q.pattern.partition_types()
+        }
 
     def transform_for_annotation(
         self, model: torch.fx.GraphModule
     ) -> torch.fx.GraphModule:
         pass_runner = NeutronAtenPassManager()
         return pass_runner(model).graph_module
+
+    def annotate(self, model: torch.fx.GraphModule) -> torch.fx.GraphModule:
+        nodes = list(model.graph.nodes)
+        for node in nodes:
+            if (
+                node.target not in self.op_to_quantizer
+                or self.op_to_applied_quantizer[node.target]
+            ):
+                continue
+            else:
+                quantizer = self.op_to_quantizer[node.target]
+                quantizer.annotate(model)
+                if not isinstance(quantizer.pattern, SharedSpecPattern):
+                    self.op_to_applied_quantizer[node.target] = True
+
+        return model
+
+    def validate(self, model: torch.fx.GraphModule) -> None:
+        return super().validate(model)