Enable kwarg inputs for pt2e quantize (#7436)

jackzhxng · facebook-github-bot · commit 4655850dcef8 · 2025-02-27T10:07:03.000-08:00
Summary:
For quantizing models that have kwarg forward() inputs, such as TorchTune Llama models


Test Plan: N/A

Reviewed By: tarun292

Differential Revision: D70206003

Pulled By: jackzhxng
diff --git a/extension/llm/export/builder.py b/extension/llm/export/builder.py
@@ -360,7 +360,10 @@ def pt2e_quantize(self, quantizers: Optional[List[Quantizer]]) -> "LLMEdgeManage
                     logging.info(
                         "No calibration provided, using dummy input to calibrate..."
                     )
-                    m(*self.example_inputs)
+                    if self.example_kwarg_inputs:
+                        m(*self.example_inputs, **self.example_kwarg_inputs)
+                    else:
+                        m(*self.example_inputs)
                 m = convert_pt2e(m)
                 DuplicateDynamicQuantChainPass()(m)
                 self.pre_autograd_graph_module = m