Skip to content

Commit 37c57d4

Browse files
committed
up
1 parent f680066 commit 37c57d4

File tree

1 file changed

+1
-3
lines changed

1 file changed

+1
-3
lines changed

extension/llm/export/builder.py

Lines changed: 1 addition & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -350,7 +350,7 @@ def calibrate_template(
350350
print(f"{task}: {res}")
351351
logging.info("Calibration finish...")
352352

353-
def pt2e_quantize(self, quantizers: Optional[Quantizer]) -> "LLMEdgeManager":
353+
def pt2e_quantize(self, quantizers: Optional[List[Quantizer]]) -> "LLMEdgeManager":
354354
"""
355355
Quantize the model via pt2e flow and retrieve LLMEdgeManager including the quantized model.
356356
Args:
@@ -367,9 +367,7 @@ def pt2e_quantize(self, quantizers: Optional[Quantizer]) -> "LLMEdgeManager":
367367
with torch.nn.attention.sdpa_kernel([SDPBackend.MATH]), torch.no_grad():
368368
if self.verbose:
369369
logging.info(f"Applied quantizers: {quantizers}")
370-
371370
composed_quantizer = ComposableQuantizer(quantizers)
372-
373371
assert (
374372
self.pre_autograd_graph_module is not None
375373
), "Please run export() first"

0 commit comments

Comments
 (0)