diff --git a/examples/llm_ptq/hf_ptq.py b/examples/llm_ptq/hf_ptq.py index 119a34f2..86e847ac 100755 --- a/examples/llm_ptq/hf_ptq.py +++ b/examples/llm_ptq/hf_ptq.py @@ -93,6 +93,7 @@ def auto_quantize( qformat in [ "fp8", + "int8_sq", "int4_awq", "nvfp4", "nvfp4_awq",