Check for gptqmodel first when exporting a GPTQ model to openvino

notsyncing · notsyncing · commit d642dded054d · 2025-05-09T22:26:20.000+08:00
diff --git a/optimum/exporters/openvino/__main__.py b/optimum/exporters/openvino/__main__.py
@@ -39,6 +39,7 @@
     _infer_library_from_model_name_or_path,
     _OpenClipForZeroShotImageClassification,
 )
+from optimum.utils import is_auto_gptq_available, is_gptqmodel_available
 
 from .utils import (
     _MAX_UNCOMPRESSED_SIZE,
@@ -344,7 +345,12 @@ def main_export(
                 orig_post_init_model = GPTQQuantizer.post_init_model
 
                 def post_init_model(self, model):
-                    from auto_gptq import exllama_set_max_input_length
+                    if is_gptqmodel_available():
+                        from gptqmodel import exllama_set_max_input_length
+                    elif is_auto_gptq_available():
+                        from auto_gptq import exllama_set_max_input_length
+                    else:
+                        raise ValueError("neither auto_gptq nor gptqmodel is available")
 
                     class StoreAttr(object):
                         pass