[rls2.6] Re-align order of WOQ.from_weight() (#3481)

jianan-gu · web-flow · commit e14b2a2a1c8c · 2025-01-23T03:58:13.000-08:00
* Re-align order of woq.from_weight

* Update woq_linear.py
diff --git a/intel_extension_for_pytorch/llm/quantization/woq_linear.py b/intel_extension_for_pytorch/llm/quantization/woq_linear.py
@@ -70,8 +70,9 @@ def from_weight(
             bias,
             group_size,
             g_idx,
-            dtype,
             quant_method,
+            dtype,
+            **kwargs
         )
         return cls(woq_linear_impl)
 
diff --git a/intel_extension_for_pytorch/nn/modules/weight_only_quantization.py b/intel_extension_for_pytorch/nn/modules/weight_only_quantization.py
@@ -372,8 +372,8 @@ def from_weight(
         bias: Optional[torch.Tensor] = None,
         group_size: int = -1,
         g_idx: Optional[torch.Tensor] = None,
-        dtype: int = 0,
         quant_method: QuantMethod = QuantMethod.GPTQ_GEMM,
+        dtype: QuantDtype = QuantDtype.INT4,
         **kwargs,
     ):
         r"""Create a weight-only quantized module from weight