fix format

jiqing-feng · jiqing-feng · commit cafe58fea6b9 · 2025-01-09T14:08:24.000Z
Signed-off-by: jiqing-feng &lt;jiqing.feng@intel.com&gt;
diff --git a/bitsandbytes/backends/cpu_xpu_common.py b/bitsandbytes/backends/cpu_xpu_common.py
@@ -6,8 +6,8 @@
 
 from bitsandbytes.functional import (
     QuantState,
-    get_4bit_type,
     create_dynamic_map,
+    get_4bit_type,
 )
 
 try:
@@ -361,15 +361,14 @@ def quantize_4bit_impl(
         for i in range(len(INT8_QUANT_TABLE)):
             out_uint8[scaled_A > INT8_QUANT_TABLE[i]] = i
 
-    if quant_type != "int8":
+    if quant_type == "int8":
+        out = out_uint8
+        code = torch.Tensor(INT8_QUANT_TABLE, device=A.device)
+    else:
         if out_uint8.size(-1) % 2:
             out_uint8 = torch.nn.functional.pad(out_uint8, (0, 1), value=0)
         out[:] = out_uint8[1::2].bitwise_left_shift(4).bitwise_or_(out_uint8[::2])
-
         code = get_4bit_type(quant_type, device=A.device)
-    else:
-        out = out_uint8
-        code = torch.Tensor(INT8_QUANT_TABLE, device=A.device)
 
     if compress_statistics:
         offset = absmax.mean()
diff --git a/bitsandbytes/functional.py b/bitsandbytes/functional.py
@@ -728,27 +728,6 @@ def quantize_blockwise(
     else:
         quant_state = QuantState(absmax=absmax, code=code, blocksize=blocksize, dtype=A.dtype)
 
-
-    n = A.numel()
-    blocks = n // blocksize
-    blocks += 1 if n % blocksize > 0 else 0
-    rem = n % blocksize
-    has_rem = rem > 0
-    # Scale tensor to [-1, 1]
-    A_reshaped = A.reshape(n)
-    A_com = A_reshaped[: n - rem]
-    A_com_reshaped = A_com.reshape(n // blocksize, blocksize)
-    absmax[: blocks - has_rem] = torch.abs(A_com_reshaped).max(dim=-1)[0]
-    scaled_A = torch.clamp(A_com_reshaped * (1 / absmax[: blocks - has_rem].view(-1, 1)), -1, 1)
-    scaled_A = scaled_A.reshape(-1)
-    if has_rem:
-        absmax[-1] = torch.abs(A_reshaped[n - rem :]).max()
-        scaled_A_rem = torch.clamp(A_reshaped[n - rem :] * (1 / absmax[-1]), -1, 1)
-        scaled_A = torch.cat([scaled_A, scaled_A_rem], dim=0)
-    B = torch.empty(A.shape, dtype=torch.uint8, device=A.device)
-    for i in range(len(code)):
-        B[scaled_A > code[i]] = i
-
     return out, quant_state