Fixed a bug in absmax float conversion.

TimDettmers · TimDettmers · commit c00402f17e04 · 2023-07-13T21:47:38.000-07:00
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -268,6 +268,7 @@ Features:
 Bug fixes:
  - Fixed a bug where the default type of absmax was undefined which leads to errors if the default type is different than torch.float32. # 553
  - Fixed a missing scipy dependency in requirements.txt. #544
+ - Fixed a bug, where a view operation could cause an error in 8-bit layers.
 
 Documentation:
  - Improved documentation for GPUs that do not support 8-bit matmul. #529
diff --git a/bitsandbytes/functional.py b/bitsandbytes/functional.py
@@ -685,10 +685,10 @@ def dequantize_blockwise(
 
     absmax, code, blocksize, nested, dtype, offset, state2 = quant_state
 
-    if absmax.dtype != torch.float32: absmax = absmax.float()
     if nested:
         absmax = dequantize_blockwise(absmax, state2)
         absmax += offset
+        if absmax.dtype != torch.float32: absmax = absmax.float()
 
     if out is None:
         out = torch.empty(A.shape, dtype=dtype, device=A.device)