We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 632262f commit 7ba303fCopy full SHA for 7ba303f
bitsandbytes/backends/npu.py
@@ -90,7 +90,7 @@ def quantize_4bit(
90
A: torch.Tensor,
91
absmax: Optional[torch.Tensor] = None,
92
out: Optional[torch.Tensor] = None,
93
- blocksize=64,
+ blocksize: Optional[int] = None,
94
compress_statistics=False,
95
quant_type: Literal["fp4", "nf4"] = "nf4",
96
quant_storage=torch.uint8,
0 commit comments