We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 6aa9866 commit d3e14efCopy full SHA for d3e14ef
dequant.py
@@ -23,7 +23,7 @@ def dequantize_tensor(tensor, dtype=None, dequant_dtype=None):
23
return dequantize(tensor.data, qtype, oshape, dtype=dequant_dtype).to(dtype)
24
else:
25
# this is incredibly slow
26
- tqdm.write(f"Falling back to numpy dequant for qtype: {getattr(qtype, "name", repr(qtype))}")
+ tqdm.write(f"Falling back to numpy dequant for qtype: {getattr(qtype, 'name', repr(qtype))}")
27
new = gguf.quants.dequantize(tensor.cpu().numpy(), qtype)
28
return torch.from_numpy(new).to(tensor.device, dtype=dtype)
29
0 commit comments