Skip to content

Commit 52a1bcb

Browse files
committed
update
1 parent af381ad commit 52a1bcb

File tree

2 files changed

+2
-1
lines changed

2 files changed

+2
-1
lines changed

src/diffusers/quantizers/gguf/gguf_quantizer.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -37,7 +37,7 @@ def __init__(self, quantization_config, **kwargs):
3737
super().__init__(quantization_config, **kwargs)
3838

3939
self.compute_dtype = quantization_config.compute_dtype
40-
self.pre_quantized = True
40+
self.pre_quantized = quantization_config.pre_quantized
4141

4242
def validate_environment(self, *args, **kwargs):
4343
if not is_accelerate_available() or is_accelerate_version("<", "0.26.0"):

src/diffusers/quantizers/quantization_config.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -397,6 +397,7 @@ def __init__(self, compute_dtype=None, quant_storage=None):
397397
self.quant_method = QuantizationMethod.GGUF
398398
self.compute_dtype = compute_dtype
399399
self.quant_storage = quant_storage
400+
self.pre_quantized = True
400401

401402
if self.compute_dtype is None:
402403
self.compute_dtype = torch.float32

0 commit comments

Comments
 (0)