File tree Expand file tree Collapse file tree 1 file changed +2
-1
lines changed
vllm/model_executor/layers/quantization/utils Expand file tree Collapse file tree 1 file changed +2
-1
lines changed Original file line number Diff line number Diff line change 11# SPDX-License-Identifier: Apache-2.0
22# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
33from copy import deepcopy
4+ from fractions import Fraction
45from typing import Optional , Union
56
67import regex as re
@@ -29,7 +30,7 @@ def override_config(config: QuantizationConfig, prefix: str):
2930 if isinstance (desc_act , bool ):
3031 config .desc_act = desc_act
3132
32- config .pack_factor = 32 // config .weight_bits # packed into int32
33+ config .pack_factor = Fraction ( 32 , config .weight_bits ) # packed into int32
3334 if config .get_name () == "gptq_marlin" :
3435 is_sym = get_dynamic_override (config , prefix , "sym" , config .is_sym )
3536 if isinstance (is_sym , bool ):
You can’t perform that action at this time.
0 commit comments