Skip to content

Commit 5bf185a

Browse files
authored
[Bugfix] gptq_marlin: Ensure g_idx_sort_indices is not a Parameter (#5108)
1 parent 4fbcb0f commit 5bf185a

File tree

1 file changed

+4
-8
lines changed

1 file changed

+4
-8
lines changed

vllm/model_executor/layers/quantization/gptq_marlin.py

Lines changed: 4 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -298,14 +298,10 @@ def create_weights(
298298
},
299299
)
300300

301-
g_idx_sort_indices = Parameter(
302-
torch.empty(
303-
g_idx.shape,
304-
dtype=torch.int32,
305-
),
306-
requires_grad=False,
301+
g_idx_sort_indices = torch.empty(
302+
g_idx.shape,
303+
dtype=torch.int32,
307304
)
308-
set_weight_attrs(g_idx_sort_indices, extra_weight_attrs)
309305

310306
# Scales
311307
scales = Parameter(
@@ -356,9 +352,9 @@ def create_weights(
356352

357353
layer.register_parameter("qweight", qweight)
358354
layer.register_parameter("g_idx", g_idx)
359-
layer.register_parameter("g_idx_sort_indices", g_idx_sort_indices)
360355
layer.register_parameter("scales", scales)
361356
layer.register_parameter("qzeros", qzeros)
357+
layer.g_idx_sort_indices = g_idx_sort_indices
362358
layer.workspace = workspace
363359
layer.input_size_per_partition = input_size_per_partition
364360
layer.output_size_per_partition = output_size_per_partition

0 commit comments

Comments
 (0)