File tree Expand file tree Collapse file tree 1 file changed +4
-8
lines changed
vllm/model_executor/layers/quantization Expand file tree Collapse file tree 1 file changed +4
-8
lines changed Original file line number Diff line number Diff line change @@ -298,14 +298,10 @@ def create_weights(
298
298
},
299
299
)
300
300
301
- g_idx_sort_indices = Parameter (
302
- torch .empty (
303
- g_idx .shape ,
304
- dtype = torch .int32 ,
305
- ),
306
- requires_grad = False ,
301
+ g_idx_sort_indices = torch .empty (
302
+ g_idx .shape ,
303
+ dtype = torch .int32 ,
307
304
)
308
- set_weight_attrs (g_idx_sort_indices , extra_weight_attrs )
309
305
310
306
# Scales
311
307
scales = Parameter (
@@ -356,9 +352,9 @@ def create_weights(
356
352
357
353
layer .register_parameter ("qweight" , qweight )
358
354
layer .register_parameter ("g_idx" , g_idx )
359
- layer .register_parameter ("g_idx_sort_indices" , g_idx_sort_indices )
360
355
layer .register_parameter ("scales" , scales )
361
356
layer .register_parameter ("qzeros" , qzeros )
357
+ layer .g_idx_sort_indices = g_idx_sort_indices
362
358
layer .workspace = workspace
363
359
layer .input_size_per_partition = input_size_per_partition
364
360
layer .output_size_per_partition = output_size_per_partition
You can’t perform that action at this time.
0 commit comments