Fix #1474 - AssertionError:assert param_slice.shape == loaded_weight.shape (#1631)

lihuahua123 · web-flow · commit eb825c1e7401 · 2023-11-12T15:53:12.000-08:00
diff --git a/vllm/model_executor/models/gpt_j.py b/vllm/model_executor/models/gpt_j.py
@@ -250,7 +250,7 @@ def load_weights(self,
                 if att_weight_name not in name:
                     continue
                 param = state_dict[name.replace(att_weight_name, "qkv_proj")]
-                shard_size = param.shape[1]
+                shard_size = param.shape[0] // 3
                 loaded_weight = loaded_weight[shard_size * tp_rank:shard_size *
                                               (tp_rank + 1)]
                 param_slice = param.data[shard_size * stride_id:shard_size *