fix all

wangzaijun · wangzaijun · commit b574ebf8d6dd · 2025-11-11T10:20:28.000Z
diff --git a/lightllm/common/basemodel/layer_weights/meta_weights/__init__.py b/lightllm/common/basemodel/layer_weights/meta_weights/__init__.py
@@ -2,12 +2,9 @@
 from .mm_weight import (
     MMWeightPack,
     MMWeightTpl,
-    MultiMMWeightTpl,
     ROWMMWeight,
     COLMMWeight,
-    MultiROWMMWeight,
     ROWBMMWeight,
-    AWQMultiMMWeightTpl,
 )
 from .norm_weight import NormWeight, GEMMANormWeight, TpNormWeight
 from .fused_moe_weight_tp import FusedMoeWeightTP
diff --git a/lightllm/common/basemodel/layer_weights/meta_weights/mm_weight/__init__.py b/lightllm/common/basemodel/layer_weights/meta_weights/mm_weight/__init__.py
@@ -1,13 +1,10 @@
 from .mm_weight import (
     MMWeightPack,
     MMWeightTpl,
-    MultiMMWeightTpl,
-    AWQMultiMMWeightTpl,
 )
 from .mm_factory import (
     MMWeight,
     ROWMMWeight,
-    MultiROWMMWeight,
     ROWBMMWeight,
     COLMMWeight,
 )
diff --git a/lightllm/common/basemodel/layer_weights/transformer_layer_weight.py b/lightllm/common/basemodel/layer_weights/transformer_layer_weight.py
@@ -2,7 +2,7 @@
 
 # from lightllm.common.layers.mm import MM
 from .base_layer_weight import BaseLayerWeight
-from .meta_weights import BaseWeight, MultiMMWeightTpl
+from .meta_weights import BaseWeight, MMWeightTpl
 from lightllm.utils.log_utils import init_logger
 
 logger = init_logger(__name__)
@@ -36,7 +36,7 @@ def load_hf_weights(self, weights):
         """
         for attr_name in dir(self):
             attr = getattr(self, attr_name, None)
-            if isinstance(attr, MultiMMWeightTpl):
+            if isinstance(attr, MMWeightTpl) and len(attr.weight_names) >= 2:
                 with self.lock:
                     attr.load_hf_weights(weights)
             elif isinstance(attr, BaseWeight):
diff --git a/lightllm/models/bloom/layer_weights/transformer_layer_weight.py b/lightllm/models/bloom/layer_weights/transformer_layer_weight.py
@@ -108,17 +108,17 @@ def load_hf_weights(self, weights):
 
     def _init_ffn(self):
         self.gate_up_proj = ROWMMWeight(
-            weight_name=self._gate_up_weight_name,
+            weight_names=self._gate_up_weight_name,
             data_type=self.data_type_,
-            bias_name=self._gate_up_bias_name,
+            bias_names=self._gate_up_bias_name,
             quant_cfg=self.quant_cfg,
             layer_num=self.layer_num_,
             name="gate_up_proj",
         )
         self.down_proj = COLMMWeight(
-            weight_name=self._down_weight_name,
+            weight_names=self._down_weight_name,
             data_type=self.data_type_,
-            bias_name=self._down_bias_name,
+            bias_names=self._down_bias_name,
             quant_cfg=self.quant_cfg,
             layer_num=self.layer_num_,
             name="down_proj",
diff --git a/lightllm/models/deepseek2/layer_weights/transformer_layer_weight.py b/lightllm/models/deepseek2/layer_weights/transformer_layer_weight.py
@@ -6,7 +6,6 @@
 from lightllm.utils.envs_utils import enable_env_vars, get_env_start_args
 from lightllm.common.basemodel.layer_weights.meta_weights import (
     ROWMMWeight,
-    MultiROWMMWeight,
     COLMMWeight,
     NormWeight,
     FusedMoeWeightTP,
@@ -142,14 +141,14 @@ def load_hf_weights(self, weights):
     def _init_qkvo(self):
         if self.q_lora_rank is None:
             self.q_weight_ = ROWMMWeight(
-                weight_name=f"model.layers.{self.layer_num_}.self_attn.q_proj.weight",
+                weight_names=f"model.layers.{self.layer_num_}.self_attn.q_proj.weight",
                 data_type=self.data_type_,
                 quant_cfg=self.quant_cfg,
                 layer_num=self.layer_num_,
                 name="q_weight",
             )
             self.kv_a_proj_with_mqa_ = ROWMMWeight(
-                weight_name=f"model.layers.{self.layer_num_}.self_attn.kv_a_proj_with_mqa.weight",
+                weight_names=f"model.layers.{self.layer_num_}.self_attn.kv_a_proj_with_mqa.weight",
                 data_type=self.data_type_,
                 quant_cfg=self.quant_cfg,
                 layer_num=self.layer_num_,
@@ -158,7 +157,7 @@ def _init_qkvo(self):
                 tp_world_size=1,
             )
         else:
-            self.qkv_a_proj_with_mqa_ = MultiROWMMWeight(
+            self.qkv_a_proj_with_mqa_ = ROWMMWeight(
                 weight_names=[
                     f"model.layers.{self.layer_num_}.self_attn.q_a_proj.weight",
                     f"model.layers.{self.layer_num_}.self_attn.kv_a_proj_with_mqa.weight",
@@ -171,37 +170,37 @@ def _init_qkvo(self):
                 tp_world_size=1,
             )
             self.q_b_proj_ = ROWMMWeight(
-                weight_name=f"model.layers.{self.layer_num_}.self_attn.q_b_proj.weight",
+                weight_names=f"model.layers.{self.layer_num_}.self_attn.q_b_proj.weight",
                 data_type=self.data_type_,
                 quant_cfg=self.quant_cfg,
                 layer_num=self.layer_num_,
                 name="q_b_proj",
             )
         self.k_b_proj_ = ROWBMMWeight(
-            weight_name=f"model.layers.{self.layer_num_}.self_attn.k_b_proj.weight",
+            weight_names=f"model.layers.{self.layer_num_}.self_attn.k_b_proj.weight",
             data_type=self.data_type_,
             quant_cfg=None,
             layer_num=self.layer_num_,
             name="k_b_proj",
         )
         self.v_b_proj_ = ROWBMMWeight(
-            weight_name=f"model.layers.{self.layer_num_}.self_attn.v_b_proj.weight",
+            weight_names=f"model.layers.{self.layer_num_}.self_attn.v_b_proj.weight",
             data_type=self.data_type_,
             quant_cfg=None,
             layer_num=self.layer_num_,
             name="v_b_proj",
         )
         if self.enable_cc_method:
             self.cc_kv_b_proj_ = ROWMMWeight(
-                weight_name=f"model.layers.{self.layer_num_}.self_attn.kv_b_proj.weight",
+                weight_names=f"model.layers.{self.layer_num_}.self_attn.kv_b_proj.weight",
                 data_type=self.data_type_,
                 quant_cfg=self.quant_cfg,
                 layer_num=self.layer_num_,
                 name="cc_kv_b_proj",
             )
 
         self.o_weight_ = COLMMWeight(
-            weight_name=f"model.layers.{self.layer_num_}.self_attn.o_proj.weight",
+            weight_names=f"model.layers.{self.layer_num_}.self_attn.o_proj.weight",
             data_type=self.data_type_,
             quant_cfg=self.quant_cfg,
             layer_num=self.layer_num_,
@@ -211,7 +210,7 @@ def _init_qkvo(self):
     def _load_mlp(self, mlp_prefix):
         moe_mode = os.getenv("MOE_MODE", "TP")
         if self.is_moe and moe_mode == "EP":
-            self.gate_up_proj = MultiROWMMWeight(
+            self.gate_up_proj = ROWMMWeight(
                 weight_names=[f"{mlp_prefix}.gate_proj.weight", f"{mlp_prefix}.up_proj.weight"],
                 data_type=self.data_type_,
                 quant_cfg=self.quant_cfg,
@@ -221,7 +220,7 @@ def _load_mlp(self, mlp_prefix):
                 tp_world_size=1,
             )
             self.down_proj = COLMMWeight(
-                weight_name=f"{mlp_prefix}.down_proj.weight",
+                weight_names=f"{mlp_prefix}.down_proj.weight",
                 data_type=self.data_type_,
                 quant_cfg=self.quant_cfg,
                 layer_num=self.layer_num_,
@@ -230,15 +229,15 @@ def _load_mlp(self, mlp_prefix):
                 tp_world_size=1,
             )
         else:
-            self.gate_up_proj = MultiROWMMWeight(
+            self.gate_up_proj = ROWMMWeight(
                 weight_names=[f"{mlp_prefix}.gate_proj.weight", f"{mlp_prefix}.up_proj.weight"],
                 data_type=self.data_type_,
                 quant_cfg=self.quant_cfg,
                 layer_num=self.layer_num_,
                 name="gate_up_proj",
             )
             self.down_proj = COLMMWeight(
-                weight_name=f"{mlp_prefix}.down_proj.weight",
+                weight_names=f"{mlp_prefix}.down_proj.weight",
                 data_type=self.data_type_,
                 quant_cfg=self.quant_cfg,
                 layer_num=self.layer_num_,
@@ -248,7 +247,7 @@ def _load_mlp(self, mlp_prefix):
     def _init_moe(self):
         moe_intermediate_size = self.network_config_["moe_intermediate_size"]
         self.moe_gate = ROWMMWeight(
-            weight_name=f"model.layers.{self.layer_num_}.mlp.gate.weight",
+            weight_names=f"model.layers.{self.layer_num_}.mlp.gate.weight",
             data_type=self.data_type_,
             layer_num=self.layer_num_,
             name="moe_gate",
diff --git a/lightllm/models/gemma3/layer_weights/transformer_layer_weight.py b/lightllm/models/gemma3/layer_weights/transformer_layer_weight.py
@@ -28,17 +28,17 @@ def _init_weight_names(self):
 
     def _init_ffn(self):
         self.gate_proj = ROWMMWeight(
-            weight_name=self._gate_weight_name,
+            weight_names=self._gate_weight_name,
             data_type=self.data_type_,
-            bias_name=self._gate_bias_name,
+            bias_names=self._gate_bias_name,
             quant_cfg=self.quant_cfg,
             layer_num=self.layer_num_,
             name="gate_proj",
         )
         self.up_proj = ROWMMWeight(
-            weight_name=self._up_weight_name,
+            weight_names=self._up_weight_name,
             data_type=self.data_type_,
-            bias_name=self._up_bias_name,
+            bias_names=self._up_bias_name,
             quant_cfg=self.quant_cfg,
             layer_num=self.layer_num_,
             name="up_proj",
@@ -47,17 +47,17 @@ def _init_ffn(self):
 
     def _init_qkv(self):
         self.k_proj = ROWMMWeight(
-            weight_name=self._k_weight_name,
+            weight_names=self._k_weight_name,
             data_type=self.data_type_,
-            bias_name=self._k_bias_name,
+            bias_names=self._k_bias_name,
             quant_cfg=self.quant_cfg,
             layer_num=self.layer_num_,
             name="k_proj",
         )
         self.v_proj = ROWMMWeight(
-            weight_name=self._v_weight_name,
+            weight_names=self._v_weight_name,
             data_type=self.data_type_,
-            bias_name=self._v_bias_name,
+            bias_names=self._v_bias_name,
             quant_cfg=self.quant_cfg,
             layer_num=self.layer_num_,
             name="v_proj",
diff --git a/lightllm/models/gemma_2b/layer_weights/transformer_layer_weight.py b/lightllm/models/gemma_2b/layer_weights/transformer_layer_weight.py
@@ -2,7 +2,7 @@
 import math
 import numpy as np
 from lightllm.models.llama.layer_weights.transformer_layer_weight import LlamaTransformerLayerWeight
-from lightllm.common.basemodel.layer_weights.meta_weights import GEMMANormWeight, ROWMMWeight, MultiROWMMWeight
+from lightllm.common.basemodel.layer_weights.meta_weights import GEMMANormWeight, ROWMMWeight
 
 
 class Gemma_2bTransformerLayerWeight(LlamaTransformerLayerWeight):
@@ -12,14 +12,14 @@ def __init__(self, layer_num, data_type, network_config, mode=[], quant_cfg=None
 
     def _init_qkv(self):
         self.q_proj = ROWMMWeight(
-            weight_name=self._q_weight_name,
+            weight_names=self._q_weight_name,
             data_type=self.data_type_,
-            bias_name=self._q_bias_name,
+            bias_names=self._q_bias_name,
             quant_cfg=self.quant_cfg,
             layer_num=self.layer_num_,
             name="q_proj",
         )
-        self.kv_proj = MultiROWMMWeight(
+        self.kv_proj = ROWMMWeight(
             weight_names=[self._k_weight_name, self._v_weight_name],
             data_type=self.data_type_,
             bias_names=[self._k_bias_name, self._v_bias_name],
diff --git a/lightllm/models/gpt_oss/layer_weights/transformer_layer_weight.py b/lightllm/models/gpt_oss/layer_weights/transformer_layer_weight.py
@@ -30,10 +30,10 @@ def _init_moe(self):
         assert moe_mode in ["TP"], "For now, GPT-OSS type model only support MOE TP mode."
 
         self.moe_gate = ROWMMWeight(
-            weight_name=self._router_weight_name,
+            weight_names=self._router_weight_name,
             data_type=self.data_type_,
             layer_num=self.layer_num_,
-            bias_name=self._router_bias_name,
+            bias_names=self._router_bias_name,
             name="moe_gate",
             tp_rank=0,
             tp_world_size=1,
diff --git a/lightllm/models/llama/layer_weights/transformer_layer_weight.py b/lightllm/models/llama/layer_weights/transformer_layer_weight.py
@@ -2,7 +2,7 @@
 import math
 import numpy as np
 from lightllm.common.basemodel import TransformerLayerWeight
-from lightllm.common.basemodel.layer_weights.meta_weights import ROWMMWeight, COLMMWeight, NormWeight, MultiROWMMWeight
+from lightllm.common.basemodel.layer_weights.meta_weights import ROWMMWeight, COLMMWeight, NormWeight
 
 
 class LlamaTransformerLayerWeight(TransformerLayerWeight):
@@ -58,14 +58,14 @@ def _init_weight_names(self):
 
     def _init_qkv(self):
         self.q_proj = ROWMMWeight(
-            weight_name=self._q_weight_name,
+            weight_names=self._q_weight_name,
             data_type=self.data_type_,
-            bias_name=self._q_bias_name,
+            bias_names=self._q_bias_name,
             quant_cfg=self.quant_cfg,
             layer_num=self.layer_num_,
             name="q_proj",
         )
-        self.kv_proj = MultiROWMMWeight(
+        self.kv_proj = ROWMMWeight(
             weight_names=[self._k_weight_name, self._v_weight_name],
             data_type=self.data_type_,
             bias_names=[self._k_bias_name, self._v_bias_name],
@@ -76,16 +76,16 @@ def _init_qkv(self):
 
     def _init_o(self):
         self.o_proj = COLMMWeight(
-            weight_name=self._o_weight_name,
+            weight_names=self._o_weight_name,
             data_type=self.data_type_,
-            bias_name=self._o_bias_name,
+            bias_names=self._o_bias_name,
             quant_cfg=self.quant_cfg,
             layer_num=self.layer_num_,
             name="o_proj",
         )
 
     def _init_ffn(self):
-        self.gate_up_proj = MultiROWMMWeight(
+        self.gate_up_proj = ROWMMWeight(
             weight_names=[self._gate_weight_name, self._up_weight_name],
             data_type=self.data_type_,
             bias_names=[self._gate_bias_name, self._up_bias_name],
@@ -94,9 +94,9 @@ def _init_ffn(self):
             name="gate_up_proj",
         )
         self.down_proj = COLMMWeight(
-            weight_name=self._down_weight_name,
+            weight_names=self._down_weight_name,
             data_type=self.data_type_,
-            bias_name=self._down_bias_name,
+            bias_names=self._down_bias_name,
             quant_cfg=self.quant_cfg,
             layer_num=self.layer_num_,
             name="down_proj",
diff --git a/lightllm/models/mixtral/layer_weights/transformer_layer_weight.py b/lightllm/models/mixtral/layer_weights/transformer_layer_weight.py
@@ -39,9 +39,9 @@ def _init_moe(self):
         split_inter_size = inter_size // self.tp_world_size_
 
         self.moe_gate = ROWMMWeight(
-            weight_name=self.moe_gate_weight_name,
+            weight_names=self.moe_gate_weight_name,
             data_type=self.data_type_,
-            bias_name=self.moe_gate_bias_name,
+            bias_names=self.moe_gate_bias_name,
             quant_cfg=self.quant_cfg,
             layer_num=self.layer_num_,
             name="moe_gate",
diff --git a/lightllm/models/qwen2_reward/layer_weights/pre_and_post_layer_weight.py b/lightllm/models/qwen2_reward/layer_weights/pre_and_post_layer_weight.py
@@ -1,7 +1,7 @@
 import torch
 import numpy as np
 from lightllm.models.llama.layer_weights.pre_and_post_layer_weight import LlamaPreAndPostLayerWeight
-from lightllm.common.basemodel.layer_weights.meta_weights import ROWMMWeight, COLMMWeight, NormWeight, MultiROWMMWeight
+from lightllm.common.basemodel.layer_weights.meta_weights import ROWMMWeight, COLMMWeight, NormWeight
 
 
 class Qwen2RewardPreAndPostLayerWeight(LlamaPreAndPostLayerWeight):
diff --git a/lightllm/models/qwen3/layer_weights/transformer_layer_weight.py b/lightllm/models/qwen3/layer_weights/transformer_layer_weight.py
@@ -6,7 +6,6 @@
 from lightllm.models.qwen2.layer_weights.transformer_layer_weight import Qwen2TransformerLayerWeight
 from lightllm.common.basemodel.layer_weights.meta_weights import (
     ROWMMWeight,
-    MultiROWMMWeight,
     COLMMWeight,
     NormWeight,
     FusedMoeWeightTP,
diff --git a/lightllm/models/qwen3_moe/layer_weights/transformer_layer_weight.py b/lightllm/models/qwen3_moe/layer_weights/transformer_layer_weight.py
@@ -7,7 +7,6 @@
 from lightllm.utils.envs_utils import enable_env_vars
 from lightllm.common.basemodel.layer_weights.meta_weights import (
     ROWMMWeight,
-    MultiROWMMWeight,
     COLMMWeight,
     NormWeight,
     FusedMoeWeightTP,
@@ -67,7 +66,7 @@ def _init_weight(self):
     def _init_moe(self):
         moe_intermediate_size = self.network_config_["moe_intermediate_size"]
         self.moe_gate = ROWMMWeight(
-            weight_name=f"model.layers.{self.layer_num_}.mlp.gate.weight",
+            weight_names=f"model.layers.{self.layer_num_}.mlp.gate.weight",
             data_type=self.data_type_,
             layer_num=self.layer_num_,
             name="moe_gate",
diff --git a/lightllm/models/starcoder/layer_weights/transformer_layer_weight.py b/lightllm/models/starcoder/layer_weights/transformer_layer_weight.py
@@ -51,17 +51,17 @@ def _init_weight_names(self):
 
     def _init_ffn(self):
         self.gate_up_proj = ROWMMWeight(
-            weight_name=self._gate_up_weight_name,
+            weight_names=self._gate_up_weight_name,
             data_type=self.data_type_,
-            bias_name=self._gate_up_bias_name,
+            bias_names=self._gate_up_bias_name,
             quant_cfg=self.quant_cfg,
             layer_num=self.layer_num_,
             name="gate_up_proj",
         )
         self.down_proj = COLMMWeight(
-            weight_name=self._down_weight_name,
+            weight_names=self._down_weight_name,
             data_type=self.data_type_,
-            bias_name=self._down_bias_name,
+            bias_names=self._down_bias_name,
             quant_cfg=self.quant_cfg,
             layer_num=self.layer_num_,
             name="down_proj",
diff --git a/lightllm/models/starcoder2/layer_weights/transformer_layer_weight.py b/lightllm/models/starcoder2/layer_weights/transformer_layer_weight.py
diff --git a/lightllm/models/vit/layer_weights/transformer_layer_weight.py b/lightllm/models/vit/layer_weights/transformer_layer_weight.py

Original file line number	Diff line number	Diff line change
`@@ -1,13 +1,10 @@`
`1`	`1`	`from .mm_weight import (`
`2`	`2`	`MMWeightPack,`
`3`	`3`	`MMWeightTpl,`
`4`		`- MultiMMWeightTpl,`
`5`		`- AWQMultiMMWeightTpl,`
`6`	`4`	`)`
`7`	`5`	`from .mm_factory import (`
`8`	`6`	`MMWeight,`
`9`	`7`	`ROWMMWeight,`
`10`		`- MultiROWMMWeight,`
`11`	`8`	`ROWBMMWeight,`
`12`	`9`	`COLMMWeight,`
`13`	`10`	`)`