Skip to content

Commit fb140f1

Browse files
committed
fix
1 parent 6e880c1 commit fb140f1

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

lightllm/models/qwen3_moe/layer_infer/transformer_layer_infer.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -86,7 +86,6 @@ def _get_qkv(
8686
def _tpsp_get_qkv(
8787
self,
8888
input: torch.Tensor,
89-
cache_kv,
9089
infer_state: LlamaInferStateInfo,
9190
layer_weight: Qwen3MOETransformerLayerWeight,
9291
) -> torch.Tensor:
@@ -100,6 +99,7 @@ def _tpsp_get_qkv(
10099

101100
input = input.view(-1, self.embed_dim_)
102101
q = layer_weight.q_proj.mm(input)
102+
cache_kv = self._pre_cache_kv(infer_state=infer_state, layer_weight=layer_weight)
103103
cache_kv = layer_weight.kv_proj.mm(
104104
input, out=cache_kv.view(-1, (self.tp_k_head_num_ + self.tp_v_head_num_) * self.head_dim_)
105105
).view(-1, (self.tp_k_head_num_ + self.tp_v_head_num_), self.head_dim_)

0 commit comments

Comments
 (0)