Skip to content

Commit bbe9731

Browse files
authored
2.4_fix_mtp_forward_meta (#5977)
1 parent 3e69022 commit bbe9731

File tree

1 file changed

+3
-1
lines changed

1 file changed

+3
-1
lines changed

fastdeploy/spec_decode/mtp.py

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1014,7 +1014,9 @@ def _propose_cuda(self, step_use_cudagraph: bool = False, is_dummy_run: bool = F
10141014
# 4. Compute logits, Sample
10151015
logits = self.model.compute_logits(hidden_states, forward_meta=self.forward_meta)
10161016
if self.enable_logprob and self.enable_draft_logprob and substep == 0:
1017-
first_token_logits = self.model.compute_logits(self.model_inputs["first_token_hidden_states"])
1017+
first_token_logits = self.model.compute_logits(
1018+
self.model_inputs["first_token_hidden_states"], forward_meta=self.forward_meta
1019+
)
10181020

10191021
speculate_get_logits(
10201022
self.model_inputs["draft_logits"],

0 commit comments

Comments
 (0)