Skip to content

Commit b614a6a

Browse files
committed
fix
Signed-off-by: wangli <wangli858794774@gmail.com>
1 parent 0f8cc23 commit b614a6a

File tree

1 file changed

+0
-6
lines changed

1 file changed

+0
-6
lines changed

vllm_ascend/spec_decode/eagle_proposer.py

Lines changed: 0 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -89,12 +89,6 @@ class SpecDecodeBaseProposer(EagleProposer):
8989
_runnable: ACLGraphWrapper | Callable
9090

9191
def __init__(self, vllm_config: VllmConfig, device: torch.device, pass_hidden_states_to_model: bool, runner=None):
92-
# vllm.EagleProposer.__init__ hardcodes pass_hidden_states_to_model=True
93-
# when calling vllm.SpecDecodeBaseProposer.__init__, so the derived
94-
# attributes (net_num_new_slots_per_request, needs_extra_input_slots) and
95-
# the dependent buffers (is_rejected_token_mask, is_masked_token_mask) may
96-
# be computed/initialized incorrectly when pass_hidden_states_to_model=False.
97-
# We fix this up after super().__init__ completes.
9892
super().__init__(vllm_config, device, runner)
9993

10094
self.use_async_scheduling = self.vllm_config.scheduler_config.async_scheduling

0 commit comments

Comments
 (0)