Skip to content

Commit e684eb5

Browse files
committed
Add check to only for do_penalities
1 parent b38c808 commit e684eb5

File tree

1 file changed

+2
-1
lines changed

1 file changed

+2
-1
lines changed

vllm/worker/hpu_model_runner.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -4024,7 +4024,8 @@ def try_revert_dummy_output_tokens():
40244024
if self.do_mark_step:
40254025
htorch.core.mark_step()
40264026
if hasattr(self.model.sampler, '_sampling_tensors') and \
4027-
self.model.sampler._sampling_tensors is not None:
4027+
self.model.sampler._sampling_tensors is not None and \
4028+
self.model.sampler._do_penalties:
40284029
sampling_tensors = self.model.sampler._sampling_tensors
40294030
if sampling_tensors.prompt_tokens.numel() > 0:
40304031
# Cache the prompt_tokens tensor that's already on HPU

0 commit comments

Comments
 (0)