Skip to content

Commit 9602070

Browse files
committed
debug cruft
Signed-off-by: Sage Moore <[email protected]>
1 parent 756d721 commit 9602070

File tree

1 file changed

+0
-3
lines changed

1 file changed

+0
-3
lines changed

vllm/v1/worker/gpu_model_runner.py

Lines changed: 0 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1740,8 +1740,6 @@ def execute_model(
17401740
uniform_decode=uniform_decode)
17411741
cudagraph_runtime_mode, batch_descriptor = \
17421742
self.cudagraph_dispatcher.dispatch(batch_descriptor)
1743-
1744-
logger.info(f"NUM TOKENS: {num_input_tokens} cudagraph_runtime_mode {cudagraph_runtime_mode} UBATCHING {ubatch_slices is not None}")
17451743

17461744
# Run the model.
17471745
# Use persistent buffers for CUDA graphs.
@@ -3133,7 +3131,6 @@ def initialize_cudagraph_capture(self) -> None:
31333131

31343132
# Trigger cudagraph dispatching keys initialization here (after
31353133
# initializing attn backends).
3136-
logger.info(f"INITIALIZING KEYS FOR MODE: {self.compilation_config.cudagraph_mode}")
31373134
self.cudagraph_dispatcher.initialize_cudagraph_keys(
31383135
self.compilation_config.cudagraph_mode,
31393136
self.uniform_decode_query_len)

0 commit comments

Comments
 (0)