debug cruft

SageMoore · SageMoore · commit 9602070690a5 · 2025-09-03T19:19:25.000Z
Signed-off-by: Sage Moore &lt;sage@neuralmagic.com&gt;
diff --git a/vllm/v1/worker/gpu_model_runner.py b/vllm/v1/worker/gpu_model_runner.py
@@ -1740,8 +1740,6 @@ def execute_model(
                                            uniform_decode=uniform_decode)
         cudagraph_runtime_mode, batch_descriptor = \
             self.cudagraph_dispatcher.dispatch(batch_descriptor)
-        
-        logger.info(f"NUM TOKENS: {num_input_tokens} cudagraph_runtime_mode {cudagraph_runtime_mode} UBATCHING {ubatch_slices is not None}")
 
         # Run the model.
         # Use persistent buffers for CUDA graphs.
@@ -3133,7 +3131,6 @@ def initialize_cudagraph_capture(self) -> None:
 
         # Trigger cudagraph dispatching keys initialization here (after
         # initializing attn backends).
-        logger.info(f"INITIALIZING KEYS FOR MODE: {self.compilation_config.cudagraph_mode}")
         self.cudagraph_dispatcher.initialize_cudagraph_keys(
             self.compilation_config.cudagraph_mode,
             self.uniform_decode_query_len)