Skip to content

Commit 04dc491

Browse files
Log not important
Signed-off-by: Diego-Castan <[email protected]>
1 parent 3ee4333 commit 04dc491

File tree

1 file changed

+1
-0
lines changed

1 file changed

+1
-0
lines changed

vllm/v1/worker/gpu_worker.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -383,6 +383,7 @@ def compile_cuda_graph(input_size: int):
383383
# but users still want to compile for better performance,
384384
# e.g. for the max-num-batched token size in chunked prefill.
385385
warmup_sizes = self.vllm_config.compilation_config.compile_sizes.copy()
386+
logger.info("Warm up sizes %s", str(warmup_sizes))
386387
if not self.model_config.enforce_eager:
387388
warmup_sizes = [
388389
x for x in warmup_sizes if x not in

0 commit comments

Comments
 (0)