File tree Expand file tree Collapse file tree 1 file changed +2
-0
lines changed Expand file tree Collapse file tree 1 file changed +2
-0
lines changed Original file line number Diff line number Diff line change @@ -369,9 +369,11 @@ def execute_model(
369
369
if scheduler_output .total_num_scheduled_tokens not in self ._token_compiled_cudagraphs and scheduler_output .total_num_scheduled_tokens != 0 :
370
370
logger .info ("DIEGO: CUDAgraph in execution time for %d input tokens" , scheduler_output .total_num_scheduled_tokens )
371
371
self ._token_compiled_cudagraphs .add (scheduler_output .total_num_scheduled_tokens )
372
+ gc .freeze ()
372
373
start_time = time .perf_counter ()
373
374
self .model_runner ._dummy_run (scheduler_output .total_num_scheduled_tokens , capture_attn_cudagraph = False , skip_eplb = True )
374
375
end_time = time .perf_counter ()
376
+ gc .unfreeze ()
375
377
elapsed_time = end_time - start_time
376
378
logger .info ("Graph capturing finished in %.3f secs" , elapsed_time )
377
379
You can’t perform that action at this time.
0 commit comments