File tree Expand file tree Collapse file tree 1 file changed +2
-2
lines changed
Expand file tree Collapse file tree 1 file changed +2
-2
lines changed Original file line number Diff line number Diff line change @@ -1737,7 +1737,7 @@ def _dummy_run(
17371737 # has num_tokens in total.
17381738 assert num_tokens <= self .scheduler_config .max_num_batched_tokens
17391739 max_num_reqs = self .scheduler_config .max_num_seqs
1740- num_reqs = max_num_reqs if num_tokens >= max_num_reqs else num_tokens
1740+ num_reqs = min ( num_tokens , max_num_reqs )
17411741 min_tokens_per_req = num_tokens // num_reqs
17421742 num_scheduled_tokens_list = [min_tokens_per_req ] * num_reqs
17431743 num_scheduled_tokens_list [- 1 ] += num_tokens % num_reqs
@@ -1765,7 +1765,7 @@ def _dummy_run(
17651765 self .kv_cache_config .kv_cache_groups ):
17661766 attn_metadata_i = (
17671767 self .attn_metadata_builders [kv_cache_group_id ].build (
1768- num_reqs = num_tokens ,
1768+ num_reqs = num_reqs ,
17691769 num_actual_tokens = num_tokens ,
17701770 max_query_len = num_tokens ,
17711771 common_prefix_len = 0 ,
You can’t perform that action at this time.
0 commit comments