@@ -115,12 +115,6 @@ class SchedulerConfig:
115
115
(e.g., beam search), recomputation is not currently supported. In
116
116
such a case, we use swapping instead."""
117
117
118
- num_scheduler_steps : int = 1
119
- """Maximum number of forward steps per scheduler call."""
120
-
121
- multi_step_stream_outputs : bool = True
122
- """If False, then multi-step will stream outputs at the end of all steps"""
123
-
124
118
send_delta_data : bool = False
125
119
"""Private API. If used, scheduler sends delta data to
126
120
workers instead of an entire data. It should be enabled only
@@ -193,16 +187,7 @@ def __post_init__(self) -> None:
193
187
194
188
if self .max_num_batched_tokens is None :
195
189
if self .enable_chunked_prefill :
196
- if self .num_scheduler_steps > 1 :
197
- # Multi-step Chunked-Prefill doesn't allow prompt-chunking
198
- # for now. Have max_num_batched_tokens set to max_model_len
199
- # so we don't reject sequences on account of a short
200
- # max_num_batched_tokens.
201
- self .max_num_batched_tokens = max (
202
- self .max_model_len , DEFAULT_MAX_NUM_BATCHED_TOKENS )
203
- else :
204
- self .max_num_batched_tokens = (
205
- DEFAULT_MAX_NUM_BATCHED_TOKENS )
190
+ self .max_num_batched_tokens = DEFAULT_MAX_NUM_BATCHED_TOKENS
206
191
else :
207
192
# If max_model_len is too short, use
208
193
# DEFAULT_MAX_NUM_BATCHED_TOKENS as the default value
@@ -293,12 +278,6 @@ def _verify_args(self) -> Self:
293
278
f"({ self .num_lookahead_slots } ) must be greater than or "
294
279
"equal to 0." )
295
280
296
- if self .num_scheduler_steps < 1 :
297
- raise ValueError (
298
- "num_scheduler_steps "
299
- f"({ self .num_scheduler_steps } ) must be greater than or "
300
- "equal to 1." )
301
-
302
281
if self .max_num_partial_prefills < 1 :
303
282
raise ValueError (
304
283
f"max_num_partial_prefills ({ self .max_num_partial_prefills } ) "
@@ -323,7 +302,3 @@ def _verify_args(self) -> Self:
323
302
f"max_num_partial_prefills ({ self .max_num_partial_prefills } )." )
324
303
325
304
return self
326
-
327
- @property
328
- def is_multi_step (self ) -> bool :
329
- return self .num_scheduler_steps > 1
0 commit comments