7
7
from vllm .sampling_params import SamplingParams
8
8
from vllm .v1 .core .sched .output import (CachedRequestData , NewRequestData ,
9
9
SchedulerOutput )
10
- from vllm .v1 .sample .metadata import SamplingMetadata
11
10
from vllm .v1 .worker .tpu_model_runner import (TPUModelRunner ,
12
11
_get_padded_token_len ,
13
12
_get_paddings )
@@ -113,12 +112,6 @@ def _is_req_added(model_runner, req_id: str) -> bool:
113
112
return req_id in model_runner .requests
114
113
115
114
116
- def _is_sampling_metadata_changed (model_runner ,
117
- sampling_metadata_before : SamplingMetadata ):
118
- return model_runner .input_batch .sampling_metadata is not (
119
- sampling_metadata_before )
120
-
121
-
122
115
def _is_req_state_block_table_match (model_runner , req_id : str ) -> bool :
123
116
req_index = model_runner .input_batch .req_id_to_index [req_id ]
124
117
block_table = model_runner .input_batch .block_table
@@ -136,10 +129,8 @@ def test_update_states_new_request(model_runner):
136
129
# new req
137
130
scheduler_output = _schedule_new_request (req_id )
138
131
139
- metadata_before = model_runner .input_batch .sampling_metadata
140
132
model_runner ._update_states (scheduler_output )
141
133
142
- assert _is_sampling_metadata_changed (model_runner , metadata_before )
143
134
assert _is_req_added (model_runner , req_id )
144
135
assert _is_req_scheduled (model_runner , req_id )
145
136
assert _is_req_state_block_table_match (model_runner , req_id )
@@ -170,9 +161,7 @@ def test_update_states_request_finished(model_runner):
170
161
grammar_bitmask = None ,
171
162
)
172
163
173
- metadata_before = model_runner .input_batch .sampling_metadata
174
164
model_runner ._update_states (scheduler_output )
175
- assert _is_sampling_metadata_changed (model_runner , metadata_before )
176
165
assert not _is_req_added (model_runner , req_id )
177
166
assert not _is_req_scheduled (model_runner , req_id )
178
167
@@ -229,9 +218,7 @@ def test_update_states_request_resumed(model_runner):
229
218
grammar_bitmask = None ,
230
219
)
231
220
232
- metadata_before = model_runner .input_batch .sampling_metadata
233
221
model_runner ._update_states (scheduler_output )
234
- assert _is_sampling_metadata_changed (model_runner , metadata_before )
235
222
assert _is_req_added (model_runner , req_id )
236
223
assert _is_req_scheduled (model_runner , req_id )
237
224
assert _is_req_state_block_table_match (model_runner , req_id )
@@ -262,9 +249,7 @@ def test_update_states_no_changes(model_runner):
262
249
grammar_bitmask = None ,
263
250
)
264
251
265
- metadata_before = model_runner .input_batch .sampling_metadata
266
252
model_runner ._update_states (scheduler_output )
267
- assert not _is_sampling_metadata_changed (model_runner , metadata_before )
268
253
assert _is_req_added (model_runner , req_id )
269
254
assert _is_req_scheduled (model_runner , req_id )
270
255
assert _is_req_state_block_table_match (model_runner , req_id )
@@ -299,8 +284,7 @@ def test_update_states_request_unscheduled(model_runner):
299
284
grammar_bitmask = None ,
300
285
)
301
286
302
- metadata_before = model_runner ._update_states (scheduler_output )
303
- assert _is_sampling_metadata_changed (model_runner , metadata_before )
287
+ model_runner ._update_states (scheduler_output )
304
288
305
289
assert _is_req_added (model_runner , req_ids [0 ])
306
290
assert _is_req_scheduled (model_runner , req_ids [0 ])
0 commit comments