Skip to content

Commit 71683ca

Browse files
authored
[V0 Deprecation] Remove multi-step scheduling (#22138)
Signed-off-by: Woosuk Kwon <[email protected]> Signed-off-by: Woosuk Kwon <[email protected]>
1 parent e188592 commit 71683ca

37 files changed

+57
-3465
lines changed

.buildkite/nightly-benchmarks/tests/genai-perf-tests.json

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -12,7 +12,6 @@
1212
"vllm_server_parameters": {
1313
"disable_log_stats": "",
1414
"gpu_memory_utilization": 0.9,
15-
"num_scheduler_steps": 10,
1615
"max_num_seqs": 512,
1716
"dtype": "bfloat16"
1817
},

.buildkite/nightly-benchmarks/tests/nightly-tests.json

Lines changed: 0 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -36,7 +36,6 @@
3636
"vllm_server_parameters": {
3737
"disable_log_stats": "",
3838
"gpu_memory_utilization": 0.9,
39-
"num_scheduler_steps": 10,
4039
"max_num_seqs": 512,
4140
"dtype": "bfloat16"
4241
},
@@ -90,7 +89,6 @@
9089
"vllm_server_parameters": {
9190
"disable_log_stats": "",
9291
"gpu_memory_utilization": 0.9,
93-
"num_scheduler_steps": 10,
9492
"max_num_seqs": 512,
9593
"dtype": "bfloat16"
9694
},
@@ -144,7 +142,6 @@
144142
"vllm_server_parameters": {
145143
"disable_log_stats": "",
146144
"gpu_memory_utilization": 0.9,
147-
"num_scheduler_steps": 10,
148145
"max_num_seqs": 512,
149146
"dtype": "bfloat16"
150147
},
@@ -195,7 +192,6 @@
195192
"vllm_server_parameters": {
196193
"disable_log_stats": "",
197194
"gpu_memory_utilization": 0.9,
198-
"num_scheduler_steps": 10,
199195
"max_num_seqs": 512,
200196
"dtype": "bfloat16"
201197
},
@@ -248,7 +244,6 @@
248244
"vllm_server_parameters": {
249245
"disable_log_stats": "",
250246
"gpu_memory_utilization": 0.9,
251-
"num_scheduler_steps": 10,
252247
"max_num_seqs": 512,
253248
"dtype": "bfloat16"
254249
},
@@ -301,7 +296,6 @@
301296
"vllm_server_parameters": {
302297
"disable_log_stats": "",
303298
"gpu_memory_utilization": 0.9,
304-
"num_scheduler_steps": 10,
305299
"max_num_seqs": 512,
306300
"dtype": "bfloat16"
307301
},

.buildkite/test-pipeline.yaml

Lines changed: 0 additions & 22 deletions
Original file line numberDiff line numberDiff line change
@@ -67,7 +67,6 @@ steps:
6767
- python3 standalone_tests/lazy_imports.py
6868
- pytest -v -s mq_llm_engine # MQLLMEngine
6969
- pytest -v -s async_engine # AsyncLLMEngine
70-
- NUM_SCHEDULER_STEPS=4 pytest -v -s async_engine/test_async_llm_engine.py
7170
- pytest -v -s test_inputs.py
7271
- pytest -v -s test_outputs.py
7372
- pytest -v -s multimodal
@@ -773,27 +772,6 @@ steps:
773772
- pytest -v -s models/test_oot_registration.py # it needs a clean process
774773
- pytest -v -s plugins/lora_resolvers # unit tests for in-tree lora resolver plugins
775774

776-
- label: Multi-step Tests (4 GPUs) # 36min
777-
mirror_hardwares: [amdexperimental]
778-
working_dir: "/vllm-workspace/tests"
779-
num_gpus: 4
780-
source_file_dependencies:
781-
- vllm/model_executor/layers/sampler.py
782-
- vllm/sequence.py
783-
- vllm/worker/worker_base.py
784-
- vllm/worker/worker.py
785-
- vllm/worker/multi_step_worker.py
786-
- vllm/worker/model_runner_base.py
787-
- vllm/worker/model_runner.py
788-
- vllm/worker/multi_step_model_runner.py
789-
- vllm/engine
790-
- tests/multi_step
791-
commands:
792-
# this test is quite flaky
793-
# TODO: investigate and fix.
794-
# - pytest -v -s multi_step/test_correctness_async_llm.py
795-
- pytest -v -s multi_step/test_correctness_llm.py
796-
797775
- label: Pipeline Parallelism Test # 45min
798776
mirror_hardwares: [amdexperimental]
799777
working_dir: "/vllm-workspace/tests"

.github/CODEOWNERS

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -36,7 +36,6 @@ CMakeLists.txt @tlrmchlsmth @LucasWilkinson
3636
/tests/entrypoints @DarkLight1337 @robertgshaw2-redhat @simon-mo @aarnphm
3737
/tests/kernels @tlrmchlsmth @WoosukKwon @yewentao256
3838
/tests/models @DarkLight1337 @ywang96
39-
/tests/multi_step @alexm-redhat @comaniac
4039
/tests/multimodal @DarkLight1337 @ywang96
4140
/tests/prefix_caching @comaniac @KuntaiDu
4241
/tests/quantization @mgoin @robertgshaw2-redhat @yewentao256

0 commit comments

Comments
 (0)