70
70
- VLLM_ATTENTION_BACKEND=XFORMERS pytest -v -s basic_correctness/test_chunked_prefill.py
71
71
- VLLM_ATTENTION_BACKEND=FLASH_ATTN pytest -v -s basic_correctness/test_chunked_prefill.py
72
72
- VLLM_TEST_ENABLE_ARTIFICIAL_PREEMPT=1 pytest -v -s basic_correctness/test_preemption.py
73
-
73
+
74
74
- label : Core Test # 10min
75
75
mirror_hardwares : [amd]
76
76
fast_check : true
@@ -90,8 +90,11 @@ steps:
90
90
commands :
91
91
- pip install -e ./plugins/vllm_add_dummy_model
92
92
- pip install git+https://github.com/EleutherAI/lm-evaluation-harness.git@a4987bba6e9e9b3f22bd3a6c1ecf0abd04fd5622#egg=lm_eval[api]
93
- - pytest -v -s entrypoints/llm --ignore=entrypoints/llm/test_lazy_outlines.py
93
+ - pytest -v -s entrypoints/llm --ignore=entrypoints/llm/test_lazy_outlines.py --ignore=entrypoints/llm/test_generate.py --ignore=entrypoints/llm/test_generate_multiple_loras.py --ignore=entrypoints/llm/test_guided_generate.py
94
94
- pytest -v -s entrypoints/llm/test_lazy_outlines.py # it needs a clean process
95
+ - pytest -v -s entrypoints/llm/test_generate.py # it needs a clean process
96
+ - pytest -v -s entrypoints/llm/test_generate_multiple_loras.py # it needs a clean process
97
+ - pytest -v -s entrypoints/llm/test_guided_generate.py # it needs a clean process
95
98
- pytest -v -s entrypoints/openai
96
99
- pytest -v -s entrypoints/test_chat_utils.py
97
100
- pytest -v -s entrypoints/offline_mode # Needs to avoid interference with other tests
@@ -207,6 +210,21 @@ steps:
207
210
command : pytest -v -s lora --shard-id=$$BUILDKITE_PARALLEL_JOB --num-shards=$$BUILDKITE_PARALLEL_JOB_COUNT --ignore=lora/test_long_context.py
208
211
parallelism : 4
209
212
213
+ - label : " PyTorch Fullgraph Smoke Test"
214
+ fast_check : true
215
+ source_file_dependencies :
216
+ - vllm/
217
+ - tests/compile
218
+ commands :
219
+ - pytest -v -s compile/test_full_graph_smoke.py
220
+
221
+ - label : " PyTorch Fullgraph Test"
222
+ source_file_dependencies :
223
+ - vllm/
224
+ - tests/compile
225
+ commands :
226
+ - pytest -v -s compile/test_full_graph.py
227
+
210
228
- label : Kernels Test %N # 30min each
211
229
mirror_hardwares : [amd]
212
230
source_file_dependencies :
@@ -352,7 +370,7 @@ steps:
352
370
- tests/distributed/
353
371
- vllm/compilation
354
372
commands :
355
- - pytest -v -s ./compile/test_full_graph .py
373
+ - pytest -v -s ./compile/test_full_graph_multi_gpu .py
356
374
- pytest -v -s ./compile/test_wrapper.py
357
375
- VLLM_TEST_SAME_HOST=1 torchrun --nproc-per-node=4 distributed/test_same_node.py | grep -q 'Same node test passed'
358
376
- TARGET_TEST_SUITE=L4 pytest basic_correctness/ -v -s -m distributed_2_gpus
0 commit comments