Skip to content

Commit 4ea4381

Browse files
Feng-xiaosuoMatrix_K
authored andcommitted
Merge branch 'vllm-project:main' into main
Signed-off-by: Matrix_K <zhangke144@huawei.com>
2 parents bebf158 + bdb6531 commit 4ea4381

File tree

232 files changed

+10651
-3392
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

232 files changed

+10651
-3392
lines changed

.github/workflows/_e2e_nightly_multi_node.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -32,7 +32,7 @@ on:
3232
description: how many pods will be pulled up via lws.yaml, indicates number of nodes we need
3333
vllm_version:
3434
required: false
35-
default: "v0.17.0"
35+
default: "v0.18.0"
3636
type: string
3737
description: vllm version to use
3838
vllm_ascend_remote_url:

.github/workflows/_e2e_nightly_single_node.yaml

Lines changed: 5 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -39,7 +39,7 @@ on:
3939
vllm_version:
4040
required: false
4141
type: string
42-
default: "v0.17.0"
42+
default: "v0.18.0"
4343
is_pr_test:
4444
required: true
4545
type: boolean
@@ -88,6 +88,7 @@ jobs:
8888
if: ${{ inputs.is_pr_test }}
8989
run: |
9090
pip uninstall -y vllm vllm-ascend || true
91+
cp -r /vllm-workspace/vllm-ascend/benchmark /tmp/aisbench-backup || true
9192
rm -rf /vllm-workspace/vllm /vllm-workspace/vllm-ascend
9293
9394
- name: Checkout vllm-project/vllm repo
@@ -125,15 +126,16 @@ jobs:
125126
env:
126127
PIP_EXTRA_INDEX_URL: https://mirrors.huaweicloud.com/ascend/repos/pypi
127128
run: |
129+
git config --global --add safe.directory /vllm-workspace/vllm-ascend
128130
pip install uc-manager
129131
uv pip install -r requirements-dev.txt
130132
uv pip install -v -e .
131133
132134
- name: Install aisbench
133135
if: ${{ inputs.is_pr_test }}
134-
shell: bash -l {0}
136+
shell: bash -l {0}
135137
run: |
136-
git clone -b v3.0-20250930-master --depth 1 https://gitee.com/aisbench/benchmark.git /vllm-workspace/vllm-ascend/benchmark
138+
cp -r /tmp/aisbench-backup /vllm-workspace/vllm-ascend/benchmark
137139
cd /vllm-workspace/vllm-ascend/benchmark
138140
pip install pytest asyncio pytest-asyncio
139141
pip install -e . -r requirements/api.txt -r requirements/extra.txt

.github/workflows/_e2e_nightly_single_node_models.yaml

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -84,6 +84,7 @@ jobs:
8484
pip config set global.index-url https://mirrors.tuna.tsinghua.edu.cn/pypi/web/simple
8585
apt-get update -y
8686
apt install git -y
87+
git config --global --add safe.directory /__w/vllm-ascend/vllm-ascend
8788
git config --global url."https://gh-proxy.test.osinfra.cn/https://github.com/".insteadOf https://github.com/
8889
8990
- name: Checkout vllm-project/vllm-ascend repo

.github/workflows/_e2e_test.yaml

Lines changed: 121 additions & 13 deletions
Original file line numberDiff line numberDiff line change
@@ -56,6 +56,7 @@ jobs:
5656
pip config set global.trusted-host cache-service.nginx-pypi-cache.svc.cluster.local
5757
apt-get update -y
5858
apt install git -y
59+
git config --global --add safe.directory /__w/vllm-ascend/vllm-ascend
5960
6061
- name: Install system dependencies
6162
run: |
@@ -92,20 +93,33 @@ jobs:
9293
env:
9394
PYTORCH_NPU_ALLOC_CONF: max_split_size_mb:256
9495
VLLM_WORKER_MULTIPROC_METHOD: spawn
96+
shell: bash
9597
run: |
98+
set -o pipefail
9699
if [ "${{ inputs.continue_on_error }}" = "true" ]; then
97100
python3 .github/workflows/scripts/run_suite.py \
98101
--suite e2e-singlecard-light \
99102
--auto-partition-id "${{ matrix.part }}" \
100103
--auto-partition-size 1 \
101104
--auto-upgrade-estimated-times \
102-
--continue-on-error
105+
--continue-on-error \
106+
2>&1 | tee /tmp/e2e-singlecard-light-part${{ matrix.part }}.log
103107
else
104108
python3 .github/workflows/scripts/run_suite.py \
105109
--suite e2e-singlecard-light \
106110
--auto-partition-id "${{ matrix.part }}" \
107-
--auto-partition-size 1
111+
--auto-partition-size 1 \
112+
2>&1 | tee /tmp/e2e-singlecard-light-part${{ matrix.part }}.log
108113
fi
114+
exit ${PIPESTATUS[0]}
115+
116+
- name: Summarize singlecard-light failure
117+
if: ${{ always() }}
118+
run: |
119+
python3 .github/workflows/scripts/ci_log_summary.py \
120+
--step-name "Run singlecard-light test" \
121+
--log-file /tmp/e2e-singlecard-light-part${{ matrix.part }}.log \
122+
--output "$GITHUB_STEP_SUMMARY"
109123
110124
111125
- name: Upload timing data
@@ -148,6 +162,7 @@ jobs:
148162
pip config set global.trusted-host cache-service.nginx-pypi-cache.svc.cluster.local
149163
apt-get update -y
150164
apt install git -y
165+
git config --global --add safe.directory /__w/vllm-ascend/vllm-ascend
151166
152167
- name: Install system dependencies
153168
run: |
@@ -183,20 +198,33 @@ jobs:
183198
env:
184199
VLLM_WORKER_MULTIPROC_METHOD: spawn
185200
PYTORCH_NPU_ALLOC_CONF: max_split_size_mb:256
201+
shell: bash
186202
run: |
203+
set -o pipefail
187204
if [ "${{ inputs.continue_on_error }}" = "true" ]; then
188205
python3 .github/workflows/scripts/run_suite.py \
189206
--suite e2e-singlecard \
190207
--auto-partition-id "${{ matrix.part }}" \
191208
--auto-partition-size 2 \
192209
--auto-upgrade-estimated-times \
193-
--continue-on-error
210+
--continue-on-error \
211+
2>&1 | tee /tmp/e2e-singlecard-full-part${{ matrix.part }}.log
194212
else
195213
python3 .github/workflows/scripts/run_suite.py \
196214
--suite e2e-singlecard \
197215
--auto-partition-id "${{ matrix.part }}" \
198-
--auto-partition-size 2
216+
--auto-partition-size 2 \
217+
2>&1 | tee /tmp/e2e-singlecard-full-part${{ matrix.part }}.log
199218
fi
219+
exit ${PIPESTATUS[0]}
220+
221+
- name: Summarize singlecard-full failure
222+
if: ${{ always() }}
223+
run: |
224+
python3 .github/workflows/scripts/ci_log_summary.py \
225+
--step-name "Run singlecard-full test" \
226+
--log-file /tmp/e2e-singlecard-full-part${{ matrix.part }}.log \
227+
--output "$GITHUB_STEP_SUMMARY"
200228
201229
- name: Upload timing data
202230
uses: actions/upload-artifact@v4
@@ -237,6 +265,7 @@ jobs:
237265
pip config set global.trusted-host cache-service.nginx-pypi-cache.svc.cluster.local
238266
apt-get update -y
239267
apt install git -y
268+
git config --global --add safe.directory /__w/vllm-ascend/vllm-ascend
240269
241270
- name: Install system dependencies
242271
run: |
@@ -271,20 +300,33 @@ jobs:
271300
- name: Run vllm-project/vllm-ascend test (light)
272301
env:
273302
VLLM_WORKER_MULTIPROC_METHOD: spawn
303+
shell: bash
274304
run: |
305+
set -o pipefail
275306
if [ "${{ inputs.continue_on_error }}" = "true" ]; then
276307
python3 .github/workflows/scripts/run_suite.py \
277308
--suite e2e-2card-light \
278309
--auto-partition-id "${{ matrix.part }}" \
279310
--auto-partition-size 1 \
280311
--auto-upgrade-estimated-times \
281-
--continue-on-error
312+
--continue-on-error \
313+
2>&1 | tee /tmp/e2e-2card-light-part${{ matrix.part }}.log
282314
else
283315
python3 .github/workflows/scripts/run_suite.py \
284316
--suite e2e-2card-light \
285317
--auto-partition-id "${{ matrix.part }}" \
286-
--auto-partition-size 1
318+
--auto-partition-size 1 \
319+
2>&1 | tee /tmp/e2e-2card-light-part${{ matrix.part }}.log
287320
fi
321+
exit ${PIPESTATUS[0]}
322+
323+
- name: Summarize multicard-2-light failure
324+
if: ${{ always() }}
325+
run: |
326+
python3 .github/workflows/scripts/ci_log_summary.py \
327+
--step-name "Run multicard-2-light test" \
328+
--log-file /tmp/e2e-2card-light-part${{ matrix.part }}.log \
329+
--output "$GITHUB_STEP_SUMMARY"
288330
289331
290332
- name: Upload timing data
@@ -326,6 +368,7 @@ jobs:
326368
pip config set global.trusted-host cache-service.nginx-pypi-cache.svc.cluster.local
327369
apt-get update -y
328370
apt install git -y
371+
git config --global --add safe.directory /__w/vllm-ascend/vllm-ascend
329372
330373
- name: Install system dependencies
331374
run: |
@@ -360,20 +403,33 @@ jobs:
360403
- name: Run vllm-project/vllm-ascend test (full)
361404
env:
362405
VLLM_WORKER_MULTIPROC_METHOD: spawn
406+
shell: bash
363407
run: |
408+
set -o pipefail
364409
if [ "${{ inputs.continue_on_error }}" = "true" ]; then
365410
python3 .github/workflows/scripts/run_suite.py \
366411
--suite e2e-multicard-2-cards \
367412
--auto-partition-id "${{ matrix.part }}" \
368413
--auto-partition-size 1 \
369414
--auto-upgrade-estimated-times \
370-
--continue-on-error
415+
--continue-on-error \
416+
2>&1 | tee /tmp/e2e-2card-full-part${{ matrix.part }}.log
371417
else
372418
python3 .github/workflows/scripts/run_suite.py \
373419
--suite e2e-multicard-2-cards \
374420
--auto-partition-id "${{ matrix.part }}" \
375-
--auto-partition-size 1
421+
--auto-partition-size 1 \
422+
2>&1 | tee /tmp/e2e-2card-full-part${{ matrix.part }}.log
376423
fi
424+
exit ${PIPESTATUS[0]}
425+
426+
- name: Summarize multicard-2-full failure
427+
if: ${{ always() }}
428+
run: |
429+
python3 .github/workflows/scripts/ci_log_summary.py \
430+
--step-name "Run multicard-2-full test " \
431+
--log-file /tmp/e2e-2card-full-part${{ matrix.part }}.log \
432+
--output "$GITHUB_STEP_SUMMARY"
377433
378434
379435
- name: Upload timing data
@@ -389,9 +445,21 @@ jobs:
389445
if: ${{ inputs.type == 'full' && matrix.part == 0 }}
390446
env:
391447
VLLM_WORKER_MULTIPROC_METHOD: spawn
448+
shell: bash
392449
run: |
450+
set -o pipefail
393451
python3 -m pip uninstall -y triton-ascend
394-
pytest -sv --durations=0 tests/e2e/multicard/2-cards/test_aclgraph_capture_replay.py
452+
pytest -sv --durations=0 tests/e2e/multicard/2-cards/test_aclgraph_capture_replay.py \
453+
2>&1 | tee /tmp/e2e-non-triton.log
454+
exit ${PIPESTATUS[0]}
455+
456+
- name: Summarize non-triton failure
457+
if: ${{ always() && inputs.type == 'full' && matrix.part == 0 }}
458+
run: |
459+
python3 .github/workflows/scripts/ci_log_summary.py \
460+
--step-name "Run multicard-2-full test (non triton)" \
461+
--log-file /tmp/e2e-non-triton.log \
462+
--output "$GITHUB_STEP_SUMMARY"
395463
396464
e2e-4-cards-full:
397465
name: multicard-4-full
@@ -422,6 +490,7 @@ jobs:
422490
pip config set global.trusted-host cache-service.nginx-pypi-cache.svc.cluster.local
423491
apt-get update -y
424492
apt install git -y
493+
git config --global --add safe.directory /__w/vllm-ascend/vllm-ascend
425494
426495
- name: Install system dependencies
427496
run: |
@@ -457,20 +526,33 @@ jobs:
457526
- name: Run vllm-project/vllm-ascend test for V1 Engine
458527
env:
459528
VLLM_WORKER_MULTIPROC_METHOD: spawn
529+
shell: bash
460530
run: |
531+
set -o pipefail
461532
if [ "${{ inputs.continue_on_error }}" = "true" ]; then
462533
python3 .github/workflows/scripts/run_suite.py \
463534
--suite e2e-multicard-4-cards \
464535
--auto-partition-id "${{ matrix.part }}" \
465536
--auto-partition-size 1 \
466537
--auto-upgrade-estimated-times \
467-
--continue-on-error
538+
--continue-on-error \
539+
2>&1 | tee /tmp/e2e-4card-full-part${{ matrix.part }}.log
468540
else
469541
python3 .github/workflows/scripts/run_suite.py \
470542
--suite e2e-multicard-4-cards \
471543
--auto-partition-id "${{ matrix.part }}" \
472-
--auto-partition-size 1
544+
--auto-partition-size 1 \
545+
2>&1 | tee /tmp/e2e-4card-full-part${{ matrix.part }}.log
473546
fi
547+
exit ${PIPESTATUS[0]}
548+
549+
- name: Summarize multicard-4-full failure
550+
if: ${{ always() }}
551+
run: |
552+
python3 .github/workflows/scripts/ci_log_summary.py \
553+
--step-name "Run vllm-project/vllm-ascend test for V1 Engine" \
554+
--log-file /tmp/e2e-4card-full-part${{ matrix.part }}.log \
555+
--output "$GITHUB_STEP_SUMMARY"
474556
475557
476558
- name: Upload timing data
@@ -504,6 +586,7 @@ jobs:
504586
pip config set global.trusted-host cache-service.nginx-pypi-cache.svc.cluster.local
505587
apt-get update -y
506588
apt install git -y
589+
git config --global --add safe.directory /__w/vllm-ascend/vllm-ascend
507590
508591
- name: Checkout vllm-project/vllm-ascend repo
509592
uses: actions/checkout@v6
@@ -540,9 +623,21 @@ jobs:
540623
env:
541624
PYTORCH_NPU_ALLOC_CONF: max_split_size_mb:256
542625
VLLM_WORKER_MULTIPROC_METHOD: spawn
626+
shell: bash
543627
run: |
628+
set -o pipefail
544629
pytest -sv --durations=0 tests/e2e/310p/singlecard/test_dense_model_singlecard.py \
545-
tests/e2e/310p/singlecard/test_vl_model_singlecard.py
630+
tests/e2e/310p/singlecard/test_vl_model_singlecard.py \
631+
2>&1 | tee /tmp/e2e-310p-singlecard.log
632+
exit ${PIPESTATUS[0]}
633+
634+
- name: Summarize 310p singlecard failure
635+
if: ${{ always() && inputs.contains_310 }}
636+
run: |
637+
python3 .github/workflows/scripts/ci_log_summary.py \
638+
--step-name "Run vllm-project/vllm-ascend test" \
639+
--log-file /tmp/e2e-310p-singlecard.log \
640+
--output "$GITHUB_STEP_SUMMARY"
546641
547642
e2e_310p-4cards:
548643
name: 310p multicards 4cards
@@ -566,6 +661,7 @@ jobs:
566661
pip config set global.trusted-host cache-service.nginx-pypi-cache.svc.cluster.local
567662
apt-get update -y
568663
apt install git -y
664+
git config --global --add safe.directory /__w/vllm-ascend/vllm-ascend
569665
570666
- name: Checkout vllm-project/vllm-ascend repo
571667
uses: actions/checkout@v6
@@ -602,8 +698,20 @@ jobs:
602698
env:
603699
PYTORCH_NPU_ALLOC_CONF: max_split_size_mb:256
604700
VLLM_WORKER_MULTIPROC_METHOD: spawn
701+
shell: bash
605702
run: |
703+
set -o pipefail
606704
pytest -sv --durations=0 \
607705
tests/e2e/310p/multicard/test_dense_model_multicard.py \
608706
tests/e2e/310p/multicard/test_moe_model_multicard.py \
609-
tests/e2e/310p/multicard/test_vl_model_multicard.py
707+
tests/e2e/310p/multicard/test_vl_model_multicard.py \
708+
2>&1 | tee /tmp/e2e-310p-4cards.log
709+
exit ${PIPESTATUS[0]}
710+
711+
- name: Summarize 310p multicards failure
712+
if: ${{ always() && inputs.contains_310 }}
713+
run: |
714+
python3 .github/workflows/scripts/ci_log_summary.py \
715+
--step-name "Run vllm-project/vllm-ascend test" \
716+
--log-file /tmp/e2e-310p-4cards.log \
717+
--output "$GITHUB_STEP_SUMMARY"

.github/workflows/_schedule_image_build.yaml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -70,14 +70,14 @@ jobs:
7070
password: ${{ secrets.QUAY_PASSWORD }}
7171

7272
- name: Set up Docker Buildx
73-
uses: docker/setup-buildx-action@v3
73+
uses: docker/setup-buildx-action@v4
7474
with:
7575
install: true
7676
driver: docker-container
7777
use: true
7878

7979
- name: Build and push
80-
uses: docker/build-push-action@v6
80+
uses: docker/build-push-action@v7
8181
id: build
8282
with:
8383
platforms: ${{ matrix.arch }}
@@ -168,7 +168,7 @@ jobs:
168168
password: ${{ secrets.QUAY_PASSWORD }}
169169

170170
- name: Set up Docker Buildx
171-
uses: docker/setup-buildx-action@v3
171+
uses: docker/setup-buildx-action@v4
172172

173173
- name: Merge and push multi-arch image
174174
env:

0 commit comments

Comments
 (0)