From 3ba0256ce63aab0af6e37eefbcd2a0c6c8b32be1 Mon Sep 17 00:00:00 2001 From: Icey <1790571317@qq.com> Date: Mon, 29 Sep 2025 08:41:05 +0000 Subject: [PATCH 1/8] Test eagle OOM Signed-off-by: Icey <1790571317@qq.com> --- .github/workflows/_e2e_test.yaml | 6 ++++-- 1 file changed, 4 insertions(+), 2 deletions(-) diff --git a/.github/workflows/_e2e_test.yaml b/.github/workflows/_e2e_test.yaml index 1254f3a2ff..5872757060 100644 --- a/.github/workflows/_e2e_test.yaml +++ b/.github/workflows/_e2e_test.yaml @@ -83,6 +83,9 @@ jobs: VLLM_WORKER_MULTIPROC_METHOD: spawn VLLM_USE_MODELSCOPE: True PYTORCH_NPU_ALLOC_CONF: max_split_size_mb:256 + PYTORCH_NPU_ALLOC_CONF: expandable_segments:True + NPU_MEMORY_FRACTION: 0.96 + OMP_NUM_THREADS: 1 if: ${{ inputs.type == 'full' }} run: | # We found that if running aclgraph tests in batch, it will cause AclmdlRICaptureBegin error. So we run @@ -103,8 +106,7 @@ jobs: # ------------------------------------ v1 spec decode test ------------------------------------ # pytest -sv tests/e2e/singlecard/spec_decode_v1/test_v1_mtp_correctness.py pytest -sv tests/e2e/singlecard/spec_decode_v1/test_v1_mtp_torchair_correctness.py - # Fix me: OOM error - #pytest -sv tests/e2e/singlecard/spec_decode_v1/test_v1_spec_decode.py + pytest -sv tests/e2e/singlecard/spec_decode_v1/test_v1_spec_decode.py pytest -sv tests/e2e/singlecard/ops/ From 5467e96bb9afc9fb008923cbfc332079147ea3e2 Mon Sep 17 00:00:00 2001 From: Icey <1790571317@qq.com> Date: Mon, 29 Sep 2025 09:40:39 +0000 Subject: [PATCH 2/8] fix Signed-off-by: Icey <1790571317@qq.com> --- .github/workflows/vllm_ascend_test_full.yaml | 1 + 1 file changed, 1 insertion(+) diff --git a/.github/workflows/vllm_ascend_test_full.yaml b/.github/workflows/vllm_ascend_test_full.yaml index 1c9f4d123d..f1ca245c90 100644 --- a/.github/workflows/vllm_ascend_test_full.yaml +++ b/.github/workflows/vllm_ascend_test_full.yaml @@ -51,6 +51,7 @@ jobs: filters: | e2e_tracker: - '.github/workflows/vllm_ascend_test.yaml' + - '.github/workflows/_e2e_test.yaml' - 'vllm_ascend/**' - 'csrc/**' - 'cmake/**' From 293bc9fdbbf5eacae1fbb7e607cd5ede4d046a2a Mon Sep 17 00:00:00 2001 From: Icey <1790571317@qq.com> Date: Mon, 29 Sep 2025 09:42:15 +0000 Subject: [PATCH 3/8] fix Signed-off-by: Icey <1790571317@qq.com> --- .github/workflows/vllm_ascend_test.yaml | 1 + 1 file changed, 1 insertion(+) diff --git a/.github/workflows/vllm_ascend_test.yaml b/.github/workflows/vllm_ascend_test.yaml index 50527d1945..e676c13b68 100644 --- a/.github/workflows/vllm_ascend_test.yaml +++ b/.github/workflows/vllm_ascend_test.yaml @@ -56,6 +56,7 @@ jobs: with: filters: | e2e_tracker: + - '.github/workflows/vllm_ascend_test.yaml' - '.github/workflows/vllm_ascend_test.yaml' - 'vllm_ascend/**' - 'csrc/**' From 7baeb6d9cfb2a39a65fc1ddb3daa440afb29f3f5 Mon Sep 17 00:00:00 2001 From: Icey <1790571317@qq.com> Date: Mon, 29 Sep 2025 09:43:15 +0000 Subject: [PATCH 4/8] fix Signed-off-by: Icey <1790571317@qq.com> --- .github/workflows/vllm_ascend_test.yaml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/vllm_ascend_test.yaml b/.github/workflows/vllm_ascend_test.yaml index e676c13b68..500cace8c0 100644 --- a/.github/workflows/vllm_ascend_test.yaml +++ b/.github/workflows/vllm_ascend_test.yaml @@ -56,8 +56,8 @@ jobs: with: filters: | e2e_tracker: - - '.github/workflows/vllm_ascend_test.yaml' - '.github/workflows/vllm_ascend_test.yaml' + - '.github/workflows/_e2e_test.yaml' - 'vllm_ascend/**' - 'csrc/**' - 'cmake/**' From eaf2f5e76e6f15eefa2dd40ea788f86102d88e6a Mon Sep 17 00:00:00 2001 From: Icey <1790571317@qq.com> Date: Mon, 29 Sep 2025 09:46:22 +0000 Subject: [PATCH 5/8] fix Signed-off-by: Icey <1790571317@qq.com> --- .github/workflows/vllm_ascend_test.yaml | 1 + .github/workflows/vllm_ascend_test_full.yaml | 1 + 2 files changed, 2 insertions(+) diff --git a/.github/workflows/vllm_ascend_test.yaml b/.github/workflows/vllm_ascend_test.yaml index 500cace8c0..48c31d924e 100644 --- a/.github/workflows/vllm_ascend_test.yaml +++ b/.github/workflows/vllm_ascend_test.yaml @@ -157,3 +157,4 @@ jobs: runner: linux-aarch64-a2 image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/cann:8.2.rc1-910b-ubuntu22.04-py3.11 type: light + diff --git a/.github/workflows/vllm_ascend_test_full.yaml b/.github/workflows/vllm_ascend_test_full.yaml index f1ca245c90..c1117e70aa 100644 --- a/.github/workflows/vllm_ascend_test_full.yaml +++ b/.github/workflows/vllm_ascend_test_full.yaml @@ -78,3 +78,4 @@ jobs: runner: linux-aarch64-a2 image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/cann:8.2.rc1-910b-ubuntu22.04-py3.11 type: full + From 0040e2a6518847c41a2667f2eee5afb9f38421df Mon Sep 17 00:00:00 2001 From: Icey <1790571317@qq.com> Date: Mon, 29 Sep 2025 09:54:39 +0000 Subject: [PATCH 6/8] fix Signed-off-by: Icey <1790571317@qq.com> --- .github/workflows/_e2e_test.yaml | 3 +-- .github/workflows/vllm_ascend_test.yaml | 4 +-- .github/workflows/vllm_ascend_test_full.yaml | 28 -------------------- 3 files changed, 2 insertions(+), 33 deletions(-) diff --git a/.github/workflows/_e2e_test.yaml b/.github/workflows/_e2e_test.yaml index 5872757060..b4a4c52d86 100644 --- a/.github/workflows/_e2e_test.yaml +++ b/.github/workflows/_e2e_test.yaml @@ -82,8 +82,7 @@ jobs: env: VLLM_WORKER_MULTIPROC_METHOD: spawn VLLM_USE_MODELSCOPE: True - PYTORCH_NPU_ALLOC_CONF: max_split_size_mb:256 - PYTORCH_NPU_ALLOC_CONF: expandable_segments:True + PYTORCH_NPU_ALLOC_CONF: max_split_size_mb:256,expandable_segments:True NPU_MEMORY_FRACTION: 0.96 OMP_NUM_THREADS: 1 if: ${{ inputs.type == 'full' }} diff --git a/.github/workflows/vllm_ascend_test.yaml b/.github/workflows/vllm_ascend_test.yaml index 48c31d924e..3077c2c477 100644 --- a/.github/workflows/vllm_ascend_test.yaml +++ b/.github/workflows/vllm_ascend_test.yaml @@ -57,7 +57,6 @@ jobs: filters: | e2e_tracker: - '.github/workflows/vllm_ascend_test.yaml' - - '.github/workflows/_e2e_test.yaml' - 'vllm_ascend/**' - 'csrc/**' - 'cmake/**' @@ -156,5 +155,4 @@ jobs: vllm: ${{ matrix.vllm_version }} runner: linux-aarch64-a2 image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/cann:8.2.rc1-910b-ubuntu22.04-py3.11 - type: light - + type: light \ No newline at end of file diff --git a/.github/workflows/vllm_ascend_test_full.yaml b/.github/workflows/vllm_ascend_test_full.yaml index c1117e70aa..b17fdf16a1 100644 --- a/.github/workflows/vllm_ascend_test_full.yaml +++ b/.github/workflows/vllm_ascend_test_full.yaml @@ -37,34 +37,6 @@ concurrency: cancel-in-progress: true jobs: - changes: - runs-on: ubuntu-latest - if: ${{ contains(github.event.pull_request.labels.*.name, 'ready') && contains(github.event.pull_request.labels.*.name, 'ready-for-test') }} - outputs: - e2e_tracker: ${{ steps.filter.outputs.e2e_tracker }} - ut_tracker: ${{ steps.filter.outputs.ut_tracker }} - steps: - - uses: actions/checkout@v4 - - uses: dorny/paths-filter@v3 - id: filter - with: - filters: | - e2e_tracker: - - '.github/workflows/vllm_ascend_test.yaml' - - '.github/workflows/_e2e_test.yaml' - - 'vllm_ascend/**' - - 'csrc/**' - - 'cmake/**' - - 'tests/e2e/**' - - 'CMakeLists.txt' - - 'setup.py' - - 'requirements.txt' - - 'requirements-dev.txt' - - 'requirements-lint.txt' - - 'packages.txt' - ut_tracker: - - 'tests/ut/**' - e2e-test: name: e2e-full strategy: From 9e1e43db7142fd3054047143c7f9d5e45754f955 Mon Sep 17 00:00:00 2001 From: Icey <1790571317@qq.com> Date: Thu, 9 Oct 2025 01:20:17 +0000 Subject: [PATCH 7/8] fix Signed-off-by: Icey <1790571317@qq.com> --- .github/workflows/_e2e_test.yaml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/_e2e_test.yaml b/.github/workflows/_e2e_test.yaml index b4a4c52d86..62ac6f20ac 100644 --- a/.github/workflows/_e2e_test.yaml +++ b/.github/workflows/_e2e_test.yaml @@ -82,7 +82,7 @@ jobs: env: VLLM_WORKER_MULTIPROC_METHOD: spawn VLLM_USE_MODELSCOPE: True - PYTORCH_NPU_ALLOC_CONF: max_split_size_mb:256,expandable_segments:True + PYTORCH_NPU_ALLOC_CONF: expandable_segments:True NPU_MEMORY_FRACTION: 0.96 OMP_NUM_THREADS: 1 if: ${{ inputs.type == 'full' }} From 93df3f423a3998e7c4a44c24f95727bbbb405834 Mon Sep 17 00:00:00 2001 From: Icey <1790571317@qq.com> Date: Thu, 9 Oct 2025 02:05:36 +0000 Subject: [PATCH 8/8] fix Signed-off-by: Icey <1790571317@qq.com> --- .github/workflows/vllm_ascend_test_full.yaml | 2 -- 1 file changed, 2 deletions(-) diff --git a/.github/workflows/vllm_ascend_test_full.yaml b/.github/workflows/vllm_ascend_test_full.yaml index b17fdf16a1..c6a3260ed3 100644 --- a/.github/workflows/vllm_ascend_test_full.yaml +++ b/.github/workflows/vllm_ascend_test_full.yaml @@ -42,8 +42,6 @@ jobs: strategy: matrix: vllm_version: [releases/v0.11.0, v0.11.0rc3] - needs: [changes] - if: ${{ needs.changes.outputs.e2e_tracker == 'true' }} uses: ./.github/workflows/_e2e_test.yaml with: vllm: ${{ matrix.vllm_version }}