Skip to content

Commit 9131dcf

Browse files
author
Varun Sundar Rabindranath
committed
fix lint
Signed-off-by: Varun Sundar Rabindranath <[email protected]>
1 parent 1bed891 commit 9131dcf

File tree

3 files changed

+17
-3
lines changed

3 files changed

+17
-3
lines changed

.buildkite/scripts/scheduled_integration_test/qwen30b_a3b_fp8_block_ep.sh renamed to .buildkite/scripts/scheduled_integration_test/qwen30b_a3b_fp8_block_ep_eplb.sh

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -36,6 +36,11 @@ for BACK in "${BACKENDS[@]}"; do
3636
VLLM_ALL2ALL_BACKEND=$BACK \
3737
vllm serve "$MODEL" \
3838
--enforce-eager \
39+
--enable-eplb \
40+
--eplb-config '{"window_size":10, \
41+
"step_interval":100, \
42+
"num_redundant_experts":0, \
43+
"log_balancedness":true}' \
3944
--tensor-parallel-size 2 \
4045
--data-parallel-size 2 \
4146
--enable-expert-parallel \

.buildkite/test-amd.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1482,4 +1482,4 @@ steps:
14821482
num_gpus: 4
14831483
working_dir: "/vllm-workspace"
14841484
commands:
1485-
- bash .buildkite/scripts/scheduled_integration_test/qwen30b_a3b_fp8_block_ep.sh 0.8 200 8020
1485+
- bash .buildkite/scripts/scheduled_integration_test/qwen30b_a3b_fp8_block_ep_eplb.sh 0.8 200 8020

.buildkite/test-pipeline.yaml

Lines changed: 11 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1339,11 +1339,20 @@ steps:
13391339
commands:
13401340
- bash .buildkite/scripts/scheduled_integration_test/deepseek_v2_lite_ep_eplb.sh 0.25 200 8010
13411341

1342-
- label: Qwen3-30B-A3B-FP8-block Accuracy
1342+
- label: Qwen3-30B-A3B-FP8-block Accuracy (H100)
13431343
timeout_in_minutes: 60
13441344
gpu: h100
13451345
optional: true
13461346
num_gpus: 4
13471347
working_dir: "/vllm-workspace"
13481348
commands:
1349-
- bash .buildkite/scripts/scheduled_integration_test/qwen30b_a3b_fp8_block_ep.sh 0.8 200 8020
1349+
- bash .buildkite/scripts/scheduled_integration_test/qwen30b_a3b_fp8_block_ep_eplb.sh 0.8 200 8020
1350+
1351+
- label: Qwen3-30B-A3B-FP8-block Accuracy (B200)
1352+
timeout_in_minutes: 60
1353+
gpu: b200
1354+
optional: true
1355+
num_gpus: 4
1356+
working_dir: "/vllm-workspace"
1357+
commands:
1358+
- bash .buildkite/scripts/scheduled_integration_test/qwen30b_a3b_fp8_block_ep_eplb.sh 0.8 200 8020

0 commit comments

Comments
 (0)