Skip to content

Commit 2f782bb

Browse files
author
Varun Sundar Rabindranath
committed
fix lint
Signed-off-by: Varun Sundar Rabindranath <[email protected]>
1 parent e4c3182 commit 2f782bb

File tree

3 files changed

+17
-3
lines changed

3 files changed

+17
-3
lines changed

.buildkite/scripts/scheduled_integration_test/qwen30b_a3b_fp8_block_ep.sh renamed to .buildkite/scripts/scheduled_integration_test/qwen30b_a3b_fp8_block_ep_eplb.sh

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -36,6 +36,11 @@ for BACK in "${BACKENDS[@]}"; do
3636
VLLM_ALL2ALL_BACKEND=$BACK \
3737
vllm serve "$MODEL" \
3838
--enforce-eager \
39+
--enable-eplb \
40+
--eplb-config '{"window_size":10, \
41+
"step_interval":100, \
42+
"num_redundant_experts":0, \
43+
"log_balancedness":true}' \
3944
--tensor-parallel-size 2 \
4045
--data-parallel-size 2 \
4146
--enable-expert-parallel \

.buildkite/test-amd.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1482,4 +1482,4 @@ steps:
14821482
num_gpus: 4
14831483
working_dir: "/vllm-workspace"
14841484
commands:
1485-
- bash .buildkite/scripts/scheduled_integration_test/qwen30b_a3b_fp8_block_ep.sh 0.8 200 8020
1485+
- bash .buildkite/scripts/scheduled_integration_test/qwen30b_a3b_fp8_block_ep_eplb.sh 0.8 200 8020

.buildkite/test-pipeline.yaml

Lines changed: 11 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1327,11 +1327,20 @@ steps:
13271327
commands:
13281328
- bash .buildkite/scripts/scheduled_integration_test/deepseek_v2_lite_ep_eplb.sh 0.25 200 8010
13291329

1330-
- label: Qwen3-30B-A3B-FP8-block Accuracy
1330+
- label: Qwen3-30B-A3B-FP8-block Accuracy (H100)
13311331
timeout_in_minutes: 60
13321332
gpu: h100
13331333
optional: true
13341334
num_gpus: 4
13351335
working_dir: "/vllm-workspace"
13361336
commands:
1337-
- bash .buildkite/scripts/scheduled_integration_test/qwen30b_a3b_fp8_block_ep.sh 0.8 200 8020
1337+
- bash .buildkite/scripts/scheduled_integration_test/qwen30b_a3b_fp8_block_ep_eplb.sh 0.8 200 8020
1338+
1339+
- label: Qwen3-30B-A3B-FP8-block Accuracy (B200)
1340+
timeout_in_minutes: 60
1341+
gpu: b200
1342+
optional: true
1343+
num_gpus: 4
1344+
working_dir: "/vllm-workspace"
1345+
commands:
1346+
- bash .buildkite/scripts/scheduled_integration_test/qwen30b_a3b_fp8_block_ep_eplb.sh 0.8 200 8020

0 commit comments

Comments
 (0)