File tree Expand file tree Collapse file tree 3 files changed +17
-3
lines changed
scripts/scheduled_integration_test Expand file tree Collapse file tree 3 files changed +17
-3
lines changed Original file line number Diff line number Diff line change @@ -36,6 +36,11 @@ for BACK in "${BACKENDS[@]}"; do
3636 VLLM_ALL2ALL_BACKEND=$BACK \
3737 vllm serve " $MODEL " \
3838 --enforce-eager \
39+ --enable-eplb \
40+ --eplb-config ' {"window_size":10, \
41+ "step_interval":100, \
42+ "num_redundant_experts":0, \
43+ "log_balancedness":true}' \
3944 --tensor-parallel-size 2 \
4045 --data-parallel-size 2 \
4146 --enable-expert-parallel \
Original file line number Diff line number Diff line change @@ -1482,4 +1482,4 @@ steps:
14821482 num_gpus : 4
14831483 working_dir : " /vllm-workspace"
14841484 commands :
1485- - bash .buildkite/scripts/scheduled_integration_test/qwen30b_a3b_fp8_block_ep .sh 0.8 200 8020
1485+ - bash .buildkite/scripts/scheduled_integration_test/qwen30b_a3b_fp8_block_ep_eplb .sh 0.8 200 8020
Original file line number Diff line number Diff line change @@ -1327,11 +1327,20 @@ steps:
13271327 commands :
13281328 - bash .buildkite/scripts/scheduled_integration_test/deepseek_v2_lite_ep_eplb.sh 0.25 200 8010
13291329
1330- - label : Qwen3-30B-A3B-FP8-block Accuracy
1330+ - label : Qwen3-30B-A3B-FP8-block Accuracy (H100)
13311331 timeout_in_minutes : 60
13321332 gpu : h100
13331333 optional : true
13341334 num_gpus : 4
13351335 working_dir : " /vllm-workspace"
13361336 commands :
1337- - bash .buildkite/scripts/scheduled_integration_test/qwen30b_a3b_fp8_block_ep.sh 0.8 200 8020
1337+ - bash .buildkite/scripts/scheduled_integration_test/qwen30b_a3b_fp8_block_ep_eplb.sh 0.8 200 8020
1338+
1339+ - label : Qwen3-30B-A3B-FP8-block Accuracy (B200)
1340+ timeout_in_minutes : 60
1341+ gpu : b200
1342+ optional : true
1343+ num_gpus : 4
1344+ working_dir : " /vllm-workspace"
1345+ commands :
1346+ - bash .buildkite/scripts/scheduled_integration_test/qwen30b_a3b_fp8_block_ep_eplb.sh 0.8 200 8020
You can’t perform that action at this time.
0 commit comments