File tree Expand file tree Collapse file tree 3 files changed +17
-3
lines changed
scripts/scheduled_integration_test Expand file tree Collapse file tree 3 files changed +17
-3
lines changed Original file line number Diff line number Diff line change @@ -36,6 +36,11 @@ for BACK in "${BACKENDS[@]}"; do
3636 VLLM_ALL2ALL_BACKEND=$BACK \
3737 vllm serve " $MODEL " \
3838 --enforce-eager \
39+ --enable-eplb \
40+ --eplb-config ' {"window_size":10, \
41+ "step_interval":100, \
42+ "num_redundant_experts":0, \
43+ "log_balancedness":true}' \
3944 --tensor-parallel-size 2 \
4045 --data-parallel-size 2 \
4146 --enable-expert-parallel \
Original file line number Diff line number Diff line change @@ -1482,4 +1482,4 @@ steps:
14821482 num_gpus : 4
14831483 working_dir : " /vllm-workspace"
14841484 commands :
1485- - bash .buildkite/scripts/scheduled_integration_test/qwen30b_a3b_fp8_block_ep .sh 0.8 200 8020
1485+ - bash .buildkite/scripts/scheduled_integration_test/qwen30b_a3b_fp8_block_ep_eplb .sh 0.8 200 8020
Original file line number Diff line number Diff line change @@ -1339,11 +1339,20 @@ steps:
13391339 commands :
13401340 - bash .buildkite/scripts/scheduled_integration_test/deepseek_v2_lite_ep_eplb.sh 0.25 200 8010
13411341
1342- - label : Qwen3-30B-A3B-FP8-block Accuracy
1342+ - label : Qwen3-30B-A3B-FP8-block Accuracy (H100)
13431343 timeout_in_minutes : 60
13441344 gpu : h100
13451345 optional : true
13461346 num_gpus : 4
13471347 working_dir : " /vllm-workspace"
13481348 commands :
1349- - bash .buildkite/scripts/scheduled_integration_test/qwen30b_a3b_fp8_block_ep.sh 0.8 200 8020
1349+ - bash .buildkite/scripts/scheduled_integration_test/qwen30b_a3b_fp8_block_ep_eplb.sh 0.8 200 8020
1350+
1351+ - label : Qwen3-30B-A3B-FP8-block Accuracy (B200)
1352+ timeout_in_minutes : 60
1353+ gpu : b200
1354+ optional : true
1355+ num_gpus : 4
1356+ working_dir : " /vllm-workspace"
1357+ commands :
1358+ - bash .buildkite/scripts/scheduled_integration_test/qwen30b_a3b_fp8_block_ep_eplb.sh 0.8 200 8020
You can’t perform that action at this time.
0 commit comments