Skip to content

Commit 9a3101b

Browse files
authored
[Rocm][CI] Fix DeekSeek V2-Lite Accuracy CI (#29135)
Signed-off-by: charlifu <[email protected]>
1 parent d5dbdbf commit 9a3101b

File tree

2 files changed

+21
-2
lines changed

2 files changed

+21
-2
lines changed

.buildkite/scripts/scheduled_integration_test/deepseek_v2_lite_ep_eplb.sh

Lines changed: 11 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -17,7 +17,17 @@ wait_for_server() {
1717
}
1818

1919
MODEL="deepseek-ai/DeepSeek-V2-lite"
20-
BACKENDS=("deepep_high_throughput" "deepep_low_latency")
20+
21+
# Set BACKENDS based on platform
22+
if command -v rocm-smi &> /dev/null || [[ -d /opt/rocm ]] || [[ -n "${ROCM_PATH:-}" ]]; then
23+
# ROCm platform
24+
BACKENDS=("allgather_reducescatter")
25+
# Disable MOE padding for ROCm since it is causing eplb to fail
26+
export VLLM_ROCM_MOE_PADDING=0
27+
else
28+
# Non-ROCm platform (CUDA/other)
29+
BACKENDS=("deepep_high_throughput" "deepep_low_latency")
30+
fi
2131

2232
cleanup() {
2333
if [[ -n "${SERVER_PID:-}" ]] && kill -0 "${SERVER_PID}" 2>/dev/null; then

.buildkite/scripts/scheduled_integration_test/qwen30b_a3b_fp8_block_ep.sh

Lines changed: 10 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -17,7 +17,16 @@ wait_for_server() {
1717
}
1818

1919
MODEL="QWen/Qwen3-30B-A3B-FP8"
20-
BACKENDS=("deepep_high_throughput" "deepep_low_latency")
20+
# Set BACKENDS based on platform
21+
if command -v rocm-smi &> /dev/null || [[ -d /opt/rocm ]] || [[ -n "${ROCM_PATH:-}" ]]; then
22+
# ROCm platform
23+
BACKENDS=("allgather_reducescatter")
24+
# Disable MOE padding for ROCm since it is causing eplb to fail
25+
export VLLM_ROCM_MOE_PADDING=0
26+
else
27+
# Non-ROCm platform (CUDA/other)
28+
BACKENDS=("deepep_high_throughput" "deepep_low_latency")
29+
fi
2130

2231
cleanup() {
2332
if [[ -n "${SERVER_PID:-}" ]] && kill -0 "${SERVER_PID}" 2>/dev/null; then

0 commit comments

Comments
 (0)