Skip to content

Commit 8a1d253

Browse files
author
Varun Sundar Rabindranath
committed
add dp/tp inputs
Signed-off-by: Varun Sundar Rabindranath <[email protected]>
1 parent da3ba7c commit 8a1d253

File tree

2 files changed

+7
-5
lines changed

2 files changed

+7
-5
lines changed

.buildkite/scripts/scheduled_integration_test/qwen30b_a3b_fp8_block_ep_eplb.sh

Lines changed: 5 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,10 +1,12 @@
11
#!/usr/bin/env bash
22
set -euxo pipefail
33

4-
# args: [THRESHOLD] [NUM_QUESTIONS] [START_PORT]
4+
# args: [THRESHOLD] [NUM_QUESTIONS] [START_PORT] [DATA_PARALLEL_SIZE] [TENSOR_PARALLEL_SIZE]
55
THRESHOLD=${1:-0.8}
66
NUM_Q=${2:-1319}
77
PORT=${3:-8020}
8+
DATA_PARALLEL_SIZE=${4:-2}
9+
TENSOR_PARALLEL_SIZE=${5:-2}
810
OUT_DIR=${OUT_DIR:-/tmp/vllm-scheduled}
911
mkdir -p "${OUT_DIR}"
1012

@@ -38,8 +40,8 @@ for BACK in "${BACKENDS[@]}"; do
3840
--enforce-eager \
3941
--enable-eplb \
4042
--eplb-config '{"window_size":10, "step_interval":100, "num_redundant_experts":0, "log_balancedness":true}' \
41-
--tensor-parallel-size 2 \
42-
--data-parallel-size 2 \
43+
--tensor-parallel-size ${TENSOR_PARALLEL_SIZE} \
44+
--data-parallel-size ${DATA_PARALLEL_SIZE} \
4345
--enable-expert-parallel \
4446
--trust-remote-code \
4547
--max-model-len 2048 \

.buildkite/test-pipeline.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1352,7 +1352,7 @@ steps:
13521352
timeout_in_minutes: 60
13531353
gpu: b200
13541354
optional: true
1355-
num_gpus: 4
1355+
num_gpus: 2
13561356
working_dir: "/vllm-workspace"
13571357
commands:
1358-
- bash .buildkite/scripts/scheduled_integration_test/qwen30b_a3b_fp8_block_ep_eplb.sh 0.8 200 8020
1358+
- bash .buildkite/scripts/scheduled_integration_test/qwen30b_a3b_fp8_block_ep_eplb.sh 0.8 200 8020 2 1

0 commit comments

Comments
 (0)