Skip to content

Commit 95ee1df

Browse files
add online runs for disagg
1 parent e1e26ad commit 95ee1df

File tree

5 files changed

+22
-7
lines changed

5 files changed

+22
-7
lines changed

cases/hourly_disagg.csv

Lines changed: 6 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,2 +1,6 @@
1-
Device,Model,MaxNumSeqs,MaxNumBatchedTokens,TensorParallelSize,MaxModelLen,Dataset,InputLen,OutputLen,ExpectedETEL,NumPrompts
2-
v6e-8,meta-llama/Llama-3.1-8B-Instruct,128,1024,2,2048,sonnet,1800,128,,1000
1+
Device,Model,MaxNumSeqs,MaxNumBatchedTokens,TensorParallelSize,MaxModelLen,Dataset,InputLen,OutputLen,ExpectedETEL,NumPrompts,MODELTAG,PREFIX_LEN,RequestRate
2+
v6e-8,meta-llama/Llama-3.1-8B-Instruct,512,8192,4,2048,mlperf,1024,1024,,10000,,,inf
3+
v6e-8,meta-llama/Llama-3.1-8B-Instruct,512,8192,4,2048,mlperf,1024,1024,,10000,,,50
4+
v6e-8,meta-llama/Llama-3.1-8B-Instruct,512,8192,4,2048,mlperf,1024,1024,,10000,,,60
5+
v6e-8,Qwen/Qwen3-32B,128,8192,4,2048,mlperf,1024,1024,,5000,,,inf
6+
v6e-8,Qwen/Qwen3-32B,128,8192,4,2048,mlperf,1024,1024,,5000,,,20

database/vllm_bm_20251117.ddl

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,2 @@
1+
ALTER TABLE RunRecord ADD COLUMN RequestRate FLOAT64 DEFAULT(0);
2+
CREATE INDEX IDX_RunRecord_RequestRate ON RunRecord (RequestRate);

scripts/agent/run_bm.sh

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -215,6 +215,13 @@ run_benchmark(){
215215
echo "$throughput $p99_e2el"
216216
}
217217

218+
# If REQUEST_RATE is provided, run the benchmark once with it and exit.
219+
if [[ -n "${REQUEST_RATE:-}" ]]; then
220+
echo "REQUEST_RATE is set to '$REQUEST_RATE'. Running benchmark once."
221+
run_benchmark "$REQUEST_RATE"
222+
exit 0
223+
fi
224+
218225
read throughput p99_e2el < <(run_benchmark "inf" | tail -n 1)
219226

220227
echo "throughput:$throughput"

scripts/scheduler/hourly_run.sh

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -131,6 +131,6 @@ fi
131131
# ./scripts/scheduler/create_job.sh ./cases/autotune_ali.csv "" $TAG AUTOTUNE
132132
# fi
133133

134-
echo LOCAL_PATCH=1 ./scripts/scheduler/create_job.sh ./cases/hourly_disagg.csv "" $TAG HOURLY_DISAGG TPU_INFERENCE "PREFILL_SLICES=2;DECODE_SLICES=2;TPU_BACKEND_TYPE=jax"
135-
LOCAL_PATCH=1 ./scripts/scheduler/create_job.sh ./cases/hourly_disagg.csv "" $TAG HOURLY_DISAGG TPU_INFERENCE "PREFILL_SLICES=2;DECODE_SLICES=2;TPU_BACKEND_TYPE=jax"
134+
echo LOCAL_PATCH=1 ./scripts/scheduler/create_job.sh ./cases/hourly_disagg.csv "" $TAG HOURLY_DISAGG TPU_INFERENCE "PREFILL_SLICES=4;DECODE_SLICES=4;TPU_BACKEND_TYPE=jax"
135+
LOCAL_PATCH=1 ./scripts/scheduler/create_job.sh ./cases/hourly_disagg.csv "" $TAG HOURLY_DISAGG TPU_INFERENCE "PREFILL_SLICES=4;DECODE_SLICES=4;TPU_BACKEND_TYPE=jax"
136136

scripts/scheduler/schedule_run.sh

Lines changed: 5 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -58,7 +58,8 @@ tail -n +2 "$CSV_FILE" | while read -r line || [ -n "${line}" ]; do
5858
EXPECTED_ETEL \
5959
NUM_PROMPTS \
6060
MODELTAG \
61-
PREFIX_LEN <<< "$line"
61+
PREFIX_LEN \
62+
REQUEST_RATE <<< "$line"
6263

6364
RECORD_ID=$(uuidgen | tr 'A-Z' 'a-z')
6465

@@ -79,7 +80,7 @@ tail -n +2 "$CSV_FILE" | while read -r line || [ -n "${line}" ]; do
7980
--sql="INSERT INTO RunRecord (
8081
RecordId, Status, CreatedTime, Device, Model, RunType, CodeHash,
8182
MaxNumSeqs, MaxNumBatchedTokens, TensorParallelSize, MaxModelLen,
82-
Dataset, InputLen, OutputLen, LastUpdate, CreatedBy,JobReference, ExpectedETEL, NumPrompts, ModelTag, PrefixLen, ExtraEnvs
83+
Dataset, InputLen, OutputLen, LastUpdate, CreatedBy,JobReference, ExpectedETEL, NumPrompts, ModelTag, PrefixLen, ExtraEnvs, RequestRate
8384
) VALUES (
8485
'$RECORD_ID', 'CREATED', PENDING_COMMIT_TIMESTAMP(), '$DEVICE', '$MODEL', '$RUN_TYPE', '$CODEHASH',
8586
$MAX_NUM_SEQS,
@@ -96,7 +97,8 @@ tail -n +2 "$CSV_FILE" | while read -r line || [ -n "${line}" ]; do
9697
${NUM_PROMPTS:-1000},
9798
'${MODELTAG:-PROD}',
9899
${PREFIX_LEN:-0},
99-
'$EXTRA_ENVS'
100+
'$EXTRA_ENVS',
101+
'${REQUEST_RATE:-inf}'
100102
);"
101103

102104
# If insert failed, just continue without publishing

0 commit comments

Comments
 (0)