Skip to content

Commit 749393e

Browse files
authored
doc: Fix benchmark cmd in disagg scripts (NVIDIA#5515)
Signed-off-by: Kaiyu Xie <[email protected]>
1 parent ff2dd72 commit 749393e

File tree

1 file changed

+13
-7
lines changed

1 file changed

+13
-7
lines changed

docs/source/scripts/disaggregated/run_benchmark.sh

Lines changed: 13 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -70,13 +70,19 @@ for concurrency in ${concurrency_list}; do
7070
mkdir -p ${log_path}/concurrency_${concurrency}
7171
max_count=$((${concurrency} * ${multi_round}))
7272
echo "Running benchmark with concurrency: ${concurrency}, max_count: ${max_count}"
73-
# run your benchmark here
74-
python run_benchmark.py --model_name ${model_name} \
75-
--isl ${isl} \
76-
--osl ${osl} \
77-
--concurrency ${concurrency} \
78-
--max_count ${max_count} \
79-
--log_path ${log_path}/concurrency_${concurrency}
73+
python -m tensorrt_llm.serve.scripts.benchmark_serving \
74+
--model ${model_name} \
75+
--tokenizer ${model_name} \
76+
--dataset-name random \
77+
--random-ids \
78+
--random-input-len ${isl} \
79+
--random-output-len ${osl} \
80+
--random-prefix-len 0 \
81+
--num-prompts ${max_count} \
82+
--max-concurrency ${concurrency} \
83+
--host ${hostname} \
84+
--port ${port} \
85+
--ignore-eos
8086
echo "done for ${concurrency} in folder ${log_path}/concurrency_${concurrency}"
8187
done
8288

0 commit comments

Comments
 (0)