Skip to content

Commit c872572

Browse files
committed
feat: add bench run script
1 parent 0f2ef2f commit c872572

File tree

1 file changed

+34
-0
lines changed

1 file changed

+34
-0
lines changed

bench/run_bench.sh

Lines changed: 34 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,34 @@
1+
#!/bin/bash
2+
3+
set -x
4+
5+
export ROUTER_API_KEY="1234567890"
6+
export VLLM_API_KEY="1234567890"
7+
export ROUTER_ENDPOINT="http://localhost:8801/v1"
8+
export VLLM_ENDPOINT="http://localhost:8000/v1"
9+
export ROUTER_MODELS="auto"
10+
export VLLM_MODELS="openai/gpt-oss-20b"
11+
12+
# Run the benchmark
13+
python src/training/model_eval/router_reason_bench.py \
14+
--run-router \
15+
--router-endpoint "$ROUTER_ENDPOINT" \
16+
--router-api-key "$ROUTER_API_KEY" \
17+
--router-models "$ROUTER_MODELS" \
18+
--run-vllm \
19+
--vllm-endpoint "$VLLM_ENDPOINT" \
20+
--vllm-api-key "$VLLM_API_KEY" \
21+
--vllm-models "$VLLM_MODELS" \
22+
--samples-per-category 20 \
23+
--vllm-exec-modes NR XC \
24+
--concurrent-requests 4 \
25+
--output-dir results/reasonbench
26+
27+
# Generate plots
28+
VLLM_MODEL_FIRST="${VLLM_MODELS%% *}"
29+
ROUTER_MODEL_FIRST="${ROUTER_MODELS%% *}"
30+
VLLM_MODELS_SAFE="${VLLM_MODEL_FIRST//\//_}"
31+
ROUTER_MODELS_SAFE="${ROUTER_MODEL_FIRST//\//_}"
32+
python src/training/model_eval/bench_plot.py \
33+
--summary "results/reasonbench/vllm::${VLLM_MODELS_SAFE}/summary.json" \
34+
--router-summary "results/reasonbench/router::${ROUTER_MODELS_SAFE}/summary.json"

0 commit comments

Comments
 (0)