Skip to content

Commit ef4cf04

Browse files
committed
finally fixed the run scripts
1 parent 7a5977c commit ef4cf04

File tree

6 files changed

+29
-12
lines changed

6 files changed

+29
-12
lines changed

3-workloads/agentic/run_agentic.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -86,7 +86,7 @@ for interval in "${NEW_USER_INTERVALS[@]}"; do
8686
# Change to project root before running summarize.py
8787
cd "$PROJECT_ROOT"
8888
python3 "4-latest-results/post-processing/summarize.py" \
89-
"${output_file#../../}" \
89+
"4-latest-results/${output_file#../../}" \
9090
KEY="$KEY" \
9191
WORKLOAD="agentic" \
9292
NUM_USERS_WARMUP="$NUM_USERS_WARMUP" \

3-workloads/mooncake/run_mooncake.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -56,7 +56,7 @@ for qps in "${QPS_VALUES[@]}"; do
5656
# Change to project root before running summarize.py
5757
cd "$PROJECT_ROOT"
5858
python3 "4-latest-results/post-processing/summarize.py" \
59-
"${output_file#../../}" \
59+
"4-latest-results/${output_file#../../}" \
6060
KEY="$KEY" \
6161
WORKLOAD="mooncake" \
6262
NUM_ROUNDS="$NUM_ROUNDS" \

3-workloads/sharegpt/workload_execution/run-sharegpt.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -67,7 +67,7 @@ for qps in "${QPS_VALUES[@]}"; do
6767
# Change to project root before running summarize.py
6868
cd "$PROJECT_ROOT"
6969
python3 "4-latest-results/post-processing/summarize.py" \
70-
"${output_file#../../../}" \
70+
"4-latest-results/${output_file#../../../}" \
7171
KEY="$KEY" \
7272
WORKLOAD="sharegpt" \
7373
LIMIT="$LIMIT" \

3-workloads/synthetic/run_synthetic.sh

Lines changed: 16 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -84,8 +84,9 @@ for qps in "${QPS_VALUES[@]}"; do
8484

8585
# Change to project root before running summarize.py
8686
cd "$PROJECT_ROOT"
87+
8788
python3 "4-latest-results/post-processing/summarize.py" \
88-
"${KEY}_synthetic_output_${qps}.csv" \
89+
"4-latest-results/${KEY}_synthetic_output_${qps}.csv" \
8990
KEY="$KEY" \
9091
WORKLOAD="synthetic" \
9192
NUM_USERS_WARMUP="$NUM_USERS_WARMUP" \
@@ -100,3 +101,17 @@ for qps in "${QPS_VALUES[@]}"; do
100101
# Change back to script directory
101102
cd "$SCRIPT_DIR"
102103
done
104+
105+
# Debugging:
106+
# python3 "4-latest-results/post-processing/summarize.py" \
107+
# "4-latest-results/stack_synthetic_output_0.7.csv" \
108+
# KEY="stack" \
109+
# WORKLOAD="synthetic" \
110+
# NUM_USERS_WARMUP="750" \
111+
# NUM_USERS="350" \
112+
# NUM_ROUNDS="20" \
113+
# SYSTEM_PROMPT="0" \
114+
# CHAT_HISTORY="20000" \
115+
# ANSWER_LEN="1000" \
116+
# QPS="0.7" \
117+
# USE_SHAREGPT="false"

4-latest-results/post-processing/summarize.py

Lines changed: 8 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -22,12 +22,6 @@ def ProcessSummary(
2222
else:
2323
launched_queries = len(df)
2424

25-
print(
26-
f"Launched queries: {launched_queries}, "
27-
f"pending queries: {pending_queries}, "
28-
f"finished queries: {len(df)}"
29-
)
30-
3125
if qps is None:
3226
qps = 0.0
3327

@@ -55,6 +49,12 @@ def ProcessSummary(
5549
average_ratio = df['ratio'].mean()
5650

5751
print("\n==================== Performance summary ======================")
52+
print(
53+
f" Launched queries: {launched_queries}, "
54+
f"pending queries: {pending_queries}, "
55+
f"finished queries: {len(df)}"
56+
)
57+
5858
print(f" Processing speed: {finished_qps:.4f} reqs/s")
5959
print(f" Input tokens per second: {average_prefill_speed:.4f} tokens/s")
6060
print(f" Output tokens per second: {average_generation_speed:.4f} tokens/s")
@@ -103,13 +103,15 @@ def process_output(filename: str, **kwargs):
103103
print(f"Performance summary saved to {results_path}")
104104

105105
# Save a copy of the results file to ~/srv/runner-db/
106+
print(f"Saving results to ~/srv/runner-db/{filename_without_parent_or_ext}-{timestamp}.results")
106107
runner_db_path = os.path.expanduser("~/srv/runner-db/")
107108
os.makedirs(runner_db_path, exist_ok=True)
108109
runner_db_file = os.path.join(runner_db_path, f"{filename_without_parent_or_ext}-{timestamp}.results")
109110

110111
# Copy the contents to the new location
111112
with open(results_path, "r") as src, open(runner_db_file, "w") as dst:
112113
dst.write(src.read())
114+
print(f"Results saved to ~/srv/runner-db/{filename_without_parent_or_ext}-{timestamp}.results")
113115

114116
if __name__ == "__main__":
115117
if len(sys.argv) < 2:

bench-spec-TEMPLATE.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -31,7 +31,7 @@ Serving:
3131
numGPUs: 1 # PLEASE make sure that replicaCount x numGPUs <= numClusterGPUs
3232
numCPUs: 4 # PLEASE look at the vCPU limits in the comment above (try to keep 12 or below)
3333
tensorParallelSize: 1 # please make sure tensorParallelSize <= numGPUs (this is the number of GPUs per replica)
34-
hf_token: <YOUR_HF_TOKEN> # leave as <YOUR_HF_TOKEN> if running on LMCacheGKE
34+
hf_token: <YOUR_HF_TOKEN>
3535
maxModelLen: 16384
3636

3737
# Option 2: Latest-ProductionStack (Renders the latest k8s deployment directly from production-stack source code)
@@ -45,7 +45,7 @@ Serving:
4545
numGPUs: 2
4646
numCPUs: 4
4747
tensorParallelSize: 2
48-
hf_token: <YOUR_HF_TOKEN> # leave as <YOUR_HF_TOKEN> if running on LMCacheGKE
48+
hf_token: <YOUR_HF_TOKEN>
4949
maxModelLen: 16384
5050

5151
# Option 3: SGLang

0 commit comments

Comments
 (0)