Skip to content

Commit 89b9a5e

Browse files
ruodilgreg-kwasniewski1
authored andcommitted
[None][test] store per user output and per gpu output metric in csv file (NVIDIA#10658)
Signed-off-by: Ruodi Lu <ruodil@users.noreply.github.com> Co-authored-by: Ruodi Lu <ruodil@users.noreply.github.com>
1 parent 7ea1838 commit 89b9a5e

File tree

2 files changed

+9
-0
lines changed

2 files changed

+9
-0
lines changed

tests/integration/defs/perf/test_perf.py

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -342,6 +342,11 @@ def import_allowed_perf_config():
342342
PerfMetricType.KV_CACHE_SIZE:
343343
re.compile(r".*(?:Allocated ([\d\.]+) GiB for max tokens in paged KV cache|"
344344
r"Final KV cache size after resize: ([\d\.]+) GiB).*"),
345+
PerfMetricType.PER_USER_OUTPUT_THROUGHPUT:
346+
re.compile(
347+
r"Per User Output Throughput \[w\/ ctx\] \(tps\/user\):\s+([\d\.]+)"),
348+
PerfMetricType.PER_GPU_OUTPUT_THROUGHPUT:
349+
re.compile(r"Per GPU Output Throughput \(tps\/gpu\):\s+([\d\.]+)"),
345350
}
346351

347352
AGGR_SERVER_PERF_METRIC_LOG_QUERIES = {
@@ -457,6 +462,8 @@ def import_allowed_perf_config():
457462
PerfMetricType.ENGINE_SIZE: "engine_size",
458463
PerfMetricType.CONTEXT_GPU_MEMORY: "context_gpu_memory",
459464
PerfMetricType.KV_CACHE_SIZE: "kv_cache_size",
465+
PerfMetricType.PER_USER_OUTPUT_THROUGHPUT: "per_user_output_throughput",
466+
PerfMetricType.PER_GPU_OUTPUT_THROUGHPUT: "per_gpu_output_throughput",
460467
}
461468

462469
BUILDER_METRICS = [

tests/integration/defs/perf/utils.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -114,6 +114,8 @@ class PerfMetricType(str, Enum):
114114
KV_CACHE_SIZE = "KV_CACHE_SIZE"
115115
DISAGG_SERVER_E2EL = "DISAGG_SERVER_E2EL"
116116
DISAGG_SERVER_TTFT = "DISAGG_SERVER_TTFT"
117+
PER_USER_OUTPUT_THROUGHPUT = "PER_USER_OUTPUT_THROUGHPUT"
118+
PER_GPU_OUTPUT_THROUGHPUT = "PER_GPU_OUTPUT_THROUGHPUT"
117119

118120

119121
@contextlib.contextmanager

0 commit comments

Comments
 (0)