Skip to content

Commit 22fff0b

Browse files
committed
Fix failed request count
Signed-off-by: Rashid Kaleem <230885705+arekay-nv@users.noreply.github.com>
1 parent 8a85041 commit 22fff0b

File tree

3 files changed

+7
-1
lines changed

3 files changed

+7
-1
lines changed

src/inference_endpoint/commands/benchmark.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -697,7 +697,7 @@ def signal_handler(signum, frame):
697697
"results": {
698698
"total": total,
699699
"successful": success_count,
700-
"failed": total - success_count,
700+
"failed": report.n_samples_failed,
701701
"elapsed_time": elapsed_time,
702702
"qps": estimated_qps,
703703
},

src/inference_endpoint/metrics/reporter.py

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -354,6 +354,7 @@ class Report:
354354
test_started_at: int
355355
n_samples_issued: int
356356
n_samples_completed: int
357+
n_samples_failed: int
357358
duration_ns: int
358359

359360
# For the following metrics, the key is a rollup statistic (i.e. mean, median, etc.)
@@ -495,6 +496,7 @@ def display(
495496
)
496497
fn(f"Total samples issued: {self.n_samples_issued}{newline}")
497498
fn(f"Total samples completed: {self.n_samples_completed}{newline}")
499+
fn(f"Total samples failed: {self.n_samples_failed}{newline}")
498500
if self.duration_ns is not None:
499501
fn(f"Duration: {self.duration_ns / 1e9:.2f} seconds{newline}")
500502
else:
@@ -1312,6 +1314,7 @@ def create_report(
13121314
test_started_at=test_started_at,
13131315
n_samples_issued=sample_statuses["total_sent"],
13141316
n_samples_completed=sample_statuses["completed"],
1317+
n_samples_failed=self.get_error_count(),
13151318
duration_ns=self.derive_duration(),
13161319
ttft=ttft_summary,
13171320
tpot=tpot_summary,

tests/unit/metrics/test_reporter.py

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -388,6 +388,7 @@ def test_reporter_create_report(events_db, fake_outputs, tokenizer):
388388

389389
assert report.n_samples_issued == 3
390390
assert report.n_samples_completed == 2
391+
assert report.n_samples_failed == 3 # 3 ERROR events for uuid3 in fixture
391392
assert report.duration_ns == (10300 - 5000)
392393

393394
for k, expected in ttft_rollup.summarize().items():
@@ -428,6 +429,7 @@ def test_reporter_json(events_db):
428429
"git_sha",
429430
"n_samples_issued",
430431
"n_samples_completed",
432+
"n_samples_failed",
431433
"duration_ns",
432434
"ttft",
433435
"tpot",
@@ -441,6 +443,7 @@ def test_reporter_json(events_db):
441443
assert set(json_dict.keys()) == set(expected_keys)
442444
assert json_dict["n_samples_issued"] == report.n_samples_issued
443445
assert json_dict["n_samples_completed"] == report.n_samples_completed
446+
assert json_dict["n_samples_failed"] == report.n_samples_failed
444447
assert json_dict["duration_ns"] == report.duration_ns
445448
assert json_dict["qps"] == report.qps
446449
assert json_dict["tps"] == report.tps

0 commit comments

Comments
 (0)