Skip to content
This repository was archived by the owner on Sep 10, 2025. It is now read-only.

Commit d7b681a

Browse files
authored
fix: do not print perf stat when NaN (#1375)
If the chat is exited or interrupted it will still print the stats with NaN values which is unnecessary. Signed-off-by: Sébastien Han <[email protected]>
1 parent 4697764 commit d7b681a

File tree

1 file changed

+20
-5
lines changed

1 file changed

+20
-5
lines changed

torchchat/generate.py

Lines changed: 20 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -1189,12 +1189,27 @@ def callback(x, *, done_generating=False):
11891189
f"Mean Accepted: {sum([idx * i for idx, i in enumerate(counts_aggregated)])/sum(counts_aggregated)}"
11901190
)
11911191

1192-
print(
1193-
f"\n Average tokens/sec (total): {torch.mean(torch.tensor(aggregate_metrics['tokens_per_sec'])).item():.2f} \
1194-
\nAverage tokens/sec (first token): {torch.mean(torch.tensor(aggregate_metrics['first_token_per_sec'])).item():.2f} \
1195-
\nAverage tokens/sec (next tokens): {torch.mean(torch.tensor(aggregate_metrics['next_tokens_per_sec'])).item():.2f} \n\
1192+
avg_tokens_sec = torch.mean(
1193+
torch.tensor(aggregate_metrics["tokens_per_sec"])
1194+
).item()
1195+
avg_first_token_sec = torch.mean(
1196+
torch.tensor(aggregate_metrics["first_token_per_sec"])
1197+
).item()
1198+
avg_next_tokens_sec = torch.mean(
1199+
torch.tensor(aggregate_metrics["next_tokens_per_sec"])
1200+
).item()
1201+
1202+
if not (
1203+
torch.isnan(torch.tensor(avg_tokens_sec))
1204+
or torch.isnan(torch.tensor(avg_first_token_sec))
1205+
or torch.isnan(torch.tensor(avg_next_tokens_sec))
1206+
):
1207+
print(
1208+
f"\n Average tokens/sec (total): {avg_tokens_sec:.2f} \
1209+
\nAverage tokens/sec (first token): {avg_first_token_sec:.2f} \
1210+
\nAverage tokens/sec (next tokens): {avg_next_tokens_sec:.2f} \n\
11961211
"
1197-
)
1212+
)
11981213
if torch.cuda.is_available():
11991214
print(f"Memory used: {torch.cuda.max_memory_reserved() / 1e9:.02f} GB")
12001215

0 commit comments

Comments
 (0)