Skip to content

Commit 429820e

Browse files
committed
add draft acceptance rate to server console output
1 parent 41a8e85 commit 429820e

File tree

1 file changed

+9
-0
lines changed

1 file changed

+9
-0
lines changed

examples/server/server.cpp

Lines changed: 9 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1453,6 +1453,15 @@ struct server_slot {
14531453
t_prompt_processing, n_prompt_tokens_processed, t_prompt, n_prompt_second,
14541454
t_token_generation, n_decoded, t_gen, n_gen_second,
14551455
t_prompt_processing + t_token_generation, n_prompt_tokens_processed + n_decoded);
1456+
1457+
if (n_draft_total > 0) {
1458+
const float draft_ratio = (float) n_draft_accepted / n_draft_total;
1459+
SLT_INF(*this,
1460+
"\n"
1461+
"draft acceptance rate = %0.5f (%5d accepted / %5d generated)\n",
1462+
draft_ratio, n_draft_accepted, n_draft_total
1463+
);
1464+
}
14561465
}
14571466

14581467
json to_json() const {

0 commit comments

Comments
 (0)