Skip to content

Commit d901d0a

Browse files
committed
bugfix _calc_engine_prefill_tps
Signed-off-by: chickeyton <[email protected]>
1 parent 99fa96c commit d901d0a

File tree

1 file changed

+4
-2
lines changed

1 file changed

+4
-2
lines changed

src/vllm_router/stats/request_stats.py

Lines changed: 4 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -382,8 +382,10 @@ def _calc_engine_prefill_tps(self, current_time: float, engine_url: str) -> floa
382382
# print(f"skip 2 |{(url, request_id) not in self.first_token_time}|{(url, request_id) not in self.uncached_prefix_tokens}")
383383
continue
384384

385-
prefill_periods.union(start_time, self.first_token_time[(url, request_id)])
386-
all_uncached_prefix_tokens += self.uncached_prefix_tokens[(url, request_id)]
385+
uncached_prefix_tokens = self.uncached_prefix_tokens[(url, request_id)]
386+
if uncached_prefix_tokens > 0:
387+
prefill_periods.union(start_time, self.first_token_time[(url, request_id)])
388+
all_uncached_prefix_tokens += uncached_prefix_tokens
387389
#print(f"[[[[[[[[[[[[[[[[[[[[[[[[[ all_uncached_prefix_tokens:{all_uncached_prefix_tokens}")
388390

389391
length = prefill_periods.compute_length()

0 commit comments

Comments
 (0)