3838
3939from guidellm .backend import (
4040 GenerationRequest ,
41- GenerationRequestTimings ,
4241 GenerationResponse ,
4342)
4443from guidellm .benchmark .objects import (
4746 GenerativeRequestStats ,
4847)
4948from guidellm .scheduler import (
50- MeasuredRequestTimingsT ,
5149 RequestT ,
5250 ResponseT ,
5351 ScheduledRequestInfo ,
@@ -153,7 +151,7 @@ def get_metric(
153151
154152
155153@runtime_checkable
156- class Aggregator (Protocol [ResponseT , RequestT , MeasuredRequestTimingsT ]):
154+ class Aggregator (Protocol [ResponseT , RequestT ]):
157155 """
158156 Protocol for processing benchmark data updates during execution.
159157
@@ -167,7 +165,7 @@ def __call__(
167165 state : AggregatorState ,
168166 response : ResponseT | None ,
169167 request : RequestT ,
170- request_info : ScheduledRequestInfo [ MeasuredRequestTimingsT ] ,
168+ request_info : ScheduledRequestInfo ,
171169 scheduler_state : SchedulerState ,
172170 ) -> dict [str , Any ] | None :
173171 """
@@ -183,7 +181,7 @@ def __call__(
183181
184182
185183@runtime_checkable
186- class CompilableAggregator (Protocol [ResponseT , RequestT , MeasuredRequestTimingsT ]):
184+ class CompilableAggregator (Protocol [ResponseT , RequestT ]):
187185 """
188186 Protocol for aggregators that compile final results from aggregated state.
189187
@@ -196,7 +194,7 @@ def __call__(
196194 state : AggregatorState ,
197195 response : ResponseT | None ,
198196 request : RequestT ,
199- request_info : ScheduledRequestInfo [ MeasuredRequestTimingsT ] ,
197+ request_info : ScheduledRequestInfo ,
200198 scheduler_state : SchedulerState ,
201199 ) -> dict [str , Any ] | None :
202200 """
@@ -225,7 +223,7 @@ def compile(
225223class SerializableAggregator (
226224 PydanticClassRegistryMixin [type ["SerializableAggregator" ]],
227225 ABC ,
228- Generic [ResponseT , RequestT , MeasuredRequestTimingsT ],
226+ Generic [ResponseT , RequestT ],
229227):
230228 schema_discriminator : ClassVar [str ] = "type_"
231229
@@ -286,7 +284,7 @@ def __call__(
286284 state : AggregatorState ,
287285 response : ResponseT | None ,
288286 request : RequestT ,
289- request_info : ScheduledRequestInfo [ MeasuredRequestTimingsT ] ,
287+ request_info : ScheduledRequestInfo ,
290288 scheduler_state : SchedulerState ,
291289 ) -> dict [str , Any ] | None :
292290 """
@@ -314,9 +312,7 @@ def compile(
314312
315313
316314@SerializableAggregator .register ("inject_extras" )
317- class InjectExtrasAggregator (
318- SerializableAggregator [ResponseT , RequestT , MeasuredRequestTimingsT ], InfoMixin
319- ):
315+ class InjectExtrasAggregator (SerializableAggregator [ResponseT , RequestT ], InfoMixin ):
320316 """
321317 Aggregator for injecting extra metadata into the output.
322318 """
@@ -333,7 +329,7 @@ def __call__(
333329 state : AggregatorState ,
334330 response : ResponseT | None ,
335331 request : RequestT ,
336- request_info : ScheduledRequestInfo [ MeasuredRequestTimingsT ] ,
332+ request_info : ScheduledRequestInfo ,
337333 scheduler_state : SchedulerState ,
338334 ) -> dict [str , Any ] | None :
339335 """
@@ -355,9 +351,7 @@ def compile(
355351
356352
357353@SerializableAggregator .register ("scheduler_stats" )
358- class SchedulerStatsAggregator (
359- SerializableAggregator [ResponseT , RequestT , MeasuredRequestTimingsT ], InfoMixin
360- ):
354+ class SchedulerStatsAggregator (SerializableAggregator [ResponseT , RequestT ], InfoMixin ):
361355 """
362356 Aggregates scheduler timing and performance metrics.
363357
@@ -376,7 +370,7 @@ def __call__(
376370 state : AggregatorState ,
377371 response : ResponseT | None ,
378372 request : RequestT ,
379- request_info : ScheduledRequestInfo [ MeasuredRequestTimingsT ] ,
373+ request_info : ScheduledRequestInfo ,
380374 scheduler_state : SchedulerState ,
381375 ) -> dict [str , Any ] | None :
382376 """
@@ -499,9 +493,7 @@ def compile(
499493
500494@SerializableAggregator .register ("generative_stats_progress" )
501495class GenerativeStatsProgressAggregator (
502- SerializableAggregator [
503- GenerationResponse , GenerationRequest , GenerationRequestTimings
504- ]
496+ SerializableAggregator [GenerationResponse , GenerationRequest ]
505497):
506498 """
507499 Tracks generative model metrics during benchmark execution.
@@ -523,7 +515,7 @@ def __call__(
523515 state : AggregatorState ,
524516 response : GenerationResponse | None ,
525517 request : GenerationRequest ,
526- request_info : ScheduledRequestInfo [ GenerationRequestTimings ] ,
518+ request_info : ScheduledRequestInfo ,
527519 scheduler_state : SchedulerState ,
528520 ) -> dict [str , Any ] | None :
529521 """
@@ -667,9 +659,7 @@ def compile(
667659
668660@SerializableAggregator .register ("generative_requests" )
669661class GenerativeRequestsAggregator (
670- SerializableAggregator [
671- GenerationResponse , GenerationRequest , GenerationRequestTimings
672- ],
662+ SerializableAggregator [GenerationResponse , GenerationRequest ],
673663):
674664 """
675665 Compiles complete generative benchmark results with warmup/cooldown filtering.
@@ -712,7 +702,7 @@ def __call__(
712702 state : AggregatorState ,
713703 response : GenerationResponse | None ,
714704 request : GenerationRequest ,
715- request_info : ScheduledRequestInfo [ GenerationRequestTimings ] ,
705+ request_info : ScheduledRequestInfo ,
716706 scheduler_state : SchedulerState ,
717707 ) -> dict [str , Any ] | None :
718708 """
@@ -875,7 +865,7 @@ def compile(
875865
876866 def _is_in_warmup (
877867 self ,
878- request_info : ScheduledRequestInfo [ GenerationRequestTimings ] ,
868+ request_info : ScheduledRequestInfo ,
879869 scheduler_state : SchedulerState ,
880870 ) -> bool :
881871 """Check if the current request is within the warmup period."""
@@ -902,7 +892,7 @@ def _is_in_warmup(
902892
903893 def _is_in_cooldown (
904894 self ,
905- request_info : ScheduledRequestInfo [ GenerationRequestTimings ] ,
895+ request_info : ScheduledRequestInfo ,
906896 scheduler_state : SchedulerState ,
907897 ) -> bool :
908898 """Check if the current request is within the cooldown period."""
@@ -936,7 +926,7 @@ def _create_generative_request_stats(
936926 cls ,
937927 response : GenerationResponse ,
938928 request : GenerationRequest ,
939- request_info : ScheduledRequestInfo [ GenerationRequestTimings ] ,
929+ request_info : ScheduledRequestInfo ,
940930 ) -> GenerativeRequestStats :
941931 prompt_tokens = response .preferred_prompt_tokens (
942932 settings .preferred_prompt_tokens_source
0 commit comments