@@ -76,11 +76,6 @@ def __init__(self, labels: List[str], max_model_len: int):
7676 description = "Number of generation tokens processed." ,
7777 kind = pb_utils .MetricFamily .HISTOGRAM ,
7878 )
79- self .histogram_best_of_request_family = pb_utils .MetricFamily (
80- name = "vllm:request_params_best_of" ,
81- description = "Histogram of the best_of request parameter." ,
82- kind = pb_utils .MetricFamily .HISTOGRAM ,
83- )
8479 self .histogram_n_request_family = pb_utils .MetricFamily (
8580 name = "vllm:request_params_n" ,
8681 description = "Histogram of the n request parameter." ,
@@ -159,10 +154,6 @@ def __init__(self, labels: List[str], max_model_len: int):
159154 buckets = build_1_2_5_buckets (max_model_len ),
160155 )
161156 )
162- self .histogram_best_of_request = self .histogram_best_of_request_family .Metric (
163- labels = labels ,
164- buckets = [1 , 2 , 5 , 10 , 20 ],
165- )
166157 self .histogram_n_request = self .histogram_n_request_family .Metric (
167158 labels = labels ,
168159 buckets = [1 , 2 , 5 , 10 , 20 ],
@@ -247,7 +238,6 @@ def log(self, stats: VllmStats) -> None:
247238 self .metrics .histogram_num_generation_tokens_request ,
248239 stats .num_generation_tokens_requests ,
249240 ),
250- (self .metrics .histogram_best_of_request , stats .best_of_requests ),
251241 (self .metrics .histogram_n_request , stats .n_requests ),
252242 ]
253243
0 commit comments