|
34 | 34 | from vllm.engine.metrics import SupportsMetricsInfo, build_1_2_5_buckets |
35 | 35 | from vllm.version import __version__ as _VLLM_VERSION |
36 | 36 |
|
| 37 | + |
37 | 38 | class TritonMetrics: |
38 | 39 | def __init__(self, labels: List[str], max_model_len: int): |
39 | 40 | # Initialize metric families |
@@ -163,9 +164,11 @@ def __init__(self, labels: List[str], max_model_len: int): |
163 | 164 | ) |
164 | 165 | ) |
165 | 166 | if _VLLM_VERSION < "0.6.3": |
166 | | - self.histogram_best_of_request = self.histogram_best_of_request_family.Metric( |
167 | | - labels=labels, |
168 | | - buckets=[1, 2, 5, 10, 20], |
| 167 | + self.histogram_best_of_request = ( |
| 168 | + self.histogram_best_of_request_family.Metric( |
| 169 | + labels=labels, |
| 170 | + buckets=[1, 2, 5, 10, 20], |
| 171 | + ) |
169 | 172 | ) |
170 | 173 | self.histogram_n_request = self.histogram_n_request_family.Metric( |
171 | 174 | labels=labels, |
@@ -254,7 +257,9 @@ def log(self, stats: VllmStats) -> None: |
254 | 257 | (self.metrics.histogram_n_request, stats.n_requests), |
255 | 258 | ] |
256 | 259 | if _VLLM_VERSION < "0.6.3": |
257 | | - histogram_metrics.append((self.metrics.histogram_best_of_request, stats.best_of_requests)) |
| 260 | + histogram_metrics.append( |
| 261 | + (self.metrics.histogram_best_of_request, stats.best_of_requests) |
| 262 | + ) |
258 | 263 | for metric, data in counter_metrics: |
259 | 264 | self._log_counter(metric, data) |
260 | 265 | for metric, data in histogram_metrics: |
|
0 commit comments