@@ -132,6 +132,13 @@ class frontend_service:
132132 OPERATION_LABEL = "operation"
133133
134134
135+ class kv_publisher :
136+ """KV Publisher metrics"""
137+
138+ # Total number of raw events dropped by engines before reaching publisher (detected via event_id gaps)
139+ ENGINES_DROPPED_EVENTS_TOTAL = "kv_publisher_engines_dropped_events_total"
140+
141+
135142class kvbm :
136143 """KVBM"""
137144
@@ -167,6 +174,21 @@ class kvbm:
167174 OBJECT_WRITE_FAILURES = "object_write_failures"
168175
169176
177+ class kvindexer :
178+ """Standalone KV indexer HTTP service metrics"""
179+
180+ # HTTP request latency
181+ REQUEST_DURATION_SECONDS = "request_duration_seconds"
182+ # Total HTTP requests
183+ REQUESTS_TOTAL = "requests_total"
184+ # HTTP error responses (4xx/5xx)
185+ ERRORS_TOTAL = "errors_total"
186+ # Number of active model+tenant indexers
187+ MODELS = "models"
188+ # Number of registered worker instances
189+ WORKERS = "workers"
190+
191+
170192class kvrouter :
171193 # Number of KV cache events applied to the index (including status)
172194 KV_CACHE_EVENTS_APPLIED = "kv_cache_events_applied"
@@ -225,6 +247,8 @@ class name_prefix:
225247 ROUTER = "dynamo_router"
226248 # Prefix for tokio runtime metrics
227249 TOKIO = "dynamo_tokio"
250+ # Prefix for standalone KV indexer metrics
251+ KVINDEXER = "dynamo_kvindexer"
228252
229253
230254class router :
@@ -265,25 +289,6 @@ class routing_overhead:
265289 TOTAL_MS = "overhead_total_ms"
266290
267291
268- class trtllm_additional :
269- """Additional TRT-LLM worker metrics beyond what the engine natively provides."""
270-
271- # Total number of aborted/cancelled requests
272- NUM_ABORTED_REQUESTS_TOTAL = "trtllm_num_aborted_requests_total"
273- # Total number of requests containing image content
274- REQUEST_TYPE_IMAGE_TOTAL = "trtllm_request_type_image_total"
275- # Total number of requests using guided/structured decoding
276- REQUEST_TYPE_STRUCTURED_OUTPUT_TOTAL = "trtllm_request_type_structured_output_total"
277- # Total number of successful KV cache transfers
278- KV_TRANSFER_SUCCESS_TOTAL = "trtllm_kv_transfer_success_total"
279- # KV cache transfer latency per request in seconds
280- KV_TRANSFER_LATENCY_SECONDS = "trtllm_kv_transfer_latency_seconds"
281- # KV cache transfer size per request in bytes
282- KV_TRANSFER_BYTES = "trtllm_kv_transfer_bytes"
283- # KV cache transfer speed per request in GB/s
284- KV_TRANSFER_SPEED_GB_S = "trtllm_kv_transfer_speed_gb_s"
285-
286-
287292class task_tracker :
288293 """Task tracker Prometheus metric name suffixes"""
289294
@@ -318,6 +323,25 @@ class tokio_perf:
318323 ALIVE_TASKS = "alive_tasks"
319324
320325
326+ class trtllm_additional :
327+ """Additional TRT-LLM worker metrics beyond what the engine natively provides."""
328+
329+ # Total number of aborted/cancelled requests
330+ NUM_ABORTED_REQUESTS_TOTAL = "trtllm_num_aborted_requests_total"
331+ # Total number of requests containing image content
332+ REQUEST_TYPE_IMAGE_TOTAL = "trtllm_request_type_image_total"
333+ # Total number of requests using guided/structured decoding
334+ REQUEST_TYPE_STRUCTURED_OUTPUT_TOTAL = "trtllm_request_type_structured_output_total"
335+ # Total number of successful KV cache transfers
336+ KV_TRANSFER_SUCCESS_TOTAL = "trtllm_kv_transfer_success_total"
337+ # KV cache transfer latency per request in seconds
338+ KV_TRANSFER_LATENCY_SECONDS = "trtllm_kv_transfer_latency_seconds"
339+ # KV cache transfer size per request in bytes
340+ KV_TRANSFER_BYTES = "trtllm_kv_transfer_bytes"
341+ # KV cache transfer speed per request in GB/s
342+ KV_TRANSFER_SPEED_GB_S = "trtllm_kv_transfer_speed_gb_s"
343+
344+
321345class work_handler :
322346 """Work handler Prometheus metric names"""
323347
0 commit comments