@@ -154,6 +154,7 @@ class UserAPIKeyLabelNames(Enum):
154
154
155
155
DEFINED_PROMETHEUS_METRICS = Literal [
156
156
"litellm_llm_api_latency_metric" ,
157
+ "litellm_llm_api_time_to_first_token_metric" ,
157
158
"litellm_request_total_latency_metric" ,
158
159
"litellm_overhead_latency_metric" ,
159
160
"litellm_remaining_requests_metric" ,
@@ -173,9 +174,11 @@ class UserAPIKeyLabelNames(Enum):
173
174
"litellm_remaining_api_key_budget_metric" ,
174
175
"litellm_api_key_max_budget_metric" ,
175
176
"litellm_api_key_budget_remaining_hours_metric" ,
177
+ "litellm_deployment_state" ,
176
178
"litellm_deployment_failure_responses" ,
177
179
"litellm_deployment_total_requests" ,
178
180
"litellm_deployment_success_responses" ,
181
+ "litellm_deployment_cooled_down" ,
179
182
"litellm_pod_lock_manager_size" ,
180
183
"litellm_in_memory_daily_spend_update_queue_size" ,
181
184
"litellm_redis_daily_spend_update_queue_size" ,
@@ -191,9 +194,14 @@ class PrometheusMetricLabels:
191
194
UserAPIKeyLabelNames .API_KEY_ALIAS .value ,
192
195
UserAPIKeyLabelNames .TEAM .value ,
193
196
UserAPIKeyLabelNames .TEAM_ALIAS .value ,
194
- UserAPIKeyLabelNames .REQUESTED_MODEL .value ,
195
- UserAPIKeyLabelNames .END_USER .value ,
196
- UserAPIKeyLabelNames .USER .value ,
197
+ ]
198
+
199
+ litellm_llm_api_time_to_first_token_metric = [
200
+ UserAPIKeyLabelNames .v1_LITELLM_MODEL_NAME .value ,
201
+ UserAPIKeyLabelNames .API_KEY_HASH .value ,
202
+ UserAPIKeyLabelNames .API_KEY_ALIAS .value ,
203
+ UserAPIKeyLabelNames .TEAM .value ,
204
+ UserAPIKeyLabelNames .TEAM_ALIAS .value ,
197
205
]
198
206
199
207
litellm_request_total_latency_metric = [
@@ -315,6 +323,20 @@ class PrometheusMetricLabels:
315
323
UserAPIKeyLabelNames .REQUESTED_MODEL .value ,
316
324
]
317
325
326
+ litellm_deployment_state = [
327
+ UserAPIKeyLabelNames .v2_LITELLM_MODEL_NAME .value ,
328
+ UserAPIKeyLabelNames .MODEL_ID .value ,
329
+ UserAPIKeyLabelNames .API_BASE .value ,
330
+ UserAPIKeyLabelNames .API_PROVIDER .value ,
331
+ ]
332
+
333
+ litellm_deployment_cooled_down = [
334
+ UserAPIKeyLabelNames .v2_LITELLM_MODEL_NAME .value ,
335
+ UserAPIKeyLabelNames .MODEL_ID .value ,
336
+ UserAPIKeyLabelNames .API_BASE .value ,
337
+ UserAPIKeyLabelNames .API_PROVIDER .value ,
338
+ ]
339
+
318
340
litellm_deployment_successful_fallbacks = [
319
341
UserAPIKeyLabelNames .REQUESTED_MODEL .value ,
320
342
UserAPIKeyLabelNames .FALLBACK_MODEL .value ,
0 commit comments