@@ -154,6 +154,7 @@ class UserAPIKeyLabelNames(Enum):
154
154
155
155
DEFINED_PROMETHEUS_METRICS = Literal [
156
156
"litellm_llm_api_latency_metric" ,
157
+ "litellm_llm_api_time_to_first_token_metric" ,
157
158
"litellm_request_total_latency_metric" ,
158
159
"litellm_overhead_latency_metric" ,
159
160
"litellm_remaining_requests_metric" ,
@@ -162,6 +163,7 @@ class UserAPIKeyLabelNames(Enum):
162
163
"litellm_proxy_failed_requests_metric" ,
163
164
"litellm_deployment_latency_per_output_token" ,
164
165
"litellm_requests_metric" ,
166
+ "litellm_spend_metric" ,
165
167
"litellm_total_tokens_metric" ,
166
168
"litellm_input_tokens_metric" ,
167
169
"litellm_output_tokens_metric" ,
@@ -173,9 +175,11 @@ class UserAPIKeyLabelNames(Enum):
173
175
"litellm_remaining_api_key_budget_metric" ,
174
176
"litellm_api_key_max_budget_metric" ,
175
177
"litellm_api_key_budget_remaining_hours_metric" ,
178
+ "litellm_deployment_state" ,
176
179
"litellm_deployment_failure_responses" ,
177
180
"litellm_deployment_total_requests" ,
178
181
"litellm_deployment_success_responses" ,
182
+ "litellm_deployment_cooled_down" ,
179
183
"litellm_pod_lock_manager_size" ,
180
184
"litellm_in_memory_daily_spend_update_queue_size" ,
181
185
"litellm_redis_daily_spend_update_queue_size" ,
@@ -191,9 +195,14 @@ class PrometheusMetricLabels:
191
195
UserAPIKeyLabelNames .API_KEY_ALIAS .value ,
192
196
UserAPIKeyLabelNames .TEAM .value ,
193
197
UserAPIKeyLabelNames .TEAM_ALIAS .value ,
194
- UserAPIKeyLabelNames .REQUESTED_MODEL .value ,
195
- UserAPIKeyLabelNames .END_USER .value ,
196
- UserAPIKeyLabelNames .USER .value ,
198
+ ]
199
+
200
+ litellm_llm_api_time_to_first_token_metric = [
201
+ UserAPIKeyLabelNames .v1_LITELLM_MODEL_NAME .value ,
202
+ UserAPIKeyLabelNames .API_KEY_HASH .value ,
203
+ UserAPIKeyLabelNames .API_KEY_ALIAS .value ,
204
+ UserAPIKeyLabelNames .TEAM .value ,
205
+ UserAPIKeyLabelNames .TEAM_ALIAS .value ,
197
206
]
198
207
199
208
litellm_request_total_latency_metric = [
@@ -282,6 +291,16 @@ class PrometheusMetricLabels:
282
291
UserAPIKeyLabelNames .USER_EMAIL .value ,
283
292
]
284
293
294
+ litellm_spend_metric = [
295
+ UserAPIKeyLabelNames .END_USER .value ,
296
+ UserAPIKeyLabelNames .API_KEY_HASH .value ,
297
+ UserAPIKeyLabelNames .API_KEY_ALIAS .value ,
298
+ UserAPIKeyLabelNames .v1_LITELLM_MODEL_NAME .value ,
299
+ UserAPIKeyLabelNames .TEAM .value ,
300
+ UserAPIKeyLabelNames .TEAM_ALIAS .value ,
301
+ UserAPIKeyLabelNames .USER .value ,
302
+ ]
303
+
285
304
litellm_input_tokens_metric = [
286
305
UserAPIKeyLabelNames .END_USER .value ,
287
306
UserAPIKeyLabelNames .API_KEY_HASH .value ,
@@ -315,6 +334,20 @@ class PrometheusMetricLabels:
315
334
UserAPIKeyLabelNames .REQUESTED_MODEL .value ,
316
335
]
317
336
337
+ litellm_deployment_state = [
338
+ UserAPIKeyLabelNames .v2_LITELLM_MODEL_NAME .value ,
339
+ UserAPIKeyLabelNames .MODEL_ID .value ,
340
+ UserAPIKeyLabelNames .API_BASE .value ,
341
+ UserAPIKeyLabelNames .API_PROVIDER .value ,
342
+ ]
343
+
344
+ litellm_deployment_cooled_down = [
345
+ UserAPIKeyLabelNames .v2_LITELLM_MODEL_NAME .value ,
346
+ UserAPIKeyLabelNames .MODEL_ID .value ,
347
+ UserAPIKeyLabelNames .API_BASE .value ,
348
+ UserAPIKeyLabelNames .API_PROVIDER .value ,
349
+ ]
350
+
318
351
litellm_deployment_successful_fallbacks = [
319
352
UserAPIKeyLabelNames .REQUESTED_MODEL .value ,
320
353
UserAPIKeyLabelNames .FALLBACK_MODEL .value ,
0 commit comments