forked from vllm-project/production-stack
-
Notifications
You must be signed in to change notification settings - Fork 3
Expand file tree
/
Copy pathprom-adapter.yaml
More file actions
31 lines (27 loc) · 807 Bytes
/
prom-adapter.yaml
File metadata and controls
31 lines (27 loc) · 807 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
loglevel: 1
prometheus:
url: http://kube-prom-stack-kube-prome-prometheus.monitoring.svc
port: 9090
rules:
default: true
custom:
# Example metric to export for HPA
- seriesQuery: '{__name__=~"^vllm:num_requests_waiting$"}'
resources:
overrides:
namespace:
resource: "namespace"
name:
matches: ""
as: "vllm_num_requests_waiting"
metricsQuery: sum by(namespace) (vllm:num_requests_waiting)
# Export num_incoming_requests_total by model name
- seriesQuery: '{__name__=~"^vllm:num_incoming_requests_total$"}'
resources:
overrides:
namespace:
resource: "namespace"
name:
matches: ""
as: "vllm_num_incoming_requests_total"
metricsQuery: sum by(namespace, model) (vllm:num_incoming_requests_total)