45
45
"axisBorderShow": false,
46
46
"axisCenteredZero": false,
47
47
"axisColorMode": "text",
48
- "axisLabel": "Request Rate ",
48
+ "axisLabel": "Requests per minute ",
49
49
"axisPlacement": "auto",
50
- "axisWidth": 3 ,
50
+ "axisWidth": 50 ,
51
51
"barAlignment": 0,
52
52
"drawStyle": "line",
53
53
"fillOpacity": 0,
87
87
"value": 80
88
88
}
89
89
]
90
- },
91
- "unitScale": true
90
+ }
92
91
},
93
92
"overrides": []
94
93
},
@@ -125,7 +124,7 @@ data:
125
124
"refId": "A"
126
125
}
127
126
],
128
- "title": "API Requests",
127
+ "title": "API Requests per Minute ",
129
128
"type": "timeseries"
130
129
},
131
130
{
@@ -142,8 +141,9 @@ data:
142
141
"axisBorderShow": false,
143
142
"axisCenteredZero": false,
144
143
"axisColorMode": "text",
145
- "axisLabel": "Tokens / second ",
144
+ "axisLabel": "Number of requests per minute ",
146
145
"axisPlacement": "auto",
146
+ "axisWidth": 50,
147
147
"barAlignment": 0,
148
148
"drawStyle": "line",
149
149
"fillOpacity": 0,
@@ -183,16 +183,110 @@ data:
183
183
"value": 80
184
184
}
185
185
]
186
+ }
187
+ },
188
+ "overrides": []
189
+ },
190
+ "gridPos": {
191
+ "h": 12,
192
+ "w": 24,
193
+ "x": 0,
194
+ "y": 12
195
+ },
196
+ "id": 8,
197
+ "options": {
198
+ "legend": {
199
+ "calcs": [],
200
+ "displayMode": "list",
201
+ "placement": "bottom",
202
+ "showLegend": true
203
+ },
204
+ "tooltip": {
205
+ "mode": "single",
206
+ "sort": "none"
207
+ }
208
+ },
209
+ "targets": [
210
+ {
211
+ "datasource": {
212
+ "type": "prometheus",
213
+ "uid": "prometheus"
186
214
},
187
- "unitScale": true
215
+ "editorMode": "code",
216
+ "expr": "sum by (container, namespace, method, path) (vllm:request_success_total)",
217
+ "instant": false,
218
+ "legendFormat": "__auto",
219
+ "range": true,
220
+ "refId": "A"
221
+ }
222
+ ],
223
+ "title": "Total API Requests",
224
+ "type": "timeseries"
225
+ },
226
+ {
227
+ "datasource": {
228
+ "type": "prometheus",
229
+ "uid": "prometheus"
230
+ },
231
+ "fieldConfig": {
232
+ "defaults": {
233
+ "color": {
234
+ "mode": "palette-classic"
235
+ },
236
+ "custom": {
237
+ "axisBorderShow": false,
238
+ "axisCenteredZero": false,
239
+ "axisColorMode": "text",
240
+ "axisLabel": "Tokens / second",
241
+ "axisPlacement": "auto",
242
+ "barAlignment": 0,
243
+ "drawStyle": "line",
244
+ "fillOpacity": 0,
245
+ "gradientMode": "none",
246
+ "hideFrom": {
247
+ "legend": false,
248
+ "tooltip": false,
249
+ "viz": false
250
+ },
251
+ "insertNulls": false,
252
+ "lineInterpolation": "linear",
253
+ "lineWidth": 1,
254
+ "pointSize": 5,
255
+ "scaleDistribution": {
256
+ "type": "linear"
257
+ },
258
+ "showPoints": "auto",
259
+ "spanNulls": false,
260
+ "stacking": {
261
+ "group": "A",
262
+ "mode": "none"
263
+ },
264
+ "thresholdsStyle": {
265
+ "mode": "off"
266
+ }
267
+ },
268
+ "mappings": [],
269
+ "thresholds": {
270
+ "mode": "absolute",
271
+ "steps": [
272
+ {
273
+ "color": "green",
274
+ "value": null
275
+ },
276
+ {
277
+ "color": "red",
278
+ "value": 80
279
+ }
280
+ ]
281
+ }
188
282
},
189
283
"overrides": []
190
284
},
191
285
"gridPos": {
192
286
"h": 8,
193
287
"w": 12,
194
288
"x": 0,
195
- "y": 12
289
+ "y": 24
196
290
},
197
291
"id": 2,
198
292
"options": {
@@ -279,16 +373,15 @@ data:
279
373
"value": 80
280
374
}
281
375
]
282
- },
283
- "unitScale": true
376
+ }
284
377
},
285
378
"overrides": []
286
379
},
287
380
"gridPos": {
288
381
"h": 8,
289
382
"w": 12,
290
383
"x": 12,
291
- "y": 12
384
+ "y": 24
292
385
},
293
386
"id": 4,
294
387
"options": {
@@ -375,16 +468,15 @@ data:
375
468
"value": 80
376
469
}
377
470
]
378
- },
379
- "unitScale": true
471
+ }
380
472
},
381
473
"overrides": []
382
474
},
383
475
"gridPos": {
384
476
"h": 8,
385
477
"w": 12,
386
478
"x": 0,
387
- "y": 20
479
+ "y": 32
388
480
},
389
481
"id": 3,
390
482
"options": {
@@ -471,16 +563,15 @@ data:
471
563
"value": 80
472
564
}
473
565
]
474
- },
475
- "unitScale": true
566
+ }
476
567
},
477
568
"overrides": []
478
569
},
479
570
"gridPos": {
480
571
"h": 8,
481
572
"w": 12,
482
573
"x": 12,
483
- "y": 20
574
+ "y": 32
484
575
},
485
576
"id": 5,
486
577
"options": {
@@ -567,16 +658,15 @@ data:
567
658
"value": 80
568
659
}
569
660
]
570
- },
571
- "unitScale": true
661
+ }
572
662
},
573
663
"overrides": []
574
664
},
575
665
"gridPos": {
576
666
"h": 8,
577
667
"w": 12,
578
668
"x": 0,
579
- "y": 28
669
+ "y": 40
580
670
},
581
671
"id": 1,
582
672
"options": {
@@ -667,16 +757,15 @@ data:
667
757
"value": 80
668
758
}
669
759
]
670
- },
671
- "unitScale": true
760
+ }
672
761
},
673
762
"overrides": []
674
763
},
675
764
"gridPos": {
676
765
"h": 8,
677
766
"w": 12,
678
767
"x": 12,
679
- "y": 28
768
+ "y": 40
680
769
},
681
770
"id": 6,
682
771
"options": {
@@ -708,22 +797,6 @@ data:
708
797
"title": "GPU Power Draw",
709
798
"type": "timeseries"
710
799
}
711
- ],
712
- "refresh": "",
713
- "schemaVersion": 39,
714
- "tags": [],
715
- "templating": {
716
- "list": []
717
- },
718
- "time": {
719
- "from": "now-30m",
720
- "to": "now"
721
- },
722
- "timepicker": {},
723
- "timezone": "",
724
- "title": "LLM Dashboard",
725
- "uid": "c4114a95-8172-4a8b-99c8-963ba7d31385",
726
- "version": 1,
727
- "weekStart": ""
800
+ ]
728
801
}
729
802
{{- end -}}
0 commit comments