Skip to content

Commit 934d0ea

Browse files
authored
Merge pull request #18 from stackhpc/minor-fixes
Improve Grafana dashboard and other minor fixes
2 parents 3bea38b + b99fbe6 commit 934d0ea

File tree

4 files changed

+109
-10
lines changed

4 files changed

+109
-10
lines changed

chart/templates/api/config-map-grafana-dashboard.yml

Lines changed: 105 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -31,6 +31,103 @@ data:
3131
"links": [],
3232
"liveNow": false,
3333
"panels": [
34+
{
35+
"datasource": {
36+
"type": "prometheus",
37+
"uid": "prometheus"
38+
},
39+
"fieldConfig": {
40+
"defaults": {
41+
"color": {
42+
"mode": "palette-classic"
43+
},
44+
"custom": {
45+
"axisBorderShow": false,
46+
"axisCenteredZero": false,
47+
"axisColorMode": "text",
48+
"axisLabel": "Request Rate",
49+
"axisPlacement": "auto",
50+
"axisWidth": 3,
51+
"barAlignment": 0,
52+
"drawStyle": "line",
53+
"fillOpacity": 0,
54+
"gradientMode": "none",
55+
"hideFrom": {
56+
"legend": false,
57+
"tooltip": false,
58+
"viz": false
59+
},
60+
"insertNulls": false,
61+
"lineInterpolation": "linear",
62+
"lineWidth": 1,
63+
"pointSize": 5,
64+
"scaleDistribution": {
65+
"type": "linear"
66+
},
67+
"showPoints": "auto",
68+
"spanNulls": false,
69+
"stacking": {
70+
"group": "A",
71+
"mode": "none"
72+
},
73+
"thresholdsStyle": {
74+
"mode": "off"
75+
}
76+
},
77+
"mappings": [],
78+
"thresholds": {
79+
"mode": "absolute",
80+
"steps": [
81+
{
82+
"color": "green",
83+
"value": null
84+
},
85+
{
86+
"color": "red",
87+
"value": 80
88+
}
89+
]
90+
},
91+
"unitScale": true
92+
},
93+
"overrides": []
94+
},
95+
"gridPos": {
96+
"h": 12,
97+
"w": 24,
98+
"x": 0,
99+
"y": 0
100+
},
101+
"id": 7,
102+
"options": {
103+
"legend": {
104+
"calcs": [],
105+
"displayMode": "list",
106+
"placement": "bottom",
107+
"showLegend": true
108+
},
109+
"tooltip": {
110+
"mode": "single",
111+
"sort": "none"
112+
}
113+
},
114+
"targets": [
115+
{
116+
"datasource": {
117+
"type": "prometheus",
118+
"uid": "prometheus"
119+
},
120+
"editorMode": "code",
121+
"expr": "sum by (container, namespace, method, path) (rate(requests_total_counter[1m]))",
122+
"instant": false,
123+
"legendFormat": "__auto",
124+
"range": true,
125+
"refId": "A"
126+
}
127+
],
128+
"title": "API Requests",
129+
"type": "timeseries"
130+
},
34131
{
35132
"datasource": {
36133
"type": "prometheus",
@@ -95,7 +192,7 @@ data:
95192
"h": 8,
96193
"w": 12,
97194
"x": 0,
98-
"y": 0
195+
"y": 12
99196
},
100197
"id": 2,
101198
"options": {
@@ -191,7 +288,7 @@ data:
191288
"h": 8,
192289
"w": 12,
193290
"x": 12,
194-
"y": 0
291+
"y": 12
195292
},
196293
"id": 4,
197294
"options": {
@@ -287,7 +384,7 @@ data:
287384
"h": 8,
288385
"w": 12,
289386
"x": 0,
290-
"y": 8
387+
"y": 20
291388
},
292389
"id": 3,
293390
"options": {
@@ -383,7 +480,7 @@ data:
383480
"h": 8,
384481
"w": 12,
385482
"x": 12,
386-
"y": 8
483+
"y": 20
387484
},
388485
"id": 5,
389486
"options": {
@@ -479,7 +576,7 @@ data:
479576
"h": 8,
480577
"w": 12,
481578
"x": 0,
482-
"y": 16
579+
"y": 28
483580
},
484581
"id": 1,
485582
"options": {
@@ -579,7 +676,7 @@ data:
579676
"h": 8,
580677
"w": 12,
581678
"x": 12,
582-
"y": 16
679+
"y": 28
583680
},
584681
"id": 6,
585682
"options": {
@@ -619,14 +716,14 @@ data:
619716
"list": []
620717
},
621718
"time": {
622-
"from": "now-24h",
719+
"from": "now-30m",
623720
"to": "now"
624721
},
625722
"timepicker": {},
626723
"timezone": "",
627724
"title": "LLM Dashboard",
628725
"uid": "c4114a95-8172-4a8b-99c8-963ba7d31385",
629-
"version": 4,
726+
"version": 1,
630727
"weekStart": ""
631728
}
632729
{{- end -}}

chart/templates/api/deployment.yml

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -38,6 +38,8 @@ spec:
3838
name: huggingface-token
3939
{{- else if .Values.huggingface.token }}
4040
env:
41+
- name: DO_NOT_TRACK
42+
value: 1
4143
- name: HUGGING_FACE_HUB_TOKEN
4244
value: {{ quote .Values.huggingface.token }}
4345
{{- else if contains "Llama" .Values.huggingface.model -}}

chart/values.schema.json

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -67,7 +67,7 @@
6767
"llm_top_k": {
6868
"type": "integer",
6969
"title": "LLM Top K",
70-
"description": "The [top k](https://docs.vllm.ai/en/latest/dev/sampling_params.html) value to use when generating LLM responses (must be an integer).",
70+
"description": "The [top k](https://docs.vllm.ai/en/stable/dev/sampling_params.html) value to use when generating LLM responses (must be an integer).",
7171
"default": -1,
7272
"minimum": -1
7373
},

chart/web-app/app.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -122,7 +122,7 @@ def inference(latest_message, history):
122122
raise gr.Error("Unexpected error encountered - see logs for details.")
123123

124124

125-
# UI colour theming
125+
# UI theming
126126
theme = gr.themes.Default(**settings.theme_params)
127127
if settings.theme_background_colour:
128128
theme.body_background_fill = settings.theme_background_colour

0 commit comments

Comments
 (0)