1
1
apiVersion : v1
2
2
kind : Service
3
3
metadata :
4
- name : minio
4
+ name : minio-guardrails-guardian
5
5
spec :
6
6
ports :
7
7
- name : minio-client-port
8
8
port : 9000
9
9
protocol : TCP
10
10
targetPort : 9000
11
11
selector :
12
- app : minio
12
+ app : minio-guardrails-guardian
13
13
---
14
14
apiVersion : v1
15
15
kind : PersistentVolumeClaim
16
16
metadata :
17
- name : vllm -models-claim
17
+ name : guardrails -models-claim-guardian
18
18
spec :
19
19
accessModes :
20
20
- ReadWriteOnce
21
21
volumeMode : Filesystem
22
22
# storageClassName: gp3-csi
23
23
resources :
24
24
requests :
25
- storage : 300Gi
25
+ storage : 100Gi
26
26
---
27
27
apiVersion : apps/v1
28
28
kind : Deployment
29
29
metadata :
30
- name : llm -container-deployment # <--- change this
30
+ name : guardrails -container-deployment-guardian # <--- change this
31
31
labels :
32
- app : minio # <--- change this to match label on the pod
32
+ app : minio-guardrails-guardian # <--- change this to match label on the pod
33
33
spec :
34
34
replicas : 1
35
35
selector :
36
36
matchLabels :
37
- app : minio # <--- change this to match label on the pod
37
+ app : minio-guardrails-guardian # <--- change this to match label on the pod
38
38
template : # => from here down copy and paste the pods metadata: and spec: sections
39
39
metadata :
40
40
labels :
41
- app : minio
41
+ app : minio-guardrails-guardian
42
42
maistra.io/expose-route : ' true'
43
- name : minio
43
+ name : minio-guardrails-guardian
44
44
spec :
45
45
volumes :
46
46
- name : model-volume
47
47
persistentVolumeClaim :
48
- claimName : vllm -models-claim
48
+ claimName : guardrails -models-claim-guardian
49
49
initContainers :
50
50
- name : download-model
51
51
image : quay.io/rgeada/llm_downloader:latest
55
55
- bash
56
56
- -c
57
57
- |
58
- model="ibm-granite/granite-guardian-hap-38m"
58
+ # model="ibm-granite/granite-guardian-hap-38m"
59
+ # model="h2oai/deberta_finetuned_pii"
60
+ model="ibm-granite/granite-guardian-3.0-2b"
59
61
# model="microsoft/Phi-3-mini-4k-instruct"
60
62
echo "starting download"
61
63
/tmp/venv/bin/huggingface-cli download $model --local-dir /mnt/models/huggingface/$(basename $model)
92
94
apiVersion : v1
93
95
kind : Secret
94
96
metadata :
95
- name : aws-connection-minio-data-connection
97
+ name : aws-connection-minio-data-connection-guardrails-guardian
96
98
labels :
97
99
opendatahub.io/dashboard : ' true'
98
100
opendatahub.io/managed : ' true'
@@ -103,7 +105,7 @@ data:
103
105
AWS_ACCESS_KEY_ID : VEhFQUNDRVNTS0VZ
104
106
AWS_DEFAULT_REGION : dXMtc291dGg=
105
107
AWS_S3_BUCKET : aHVnZ2luZ2ZhY2U=
106
- AWS_S3_ENDPOINT : aHR0cDovL21pbmlvOjkwMDA =
108
+ AWS_S3_ENDPOINT : aHR0cDovL21pbmlvLWd1YXJkcmFpbHMtZ3VhcmRpYW46OTAwMA= =
107
109
AWS_SECRET_ACCESS_KEY : VEhFU0VDUkVUS0VZ
108
110
type : Opaque
109
111
---
0 commit comments