Skip to content

Commit 64ea827

Browse files
committed
Fix coderabbit suggestions and rename secret
Signed-off-by: Jorge Garcia Oncins <[email protected]>
1 parent 09d70ea commit 64ea827

File tree

4 files changed

+36
-28
lines changed

4 files changed

+36
-28
lines changed

DEPLOYMENT.md

Lines changed: 16 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -44,19 +44,23 @@ oc patch secret hf-token-secret --type='merge' -p='{"data":{"HF_TOKEN":"'$(echo
4444

4545
#### Option D: setup using an inference model deployed remotely
4646

47-
Note: do not use VLLM_TLS_VERIFY=false in production environments
47+
4848
```bash
49-
# Create secret llama-stack-remote-inference-model-secret providing remote model info
50-
export INFERENCE_MODEL=llama-3-2-3b
51-
export VLLM_URL=https://llama-3-2-3b.apps.remote-cluster.com:443/v1
52-
export VLLM_TLS_VERIFY=false
53-
export VLLM_API_TOKEN=XXXXXXXXXXXXXXXXXXXXXXX
54-
55-
oc create secret generic llama-stack-remote-inference-model-secret \
56-
--from-literal INFERENCE_MODEL=$INFERENCE_MODEL \
57-
--from-literal VLLM_URL=$VLLM_URL \
58-
--from-literal VLLM_TLS_VERIFY=$VLLM_TLS_VERIFY \
59-
--from-literal VLLM_API_TOKEN=$VLLM_API_TOKEN
49+
# Create secret llama-stack-inference-model-secret providing model info
50+
# Important:
51+
# - Make sure that the value for INFERENCE_MODEL is correct (it doesn't have points)
52+
# - In VLLM_URL you can use internal or external endpoints for the model. Add /v1 at the end
53+
# - NEVER set VLLM_TLS_VERIFY=false in production
54+
export INFERENCE_MODEL="llama-3-2-3b"
55+
export VLLM_URL="https://llama-3-2-3b.apps.remote-cluster.com:443/v1"
56+
export VLLM_TLS_VERIFY="false"
57+
export VLLM_API_TOKEN="XXXXXXXXXXXXXXXXXXXXXXX"
58+
59+
oc create secret generic llama-stack-inference-model-secret \
60+
--from-literal INFERENCE_MODEL="$INFERENCE_MODEL" \
61+
--from-literal VLLM_URL="$VLLM_URL" \
62+
--from-literal VLLM_TLS_VERIFY="$VLLM_TLS_VERIFY" \
63+
--from-literal VLLM_API_TOKEN="$VLLM_API_TOKEN"
6064

6165
# Deploy the LlamaStackDistribution
6266
oc apply -k stack/overlays/vllm-remote-inference-model

stack/overlays/vllm-remote-inference-model/llama-stack-distribution.yaml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -19,25 +19,25 @@ spec:
1919
valueFrom:
2020
secretKeyRef:
2121
key: INFERENCE_MODEL
22-
name: llama-stack-remote-inference-model-secret
22+
name: llama-stack-inference-model-secret
2323
optional: true
2424
- name: VLLM_URL
2525
valueFrom:
2626
secretKeyRef:
2727
key: VLLM_URL
28-
name: llama-stack-remote-inference-model-secret
28+
name: llama-stack-inference-model-secret
2929
optional: true
3030
- name: VLLM_TLS_VERIFY
3131
valueFrom:
3232
secretKeyRef:
3333
key: VLLM_TLS_VERIFY
34-
name: llama-stack-remote-inference-model-secret
34+
name: llama-stack-inference-model-secret
3535
optional: true
3636
- name: VLLM_API_TOKEN
3737
valueFrom:
3838
secretKeyRef:
3939
key: VLLM_API_TOKEN
40-
name: llama-stack-remote-inference-model-secret
40+
name: llama-stack-inference-model-secret
4141
optional: true
4242
- name: MILVUS_DB_PATH
4343
value: ~/.llama/milvus.db
Lines changed: 16 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,16 @@
1+
# Secret added as example. It should be manually created with the right values via
2+
# oc create secret generic ... before creating the llama-stack-distribution
3+
# Important:
4+
# - Make sure that the value for INFERENCE_MODEL is correct (it doesn't have points)
5+
# - In VLLM_URL you can use internal or external endpoints for the model. Add /v1 at the end
6+
# - NEVER set VLLM_TLS_VERIFY=false in production
7+
apiVersion: v1
8+
kind: Secret
9+
metadata:
10+
name: llama-stack-inference-model-secret
11+
type: Opaque
12+
stringData:
13+
INFERENCE_MODEL: "<your-model-id>"
14+
VLLM_API_TOKEN: "<paste-api-token>"
15+
VLLM_TLS_VERIFY: "true" # or "false"
16+
VLLM_URL: "https://your-model-id.example.com/v1"

stack/overlays/vllm-remote-inference-model/llama-stack-remote-inference-model-secret.yaml

Lines changed: 0 additions & 12 deletions
This file was deleted.

0 commit comments

Comments
 (0)