File tree Expand file tree Collapse file tree 3 files changed +135
-0
lines changed Expand file tree Collapse file tree 3 files changed +135
-0
lines changed Original file line number Diff line number Diff line change 1+ FROM cgr.dev/chainguard/python:latest-dev
2+
3+ USER root
4+ WORKDIR /app
5+
6+ ENV HOME=/home/litellm
7+ ENV PATH="${HOME}/venv/bin:$PATH"
8+
9+ # Install runtime dependencies
10+ RUN apk update && \
11+ apk add --no-cache gcc python3-dev openssl openssl-dev
12+
13+ RUN python -m venv ${HOME}/venv
14+ RUN ${HOME}/venv/bin/pip install --no-cache-dir --upgrade pip
15+
16+ COPY requirements.txt .
17+ RUN --mount=type=cache,target=${HOME}/.cache/pip \
18+ ${HOME}/venv/bin/pip install -r requirements.txt
19+
20+ EXPOSE 4000/tcp
21+
22+ ENTRYPOINT ["litellm" ]
23+ CMD ["--port" , "4000" ]
Original file line number Diff line number Diff line change 1+ apiVersion : v1
2+ kind : ConfigMap
3+ metadata :
4+ name : litellm-config-file
5+ data :
6+ config.yaml : |
7+ model_list:
8+ - model_name: DeepSeek-R1-Distill-Qwen-7B-GGUF
9+ litellm_params:
10+ model: unsloth/DeepSeek-R1-Distill-Qwen-7B-GGUF
11+ api_base: http://llama-cpp-cpu-lb-2137543273.us-west-2.elb.amazonaws.com/v1/chat/completions
12+ api_key: os.environ/OPENAI_API_KEY
13+ - model_name: QwQ-32B
14+ litellm_params:
15+ model: Qwen/QwQ-32B
16+ api_base: http://54.159.11.218:8080/v1
17+ api_key: os.environ/OPENAI_API_KEY
18+ general_settings:
19+ master_key: os.environ/LITELLM_MASTER_KEY
20+ ---
21+ apiVersion : v1
22+ kind : Secret
23+ type : Opaque
24+ metadata :
25+ name : litellm-secrets
26+ data :
27+ OPENAI_API_KEY : c2stMTIzNA== # your api key in base64
28+ LITELLM_MASTER_KEY : c2stMTIzNA== # master key in base64
29+ stringData :
30+ DATABASE_URL : postgresql://<user>:<password>@<host>:<port>/<dbname>
31+ ---
32+ apiVersion : apps/v1
33+ kind : Deployment
34+ metadata :
35+ name : litellm-deployment
36+ labels :
37+ app : litellm
38+ spec :
39+ selector :
40+ matchLabels :
41+ app : litellm
42+ template :
43+ metadata :
44+ labels :
45+ app : litellm
46+ spec :
47+ nodeSelector :
48+ kubernetes.io/arch : arm64
49+ affinity :
50+ nodeAffinity :
51+ requiredDuringSchedulingIgnoredDuringExecution :
52+ nodeSelectorTerms :
53+ - matchExpressions :
54+ - key : kubernetes.io/arch
55+ operator : In
56+ values :
57+ - arm64
58+ containers :
59+ - name : litellm
60+ image : 412381761882.dkr.ecr.us-west-2.amazonaws.com/litellm-proxy:latest # it is recommended to fix a version generally
61+ ports :
62+ - containerPort : 4000
63+ volumeMounts :
64+ - name : config-volume
65+ mountPath : /app/proxy_server_config.yaml
66+ subPath : config.yaml
67+ envFrom :
68+ - secretRef :
69+ name : litellm-secrets
70+ volumes :
71+ - name : config-volume
72+ configMap :
73+ name : litellm-config-file
74+ ---
75+ apiVersion : v1
76+ kind : Service
77+ metadata :
78+ name : litellm-service
79+ labels :
80+ app : litellm
81+ spec :
82+ selector :
83+ app : litellm
84+ ports :
85+ - port : 80
86+ targetPort : 4000
87+ protocol : TCP
88+ type : ClusterIP
89+ ---
90+ apiVersion : networking.k8s.io/v1
91+ kind : Ingress
92+ metadata :
93+ name : litellm-ingress
94+ annotations :
95+ kubernetes.io/ingress.class : " alb"
96+ alb.ingress.kubernetes.io/scheme : internet-facing
97+ alb.ingress.kubernetes.io/target-type : ip
98+ spec :
99+ rules :
100+ - http :
101+ paths :
102+ - path : /
103+ pathType : Prefix
104+ backend :
105+ service :
106+ name : litellm-service
107+ port :
108+ number : 80
Original file line number Diff line number Diff line change 1+ litellm [proxy ]== 1.57.3 # Specify the litellm version you want to use
2+ prometheus_client
3+ langfuse
4+ prisma
You can’t perform that action at this time.
0 commit comments