Skip to content

Commit ad201f4

Browse files
committed
add more
1 parent 40b5326 commit ad201f4

File tree

3 files changed

+135
-0
lines changed

3 files changed

+135
-0
lines changed

oss/litellm/Dockerfile

Lines changed: 23 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,23 @@
1+
FROM cgr.dev/chainguard/python:latest-dev
2+
3+
USER root
4+
WORKDIR /app
5+
6+
ENV HOME=/home/litellm
7+
ENV PATH="${HOME}/venv/bin:$PATH"
8+
9+
# Install runtime dependencies
10+
RUN apk update && \
11+
apk add --no-cache gcc python3-dev openssl openssl-dev
12+
13+
RUN python -m venv ${HOME}/venv
14+
RUN ${HOME}/venv/bin/pip install --no-cache-dir --upgrade pip
15+
16+
COPY requirements.txt .
17+
RUN --mount=type=cache,target=${HOME}/.cache/pip \
18+
${HOME}/venv/bin/pip install -r requirements.txt
19+
20+
EXPOSE 4000/tcp
21+
22+
ENTRYPOINT ["litellm"]
23+
CMD ["--port", "4000"]

oss/litellm/combined.yaml

Lines changed: 108 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,108 @@
1+
apiVersion: v1
2+
kind: ConfigMap
3+
metadata:
4+
name: litellm-config-file
5+
data:
6+
config.yaml: |
7+
model_list:
8+
- model_name: DeepSeek-R1-Distill-Qwen-7B-GGUF
9+
litellm_params:
10+
model: unsloth/DeepSeek-R1-Distill-Qwen-7B-GGUF
11+
api_base: http://llama-cpp-cpu-lb-2137543273.us-west-2.elb.amazonaws.com/v1/chat/completions
12+
api_key: os.environ/OPENAI_API_KEY
13+
- model_name: QwQ-32B
14+
litellm_params:
15+
model: Qwen/QwQ-32B
16+
api_base: http://54.159.11.218:8080/v1
17+
api_key: os.environ/OPENAI_API_KEY
18+
general_settings:
19+
master_key: os.environ/LITELLM_MASTER_KEY
20+
---
21+
apiVersion: v1
22+
kind: Secret
23+
type: Opaque
24+
metadata:
25+
name: litellm-secrets
26+
data:
27+
OPENAI_API_KEY: c2stMTIzNA== # your api key in base64
28+
LITELLM_MASTER_KEY: c2stMTIzNA== # master key in base64
29+
stringData:
30+
DATABASE_URL: postgresql://<user>:<password>@<host>:<port>/<dbname>
31+
---
32+
apiVersion: apps/v1
33+
kind: Deployment
34+
metadata:
35+
name: litellm-deployment
36+
labels:
37+
app: litellm
38+
spec:
39+
selector:
40+
matchLabels:
41+
app: litellm
42+
template:
43+
metadata:
44+
labels:
45+
app: litellm
46+
spec:
47+
nodeSelector:
48+
kubernetes.io/arch: arm64
49+
affinity:
50+
nodeAffinity:
51+
requiredDuringSchedulingIgnoredDuringExecution:
52+
nodeSelectorTerms:
53+
- matchExpressions:
54+
- key: kubernetes.io/arch
55+
operator: In
56+
values:
57+
- arm64
58+
containers:
59+
- name: litellm
60+
image: 412381761882.dkr.ecr.us-west-2.amazonaws.com/litellm-proxy:latest # it is recommended to fix a version generally
61+
ports:
62+
- containerPort: 4000
63+
volumeMounts:
64+
- name: config-volume
65+
mountPath: /app/proxy_server_config.yaml
66+
subPath: config.yaml
67+
envFrom:
68+
- secretRef:
69+
name: litellm-secrets
70+
volumes:
71+
- name: config-volume
72+
configMap:
73+
name: litellm-config-file
74+
---
75+
apiVersion: v1
76+
kind: Service
77+
metadata:
78+
name: litellm-service
79+
labels:
80+
app: litellm
81+
spec:
82+
selector:
83+
app: litellm
84+
ports:
85+
- port: 80
86+
targetPort: 4000
87+
protocol: TCP
88+
type: ClusterIP
89+
---
90+
apiVersion: networking.k8s.io/v1
91+
kind: Ingress
92+
metadata:
93+
name: litellm-ingress
94+
annotations:
95+
kubernetes.io/ingress.class: "alb"
96+
alb.ingress.kubernetes.io/scheme: internet-facing
97+
alb.ingress.kubernetes.io/target-type: ip
98+
spec:
99+
rules:
100+
- http:
101+
paths:
102+
- path: /
103+
pathType: Prefix
104+
backend:
105+
service:
106+
name: litellm-service
107+
port:
108+
number: 80

oss/litellm/requirements.txt

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,4 @@
1+
litellm[proxy]==1.57.3 # Specify the litellm version you want to use
2+
prometheus_client
3+
langfuse
4+
prisma

0 commit comments

Comments
 (0)