forked from yachty66/demo-stablecode-instruct-alpha-3b-gptq
-
Notifications
You must be signed in to change notification settings - Fork 1
Expand file tree
/
Copy pathDockerfile
More file actions
27 lines (18 loc) · 690 Bytes
/
Dockerfile
File metadata and controls
27 lines (18 loc) · 690 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
# Must use a Cuda version 11+
FROM pytorch/pytorch:1.11.0-cuda11.3-cudnn8-runtime
WORKDIR /
# Install git and wget
RUN apt-get update && apt-get install -y git wget
# Upgrade pip
RUN pip install --upgrade pip
# Download and install specific version of AutoGPTQ from GitHub release
RUN wget https://github.com/PanQiWei/AutoGPTQ/releases/download/v0.3.2/auto_gptq-0.3.2+cu117-cp38-cp38-linux_x86_64.whl && \
GITHUB_ACTIONS=true pip3 install auto_gptq-0.3.2+cu117-cp38-cp38-linux_x86_64.whl
ADD requirements.txt requirements.txt
RUN pip3 install -r requirements.txt
# Add your model weight files
ADD download.py .
RUN python3 download.py
ADD . .
EXPOSE 8000
CMD python3 -u app.py