File tree Expand file tree Collapse file tree 3 files changed +78
-0
lines changed Expand file tree Collapse file tree 3 files changed +78
-0
lines changed Original file line number Diff line number Diff line change
1
+ # General Ignore
2
+ .git
3
+ .github
4
+ .vscode
5
+ .dockerignore
6
+ .gitignore
7
+ README.md
8
+ Dockerfile
9
+ docker-compose.yaml
10
+
11
+ # Unique to distributed-llama
12
+ report
13
+ docs
14
+ examples
15
+ models
Original file line number Diff line number Diff line change
1
+ FROM debian:bookworm-slim
2
+
3
+ RUN apt-get update && apt-get install -y \
4
+ git build-essential dnsutils \
5
+ && rm -rf /var/lib/apt/lists/*
6
+
7
+ WORKDIR /app
8
+
9
+ COPY . /app
10
+ RUN make dllama && make dllama-api
11
+
12
+ # Default ports for root node + worker node
13
+ EXPOSE 5000
14
+ EXPOSE 9999
15
+
16
+ CMD ["./dllama" ]
Original file line number Diff line number Diff line change
1
+ services :
2
+ root :
3
+ build : .
4
+ networks :
5
+ - llama-net
6
+ volumes :
7
+ - ./models:/models
8
+ depends_on :
9
+ - worker1
10
+ - worker2
11
+ - worker3
12
+ ports :
13
+ - " 5000:5000"
14
+ restart : on-failure
15
+ command : >-
16
+ ./dllama-api
17
+ --model /models/dllama_model_llama3.2-1b-instruct_q40.m
18
+ --tokenizer /models/dllama_tokenizer_llama3_2.t
19
+ --buffer-float-type q80 --nthreads 2 --port 5000
20
+ --workers worker1:9999 worker2:9999 worker3:9999
21
+
22
+ worker1 :
23
+ build : .
24
+ ports :
25
+ - " 9999:9999"
26
+ networks :
27
+ - llama-net
28
+ command : >
29
+ ./dllama worker --port 9999 --nthreads 2
30
+
31
+ worker2 :
32
+ build : .
33
+ networks :
34
+ - llama-net
35
+ command : >
36
+ ./dllama worker --port 9999 --nthreads 2
37
+
38
+ worker3 :
39
+ build : .
40
+ networks :
41
+ - llama-net
42
+ command : >
43
+ ./dllama worker --port 9999 --nthreads 2
44
+
45
+ networks :
46
+ llama-net :
47
+ driver : bridge
You can’t perform that action at this time.
0 commit comments