File tree Expand file tree Collapse file tree 3 files changed +78
-0
lines changed
Expand file tree Collapse file tree 3 files changed +78
-0
lines changed Original file line number Diff line number Diff line change 1+ # General Ignore
2+ .git
3+ .github
4+ .vscode
5+ .dockerignore
6+ .gitignore
7+ README.md
8+ Dockerfile
9+ docker-compose.yaml
10+
11+ # Unique to distributed-llama
12+ report
13+ docs
14+ examples
15+ models
Original file line number Diff line number Diff line change 1+ FROM debian:bookworm-slim
2+
3+ RUN apt-get update && apt-get install -y \
4+ git build-essential \
5+ && rm -rf /var/lib/apt/lists/*
6+
7+ WORKDIR /app
8+
9+ COPY . /app
10+ RUN make dllama && make dllama-api
11+
12+ # Default ports for root node + worker node
13+ EXPOSE 5000
14+ EXPOSE 9999
15+
16+ CMD ["./dllama" ]
Original file line number Diff line number Diff line change 1+ services :
2+ root :
3+ build : .
4+ networks :
5+ - llama-net
6+ volumes :
7+ - ./models:/models
8+ depends_on :
9+ - worker1
10+ - worker2
11+ - worker3
12+ ports :
13+ - " 5000:5000"
14+ restart : on-failure
15+ command : >-
16+ ./dllama-api
17+ --model /models/dllama_model_llama3.2-1b-instruct_q40.m
18+ --tokenizer /models/dllama_tokenizer_llama3_2.t
19+ --buffer-float-type q80 --nthreads 2 --port 5000
20+ --workers worker1:9999 worker2:9999 worker3:9999
21+
22+ worker1 :
23+ build : .
24+ ports :
25+ - " 9999:9999"
26+ networks :
27+ - llama-net
28+ command : >
29+ ./dllama worker --port 9999 --nthreads 2
30+
31+ worker2 :
32+ build : .
33+ networks :
34+ - llama-net
35+ command : >
36+ ./dllama worker --port 9999 --nthreads 2
37+
38+ worker3 :
39+ build : .
40+ networks :
41+ - llama-net
42+ command : >
43+ ./dllama worker --port 9999 --nthreads 2
44+
45+ networks :
46+ llama-net :
47+ driver : bridge
You can’t perform that action at this time.
0 commit comments