-
Notifications
You must be signed in to change notification settings - Fork 69
/
docker-compose.yaml
47 lines (47 loc) · 1.14 KB
/
docker-compose.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
version: '3'
services:
jlama-coordinator:
image: jlama
restart: always
container_name: jlama-coordinator
ports:
- "8080:8080"
environment:
- JLAMA_JVM_ARGS_EXTRA=-Xmx1g -Djava.net.preferIPv4Stack=true
deploy:
resources:
limits:
memory: 1g
cpus: "1"
command:
- cluster-coordinator
- --threads=2
- --worker-count=8
- tjake/Mistral-7B-Instruct-v0.3-jlama-Q4
volumes:
- "./models:/models"
healthcheck:
test: ["CMD", "curl", "-f", "http://localhost:8080/ui/index.html"]
interval: 5s
jlama-worker:
image: jlama
restart: always
depends_on:
jlama-coordinator:
condition: service_healthy
environment:
- JLAMA_JVM_ARGS_EXTRA=-Xmx500M -Djava.net.preferIPv4Stack=true -Djlama.use_hostname_as_workerid=true
deploy:
mode: replicated
replicas: 8
resources:
limits:
cpus: "1"
memory: 500m
command:
- cluster-worker
- --threads=1
- --coordinator=jlama-coordinator
- tjake/Mistral-7B-Instruct-v0.3-jlama-Q4
volumes:
- "./models:/models"