-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathdocker-compose.yml
115 lines (94 loc) · 2.36 KB
/
docker-compose.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
services:
ollama-embedding:
image: ollama/ollama:0.1.32-rocm
# image: ollama/ollama:0.1.32 # for nvidia
environment:
OLLAMA_HOST: 0.0.0.0:11434
OLLAMA_MODELS: /var/lib/ollama/models
OLLAMA_KEEP_ALIVE: -1 # do not unload models
volumes:
- ollama-models:/var/lib/ollama/models
- ollama-config:/root/.ollama # stores private key
# GPU access for ROCm (AMD)
devices:
- /dev/dri:/dev/dri
- /dev/kfd:/dev/kfd
# GPU access for CUDA (NVIDIA) - untested
# deploy:
# resources:
# reservations:
# devices:
# - driver: nvidia
# count: 1
# capabilities: [gpu]
#
# ports:
# - 11434:11434
healthcheck:
test: "ollama --version || exit 1"
interval: 5s
timeout: 1s
retries: 10
start_period: 10s
ollama-chat:
image: ollama/ollama:0.1.32-rocm
# image: ollama/ollama:0.1.32 # for nvidia
environment:
OLLAMA_HOST: 0.0.0.0:11434
OLLAMA_MODELS: /var/lib/ollama/models
OLLAMA_KEEP_ALIVE: -1 # do not unload models
volumes:
- ollama-models:/var/lib/ollama/models
- ollama-config:/root/.ollama # stores private key
# GPU access for ROCm (AMD)
devices:
- /dev/dri:/dev/dri
- /dev/kfd:/dev/kfd
# GPU access for CUDA (NVIDIA) - untested
# deploy:
# resources:
# reservations:
# devices:
# - driver: nvidia
# count: 1
# capabilities: [gpu]
#
# ports:
# - 11434:11434
healthcheck:
test: "ollama --version || exit 1"
interval: 5s
timeout: 1s
retries: 10
start_period: 10s
postgres:
image: tensorchord/pgvecto-rs:pg16-v0.2.1
environment:
POSTGRES_DB: mydb
POSTGRES_USER: myuser
POSTGRES_PASSWORD: mypassword
volumes:
- postgres-data:/var/lib/postgresql/data
ports:
- 5432:5432
healthcheck:
test: "pg_isready -U myuser -d mydb"
interval: 5s
timeout: 1s
retries: 10
start_period: 10s
app:
build: .
volumes:
- .:/workspace
depends_on:
ollama-embedding:
condition: service_healthy
ollama-chat:
condition: service_healthy
postgres:
condition: service_healthy
volumes:
ollama-models:
ollama-config:
postgres-data: