-
Notifications
You must be signed in to change notification settings - Fork 0
/
docker-compose.cuda.yaml
52 lines (48 loc) · 1.18 KB
/
docker-compose.cuda.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
services:
open-webui:
image: ghcr.io/open-webui/open-webui:v0.3.5-cuda
environment:
- ENV=PROD
- ENABLE_COMMUNITY_SHARING=False
- USE_CUDA_DOCKER=True
- GLOBAL_LOG_LEVEL=INFO
ports:
- "3030:8080"
extra_hosts:
- "host.docker.internal:host-gateway"
volumes:
- open-webui:/app/backend/data
restart: no
deploy:
resources:
reservations:
devices:
- capabilities: [ gpu ]
count: all
pipelines:
image: ghcr.io/open-webui/pipelines:cuda
environment:
- PIPELINES_URLS=file:///app/pipelines/llama_index_retrieval_pipeline.py
ports:
- "9099:9099"
extra_hosts:
- "host.docker.internal:host-gateway"
volumes:
- type: bind
source: ./pipelines/llama_index_retrieval_pipeline.py
target: /app/pipelines/llama_index_retrieval_pipeline.py
- type: bind
source: ./persist
target: /app/persist
- pipelines:/app/pipelines
restart: no
deploy:
resources:
reservations:
devices:
- capabilities: [ gpu ]
count: all
volumes:
open-webui:
pipelines:
datastore: