-
Notifications
You must be signed in to change notification settings - Fork 2
/
docker-compose-multigpu.yaml
66 lines (63 loc) · 1.69 KB
/
docker-compose-multigpu.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
version: '3.7'
# Settings and configurations that are common for all containers
services:
everythingdata:
container_name: everythingdata
user: root
image: dansknaw/everythingdata:devel-${cudaversion}
deploy:
resources:
reservations:
devices:
- driver: nvidia
capabilities: [gpu]
device_ids: ['1']
environment:
- "TEST"
- "TOKEN"
- "DATAPATH"
- "MIN_SENTENCE_SIZE"
- "CONFIG"
- "CONFIGFILE"
- "MODEL"
- "LLAMAMODEL"
- "DIDAPI"
- "NERAPI"
- "LLMRAMAPI"
- "LLMAPI"
- "GRAPHDIR"
- "TRANSLATOR"
- "MAX_WORKERS"
- "WEB_CONCURRENCY"
- "--n_samples=1"
- PYTORCH_CUDA_ALLOC_CONF=max_split_size_mb:512
- "OLLAMA_API"
- "DEBUG=1234567801"
ports:
- "${llmport}:8000"
command: uvicorn main:app --host 0.0.0.0 --port 8000
volumes:
- ${DATADIR}:/data
- ${CONFIG}:/app/config/prompts.ini
- ${MODELS}:/root/.cache/huggingface
- ./app/app.py:/app/main.py
- ./app/llmframe.py:/app/llmframe.py
- ./app/localconfig.py:/app/localconfig.py
# - ./config/prompts.ini:/app/config/prompts.ini
llama:
volumes:
- ./ollama-docker/ollama/ollama:/root/.ollama
container_name: ollama
pull_policy: always
tty: true
restart: unless-stopped
image: ollama/ollama:latest
ports:
- 11434:11434
deploy:
resources:
reservations:
devices:
- driver: nvidia
capabilities: [gpu]
device_ids: ['1']