-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathdocker-compose.yml
108 lines (104 loc) · 2.8 KB
/
docker-compose.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
version: '3.8'
services:
vllm-openai:
container_name: waifuassistant_vllm
image: vllm/vllm-openai:v0.5.5
runtime: nvidia
environment:
- NVIDIA_VISIBLE_DEVICES=1
- OMP_NUM_THREADS=8
volumes:
- /data2/model_weights/LLM/:/app/models_zoo/
- /data/huggingface_cache/huggingface:/root/.cache/huggingface
ipc: host
ports:
- "8200:8200"
command: [
"--model", "/app/models_zoo/spow12/ChatWaifu_v1.5_stock",
"--dtype", "bfloat16",
"--api-key", "token-abc123",
"--max-seq-len-to-capture", "128000",
"--max_model_len", "32768",
"--tensor-parallel-size", "1",
"--disable-frontend-multiprocessing",
"--served-model-name", "chat_model",
"--port", "8200"
]
backend:
container_name: waifuassistant_backend
build:
context: ./backend-api
dockerfile: Dockerfile
ports:
- "8201:8201"
volumes:
- ./backend-api:/app
environment:
- PYTHONUNBUFFERED=1
- NVIDIA_VISIBLE_DEVICES=1
command: ["uvicorn", "WaifuChat.app:app", "--host", "0.0.0.0", "--port", "8201"]
tts:
container_name: waifuassistant_tts
build:
context: ./tts-api
dockerfile: Dockerfile
volumes:
- ./tts-api:/app
ports:
- "7860:7860"
environment:
- NVIDIA_VISIBLE_DEVICES=0
deploy:
resources:
reservations:
devices:
- driver: nvidia
count: 0
capabilities: [gpu]
command: ["python", "server_editor.py", "--line_length", "200", "--line_count", "6", "--skip_static_files", "--skip_default_models", "--port", "7860"]
asr:
image: fedirz/faster-whisper-server:latest-cuda
container_name: waifuassistant_asr
runtime: nvidia
environment:
- NVIDIA_VISIBLE_DEVICES=0
- OPENAI_API_KEY=token-abc123
deploy:
resources:
reservations:
devices:
- driver: nvidia
count: 0
capabilities: [gpu]
ports:
- "8202:8000"
expose:
- 8202
volumes:
- /data/huggingface_cache/huggingface:/root/.cache/huggingface
mongodb:
image: mongo:5.0.14
container_name: waifuassistant_mongodb
restart: always
ports:
- 27017:27017
expose:
- 27017
volumes:
- /data2/datas/db/visual_novel/mongodb:/data/db
environment:
- MONGO_INITDB_ROOT_USERNAME=root
- MONGO_INITDB_ROOT_PASSWORD=1234
- MONGO_INITDB_DATABASE=visual_novel_db
mongo-express:
image: mongo-express:latest
container_name: waifuassistant_mongo-express
restart: always
ports:
- 8081:8081
expose:
- 8081
environment:
ME_CONFIG_MONGODB_ADMINUSERNAME: root
ME_CONFIG_MONGODB_ADMINPASSWORD: 1234
ME_CONFIG_MONGODB_URL: mongodb://root:1234@mongodb:27017