-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathdocker-compose.yaml
More file actions
33 lines (32 loc) · 1005 Bytes
/
docker-compose.yaml
File metadata and controls
33 lines (32 loc) · 1005 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
services:
ktransformers:
image: registry.cn-hangzhou.aliyuncs.com/joybo/ktransformers:v2025.04.13-action-web
container_name: ktransformers
hostname: ktransformers
environment:
- TZ=Asia/Shanghai
- COMMANDLINE_ARGS="--share --listen"
# - NVIDIA_VISIBLE_DEVICES=0
volumes:
- ./DeepSeek-V2-Lite-Chat-GGUF:/model/DeepSeek-V2-Lite-Chat-GGUF
- ./DeepSeek-V2-Lite-Chat:/model/DeepSeek-V2-Lite-Chat
ports:
- "8080:8080"
runtime: nvidia
deploy:
resources:
reservations:
devices:
- driver: nvidia
# device_ids: ['0']
capabilities: [gpu]
stdin_open: true
tty: true
restart: no
networks:
- ktransformers
entrypoint: ["ktransformers", "--model_path=/model/DeepSeek-V2-Lite-Chat", "--gguf_path=/model/DeepSeek-V2-Lite-Chat-GGUF", "--port=8080", "--web=True", "--host=0.0.0.0", "--force_think"]
networks:
ktransformers:
driver: bridge
name: ktransformers