Files
llamacpp-qwen3.5-0.8b/docker-compose.yml
Luca Sacchi Ricciardi f20f6571c2 project refactored
2026-03-27 14:27:12 +00:00

21 lines
476 B
YAML

services:
qwen-08b:
build: .
container_name: qwen_08b_server
ports:
- "8000:8000"
devices:
- /dev/kfd:/dev/kfd
- /dev/dri:/dev/dri
volumes:
- /opt/models:/models
# -ngl 99 offloada tutti i layer sulla GPU AMD
# --host 0.0.0.0 lo rende accessibile fuori dal container
command: >
-m /models/qwen1_5-0_8b-chat-q8_0.gguf
--host 0.0.0.0
--port 8000
-ngl 99
-c 4096
restart: unless-stopped