From 56077b6fe019377be72897cd6f138c26c7318f92 Mon Sep 17 00:00:00 2001 From: Luca Sacchi Ricciardi Date: Fri, 27 Mar 2026 14:54:17 +0000 Subject: [PATCH] added .env env-example, refactored docker-compose --- .env | 5 +++++ docker-compose.yml | 14 ++++++-------- env-example | 5 +++++ 3 files changed, 16 insertions(+), 8 deletions(-) create mode 100644 .env create mode 100644 env-example diff --git a/.env b/.env new file mode 100644 index 0000000..e70911e --- /dev/null +++ b/.env @@ -0,0 +1,5 @@ +# Porta esposta sull'host e usata internamente dal server +SERVER_PORT=8000 + +# Nome esatto del file GGUF presente nella cartella ./models +MODEL_FILENAME=Qwen3.5-0.8B-UD-Q8_K_XL.gguf diff --git a/docker-compose.yml b/docker-compose.yml index 98d16b9..40f0be6 100644 --- a/docker-compose.yml +++ b/docker-compose.yml @@ -1,20 +1,18 @@ services: - qwen-08b: + llamacpp-server: build: . - container_name: qwen_08b_server + container_name: llamacpp_${SERVER_PORT} ports: - - "8000:8000" + - "${SERVER_PORT}:${SERVER_PORT}" devices: - /dev/kfd:/dev/kfd - /dev/dri:/dev/dri volumes: - - /opt/models:/models - # -ngl 99 offloada tutti i layer sulla GPU AMD - # --host 0.0.0.0 lo rende accessibile fuori dal container + - ./models:/models command: > - -m /models/Qwen3.5-0.8B-UD-Q8_K_XL.gguf + -m /models/${MODEL_FILENAME} --host 0.0.0.0 - --port 8000 + --port ${SERVER_PORT} -ngl 99 -c 4096 restart: unless-stopped diff --git a/env-example b/env-example new file mode 100644 index 0000000..e70911e --- /dev/null +++ b/env-example @@ -0,0 +1,5 @@ +# Porta esposta sull'host e usata internamente dal server +SERVER_PORT=8000 + +# Nome esatto del file GGUF presente nella cartella ./models +MODEL_FILENAME=Qwen3.5-0.8B-UD-Q8_K_XL.gguf