first commit

2026-03-27 13:05:47 +00:00
commit 549f70b97a
4 changed files with 82 additions and 0 deletions
--- a/docker-compose.yml
+++ b/docker-compose.yml
@@ -0,0 +1,27 @@
+services:
+  vllm-qwen:
+    build: 
+      context: .
+      dockerfile: Dockerfile
+    container_name: vllm_qwen_08b
+    ports:
+      - "8000:8000"
+    ipc: host 
+    devices:
+      - "/dev/kfd:/dev/kfd"
+      - "/dev/dri:/dev/dri"
+    group_add:
+      - video
+      - render
+    volumes:
+      # Montaggio in sola lettura del modello
+      - /opt/models:/app/models:ro
+    environment:
+      - HSA_OVERRIDE_GFX_VERSION=11.0.0
+      - HIP_VISIBLE_DEVICES=0
+    command: >
+      --model /app/models/Qwen3.5-0.8B-UD-Q8_K_XL.gguf
+      --quantization gguf
+      --gpu-memory-utilization 0.50
+      --max-model-len 4096
+    restart: unless-stopped