added README
This commit is contained in:
@@ -22,6 +22,6 @@ services:
|
||||
command: >
|
||||
--model /app/models/Qwen3.5-0.8B-UD-Q8_K_XL.gguf
|
||||
--quantization gguf
|
||||
--gpu-memory-utilization 0.50
|
||||
--max-model-len 4096
|
||||
--gpu-memory-utilization 0.06
|
||||
--max-model-len 32768
|
||||
restart: unless-stopped
|
||||
|
||||
Reference in New Issue
Block a user