diff --git a/docker-compose.yml b/docker-compose.yml index 938f9fe..f84046d 100644 --- a/docker-compose.yml +++ b/docker-compose.yml @@ -4,26 +4,18 @@ services: container_name: llama-cpp-qwen restart: unless-stopped ports: - - "8000:8000" + - 8000:8000 volumes: - ./models:/models - command: - - -m - - /models/qwen-3.5-0.8b/Qwen3.5-0.8B-UD-Q2_K_XL.gguf - - --mmproj - - /models/qwen-3.5-0.8b/mmproj-F16.gguf - - --host - - 0.0.0.0 - - --port - - "8000" - - --ctx-size - - "16384" - - --temp - - "0.7" - - --top-p - - "0.8" - - --top-k - - "20" - - --min-p - - "0.00" - + command: > + -m /models/qwen/Qwen3.5-0.8B-UD-Q8_K_XL.gguf + --mmproj /models/qwen/mmproj-F16.gguf + --host 0.0.0.0 --port "8000" + --ctx-size "16384" + --temp "0.6" + --top-p "1.00" + --top-k "20" + --min-p "0.00" + --presence-penalty 2.0 + --repeat-penalty 1.0 + --chat-template-kwargs '{"enable_thinking":false}'