diff --git a/docker-compose.yml b/docker-compose.yml index c3ddd56..3ebe067 100644 --- a/docker-compose.yml +++ b/docker-compose.yml @@ -9,12 +9,18 @@ services: - ./models:/models command: - -m - - /models/qwen2.5-0.5b-instruct-q4_k_m.gguf + - /models/qwen3.5-9B-Q5.gguf - --host - 0.0.0.0 - --port - "8000" - --ctx-size - - "4096" - - --threads - - "4" \ No newline at end of file + - "16384" + - --temp + - "0.7" + - --top-p + - "0.8" + - --top-k + - "20" + - --min-p + - "0.00" diff --git a/download-model.sh b/download-model.sh index 7234332..69d14c4 100644 --- a/download-model.sh +++ b/download-model.sh @@ -1,2 +1,2 @@ mkdir -p models -curl -L -o ./models/qwen2.5-0.5b-instruct-q4_k_m.gguf https://huggingface.co/Qwen/Qwen2.5-0.5B-Instruct-GGUF/resolve/main/qwen2.5-0.5b-instruct-q4_k_m.gguf \ No newline at end of file +curl -L -o ./models/qwen3.5-9B-Q5 https://huggingface.co/unsloth/Qwen3.5-9B-GGUF/resolve/main/Qwen3.5-9B-Q5_K_M.gguf