From 100445ee54cd4a739ccfa0b66329c914ac27aa80 Mon Sep 17 00:00:00 2001 From: Lenoctambule <106790775+lenoctambule@users.noreply.github.com> Date: Mon, 9 Mar 2026 21:56:05 +0100 Subject: [PATCH] init: first commit --- .gitignore | 1 + docker-compose.yml | 20 ++++++++++++++++++++ download-model.sh | 2 ++ 3 files changed, 23 insertions(+) create mode 100644 .gitignore create mode 100644 docker-compose.yml create mode 100644 download-model.sh diff --git a/.gitignore b/.gitignore new file mode 100644 index 0000000..d6d95cf --- /dev/null +++ b/.gitignore @@ -0,0 +1 @@ +models \ No newline at end of file diff --git a/docker-compose.yml b/docker-compose.yml new file mode 100644 index 0000000..c3ddd56 --- /dev/null +++ b/docker-compose.yml @@ -0,0 +1,20 @@ +services: + llama-cpp: + image: ghcr.io/ggml-org/llama.cpp:server + container_name: llama-cpp-qwen + restart: unless-stopped + ports: + - "8000:8000" + volumes: + - ./models:/models + command: + - -m + - /models/qwen2.5-0.5b-instruct-q4_k_m.gguf + - --host + - 0.0.0.0 + - --port + - "8000" + - --ctx-size + - "4096" + - --threads + - "4" \ No newline at end of file diff --git a/download-model.sh b/download-model.sh new file mode 100644 index 0000000..7234332 --- /dev/null +++ b/download-model.sh @@ -0,0 +1,2 @@ +mkdir -p models +curl -L -o ./models/qwen2.5-0.5b-instruct-q4_k_m.gguf https://huggingface.co/Qwen/Qwen2.5-0.5B-Instruct-GGUF/resolve/main/qwen2.5-0.5b-instruct-q4_k_m.gguf \ No newline at end of file