init: first commit
This commit is contained in:
1
.gitignore
vendored
Normal file
1
.gitignore
vendored
Normal file
@@ -0,0 +1 @@
|
|||||||
|
models
|
||||||
20
docker-compose.yml
Normal file
20
docker-compose.yml
Normal file
@@ -0,0 +1,20 @@
|
|||||||
|
services:
|
||||||
|
llama-cpp:
|
||||||
|
image: ghcr.io/ggml-org/llama.cpp:server
|
||||||
|
container_name: llama-cpp-qwen
|
||||||
|
restart: unless-stopped
|
||||||
|
ports:
|
||||||
|
- "8000:8000"
|
||||||
|
volumes:
|
||||||
|
- ./models:/models
|
||||||
|
command:
|
||||||
|
- -m
|
||||||
|
- /models/qwen2.5-0.5b-instruct-q4_k_m.gguf
|
||||||
|
- --host
|
||||||
|
- 0.0.0.0
|
||||||
|
- --port
|
||||||
|
- "8000"
|
||||||
|
- --ctx-size
|
||||||
|
- "4096"
|
||||||
|
- --threads
|
||||||
|
- "4"
|
||||||
2
download-model.sh
Normal file
2
download-model.sh
Normal file
@@ -0,0 +1,2 @@
|
|||||||
|
mkdir -p models
|
||||||
|
curl -L -o ./models/qwen2.5-0.5b-instruct-q4_k_m.gguf https://huggingface.co/Qwen/Qwen2.5-0.5B-Instruct-GGUF/resolve/main/qwen2.5-0.5b-instruct-q4_k_m.gguf
|
||||||
Reference in New Issue
Block a user