init: first commit
This commit is contained in:
1
.gitignore
vendored
Normal file
1
.gitignore
vendored
Normal file
@@ -0,0 +1 @@
|
||||
models
|
||||
20
docker-compose.yml
Normal file
20
docker-compose.yml
Normal file
@@ -0,0 +1,20 @@
|
||||
services:
|
||||
llama-cpp:
|
||||
image: ghcr.io/ggml-org/llama.cpp:server
|
||||
container_name: llama-cpp-qwen
|
||||
restart: unless-stopped
|
||||
ports:
|
||||
- "8000:8000"
|
||||
volumes:
|
||||
- ./models:/models
|
||||
command:
|
||||
- -m
|
||||
- /models/qwen2.5-0.5b-instruct-q4_k_m.gguf
|
||||
- --host
|
||||
- 0.0.0.0
|
||||
- --port
|
||||
- "8000"
|
||||
- --ctx-size
|
||||
- "4096"
|
||||
- --threads
|
||||
- "4"
|
||||
2
download-model.sh
Normal file
2
download-model.sh
Normal file
@@ -0,0 +1,2 @@
|
||||
mkdir -p models
|
||||
curl -L -o ./models/qwen2.5-0.5b-instruct-q4_k_m.gguf https://huggingface.co/Qwen/Qwen2.5-0.5B-Instruct-GGUF/resolve/main/qwen2.5-0.5b-instruct-q4_k_m.gguf
|
||||
Reference in New Issue
Block a user