Files
klaster/apps/llama/configs/config.yaml
2025-07-23 22:56:52 +02:00

21 lines
541 B
YAML

models:
"DeepSeek-R1-0528-Qwen3-8B-GGUF":
cmd: |
/app/llama-server
-hf unsloth/DeepSeek-R1-0528-Qwen3-8B-GGUF:Q4_K_M
-ngl 37 -c 16384
--port ${PORT}
"Qwen3-8B-GGUF":
cmd: |
/app/llama-server
-hf unsloth/Qwen3-8B-GGUF:Q4_K_M
-ngl 37 -c 16384
--port ${PORT}
"Qwen3-8B-GGUF-no-thinking":
cmd: |
/app/llama-server
-hf unsloth/Qwen3-8B-GGUF:Q4_K_M
-ngl 37 -c 16384
--jinja --chat-template-file /config/qwen_nothink_chat_template.jinja
--port ${PORT}