21 lines
541 B
YAML
21 lines
541 B
YAML
models:
|
|
"DeepSeek-R1-0528-Qwen3-8B-GGUF":
|
|
cmd: |
|
|
/app/llama-server
|
|
-hf unsloth/DeepSeek-R1-0528-Qwen3-8B-GGUF:Q4_K_M
|
|
-ngl 37 -c 16384
|
|
--port ${PORT}
|
|
"Qwen3-8B-GGUF":
|
|
cmd: |
|
|
/app/llama-server
|
|
-hf unsloth/Qwen3-8B-GGUF:Q4_K_M
|
|
-ngl 37 -c 16384
|
|
--port ${PORT}
|
|
"Qwen3-8B-GGUF-no-thinking":
|
|
cmd: |
|
|
/app/llama-server
|
|
-hf unsloth/Qwen3-8B-GGUF:Q4_K_M
|
|
-ngl 37 -c 16384
|
|
--jinja --chat-template-file /config/qwen_nothink_chat_template.jinja
|
|
--port ${PORT}
|