add qwen3

This commit is contained in:
2025-07-23 20:13:10 +02:00
parent 5813db75dc
commit 869cc79898
2 changed files with 15 additions and 1 deletions

View File

@@ -64,7 +64,9 @@ spec:
baseURL: "http://llama.llama.svc.cluster.local:11434/v1/chat/completions"
models:
default: [
"DeepSeek-R1-0528-Qwen3-8B-GGUF"
"DeepSeek-R1-0528-Qwen3-8B-GGUF",
"Qwen3-8B-GGUF",
"Qwen3-8B-GGUF-Q6_K"
]
titleConvo: true
titleModel: "current_model"

View File

@@ -12,3 +12,15 @@ data:
-hf unsloth/DeepSeek-R1-0528-Qwen3-8B-GGUF:Q4_K_M
-ngl 37
--port ${PORT}
"Qwen3-8B-GGUF":
cmd: |
/app/llama-server
-hf unsloth/Qwen3-8B-GGUF:Q4_K_M
-ngl 37
--port ${PORT}
"Qwen3-8B-GGUF-Q6_K":
cmd: |
/app/llama-server
-hf unsloth/Qwen3-8B-GGUF:Q6_K
-ngl 37
--port ${PORT}