add qwen3
This commit is contained in:
@@ -64,7 +64,9 @@ spec:
|
|||||||
baseURL: "http://llama.llama.svc.cluster.local:11434/v1/chat/completions"
|
baseURL: "http://llama.llama.svc.cluster.local:11434/v1/chat/completions"
|
||||||
models:
|
models:
|
||||||
default: [
|
default: [
|
||||||
"DeepSeek-R1-0528-Qwen3-8B-GGUF"
|
"DeepSeek-R1-0528-Qwen3-8B-GGUF",
|
||||||
|
"Qwen3-8B-GGUF",
|
||||||
|
"Qwen3-8B-GGUF-Q6_K"
|
||||||
]
|
]
|
||||||
titleConvo: true
|
titleConvo: true
|
||||||
titleModel: "current_model"
|
titleModel: "current_model"
|
||||||
|
|||||||
@@ -12,3 +12,15 @@ data:
|
|||||||
-hf unsloth/DeepSeek-R1-0528-Qwen3-8B-GGUF:Q4_K_M
|
-hf unsloth/DeepSeek-R1-0528-Qwen3-8B-GGUF:Q4_K_M
|
||||||
-ngl 37
|
-ngl 37
|
||||||
--port ${PORT}
|
--port ${PORT}
|
||||||
|
"Qwen3-8B-GGUF":
|
||||||
|
cmd: |
|
||||||
|
/app/llama-server
|
||||||
|
-hf unsloth/Qwen3-8B-GGUF:Q4_K_M
|
||||||
|
-ngl 37
|
||||||
|
--port ${PORT}
|
||||||
|
"Qwen3-8B-GGUF-Q6_K":
|
||||||
|
cmd: |
|
||||||
|
/app/llama-server
|
||||||
|
-hf unsloth/Qwen3-8B-GGUF:Q6_K
|
||||||
|
-ngl 37
|
||||||
|
--port ${PORT}
|
||||||
|
|||||||
Reference in New Issue
Block a user