From 869cc798988004d04b8573a97bd16dd30b086add Mon Sep 17 00:00:00 2001 From: Lumpiasty Date: Wed, 23 Jul 2025 20:13:10 +0200 Subject: [PATCH] add qwen3 --- apps/librechat/release.yaml | 4 +++- apps/llama/configmap.yaml | 12 ++++++++++++ 2 files changed, 15 insertions(+), 1 deletion(-) diff --git a/apps/librechat/release.yaml b/apps/librechat/release.yaml index 40ccdc4..640aceb 100644 --- a/apps/librechat/release.yaml +++ b/apps/librechat/release.yaml @@ -64,7 +64,9 @@ spec: baseURL: "http://llama.llama.svc.cluster.local:11434/v1/chat/completions" models: default: [ - "DeepSeek-R1-0528-Qwen3-8B-GGUF" + "DeepSeek-R1-0528-Qwen3-8B-GGUF", + "Qwen3-8B-GGUF", + "Qwen3-8B-GGUF-Q6_K" ] titleConvo: true titleModel: "current_model" diff --git a/apps/llama/configmap.yaml b/apps/llama/configmap.yaml index e8cd84b..85e6849 100644 --- a/apps/llama/configmap.yaml +++ b/apps/llama/configmap.yaml @@ -12,3 +12,15 @@ data: -hf unsloth/DeepSeek-R1-0528-Qwen3-8B-GGUF:Q4_K_M -ngl 37 --port ${PORT} + "Qwen3-8B-GGUF": + cmd: | + /app/llama-server + -hf unsloth/Qwen3-8B-GGUF:Q4_K_M + -ngl 37 + --port ${PORT} + "Qwen3-8B-GGUF-Q6_K": + cmd: | + /app/llama-server + -hf unsloth/Qwen3-8B-GGUF:Q6_K + -ngl 37 + --port ${PORT}