From 9765f1cf865cc0eb2a30269d1275578e2af6cd65 Mon Sep 17 00:00:00 2001 From: Lumpiasty Date: Wed, 23 Jul 2025 23:07:46 +0200 Subject: [PATCH] add gemma3n --- apps/librechat/release.yaml | 3 ++- apps/llama/configs/config.yaml | 14 ++++++++++++++ 2 files changed, 16 insertions(+), 1 deletion(-) diff --git a/apps/librechat/release.yaml b/apps/librechat/release.yaml index 65eade1..0e89e09 100644 --- a/apps/librechat/release.yaml +++ b/apps/librechat/release.yaml @@ -66,7 +66,8 @@ spec: default: [ "DeepSeek-R1-0528-Qwen3-8B-GGUF", "Qwen3-8B-GGUF", - "Qwen3-8B-GGUF-no-thinking" + "Qwen3-8B-GGUF-no-thinking", + "gemma3n" ] titleConvo: true titleModel: "current_model" diff --git a/apps/llama/configs/config.yaml b/apps/llama/configs/config.yaml index 6a4ff68..a71f216 100644 --- a/apps/llama/configs/config.yaml +++ b/apps/llama/configs/config.yaml @@ -18,3 +18,17 @@ models: -ngl 37 -c 16384 --jinja --chat-template-file /config/qwen_nothink_chat_template.jinja --port ${PORT} + "gemma3n": + cmd: | + /app/llama-server + -hf unsloth/gemma-3n-E4B-it-GGUF:UD-Q4_K_XL + --ctx-size 16384 + --n-gpu-layers 99 + --seed 3407 + --prio 2 + --temp 1.0 + --repeat-penalty 1.0 + --min-p 0.00 + --top-k 64 + --top-p 0.95 + --port ${PORT}