add Qwen3-Coder-Next model

This commit is contained in:
2026-02-26 00:10:53 +01:00
parent 1ddef7951a
commit 63a8e2f7ac

View File

@@ -465,4 +465,19 @@ models:
--frequency-penalty 0.5 --frequency-penalty 0.5
--presence-penalty 0.4 --presence-penalty 0.4
--no-warmup --no-warmup
--port ${PORT} --port ${PORT}
"Qwen3-Coder-Next-GGUF:Q4_K_M":
ttl: 600
cmd: |
/app/llama-server
-hf unsloth/Qwen3-Coder-Next-GGUF:Q4_K_M
--ctx-size 32768
--predict 8192
--temp 1.0
--min-p 0.01
--top-p 0.95
--top-k 40
--repeat-penalty 1.0
--no-warmup
--port ${PORT}