From b379c181f23f0133faca9e72a589f7fbed1dd96e Mon Sep 17 00:00:00 2001 From: Lumpiasty Date: Wed, 23 Jul 2025 22:06:45 +0200 Subject: [PATCH] increase context size --- apps/llama/configmap.yaml | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/apps/llama/configmap.yaml b/apps/llama/configmap.yaml index 85e6849..4dd8b0d 100644 --- a/apps/llama/configmap.yaml +++ b/apps/llama/configmap.yaml @@ -10,17 +10,17 @@ data: cmd: | /app/llama-server -hf unsloth/DeepSeek-R1-0528-Qwen3-8B-GGUF:Q4_K_M - -ngl 37 + -ngl 37 -c 16384 --port ${PORT} "Qwen3-8B-GGUF": cmd: | /app/llama-server -hf unsloth/Qwen3-8B-GGUF:Q4_K_M - -ngl 37 + -ngl 37 -c 16384 --port ${PORT} "Qwen3-8B-GGUF-Q6_K": cmd: | /app/llama-server -hf unsloth/Qwen3-8B-GGUF:Q6_K - -ngl 37 + -ngl 37 -c 16384 --port ${PORT}