chore(deps): update renovate/renovate docker tag to v43.83.1

change kv cache quant to q8_0
Merge pull request 'chore(deps): update ghcr.io/mostlygeek/llama-swap docker tag to v198-vulkan-b8400' (#167 ) from renovate/ghcr.io-mostlygeek-llama-swap-198.x into fresh-start
2026-03-20 00:00:54 +00:00 · 2026-03-20 00:57:39 +01:00 · 2026-03-19 00:00:38 +00:00 · 2026-03-19 00:00:34 +00:00
3 changed files with 5 additions and 5 deletions
--- a/apps/llama/configs/config.yaml
+++ b/apps/llama/configs/config.yaml
@@ -8,8 +8,8 @@ macros:
  gemma3_ctx_128k: "--ctx-size 131072"
  qwen35_ctx_256k: "--ctx-size 262144"
  gemma_sampling: "--prio 2 --temp 1.0 --repeat-penalty 1.0 --min-p 0.00 --top-k 64 --top-p 0.95"
-  qwen35_sampling: "--temp 0.6 --top-p 0.95 --top-k 20 --min-p 0.00 -ctk q4_0 -ctv q4_0"
-  qwen35_35b_args: "--temp 1.0 --min-p 0.00 --top-p 0.95 --top-k 20 -ctk q4_0 -ctv q4_0"
+  qwen35_sampling: "--temp 0.6 --top-p 0.95 --top-k 20 --min-p 0.00 -ctk q8_0 -ctv q8_0"
+  qwen35_35b_args: "--temp 1.0 --min-p 0.00 --top-p 0.95 --top-k 20 -ctk q8_0 -ctv q8_0"
  qwen35_35b_heretic_mmproj: "--mmproj-url https://huggingface.co/unsloth/Qwen3.5-35B-A3B-GGUF/resolve/main/mmproj-F16.gguf --mmproj /root/.cache/llama.cpp/unsloth_Qwen3.5-35B-A3B-GGUF_mmproj-F16.gguf"
  qwen35_4b_heretic_mmproj: "--mmproj-url https://huggingface.co/unsloth/Qwen3.5-4B-GGUF/resolve/main/mmproj-F16.gguf --mmproj /root/.cache/llama.cpp/unsloth_Qwen3.5-4B-GGUF_mmproj-F16.gguf"
  glm47_flash_args: "--temp 0.7 --top-p 1.0 --min-p 0.01 --repeat-penalty 1.0"
@@ -82,7 +82,7 @@ models:
        --top-p 0.95
        --top-k 40
        --repeat-penalty 1.0
-        -ctk q4_0 -ctv q4_0
+        -ctk q8_0 -ctv q8_0
        ${common_args}

  "Qwen3.5-35B-A3B-GGUF:Q4_K_M":
--- a/apps/llama/deployment.yaml
+++ b/apps/llama/deployment.yaml
@@ -18,7 +18,7 @@ spec:
    spec:
      containers:
        - name: llama-swap
-          image: ghcr.io/mostlygeek/llama-swap:v198-vulkan-b8390
+          image: ghcr.io/mostlygeek/llama-swap:v198-vulkan-b8400
          imagePullPolicy: IfNotPresent
          command:
            - /app/llama-swap
--- a/apps/renovate/cronjob.yaml
+++ b/apps/renovate/cronjob.yaml
@@ -15,7 +15,7 @@ spec:
            - name: renovate
              # Update this to the latest available and then enable Renovate on
              # the manifest
-              image: renovate/renovate:43.76.1-full
+              image: renovate/renovate:43.83.1-full
              envFrom:
                - secretRef:
                    name: renovate-gitea-token
Author	SHA1	Message	Date
Renovate Bot	af9b5b82f9	chore(deps): update renovate/renovate docker tag to v43.83.1	2026-03-20 00:00:54 +00:00
Lumpiasty	ce0b13ebb3	change kv cache quant to q8_0	2026-03-20 00:57:39 +01:00
Renovate	516e157d39	Merge pull request 'chore(deps): update ghcr.io/mostlygeek/llama-swap docker tag to v198-vulkan-b8400' (#167 ) from renovate/ghcr.io-mostlygeek-llama-swap-198.x into fresh-start	2026-03-19 00:00:38 +00:00
Renovate Bot	73d6d1f15a	chore(deps): update ghcr.io/mostlygeek/llama-swap docker tag to v198-vulkan-b8400	2026-03-19 00:00:34 +00:00