From 55ac337a6346b13589962b31768f4c0733f426ab Mon Sep 17 00:00:00 2001 From: Lumpiasty Date: Mon, 18 May 2026 20:18:18 +0200 Subject: [PATCH] enable MTP on MTP models --- apps/llama/configs/config.yaml | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/apps/llama/configs/config.yaml b/apps/llama/configs/config.yaml index 61ab86a..533cd56 100644 --- a/apps/llama/configs/config.yaml +++ b/apps/llama/configs/config.yaml @@ -190,6 +190,8 @@ models: -hf unsloth/Qwen3.6-35B-A3B-MTP-GGUF:Q4_K_M ${ctx_256k} ${qwen35_think_args} + --spec-type draft-mtp --spec-draft-n-max 1 + --parallel 1 ${common_args} "unsloth/Qwen3.6-35B-A3B-MTP-GGUF-nothink:Q4_K_M": @@ -198,4 +200,6 @@ models: -hf unsloth/Qwen3.6-35B-A3B-MTP-GGUF:Q4_K_M ${ctx_256k} ${qwen35_nothink_args} + --spec-type draft-mtp --spec-draft-n-max 1 + --parallel 1 ${common_args}