From 67e9f49ee66a056abc69ba9350030542b89e2894 Mon Sep 17 00:00:00 2001 From: Lumpiasty Date: Mon, 18 May 2026 20:18:18 +0200 Subject: [PATCH] enable MTP on MTP models --- apps/llama/configs/config.yaml | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/apps/llama/configs/config.yaml b/apps/llama/configs/config.yaml index 61ab86a..1cd6b98 100644 --- a/apps/llama/configs/config.yaml +++ b/apps/llama/configs/config.yaml @@ -190,6 +190,8 @@ models: -hf unsloth/Qwen3.6-35B-A3B-MTP-GGUF:Q4_K_M ${ctx_256k} ${qwen35_think_args} + --spec-type draft-mtp --spec-draft-n-max 6 + --parallel 1 ${common_args} "unsloth/Qwen3.6-35B-A3B-MTP-GGUF-nothink:Q4_K_M": @@ -198,4 +200,6 @@ models: -hf unsloth/Qwen3.6-35B-A3B-MTP-GGUF:Q4_K_M ${ctx_256k} ${qwen35_nothink_args} + --spec-type draft-mtp --spec-draft-n-max 6 + --parallel 1 ${common_args}