From 9dc536c07a95c19f0b4e0583f04e4331f73ae836 Mon Sep 17 00:00:00 2001 From: Lumpiasty Date: Mon, 18 May 2026 20:18:18 +0200 Subject: [PATCH] enable MTP on MTP models --- apps/llama/configs/config.yaml | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/apps/llama/configs/config.yaml b/apps/llama/configs/config.yaml index 61ab86a..85f510c 100644 --- a/apps/llama/configs/config.yaml +++ b/apps/llama/configs/config.yaml @@ -190,6 +190,8 @@ models: -hf unsloth/Qwen3.6-35B-A3B-MTP-GGUF:Q4_K_M ${ctx_256k} ${qwen35_think_args} + --spec-type draft-mtp --spec-draft-n-max 2 + --parallel 1 ${common_args} "unsloth/Qwen3.6-35B-A3B-MTP-GGUF-nothink:Q4_K_M": @@ -198,4 +200,6 @@ models: -hf unsloth/Qwen3.6-35B-A3B-MTP-GGUF:Q4_K_M ${ctx_256k} ${qwen35_nothink_args} + --spec-type draft-mtp --spec-draft-n-max 2 + --parallel 1 ${common_args}