From 31e491e3148cc1143393acfef5e8c9ce2b90e87e Mon Sep 17 00:00:00 2001 From: Harald Hoyer Date: Wed, 20 May 2026 07:05:27 +0200 Subject: [PATCH] Revert "fix(halo): 27 only" This reverts commit 72e7bf613fa119dc17e8fa79756888f20e937380. --- systems/x86_64-linux/halo/models.ini | 10 +++++++++- 1 file changed, 9 insertions(+), 1 deletion(-) diff --git a/systems/x86_64-linux/halo/models.ini b/systems/x86_64-linux/halo/models.ini index 1f77d61..9d23606 100644 --- a/systems/x86_64-linux/halo/models.ini +++ b/systems/x86_64-linux/halo/models.ini @@ -1,6 +1,6 @@ version = 1 -[Qwen3.6-27B] +[*] flash-attn = on jinja = true n-gpu-layers = 99 @@ -17,6 +17,14 @@ no-context-shift = true chat-template-kwargs = {"preserve_thinking": true} fit = on spec-type = draft-mtp + +[Qwen3.6-35B-A3B] +hf = unsloth/Qwen3.6-35B-A3B-MTP-GGUF:UD-Q8_K_XL +spec-draft-n-max = 3 +parallel = 1 +c = 262144 + +[Qwen3.6-27B] hf = unsloth/Qwen3.6-27B-MTP-GGUF:Q6_K spec-draft-n-max = 6 parallel = 2