fix(halo): 27 only

This commit is contained in:
Harald Hoyer 2026-05-20 02:14:08 +02:00
parent 807a3d0d8e
commit 72e7bf613f

View file

@ -1,6 +1,6 @@
version = 1 version = 1
[*] [Qwen3.6-27B]
flash-attn = on flash-attn = on
jinja = true jinja = true
n-gpu-layers = 99 n-gpu-layers = 99
@ -17,14 +17,6 @@ no-context-shift = true
chat-template-kwargs = {"preserve_thinking": true} chat-template-kwargs = {"preserve_thinking": true}
fit = on fit = on
spec-type = draft-mtp spec-type = draft-mtp
[Qwen3.6-35B-A3B]
hf = unsloth/Qwen3.6-35B-A3B-MTP-GGUF:UD-Q8_K_XL
spec-draft-n-max = 3
parallel = 1
c = 262144
[Qwen3.6-27B]
hf = unsloth/Qwen3.6-27B-MTP-GGUF:Q6_K hf = unsloth/Qwen3.6-27B-MTP-GGUF:Q6_K
spec-draft-n-max = 6 spec-draft-n-max = 6
parallel = 2 parallel = 2