feat(halo): use unsloth/Qwen3.6-27B-GGUF:UD-Q8_K_XL
This commit is contained in:
parent
c9c7f6916a
commit
a95417da8b
2 changed files with 4 additions and 4 deletions
|
|
@ -9,7 +9,7 @@
|
||||||
"baseURL": "http://halo.fritz.box:8000/v1"
|
"baseURL": "http://halo.fritz.box:8000/v1"
|
||||||
},
|
},
|
||||||
"models": {
|
"models": {
|
||||||
"unsloth/Qwen3.6-35B-A3B-GGUF:UD-Q8_K_XL": { "name" : "qwen3.6-35B-A3B" }
|
"unsloth/Qwen3.6-27B-GGUF:UD-Q8_K_XL": { "name" : "qwen3.6-27B" }
|
||||||
}
|
}
|
||||||
},
|
},
|
||||||
"halo-8001": {
|
"halo-8001": {
|
||||||
|
|
|
||||||
|
|
@ -35,11 +35,11 @@
|
||||||
"--port 8000"
|
"--port 8000"
|
||||||
"--no-mmap"
|
"--no-mmap"
|
||||||
"--n-gpu-layers 99"
|
"--n-gpu-layers 99"
|
||||||
"-hf unsloth/Qwen3.6-35B-A3B-GGUF:UD-Q8_K_XL"
|
"-hf unsloth/Qwen3.6-27B-GGUF:UD-Q8_K_XL"
|
||||||
"--alias qwen3.6-35b-a3b"
|
"--alias qwen3.6-27b"
|
||||||
"--threads 8"
|
"--threads 8"
|
||||||
"--ubatch-size 256"
|
"--ubatch-size 256"
|
||||||
"-ctk q8_0 -ctv q8_0"
|
"-ctk bf16 -ctv bf16"
|
||||||
"--temp 0.6 --top-p 0.95 --top-k 20 --min-p 0.00"
|
"--temp 0.6 --top-p 0.95 --top-k 20 --min-p 0.00"
|
||||||
"--no-context-shift"
|
"--no-context-shift"
|
||||||
''--chat-template-kwargs '{"preserve_thinking": true}' ''
|
''--chat-template-kwargs '{"preserve_thinking": true}' ''
|
||||||
|
|
|
||||||
Loading…
Add table
Add a link
Reference in a new issue