From dadfb07914c87e6f806224ac17cc344ceba34a60 Mon Sep 17 00:00:00 2001 From: Harald Hoyer Date: Wed, 13 May 2026 14:52:49 +0200 Subject: [PATCH] fix(halo): set `--alias halo-8000` --- systems/x86_64-linux/halo/llama-server-27B-MTP.nix | 2 +- systems/x86_64-linux/halo/llama-server-27B.nix | 2 +- systems/x86_64-linux/halo/llama-server-coder-next.nix | 2 +- systems/x86_64-linux/halo/llama-server.nix | 2 +- 4 files changed, 4 insertions(+), 4 deletions(-) diff --git a/systems/x86_64-linux/halo/llama-server-27B-MTP.nix b/systems/x86_64-linux/halo/llama-server-27B-MTP.nix index 2b8283d..9a722b9 100644 --- a/systems/x86_64-linux/halo/llama-server-27B-MTP.nix +++ b/systems/x86_64-linux/halo/llama-server-27B-MTP.nix @@ -36,7 +36,7 @@ "--no-mmap" "--n-gpu-layers 99" "-hf am17an/Qwen3.6-27B-MTP-GGUF:Q8_0" - "--alias qwen3.6-27b" + "--alias halo-8000" "--threads 8" "--ubatch-size 256" "-ctk bf16 -ctv bf16" diff --git a/systems/x86_64-linux/halo/llama-server-27B.nix b/systems/x86_64-linux/halo/llama-server-27B.nix index d86cee9..94f0cdc 100644 --- a/systems/x86_64-linux/halo/llama-server-27B.nix +++ b/systems/x86_64-linux/halo/llama-server-27B.nix @@ -36,7 +36,7 @@ "--no-mmap" "--n-gpu-layers 99" "-hf unsloth/Qwen3.6-27B-GGUF:UD-Q8_K_XL" - "--alias qwen3.6-27b" + "--alias halo-8000" "--threads 8" "--ubatch-size 256" "-ctk bf16 -ctv bf16" diff --git a/systems/x86_64-linux/halo/llama-server-coder-next.nix b/systems/x86_64-linux/halo/llama-server-coder-next.nix index 075ed57..7f34a3c 100644 --- a/systems/x86_64-linux/halo/llama-server-coder-next.nix +++ b/systems/x86_64-linux/halo/llama-server-coder-next.nix @@ -41,7 +41,7 @@ "--fit on" "--no-context-shift" "-hf unsloth/Qwen3-Coder-Next-GGUF:UD-Q8_K_XL" - "--alias qwen3-coder-next" + "--alias halo-8000" "--temp 1.0 --top-p 0.95 --min-p 0.01 --top-k 40" "--slot-save-path %C/llama-server/kv-slots-coder-next" ]; diff --git a/systems/x86_64-linux/halo/llama-server.nix b/systems/x86_64-linux/halo/llama-server.nix index 340b775..683286b 100644 --- a/systems/x86_64-linux/halo/llama-server.nix +++ b/systems/x86_64-linux/halo/llama-server.nix @@ -36,7 +36,7 @@ "--no-mmap" "--n-gpu-layers 99" "-hf unsloth/Qwen3.6-35B-A3B-GGUF:UD-Q8_K_XL" - "--alias qwen3.6-35b-a3b" + "--alias halo-8000" "--threads 8" "--ubatch-size 256" "-ctk bf16 -ctv bf16"