diff --git a/systems/x86_64-linux/halo/default.nix b/systems/x86_64-linux/halo/default.nix index c25e491..afece0e 100644 --- a/systems/x86_64-linux/halo/default.nix +++ b/systems/x86_64-linux/halo/default.nix @@ -10,7 +10,7 @@ with lib.metacfg; ./hardware-configuration.nix #./xremap.nix ./wyoming.nix - ./llama-server-27B.nix + ./llama-server-coder-next.nix ]; boot.lanzaboote.pkiBundle = "/var/lib/sbctl"; diff --git a/systems/x86_64-linux/halo/llama-server-coder-next.nix b/systems/x86_64-linux/halo/llama-server-coder-next.nix index d384f7c..075ed57 100644 --- a/systems/x86_64-linux/halo/llama-server-coder-next.nix +++ b/systems/x86_64-linux/halo/llama-server-coder-next.nix @@ -28,7 +28,7 @@ ExecStartPre = "${pkgs.coreutils}/bin/mkdir -p %C/llama-server/kv-slots-coder-next"; ExecStart = lib.concatStringsSep " " [ "${pkgs.llama-cpp-rocm}/bin/llama-server" - "--flash-attn on" + "--flash-attn on" "--parallel 1" "--jinja" "--host 0.0.0.0"