diff --git a/systems/x86_64-linux/halo/llama-server-27B.nix b/systems/x86_64-linux/halo/llama-server-27B.nix index 1a2faa3..ab25831 100644 --- a/systems/x86_64-linux/halo/llama-server-27B.nix +++ b/systems/x86_64-linux/halo/llama-server-27B.nix @@ -25,7 +25,7 @@ StateDirectory = "llama-server"; CacheDirectory = "llama-server"; WorkingDirectory = "%S/llama-server"; - ExecStartPre = "${pkgs.coreutils}/bin/mkdir -p %C/llama-server/kv-slots"; + ExecStartPre = "${pkgs.coreutils}/bin/mkdir -p %C/llama-server/kv-slots-27B"; ExecStart = lib.concatStringsSep " " [ "${pkgs.llama-cpp-rocm}/bin/llama-server" "--flash-attn on"