feat(halo): activate qwen 27b
This commit is contained in:
parent
bef528e26a
commit
689cdec28d
2 changed files with 3 additions and 3 deletions
|
|
@ -10,7 +10,7 @@ with lib.metacfg;
|
||||||
./hardware-configuration.nix
|
./hardware-configuration.nix
|
||||||
#./xremap.nix
|
#./xremap.nix
|
||||||
./wyoming.nix
|
./wyoming.nix
|
||||||
./llama-server.nix
|
./llama-server-27B.nix
|
||||||
];
|
];
|
||||||
|
|
||||||
boot.lanzaboote.pkiBundle = "/var/lib/sbctl";
|
boot.lanzaboote.pkiBundle = "/var/lib/sbctl";
|
||||||
|
|
|
||||||
|
|
@ -29,7 +29,7 @@
|
||||||
ExecStart = lib.concatStringsSep " " [
|
ExecStart = lib.concatStringsSep " " [
|
||||||
"${pkgs.llama-cpp-rocm}/bin/llama-server"
|
"${pkgs.llama-cpp-rocm}/bin/llama-server"
|
||||||
"--flash-attn on"
|
"--flash-attn on"
|
||||||
"--parallel 2"
|
"--parallel 1"
|
||||||
"--jinja"
|
"--jinja"
|
||||||
"--host 0.0.0.0"
|
"--host 0.0.0.0"
|
||||||
"--port 8000"
|
"--port 8000"
|
||||||
|
|
@ -43,7 +43,7 @@
|
||||||
"--temp 0.6 --top-p 0.95 --top-k 20 --min-p 0.00"
|
"--temp 0.6 --top-p 0.95 --top-k 20 --min-p 0.00"
|
||||||
"--no-context-shift"
|
"--no-context-shift"
|
||||||
''--chat-template-kwargs '{"preserve_thinking": true}' ''
|
''--chat-template-kwargs '{"preserve_thinking": true}' ''
|
||||||
"-c 524288"
|
"-c 262144"
|
||||||
"--fit on"
|
"--fit on"
|
||||||
"--slot-save-path %C/llama-server/kv-slots"
|
"--slot-save-path %C/llama-server/kv-slots"
|
||||||
];
|
];
|
||||||
|
|
|
||||||
Loading…
Add table
Add a link
Reference in a new issue