fix(halo): only one model

This commit is contained in:
Harald Hoyer 2026-05-20 14:23:20 +02:00
parent 5ee2f65337
commit 6c5ce8742c
2 changed files with 2 additions and 2 deletions

View file

@ -29,7 +29,7 @@
"--host 0.0.0.0"
"--port 8000"
"--models-preset ${./models.ini}"
"--models-max 2"
"--models-max 1"
];
Restart = "on-failure";
RestartSec = 10;

View file

@ -11,7 +11,6 @@ cache-type-k = bf16
cache-type-v = bf16
mmap = false
no-context-shift = true
chat-template-kwargs = {"preserve_thinking": true}
fit = on
c = 131072
@ -27,3 +26,4 @@ min-p = 0.0
parallel = 2
c = 524288
load-on-startup = true
chat-template-kwargs = {"preserve_thinking": true}