fix(halo): only one model
This commit is contained in:
parent
5ee2f65337
commit
6c5ce8742c
2 changed files with 2 additions and 2 deletions
|
|
@ -29,7 +29,7 @@
|
||||||
"--host 0.0.0.0"
|
"--host 0.0.0.0"
|
||||||
"--port 8000"
|
"--port 8000"
|
||||||
"--models-preset ${./models.ini}"
|
"--models-preset ${./models.ini}"
|
||||||
"--models-max 2"
|
"--models-max 1"
|
||||||
];
|
];
|
||||||
Restart = "on-failure";
|
Restart = "on-failure";
|
||||||
RestartSec = 10;
|
RestartSec = 10;
|
||||||
|
|
|
||||||
|
|
@ -11,7 +11,6 @@ cache-type-k = bf16
|
||||||
cache-type-v = bf16
|
cache-type-v = bf16
|
||||||
mmap = false
|
mmap = false
|
||||||
no-context-shift = true
|
no-context-shift = true
|
||||||
chat-template-kwargs = {"preserve_thinking": true}
|
|
||||||
fit = on
|
fit = on
|
||||||
c = 131072
|
c = 131072
|
||||||
|
|
||||||
|
|
@ -27,3 +26,4 @@ min-p = 0.0
|
||||||
parallel = 2
|
parallel = 2
|
||||||
c = 524288
|
c = 524288
|
||||||
load-on-startup = true
|
load-on-startup = true
|
||||||
|
chat-template-kwargs = {"preserve_thinking": true}
|
||||||
|
|
|
||||||
Loading…
Add table
Add a link
Reference in a new issue