fix(halo): only one model
This commit is contained in:
parent
5ee2f65337
commit
6c5ce8742c
2 changed files with 2 additions and 2 deletions
|
|
@ -29,7 +29,7 @@
|
|||
"--host 0.0.0.0"
|
||||
"--port 8000"
|
||||
"--models-preset ${./models.ini}"
|
||||
"--models-max 2"
|
||||
"--models-max 1"
|
||||
];
|
||||
Restart = "on-failure";
|
||||
RestartSec = 10;
|
||||
|
|
|
|||
|
|
@ -11,7 +11,6 @@ cache-type-k = bf16
|
|||
cache-type-v = bf16
|
||||
mmap = false
|
||||
no-context-shift = true
|
||||
chat-template-kwargs = {"preserve_thinking": true}
|
||||
fit = on
|
||||
c = 131072
|
||||
|
||||
|
|
@ -27,3 +26,4 @@ min-p = 0.0
|
|||
parallel = 2
|
||||
c = 524288
|
||||
load-on-startup = true
|
||||
chat-template-kwargs = {"preserve_thinking": true}
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue