diff --git a/systems/x86_64-linux/halo/models.ini b/systems/x86_64-linux/halo/models.ini index 7c46654..dce6edf 100644 --- a/systems/x86_64-linux/halo/models.ini +++ b/systems/x86_64-linux/halo/models.ini @@ -23,7 +23,7 @@ temp = 0.6 top-p = 0.95 top-k = 20 min-p = 0.0 -parallel = 2 -c = 524288 +parallel = 4 +c = 1048576 load-on-startup = true chat-template-kwargs = {"preserve_thinking": true}