chore(halo): reduce ubatch size

This commit is contained in:
Harald Hoyer 2026-05-21 08:47:39 +02:00
parent 6c5ce8742c
commit 1376ab0ba0

View file

@ -6,7 +6,7 @@ parallel = 1
jinja = true
n-gpu-layers = 99
threads = 8
ubatch-size = 512
ubatch-size = 256
cache-type-k = bf16
cache-type-v = bf16
mmap = false