From 1376ab0ba0a58d5c8fe97cef9cd3647ca3046aa8 Mon Sep 17 00:00:00 2001 From: Harald Hoyer Date: Thu, 21 May 2026 08:47:39 +0200 Subject: [PATCH] chore(halo): reduce ubatch size --- systems/x86_64-linux/halo/models.ini | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/systems/x86_64-linux/halo/models.ini b/systems/x86_64-linux/halo/models.ini index 6632557..d2ec173 100644 --- a/systems/x86_64-linux/halo/models.ini +++ b/systems/x86_64-linux/halo/models.ini @@ -6,7 +6,7 @@ parallel = 1 jinja = true n-gpu-layers = 99 threads = 8 -ubatch-size = 512 +ubatch-size = 256 cache-type-k = bf16 cache-type-v = bf16 mmap = false