From d2ee599dcf9746a3af0433463f9ce7dbc8cbc693 Mon Sep 17 00:00:00 2001 From: Devon Rifkin Date: Sun, 27 Apr 2025 13:45:13 -0700 Subject: [PATCH] load arrays with up to 1024 elements when estimating This mirrors the old behavior before #10382 --- server/sched.go | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/server/sched.go b/server/sched.go index d5b19fbfd..9c13f6cf5 100644 --- a/server/sched.go +++ b/server/sched.go @@ -201,7 +201,7 @@ func (s *Scheduler) processPending(ctx context.Context) { } // Load model for fitting - ggml, err := llm.LoadModel(pending.model.ModelPath, 0) + ggml, err := llm.LoadModel(pending.model.ModelPath, 1024) if err != nil { pending.errCh <- err break