load arrays with up to 1024 elements when estimating

This mirrors the old behavior before #10382
2025-09-07 07:31:47 +02:00 · 2025-04-27 13:45:13 -07:00
parent 6ed8898590
commit d2ee599dcf
1 changed files with 1 additions and 1 deletions
--- a/server/sched.go
+++ b/server/sched.go
@@ -201,7 +201,7 @@ func (s *Scheduler) processPending(ctx context.Context) {
 					}
 					// Load model for fitting
-					ggml, err := llm.LoadModel(pending.model.ModelPath, 0)
+					ggml, err := llm.LoadModel(pending.model.ModelPath, 1024)
 					if err != nil {
 						pending.errCh <- err
 						break