mirror of
https://github.com/ollama/ollama.git
synced 2025-08-27 00:31:41 +02:00
load arrays with up to 1024 elements when estimating
This mirrors the old behavior before #10382
This commit is contained in:
@@ -201,7 +201,7 @@ func (s *Scheduler) processPending(ctx context.Context) {
|
||||
}
|
||||
|
||||
// Load model for fitting
|
||||
ggml, err := llm.LoadModel(pending.model.ModelPath, 0)
|
||||
ggml, err := llm.LoadModel(pending.model.ModelPath, 1024)
|
||||
if err != nil {
|
||||
pending.errCh <- err
|
||||
break
|
||||
|
Reference in New Issue
Block a user