mirror of
https://github.com/ollama/ollama.git
synced 2025-09-07 07:31:47 +02:00
load arrays with up to 1024 elements when estimating
This mirrors the old behavior before #10382
This commit is contained in:
@@ -201,7 +201,7 @@ func (s *Scheduler) processPending(ctx context.Context) {
|
|||||||
}
|
}
|
||||||
|
|
||||||
// Load model for fitting
|
// Load model for fitting
|
||||||
ggml, err := llm.LoadModel(pending.model.ModelPath, 0)
|
ggml, err := llm.LoadModel(pending.model.ModelPath, 1024)
|
||||||
if err != nil {
|
if err != nil {
|
||||||
pending.errCh <- err
|
pending.errCh <- err
|
||||||
break
|
break
|
||||||
|
Reference in New Issue
Block a user