mirror of
https://github.com/ollama/ollama.git
synced 2025-09-27 21:26:59 +02:00
lower batch size to 512
This commit is contained in:
@@ -190,7 +190,7 @@ func DefaultOptions() Options {
|
||||
UseNUMA: false,
|
||||
|
||||
NumCtx: 2048,
|
||||
NumBatch: 1024,
|
||||
NumBatch: 512,
|
||||
NumGPU: 1,
|
||||
NumGQA: 1,
|
||||
LowVRAM: false,
|
||||
|
Reference in New Issue
Block a user