mirror of
https://github.com/ollama/ollama.git
synced 2026-03-27 02:58:43 +07:00
lower batch size to 512
This commit is contained in:
@@ -190,7 +190,7 @@ func DefaultOptions() Options {
|
||||
UseNUMA: false,
|
||||
|
||||
NumCtx: 2048,
|
||||
NumBatch: 1024,
|
||||
NumBatch: 512,
|
||||
NumGPU: 1,
|
||||
NumGQA: 1,
|
||||
LowVRAM: false,
|
||||
|
||||
Reference in New Issue
Block a user