lower batch size to 512

This commit is contained in:
Jeffrey Morgan 2023-07-28 10:56:21 -04:00
parent 18b6b601ad
commit 822a0e36eb

View file

@ -190,7 +190,7 @@ func DefaultOptions() Options {
UseNUMA: false,
NumCtx: 2048,
NumBatch: 1024,
NumBatch: 512,
NumGPU: 1,
NumGQA: 1,
LowVRAM: false,