Only enable numa on CPUs (#6484)

The numa flag may be having a performance impact on multi-socket systems with GPU loads
This commit is contained in:
Daniel Hiltgen 2024-08-24 17:24:50 -07:00 committed by GitHub
parent 69be940bf6
commit 0f92b19bec
No known key found for this signature in database
GPG key ID: B5690EEEBB952194

View file

@ -258,7 +258,7 @@ func NewLlamaServer(gpus gpu.GpuInfoList, model string, ggml *GGML, adapters, pr
params = append(params, "--mlock")
}
if gpu.IsNUMA() {
if gpu.IsNUMA() && gpus[0].Library == "cpu" {
numaMode := "distribute"
if runtime.GOOS == "linux" {
if _, err := exec.LookPath("numactl"); err == nil {