Only enable numa on CPUs (#6484)

The numa flag may be having a performance impact on multi-socket systems with GPU loads
2025-06-07 03:35:21 +00:00 · 2024-08-24 17:24:50 -07:00 · 2024-08-24 17:24:50 -07:00 · 0f92b19bec
commit 0f92b19bec
parent 69be940bf6
1 changed files with 1 additions and 1 deletions
--- a/llm/server.go
+++ b/llm/server.go
@ -258,7 +258,7 @@ func NewLlamaServer(gpus gpu.GpuInfoList, model string, ggml *GGML, adapters, pr
 		params = append(params, "--mlock")
 	}
-	if gpu.IsNUMA() {
+	if gpu.IsNUMA() && gpus[0].Library == "cpu" {
 		numaMode := "distribute"
 		if runtime.GOOS == "linux" {
 			if _, err := exec.LookPath("numactl"); err == nil {