Revert "Limit GPU lib search for now (#4777)"

This reverts commit 476fb8e892.
2024-06-03 08:31:48 -07:00 · 2024-06-03 08:31:48 -07:00 · efac488675
commit efac488675
parent 4dc7fb9525
1 changed files with 31 additions and 1 deletions
--- a/gpu/gpu.go
+++ b/gpu/gpu.go
@ -16,12 +16,13 @@ import (
 	"os"
 	"path/filepath"
 	"runtime"
 	"strconv"
 	"strings"
 	"sync"
 	"unsafe"
 	"github.com/ollama/ollama/envconfig"
 	"github.com/ollama/ollama/format"
 	"github.com/ollama/ollama/envconfig"
 )
 type handles struct {
@ -104,6 +105,8 @@ func initGPUHandles() *handles {
 	var cudartMgmtPatterns []string
 	var nvcudaMgmtName string
 	var nvcudaMgmtPatterns []string
 	var oneapiMgmtName string
 	var oneapiMgmtPatterns []string
 	tmpDir, _ := PayloadsDir()
 	switch runtime.GOOS {
@ -115,6 +118,8 @@ func initGPUHandles() *handles {
 		// Aligned with driver, we can't carry as payloads
 		nvcudaMgmtName = "nvcuda.dll"
 		nvcudaMgmtPatterns = NvcudaWindowsGlobs
 		oneapiMgmtName = "ze_intel_gpu64.dll"
 		oneapiMgmtPatterns = OneapiWindowsGlobs
 	case "linux":
 		cudartMgmtName = "libcudart.so*"
 		if tmpDir != "" {
@ -125,6 +130,8 @@ func initGPUHandles() *handles {
 		// Aligned with driver, we can't carry as payloads
 		nvcudaMgmtName = "libcuda.so*"
 		nvcudaMgmtPatterns = NvcudaLinuxGlobs
 		oneapiMgmtName = "libze_intel_gpu.so"
 		oneapiMgmtPatterns = OneapiLinuxGlobs
 	default:
 		return gpuHandles
 	}
@ -152,6 +159,17 @@ func initGPUHandles() *handles {
 		}
 	}
 	oneapiLibPaths := FindGPULibs(oneapiMgmtName, oneapiMgmtPatterns)
 	if len(oneapiLibPaths) > 0 {
 		deviceCount, oneapi, libPath := LoadOneapiMgmt(oneapiLibPaths)
 		if oneapi != nil {
 			slog.Debug("detected Intel GPUs", "library", libPath, "count", deviceCount)
 			gpuHandles.oneapi = oneapi
 			gpuHandles.deviceCount = deviceCount
 			return gpuHandles
 		}
 	}
 	return gpuHandles
 }
@ -227,6 +245,18 @@ func GetGPUInfo() GpuInfoList {
 			// TODO potentially sort on our own algorithm instead of what the underlying GPU library does...
 			resp = append(resp, gpuInfo)
 		}
 		if gpuHandles.oneapi != nil {
 			gpuInfo := GpuInfo{
 				Library: "oneapi",
 			}
 			C.oneapi_check_vram(*gpuHandles.oneapi, &memInfo)
 			var totalFreeMem float64 = float64(memInfo.free) * 0.95 // work-around: leave some reserve vram for mkl lib used in ggml-sycl backend.
 			memInfo.free = C.uint64_t(totalFreeMem)
 			gpuInfo.TotalMemory = uint64(memInfo.total)
 			gpuInfo.FreeMemory = uint64(memInfo.free)
 			gpuInfo.ID = strconv.Itoa(i)
 			resp = append(resp, gpuInfo)
 		}
 	}
 	// Then AMD