2024-06-05 19:07:20 +00:00
|
|
|
package gpu
|
|
|
|
|
|
|
|
import (
|
|
|
|
"bufio"
|
|
|
|
"fmt"
|
|
|
|
"os"
|
2024-10-15 18:36:08 +00:00
|
|
|
"reflect"
|
|
|
|
"regexp"
|
2024-06-05 19:07:20 +00:00
|
|
|
"strings"
|
|
|
|
|
|
|
|
"github.com/ollama/ollama/format"
|
|
|
|
)
|
|
|
|
|
|
|
|
var CudartGlobs = []string{
|
|
|
|
"/usr/local/cuda/lib64/libcudart.so*",
|
|
|
|
"/usr/lib/x86_64-linux-gnu/nvidia/current/libcudart.so*",
|
|
|
|
"/usr/lib/x86_64-linux-gnu/libcudart.so*",
|
|
|
|
"/usr/lib/wsl/lib/libcudart.so*",
|
|
|
|
"/usr/lib/wsl/drivers/*/libcudart.so*",
|
|
|
|
"/opt/cuda/lib64/libcudart.so*",
|
|
|
|
"/usr/local/cuda*/targets/aarch64-linux/lib/libcudart.so*",
|
|
|
|
"/usr/lib/aarch64-linux-gnu/nvidia/current/libcudart.so*",
|
|
|
|
"/usr/lib/aarch64-linux-gnu/libcudart.so*",
|
|
|
|
"/usr/local/cuda/lib*/libcudart.so*",
|
|
|
|
"/usr/lib*/libcudart.so*",
|
|
|
|
"/usr/local/lib*/libcudart.so*",
|
|
|
|
}
|
|
|
|
|
|
|
|
var NvmlGlobs = []string{}
|
|
|
|
|
|
|
|
var NvcudaGlobs = []string{
|
|
|
|
"/usr/local/cuda*/targets/*/lib/libcuda.so*",
|
|
|
|
"/usr/lib/*-linux-gnu/nvidia/current/libcuda.so*",
|
|
|
|
"/usr/lib/*-linux-gnu/libcuda.so*",
|
|
|
|
"/usr/lib/wsl/lib/libcuda.so*",
|
|
|
|
"/usr/lib/wsl/drivers/*/libcuda.so*",
|
|
|
|
"/opt/cuda/lib*/libcuda.so*",
|
|
|
|
"/usr/local/cuda/lib*/libcuda.so*",
|
|
|
|
"/usr/lib*/libcuda.so*",
|
|
|
|
"/usr/local/lib*/libcuda.so*",
|
|
|
|
}
|
|
|
|
|
|
|
|
var OneapiGlobs = []string{
|
|
|
|
"/usr/lib/x86_64-linux-gnu/libze_intel_gpu.so*",
|
|
|
|
"/usr/lib*/libze_intel_gpu.so*",
|
|
|
|
}
|
|
|
|
|
2024-08-01 21:52:15 +00:00
|
|
|
var (
|
|
|
|
CudartMgmtName = "libcudart.so*"
|
|
|
|
NvcudaMgmtName = "libcuda.so*"
|
|
|
|
NvmlMgmtName = "" // not currently wired on linux
|
2024-07-08 19:50:11 +00:00
|
|
|
OneapiMgmtName = "libze_intel_gpu.so*"
|
2024-08-01 21:52:15 +00:00
|
|
|
)
|
2024-06-05 19:07:20 +00:00
|
|
|
|
|
|
|
func GetCPUMem() (memInfo, error) {
|
|
|
|
var mem memInfo
|
2024-07-11 23:42:57 +00:00
|
|
|
var total, available, free, buffers, cached, freeSwap uint64
|
2024-06-05 19:07:20 +00:00
|
|
|
f, err := os.Open("/proc/meminfo")
|
|
|
|
if err != nil {
|
|
|
|
return mem, err
|
|
|
|
}
|
|
|
|
defer f.Close()
|
|
|
|
s := bufio.NewScanner(f)
|
|
|
|
for s.Scan() {
|
|
|
|
line := s.Text()
|
|
|
|
switch {
|
|
|
|
case strings.HasPrefix(line, "MemTotal:"):
|
|
|
|
_, err = fmt.Sscanf(line, "MemTotal:%d", &total)
|
|
|
|
case strings.HasPrefix(line, "MemAvailable:"):
|
|
|
|
_, err = fmt.Sscanf(line, "MemAvailable:%d", &available)
|
|
|
|
case strings.HasPrefix(line, "MemFree:"):
|
|
|
|
_, err = fmt.Sscanf(line, "MemFree:%d", &free)
|
|
|
|
case strings.HasPrefix(line, "Buffers:"):
|
|
|
|
_, err = fmt.Sscanf(line, "Buffers:%d", &buffers)
|
|
|
|
case strings.HasPrefix(line, "Cached:"):
|
|
|
|
_, err = fmt.Sscanf(line, "Cached:%d", &cached)
|
2024-07-11 23:42:57 +00:00
|
|
|
case strings.HasPrefix(line, "SwapFree:"):
|
|
|
|
_, err = fmt.Sscanf(line, "SwapFree:%d", &freeSwap)
|
2024-06-05 19:07:20 +00:00
|
|
|
default:
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
if err != nil {
|
|
|
|
return mem, err
|
|
|
|
}
|
|
|
|
}
|
|
|
|
mem.TotalMemory = total * format.KibiByte
|
2024-07-11 23:42:57 +00:00
|
|
|
mem.FreeSwap = freeSwap * format.KibiByte
|
|
|
|
if available > 0 {
|
|
|
|
mem.FreeMemory = available * format.KibiByte
|
|
|
|
} else {
|
|
|
|
mem.FreeMemory = (free + buffers + cached) * format.KibiByte
|
|
|
|
}
|
2024-06-05 19:07:20 +00:00
|
|
|
return mem, nil
|
|
|
|
}
|
2024-10-15 18:36:08 +00:00
|
|
|
|
|
|
|
const CpuInfoFilename = "/proc/cpuinfo"
|
|
|
|
|
|
|
|
type linuxCpuInfo struct {
|
|
|
|
ID string `cpuinfo:"processor"`
|
|
|
|
VendorID string `cpuinfo:"vendor_id"`
|
|
|
|
ModelName string `cpuinfo:"model name"`
|
|
|
|
PhysicalID string `cpuinfo:"physical id"`
|
|
|
|
Siblings string `cpuinfo:"siblings"`
|
|
|
|
CoreID string `cpuinfo:"core id"`
|
|
|
|
}
|
|
|
|
|
|
|
|
func GetCPUDetails() ([]CPU, error) {
|
|
|
|
file, err := os.Open(CpuInfoFilename)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
reColumns := regexp.MustCompile("\t+: ")
|
|
|
|
scanner := bufio.NewScanner(file)
|
|
|
|
cpuInfos := []linuxCpuInfo{}
|
|
|
|
cpu := &linuxCpuInfo{}
|
|
|
|
for scanner.Scan() {
|
|
|
|
line := scanner.Text()
|
|
|
|
if sl := reColumns.Split(line, 2); len(sl) > 1 {
|
|
|
|
t := reflect.TypeOf(cpu).Elem()
|
|
|
|
s := reflect.ValueOf(cpu).Elem()
|
|
|
|
for i := range t.NumField() {
|
|
|
|
field := t.Field(i)
|
|
|
|
tag := field.Tag.Get("cpuinfo")
|
|
|
|
if tag == sl[0] {
|
|
|
|
s.FieldByName(field.Name).SetString(sl[1])
|
|
|
|
break
|
|
|
|
}
|
|
|
|
}
|
|
|
|
} else if strings.TrimSpace(line) == "" && cpu.ID != "" {
|
|
|
|
cpuInfos = append(cpuInfos, *cpu)
|
|
|
|
cpu = &linuxCpuInfo{}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Process the sockets/cores/threads
|
|
|
|
socketByID := map[string]*CPU{}
|
|
|
|
coreBySocket := map[string]map[string]struct{}{}
|
|
|
|
threadsByCoreBySocket := map[string]map[string]int{}
|
|
|
|
for _, c := range cpuInfos {
|
|
|
|
if _, found := socketByID[c.PhysicalID]; !found {
|
|
|
|
socketByID[c.PhysicalID] = &CPU{
|
|
|
|
ID: c.PhysicalID,
|
|
|
|
VendorID: c.VendorID,
|
|
|
|
ModelName: c.ModelName,
|
|
|
|
}
|
|
|
|
coreBySocket[c.PhysicalID] = map[string]struct{}{}
|
|
|
|
threadsByCoreBySocket[c.PhysicalID] = map[string]int{}
|
|
|
|
}
|
|
|
|
if c.CoreID != "" {
|
|
|
|
coreBySocket[c.PhysicalID][c.PhysicalID+":"+c.CoreID] = struct{}{}
|
|
|
|
threadsByCoreBySocket[c.PhysicalID][c.PhysicalID+":"+c.CoreID]++
|
|
|
|
} else {
|
|
|
|
coreBySocket[c.PhysicalID][c.PhysicalID+":"+c.ID] = struct{}{}
|
|
|
|
threadsByCoreBySocket[c.PhysicalID][c.PhysicalID+":"+c.ID]++
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Tally up the values from the tracking maps
|
|
|
|
for id, s := range socketByID {
|
|
|
|
s.CoreCount = len(coreBySocket[id])
|
|
|
|
s.ThreadCount = 0
|
|
|
|
for _, tc := range threadsByCoreBySocket[id] {
|
|
|
|
s.ThreadCount += tc
|
|
|
|
}
|
|
|
|
|
|
|
|
// This only works if HT is enabled, consider a more reliable model, maybe cache size comparisons?
|
|
|
|
efficiencyCoreCount := 0
|
|
|
|
for _, threads := range threadsByCoreBySocket[id] {
|
|
|
|
if threads == 1 {
|
|
|
|
efficiencyCoreCount++
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if efficiencyCoreCount == s.CoreCount {
|
|
|
|
// 1:1 mapping means they're not actually efficiency cores, but regular cores
|
|
|
|
s.EfficiencyCoreCount = 0
|
|
|
|
} else {
|
|
|
|
s.EfficiencyCoreCount = efficiencyCoreCount
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
result := []CPU{}
|
|
|
|
for _, c := range socketByID {
|
|
|
|
result = append(result, *c)
|
|
|
|
}
|
|
|
|
return result, nil
|
|
|
|
}
|