gpu_linux.go 5.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186
  1. package discover
  2. import (
  3. "bufio"
  4. "fmt"
  5. "os"
  6. "reflect"
  7. "regexp"
  8. "strings"
  9. "github.com/ollama/ollama/format"
  10. )
  11. var CudartGlobs = []string{
  12. "/usr/local/cuda/lib64/libcudart.so*",
  13. "/usr/lib/x86_64-linux-gnu/nvidia/current/libcudart.so*",
  14. "/usr/lib/x86_64-linux-gnu/libcudart.so*",
  15. "/usr/lib/wsl/lib/libcudart.so*",
  16. "/usr/lib/wsl/drivers/*/libcudart.so*",
  17. "/opt/cuda/lib64/libcudart.so*",
  18. "/usr/local/cuda*/targets/aarch64-linux/lib/libcudart.so*",
  19. "/usr/lib/aarch64-linux-gnu/nvidia/current/libcudart.so*",
  20. "/usr/lib/aarch64-linux-gnu/libcudart.so*",
  21. "/usr/local/cuda/lib*/libcudart.so*",
  22. "/usr/lib*/libcudart.so*",
  23. "/usr/local/lib*/libcudart.so*",
  24. }
  25. var NvmlGlobs = []string{}
  26. var NvcudaGlobs = []string{
  27. "/usr/local/cuda*/targets/*/lib/libcuda.so*",
  28. "/usr/lib/*-linux-gnu/nvidia/current/libcuda.so*",
  29. "/usr/lib/*-linux-gnu/libcuda.so*",
  30. "/usr/lib/wsl/lib/libcuda.so*",
  31. "/usr/lib/wsl/drivers/*/libcuda.so*",
  32. "/opt/cuda/lib*/libcuda.so*",
  33. "/usr/local/cuda/lib*/libcuda.so*",
  34. "/usr/lib*/libcuda.so*",
  35. "/usr/local/lib*/libcuda.so*",
  36. }
  37. var OneapiGlobs = []string{
  38. "/usr/lib/x86_64-linux-gnu/libze_intel_gpu.so*",
  39. "/usr/lib*/libze_intel_gpu.so*",
  40. }
  41. var (
  42. CudartMgmtName = "libcudart.so*"
  43. NvcudaMgmtName = "libcuda.so*"
  44. NvmlMgmtName = "" // not currently wired on linux
  45. OneapiMgmtName = "libze_intel_gpu.so*"
  46. )
  47. func GetCPUMem() (memInfo, error) {
  48. var mem memInfo
  49. var total, available, free, buffers, cached, freeSwap uint64
  50. f, err := os.Open("/proc/meminfo")
  51. if err != nil {
  52. return mem, err
  53. }
  54. defer f.Close()
  55. s := bufio.NewScanner(f)
  56. for s.Scan() {
  57. line := s.Text()
  58. switch {
  59. case strings.HasPrefix(line, "MemTotal:"):
  60. _, err = fmt.Sscanf(line, "MemTotal:%d", &total)
  61. case strings.HasPrefix(line, "MemAvailable:"):
  62. _, err = fmt.Sscanf(line, "MemAvailable:%d", &available)
  63. case strings.HasPrefix(line, "MemFree:"):
  64. _, err = fmt.Sscanf(line, "MemFree:%d", &free)
  65. case strings.HasPrefix(line, "Buffers:"):
  66. _, err = fmt.Sscanf(line, "Buffers:%d", &buffers)
  67. case strings.HasPrefix(line, "Cached:"):
  68. _, err = fmt.Sscanf(line, "Cached:%d", &cached)
  69. case strings.HasPrefix(line, "SwapFree:"):
  70. _, err = fmt.Sscanf(line, "SwapFree:%d", &freeSwap)
  71. default:
  72. continue
  73. }
  74. if err != nil {
  75. return mem, err
  76. }
  77. }
  78. mem.TotalMemory = total * format.KibiByte
  79. mem.FreeSwap = freeSwap * format.KibiByte
  80. if available > 0 {
  81. mem.FreeMemory = available * format.KibiByte
  82. } else {
  83. mem.FreeMemory = (free + buffers + cached) * format.KibiByte
  84. }
  85. return mem, nil
  86. }
  87. const CpuInfoFilename = "/proc/cpuinfo"
  88. type linuxCpuInfo struct {
  89. ID string `cpuinfo:"processor"`
  90. VendorID string `cpuinfo:"vendor_id"`
  91. ModelName string `cpuinfo:"model name"`
  92. PhysicalID string `cpuinfo:"physical id"`
  93. Siblings string `cpuinfo:"siblings"`
  94. CoreID string `cpuinfo:"core id"`
  95. }
  96. func GetCPUDetails() ([]CPU, error) {
  97. file, err := os.Open(CpuInfoFilename)
  98. if err != nil {
  99. return nil, err
  100. }
  101. reColumns := regexp.MustCompile("\t+: ")
  102. scanner := bufio.NewScanner(file)
  103. cpuInfos := []linuxCpuInfo{}
  104. cpu := &linuxCpuInfo{}
  105. for scanner.Scan() {
  106. line := scanner.Text()
  107. if sl := reColumns.Split(line, 2); len(sl) > 1 {
  108. t := reflect.TypeOf(cpu).Elem()
  109. s := reflect.ValueOf(cpu).Elem()
  110. for i := range t.NumField() {
  111. field := t.Field(i)
  112. tag := field.Tag.Get("cpuinfo")
  113. if tag == sl[0] {
  114. s.FieldByName(field.Name).SetString(sl[1])
  115. break
  116. }
  117. }
  118. } else if strings.TrimSpace(line) == "" && cpu.ID != "" {
  119. cpuInfos = append(cpuInfos, *cpu)
  120. cpu = &linuxCpuInfo{}
  121. }
  122. }
  123. // Process the sockets/cores/threads
  124. socketByID := map[string]*CPU{}
  125. coreBySocket := map[string]map[string]struct{}{}
  126. threadsByCoreBySocket := map[string]map[string]int{}
  127. for _, c := range cpuInfos {
  128. if _, found := socketByID[c.PhysicalID]; !found {
  129. socketByID[c.PhysicalID] = &CPU{
  130. ID: c.PhysicalID,
  131. VendorID: c.VendorID,
  132. ModelName: c.ModelName,
  133. }
  134. coreBySocket[c.PhysicalID] = map[string]struct{}{}
  135. threadsByCoreBySocket[c.PhysicalID] = map[string]int{}
  136. }
  137. if c.CoreID != "" {
  138. coreBySocket[c.PhysicalID][c.PhysicalID+":"+c.CoreID] = struct{}{}
  139. threadsByCoreBySocket[c.PhysicalID][c.PhysicalID+":"+c.CoreID]++
  140. } else {
  141. coreBySocket[c.PhysicalID][c.PhysicalID+":"+c.ID] = struct{}{}
  142. threadsByCoreBySocket[c.PhysicalID][c.PhysicalID+":"+c.ID]++
  143. }
  144. }
  145. // Tally up the values from the tracking maps
  146. for id, s := range socketByID {
  147. s.CoreCount = len(coreBySocket[id])
  148. s.ThreadCount = 0
  149. for _, tc := range threadsByCoreBySocket[id] {
  150. s.ThreadCount += tc
  151. }
  152. // This only works if HT is enabled, consider a more reliable model, maybe cache size comparisons?
  153. efficiencyCoreCount := 0
  154. for _, threads := range threadsByCoreBySocket[id] {
  155. if threads == 1 {
  156. efficiencyCoreCount++
  157. }
  158. }
  159. if efficiencyCoreCount == s.CoreCount {
  160. // 1:1 mapping means they're not actually efficiency cores, but regular cores
  161. s.EfficiencyCoreCount = 0
  162. } else {
  163. s.EfficiencyCoreCount = efficiencyCoreCount
  164. }
  165. }
  166. result := []CPU{}
  167. for _, c := range socketByID {
  168. result = append(result, *c)
  169. }
  170. return result, nil
  171. }