mirror of
https://github.com/ClusterCockpit/cc-metric-collector.git
synced 2024-11-10 12:37:25 +01:00
391 lines
10 KiB
Go
391 lines
10 KiB
Go
package ccTopology
|
|
|
|
import (
|
|
"bufio"
|
|
"fmt"
|
|
"log"
|
|
"os"
|
|
"path/filepath"
|
|
"regexp"
|
|
"strconv"
|
|
"strings"
|
|
|
|
cclogger "github.com/ClusterCockpit/cc-metric-collector/pkg/ccLogger"
|
|
"golang.org/x/exp/slices"
|
|
)
|
|
|
|
const (
|
|
SYSFS_NUMABASE = `/sys/devices/system/node`
|
|
SYSFS_CPUBASE = `/sys/devices/system/cpu`
|
|
PROCFS_CPUINFO = `/proc/cpuinfo`
|
|
)
|
|
|
|
// Structure holding all information about a hardware thread
|
|
type HwthreadEntry struct {
|
|
CpuID int // CPU hardware threads
|
|
SMT int // symmetric hyper threading ID
|
|
Core int // CPU core ID
|
|
Socket int // CPU sockets (physical) ID
|
|
Die int // CPU Die ID
|
|
NumaDomain int // NUMA Domain
|
|
}
|
|
|
|
var cache struct {
|
|
HwthreadList, uniqHwthreadList []int // List of CPU hardware threads
|
|
SMTList, uniqSMTList []int // List of symmetric hyper threading IDs
|
|
CoreList, uniqCoreList []int // List of CPU core IDs
|
|
SocketList, uniqSocketList []int // List of CPU sockets (physical) IDs
|
|
DieList, uniqDieList []int // List of CPU Die IDs
|
|
NumaDomainList, uniqNumaDomainList []int // List of NUMA Domains
|
|
|
|
CpuData []HwthreadEntry
|
|
}
|
|
|
|
// init initializes the cache structure
|
|
func init() {
|
|
file, err := os.Open(PROCFS_CPUINFO)
|
|
if err != nil {
|
|
log.Print(err)
|
|
return
|
|
}
|
|
defer file.Close()
|
|
|
|
scanner := bufio.NewScanner(file)
|
|
for scanner.Scan() {
|
|
lineSplit := strings.Split(scanner.Text(), ":")
|
|
if len(lineSplit) == 2 {
|
|
key := strings.TrimSpace(lineSplit[0])
|
|
value := strings.TrimSpace(lineSplit[1])
|
|
switch key {
|
|
case "physical id":
|
|
id, err := strconv.Atoi(value)
|
|
if err != nil {
|
|
log.Print(err)
|
|
return
|
|
}
|
|
cache.SocketList = append(cache.SocketList, id)
|
|
case "processor":
|
|
id, err := strconv.Atoi(value)
|
|
if err != nil {
|
|
log.Print(err)
|
|
return
|
|
}
|
|
cache.HwthreadList = append(cache.HwthreadList, id)
|
|
}
|
|
}
|
|
}
|
|
|
|
getSMT :=
|
|
func(cpuID int, basePath string) int {
|
|
// Read thread sibling list
|
|
buffer, err := os.ReadFile(filepath.Join(basePath, "thread_siblings_list"))
|
|
if err != nil {
|
|
cclogger.ComponentError("CCTopology", "init", err.Error())
|
|
}
|
|
|
|
// Create thread sibling list
|
|
threadList := make([]int, 0)
|
|
stringBuffer := strings.TrimSpace(string(buffer))
|
|
for _, x := range strings.Split(stringBuffer, ",") {
|
|
id, err := strconv.Atoi(x)
|
|
if err != nil {
|
|
cclogger.ComponentError("CCTopology", "init", err.Error())
|
|
}
|
|
threadList = append(threadList, id)
|
|
}
|
|
|
|
// Find index of CPU ID in thread sibling list
|
|
// if not found return -1
|
|
return slices.Index(threadList, cpuID)
|
|
}
|
|
|
|
getNumaDomain :=
|
|
func(basePath string) int {
|
|
globPath := filepath.Join(basePath, "node*")
|
|
regexPath := filepath.Join(basePath, "node([[:digit:]]+)")
|
|
regex := regexp.MustCompile(regexPath)
|
|
|
|
// File globbing for NUMA node
|
|
files, err := filepath.Glob(globPath)
|
|
if err != nil {
|
|
cclogger.ComponentError("CCTopology", "CpuData:getNumaDomain", err.Error())
|
|
}
|
|
if len(files) != 1 {
|
|
return -1
|
|
}
|
|
|
|
// Extract NUMA node ID
|
|
matches := regex.FindStringSubmatch(files[0])
|
|
if len(matches) != 2 {
|
|
return -1
|
|
}
|
|
id, err := strconv.Atoi(matches[1])
|
|
if err != nil {
|
|
return -1
|
|
}
|
|
|
|
return id
|
|
}
|
|
|
|
cache.CoreList = make([]int, len(cache.HwthreadList))
|
|
cache.DieList = make([]int, len(cache.HwthreadList))
|
|
cache.SMTList = make([]int, len(cache.HwthreadList))
|
|
cache.NumaDomainList = make([]int, len(cache.HwthreadList))
|
|
for i, c := range cache.HwthreadList {
|
|
// Set base directory for topology lookup
|
|
base :=
|
|
filepath.Join(
|
|
"/sys/devices/system/cpu",
|
|
fmt.Sprintf("cpu%d", c),
|
|
)
|
|
topoBase := filepath.Join(base, "topology")
|
|
|
|
// Lookup Core ID
|
|
cache.CoreList[i] = fileToInt(filepath.Join(topoBase, "core_id"))
|
|
|
|
// Lookup CPU die id
|
|
cache.DieList[i] = fileToInt(filepath.Join(topoBase, "die_id"))
|
|
if cache.DieList[i] < 0 {
|
|
cache.DieList[i] = cache.SocketList[i]
|
|
}
|
|
|
|
// Lookup SMT thread id
|
|
cache.SMTList[i] = getSMT(c, topoBase)
|
|
|
|
// Lookup NUMA domain id
|
|
cache.NumaDomainList[i] = getNumaDomain(base)
|
|
}
|
|
|
|
cache.uniqHwthreadList = slices.Clone(cache.HwthreadList)
|
|
slices.Sort(cache.uniqHwthreadList)
|
|
cache.uniqHwthreadList = slices.Compact(cache.uniqHwthreadList)
|
|
|
|
cache.uniqSMTList = slices.Clone(cache.SMTList)
|
|
slices.Sort(cache.uniqSMTList)
|
|
cache.uniqSMTList = slices.Compact(cache.uniqSMTList)
|
|
|
|
cache.uniqCoreList = slices.Clone(cache.CoreList)
|
|
slices.Sort(cache.uniqCoreList)
|
|
cache.uniqCoreList = slices.Compact(cache.uniqCoreList)
|
|
|
|
cache.uniqSocketList = slices.Clone(cache.SocketList)
|
|
slices.Sort(cache.uniqSocketList)
|
|
cache.uniqSocketList = slices.Compact(cache.uniqSocketList)
|
|
|
|
cache.uniqDieList = slices.Clone(cache.DieList)
|
|
slices.Sort(cache.uniqDieList)
|
|
cache.uniqDieList = slices.Compact(cache.uniqDieList)
|
|
|
|
cache.uniqNumaDomainList = slices.Clone(cache.NumaDomainList)
|
|
slices.Sort(cache.uniqNumaDomainList)
|
|
cache.uniqNumaDomainList = slices.Compact(cache.uniqNumaDomainList)
|
|
|
|
cache.CpuData = make([]HwthreadEntry, len(cache.HwthreadList))
|
|
for i := range cache.HwthreadList {
|
|
cache.CpuData[i] =
|
|
HwthreadEntry{
|
|
CpuID: cache.HwthreadList[i],
|
|
SMT: cache.SMTList[i],
|
|
Socket: cache.SocketList[i],
|
|
NumaDomain: cache.NumaDomainList[i],
|
|
Die: cache.DieList[i],
|
|
Core: cache.CoreList[i],
|
|
}
|
|
}
|
|
}
|
|
|
|
// fileToInt reads an integer value from a file
|
|
// In case of an error -1 is returned
|
|
// Used internally for sysfs file reads
|
|
func fileToInt(path string) int {
|
|
buffer, err := os.ReadFile(path)
|
|
if err != nil {
|
|
log.Print(err)
|
|
cclogger.ComponentError("ccTopology", "Reading", path, ":", err.Error())
|
|
return -1
|
|
}
|
|
stringBuffer := strings.TrimSpace(string(buffer))
|
|
id, err := strconv.Atoi(stringBuffer)
|
|
if err != nil {
|
|
cclogger.ComponentError("ccTopology", "Parsing", path, ":", stringBuffer, err.Error())
|
|
return -1
|
|
}
|
|
return id
|
|
}
|
|
|
|
// SocketList gets the list of CPU socket IDs
|
|
func SocketList() []int {
|
|
return slices.Clone(cache.uniqSocketList)
|
|
}
|
|
|
|
// HwthreadList gets the list of hardware thread IDs in the order of listing in /proc/cpuinfo
|
|
func HwthreadList() []int {
|
|
return slices.Clone(cache.uniqHwthreadList)
|
|
}
|
|
|
|
// Get list of hardware thread IDs in the order of listing in /proc/cpuinfo
|
|
// Deprecated! Use HwthreadList()
|
|
func CpuList() []int {
|
|
return HwthreadList()
|
|
}
|
|
|
|
// CoreList gets the list of CPU core IDs in the order of listing in /proc/cpuinfo
|
|
func CoreList() []int {
|
|
return slices.Clone(cache.uniqCoreList)
|
|
}
|
|
|
|
// Get list of NUMA node IDs
|
|
func NumaNodeList() []int {
|
|
return slices.Clone(cache.uniqNumaDomainList)
|
|
}
|
|
|
|
// DieList gets the list of CPU die IDs
|
|
func DieList() []int {
|
|
if len(cache.uniqDieList) > 0 {
|
|
return slices.Clone(cache.uniqDieList)
|
|
}
|
|
return SocketList()
|
|
}
|
|
|
|
// GetTypeList gets the list of specified type using the naming format inside ClusterCockpit
|
|
func GetTypeList(topology_type string) []int {
|
|
switch topology_type {
|
|
case "node":
|
|
return []int{0}
|
|
case "socket":
|
|
return SocketList()
|
|
case "die":
|
|
return DieList()
|
|
case "memoryDomain":
|
|
return NumaNodeList()
|
|
case "core":
|
|
return CoreList()
|
|
case "hwthread":
|
|
return HwthreadList()
|
|
}
|
|
return []int{}
|
|
}
|
|
|
|
// CpuData returns CPU data for each hardware thread
|
|
func CpuData() []HwthreadEntry {
|
|
return slices.Clone(cache.CpuData)
|
|
}
|
|
|
|
// Structure holding basic information about a CPU
|
|
type CpuInformation struct {
|
|
NumHWthreads int
|
|
SMTWidth int
|
|
NumSockets int
|
|
NumDies int
|
|
NumCores int
|
|
NumNumaDomains int
|
|
}
|
|
|
|
// CpuInformation reports basic information about the CPU
|
|
func CpuInfo() CpuInformation {
|
|
return CpuInformation{
|
|
NumNumaDomains: len(cache.uniqNumaDomainList),
|
|
SMTWidth: len(cache.uniqSMTList),
|
|
NumDies: len(cache.uniqDieList),
|
|
NumCores: len(cache.uniqCoreList),
|
|
NumSockets: len(cache.uniqSocketList),
|
|
NumHWthreads: len(cache.uniqHwthreadList),
|
|
}
|
|
}
|
|
|
|
// GetHwthreadSocket gets the CPU socket ID for a given hardware thread ID
|
|
// In case hardware thread ID is not found -1 is returned
|
|
func GetHwthreadSocket(cpuID int) int {
|
|
for i := range cache.CpuData {
|
|
d := &cache.CpuData[i]
|
|
if d.CpuID == cpuID {
|
|
return d.Socket
|
|
}
|
|
}
|
|
return -1
|
|
}
|
|
|
|
// GetHwthreadNumaDomain gets the NUMA domain ID for a given hardware thread ID
|
|
// In case hardware thread ID is not found -1 is returned
|
|
func GetHwthreadNumaDomain(cpuID int) int {
|
|
for i := range cache.CpuData {
|
|
d := &cache.CpuData[i]
|
|
if d.CpuID == cpuID {
|
|
return d.NumaDomain
|
|
}
|
|
}
|
|
return -1
|
|
}
|
|
|
|
// GetHwthreadDie gets the CPU die ID for a given hardware thread ID
|
|
// In case hardware thread ID is not found -1 is returned
|
|
func GetHwthreadDie(cpuID int) int {
|
|
for i := range cache.CpuData {
|
|
d := &cache.CpuData[i]
|
|
if d.CpuID == cpuID {
|
|
return d.Die
|
|
}
|
|
}
|
|
return -1
|
|
}
|
|
|
|
// GetHwthreadCore gets the CPU core ID for a given hardware thread ID
|
|
// In case hardware thread ID is not found -1 is returned
|
|
func GetHwthreadCore(cpuID int) int {
|
|
for i := range cache.CpuData {
|
|
d := &cache.CpuData[i]
|
|
if d.CpuID == cpuID {
|
|
return d.Core
|
|
}
|
|
}
|
|
return -1
|
|
}
|
|
|
|
// GetSocketHwthreads gets all hardware thread IDs associated with a CPU socket
|
|
func GetSocketHwthreads(socket int) []int {
|
|
cpuList := make([]int, 0)
|
|
for i := range cache.CpuData {
|
|
d := &cache.CpuData[i]
|
|
if d.Socket == socket {
|
|
cpuList = append(cpuList, d.CpuID)
|
|
}
|
|
}
|
|
return cpuList
|
|
}
|
|
|
|
// GetNumaDomainHwthreads gets the all hardware thread IDs associated with a NUMA domain
|
|
func GetNumaDomainHwthreads(numaDomain int) []int {
|
|
cpuList := make([]int, 0)
|
|
for i := range cache.CpuData {
|
|
d := &cache.CpuData[i]
|
|
if d.NumaDomain == numaDomain {
|
|
cpuList = append(cpuList, d.CpuID)
|
|
}
|
|
}
|
|
return cpuList
|
|
}
|
|
|
|
// GetDieHwthreads gets all hardware thread IDs associated with a CPU die
|
|
func GetDieHwthreads(die int) []int {
|
|
cpuList := make([]int, 0)
|
|
for i := range cache.CpuData {
|
|
d := &cache.CpuData[i]
|
|
if d.Die == die {
|
|
cpuList = append(cpuList, d.CpuID)
|
|
}
|
|
}
|
|
return cpuList
|
|
}
|
|
|
|
// GetCoreHwthreads get all hardware thread IDs associated with a CPU core
|
|
func GetCoreHwthreads(core int) []int {
|
|
cpuList := make([]int, 0)
|
|
for i := range cache.CpuData {
|
|
d := &cache.CpuData[i]
|
|
if d.Core == core {
|
|
cpuList = append(cpuList, d.CpuID)
|
|
}
|
|
}
|
|
return cpuList
|
|
}
|