mirror of
https://github.com/kubernetes-sigs/node-feature-discovery.git
synced 2024-12-14 11:57:51 +00:00
source/cpu: better error reporting
Drop confusing errors in the log when intel pstate or cstate driver is not enabled in the system. However, we still log an error if sysfs is not available at all, in which case we're not able to detect these correctly.
This commit is contained in:
parent
73704e2e11
commit
43e0f83940
3 changed files with 49 additions and 19 deletions
|
@ -147,10 +147,10 @@ func (s *Source) Discover() (source.Features, error) {
|
||||||
}
|
}
|
||||||
|
|
||||||
// Detect cstate configuration
|
// Detect cstate configuration
|
||||||
cstate, err := detectCstate()
|
cstate, ok, err := detectCstate()
|
||||||
if err != nil {
|
if err != nil {
|
||||||
klog.Errorf("failed to detect cstate: %v", err)
|
klog.Error(err)
|
||||||
} else {
|
} else if ok {
|
||||||
features["cstate.enabled"] = cstate
|
features["cstate.enabled"] = cstate
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
@ -19,33 +19,49 @@ package cpu
|
||||||
import (
|
import (
|
||||||
"fmt"
|
"fmt"
|
||||||
"io/ioutil"
|
"io/ioutil"
|
||||||
|
"os"
|
||||||
|
"path/filepath"
|
||||||
"strconv"
|
"strconv"
|
||||||
"strings"
|
"strings"
|
||||||
|
|
||||||
|
"k8s.io/klog/v2"
|
||||||
|
|
||||||
"sigs.k8s.io/node-feature-discovery/source"
|
"sigs.k8s.io/node-feature-discovery/source"
|
||||||
)
|
)
|
||||||
|
|
||||||
// Discover if c-states are enabled
|
// Discover if c-states are enabled
|
||||||
func detectCstate() (bool, error) {
|
func detectCstate() (bool, bool, error) {
|
||||||
// When the intel_idle driver is in use (default), check setting of max_cstates
|
// Check that sysfs is available
|
||||||
driver, err := ioutil.ReadFile(source.SysfsDir.Path("devices/system/cpu/cpuidle/current_driver"))
|
sysfsBase := source.SysfsDir.Path("devices/system/cpu")
|
||||||
if err != nil {
|
if _, err := os.Stat(sysfsBase); err != nil {
|
||||||
return false, fmt.Errorf("cannot get driver for cpuidle: %s", err.Error())
|
return false, false, fmt.Errorf("unable to detect cstate status: %w", err)
|
||||||
|
}
|
||||||
|
cpuidleDir := filepath.Join(sysfsBase, "cpuidle")
|
||||||
|
if _, err := os.Stat(cpuidleDir); os.IsNotExist(err) {
|
||||||
|
klog.V(1).Info("cpuidle disabled in the kernel")
|
||||||
|
return false, false, nil
|
||||||
}
|
}
|
||||||
|
|
||||||
if strings.TrimSpace(string(driver)) != "intel_idle" {
|
// When the intel_idle driver is in use (default), check setting of max_cstates
|
||||||
|
driver, err := ioutil.ReadFile(filepath.Join(cpuidleDir, "current_driver"))
|
||||||
|
if err != nil {
|
||||||
|
return false, false, fmt.Errorf("cannot get driver for cpuidle: %w", err)
|
||||||
|
}
|
||||||
|
|
||||||
|
if d := strings.TrimSpace(string(driver)); d != "intel_idle" {
|
||||||
// Currently only checking intel_idle driver for cstates
|
// Currently only checking intel_idle driver for cstates
|
||||||
return false, fmt.Errorf("intel_idle driver is not in use: %s", string(driver))
|
klog.V(1).Infof("intel_idle driver is not in use (%s is active)", d)
|
||||||
|
return false, false, nil
|
||||||
}
|
}
|
||||||
|
|
||||||
data, err := ioutil.ReadFile(source.SysfsDir.Path("module/intel_idle/parameters/max_cstate"))
|
data, err := ioutil.ReadFile(source.SysfsDir.Path("module/intel_idle/parameters/max_cstate"))
|
||||||
if err != nil {
|
if err != nil {
|
||||||
return false, fmt.Errorf("cannot determine cstate from max_cstates: %s", err.Error())
|
return false, false, fmt.Errorf("cannot determine cstate from max_cstates: %w", err)
|
||||||
}
|
}
|
||||||
cstates, err := strconv.Atoi(strings.TrimSpace(string(data)))
|
cstates, err := strconv.Atoi(strings.TrimSpace(string(data)))
|
||||||
if err != nil {
|
if err != nil {
|
||||||
return false, fmt.Errorf("non-integer value of cstates: %s", err.Error())
|
return false, false, fmt.Errorf("non-integer value of cstates: %w", err)
|
||||||
}
|
}
|
||||||
|
|
||||||
return cstates > 0, nil
|
return cstates > 0, true, nil
|
||||||
}
|
}
|
||||||
|
|
|
@ -19,6 +19,8 @@ package cpu
|
||||||
import (
|
import (
|
||||||
"fmt"
|
"fmt"
|
||||||
"io/ioutil"
|
"io/ioutil"
|
||||||
|
"os"
|
||||||
|
"path/filepath"
|
||||||
"runtime"
|
"runtime"
|
||||||
"strings"
|
"strings"
|
||||||
|
|
||||||
|
@ -35,10 +37,21 @@ func detectPstate() (map[string]string, error) {
|
||||||
return nil, nil
|
return nil, nil
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// Check that sysfs is available
|
||||||
|
sysfsBase := source.SysfsDir.Path("devices/system/cpu")
|
||||||
|
if _, err := os.Stat(sysfsBase); err != nil {
|
||||||
|
return nil, fmt.Errorf("unable to detect pstate status: %w", err)
|
||||||
|
}
|
||||||
|
pstateDir := filepath.Join(sysfsBase, "intel_pstate")
|
||||||
|
if _, err := os.Stat(pstateDir); os.IsNotExist(err) {
|
||||||
|
klog.V(1).Info("intel pstate driver not enabled")
|
||||||
|
return nil, nil
|
||||||
|
}
|
||||||
|
|
||||||
// Get global pstate status
|
// Get global pstate status
|
||||||
data, err := ioutil.ReadFile(source.SysfsDir.Path("devices/system/cpu/intel_pstate/status"))
|
data, err := ioutil.ReadFile(filepath.Join(pstateDir, "status"))
|
||||||
if err != nil {
|
if err != nil {
|
||||||
return nil, fmt.Errorf("could not read pstate status: %s", err.Error())
|
return nil, fmt.Errorf("could not read pstate status: %w", err)
|
||||||
}
|
}
|
||||||
status := strings.TrimSpace(string(data))
|
status := strings.TrimSpace(string(data))
|
||||||
if status == "off" {
|
if status == "off" {
|
||||||
|
@ -49,7 +62,7 @@ func detectPstate() (map[string]string, error) {
|
||||||
features := map[string]string{"status": status}
|
features := map[string]string{"status": status}
|
||||||
|
|
||||||
// Check turbo boost
|
// Check turbo boost
|
||||||
bytes, err := ioutil.ReadFile(source.SysfsDir.Path("devices/system/cpu/intel_pstate/no_turbo"))
|
bytes, err := ioutil.ReadFile(filepath.Join(pstateDir, "no_turbo"))
|
||||||
if err != nil {
|
if err != nil {
|
||||||
klog.Errorf("can't detect whether turbo boost is enabled: %s", err.Error())
|
klog.Errorf("can't detect whether turbo boost is enabled: %s", err.Error())
|
||||||
} else {
|
} else {
|
||||||
|
@ -65,7 +78,8 @@ func detectPstate() (map[string]string, error) {
|
||||||
}
|
}
|
||||||
|
|
||||||
// Determine scaling governor that is being used
|
// Determine scaling governor that is being used
|
||||||
policies, err := ioutil.ReadDir(source.SysfsDir.Path("devices/system/cpu/cpufreq"))
|
cpufreqDir := filepath.Join(sysfsBase, "cpufreq")
|
||||||
|
policies, err := ioutil.ReadDir(cpufreqDir)
|
||||||
if err != nil {
|
if err != nil {
|
||||||
klog.Errorf("failed to read cpufreq directory: %s", err.Error())
|
klog.Errorf("failed to read cpufreq directory: %s", err.Error())
|
||||||
return features, nil
|
return features, nil
|
||||||
|
@ -74,7 +88,7 @@ func detectPstate() (map[string]string, error) {
|
||||||
scaling := ""
|
scaling := ""
|
||||||
for _, policy := range policies {
|
for _, policy := range policies {
|
||||||
// Ensure at least one cpu is using this policy
|
// Ensure at least one cpu is using this policy
|
||||||
cpus, err := ioutil.ReadFile(source.SysfsDir.Path("devices/system/cpu/cpufreq", policy.Name(), "affected_cpus"))
|
cpus, err := ioutil.ReadFile(filepath.Join(cpufreqDir, policy.Name(), "affected_cpus"))
|
||||||
if err != nil {
|
if err != nil {
|
||||||
klog.Errorf("could not read cpufreq policy %s affected_cpus", policy.Name())
|
klog.Errorf("could not read cpufreq policy %s affected_cpus", policy.Name())
|
||||||
continue
|
continue
|
||||||
|
@ -84,7 +98,7 @@ func detectPstate() (map[string]string, error) {
|
||||||
continue
|
continue
|
||||||
}
|
}
|
||||||
|
|
||||||
data, err := ioutil.ReadFile(source.SysfsDir.Path("devices/system/cpu/cpufreq", policy.Name(), "scaling_governor"))
|
data, err := ioutil.ReadFile(filepath.Join(cpufreqDir, policy.Name(), "scaling_governor"))
|
||||||
if err != nil {
|
if err != nil {
|
||||||
klog.Errorf("could not read cpufreq policy %s scaling_governor", policy.Name())
|
klog.Errorf("could not read cpufreq policy %s scaling_governor", policy.Name())
|
||||||
continue
|
continue
|
||||||
|
|
Loading…
Reference in a new issue