|
|
@ -17,7 +17,6 @@ package collector
|
|
|
|
|
|
|
|
|
|
|
|
import (
|
|
|
|
import (
|
|
|
|
"errors"
|
|
|
|
"errors"
|
|
|
|
"os"
|
|
|
|
|
|
|
|
"strconv"
|
|
|
|
"strconv"
|
|
|
|
"unsafe"
|
|
|
|
"unsafe"
|
|
|
|
|
|
|
|
|
|
|
@ -25,9 +24,8 @@ import (
|
|
|
|
)
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
/*
|
|
|
|
#cgo LDFLAGS: -lkvm
|
|
|
|
#cgo LDFLAGS:
|
|
|
|
#include <fcntl.h>
|
|
|
|
#include <fcntl.h>
|
|
|
|
#include <kvm.h>
|
|
|
|
|
|
|
|
#include <stdlib.h>
|
|
|
|
#include <stdlib.h>
|
|
|
|
#include <sys/param.h>
|
|
|
|
#include <sys/param.h>
|
|
|
|
#include <sys/pcpu.h>
|
|
|
|
#include <sys/pcpu.h>
|
|
|
@ -35,17 +33,71 @@ import (
|
|
|
|
#include <sys/sysctl.h>
|
|
|
|
#include <sys/sysctl.h>
|
|
|
|
#include <sys/time.h>
|
|
|
|
#include <sys/time.h>
|
|
|
|
|
|
|
|
|
|
|
|
long _clockrate() {
|
|
|
|
static int mibs_set_up = 0;
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
static int mib_kern_cp_times[2];
|
|
|
|
|
|
|
|
static size_t mib_kern_cp_times_len = 2;
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
static const int mib_hw_ncpu[] = {CTL_HW, HW_NCPU};
|
|
|
|
|
|
|
|
static const size_t mib_hw_ncpu_len = 2;
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
static const int mib_kern_clockrate[] = {CTL_KERN, KERN_CLOCKRATE};
|
|
|
|
|
|
|
|
static size_t mib_kern_clockrate_len = 2;
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
// Setup method for MIBs not available as constants.
|
|
|
|
|
|
|
|
// Calls to this method must be synchronized externally.
|
|
|
|
|
|
|
|
int setupSysctlMIBs() {
|
|
|
|
|
|
|
|
int ret = sysctlnametomib("kern.cp_times", mib_kern_cp_times, &mib_kern_cp_times_len);
|
|
|
|
|
|
|
|
if (ret == 0) mibs_set_up = 1;
|
|
|
|
|
|
|
|
return ret;
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
int getCPUTimes(int *ncpu, double **cpu_times, size_t *cp_times_length) {
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
// Assert that mibs are set up through setupSysctlMIBs
|
|
|
|
|
|
|
|
if (!mibs_set_up) {
|
|
|
|
|
|
|
|
return -1;
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
// Retrieve number of cpu cores
|
|
|
|
|
|
|
|
size_t ncpu_size = sizeof(*ncpu);
|
|
|
|
|
|
|
|
if (sysctl(mib_hw_ncpu, mib_hw_ncpu_len, ncpu, &ncpu_size, NULL, 0) == -1 ||
|
|
|
|
|
|
|
|
sizeof(*ncpu) != ncpu_size) {
|
|
|
|
|
|
|
|
return -1;
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
// Retrieve clockrate
|
|
|
|
struct clockinfo clockrate;
|
|
|
|
struct clockinfo clockrate;
|
|
|
|
size_t size = sizeof(clockrate);
|
|
|
|
size_t clockrate_size = sizeof(clockrate);
|
|
|
|
int res = sysctlbyname("kern.clockrate", &clockrate, &size, NULL, 0);
|
|
|
|
if (sysctl(mib_kern_clockrate, mib_kern_clockrate_len, &clockrate, &clockrate_size, NULL, 0) == -1 ||
|
|
|
|
if (res == -1) {
|
|
|
|
sizeof(clockrate) != clockrate_size) {
|
|
|
|
return -1;
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (size != sizeof(clockrate)) {
|
|
|
|
|
|
|
|
return -2;
|
|
|
|
// Retrieve cp_times values
|
|
|
|
|
|
|
|
*cp_times_length = (*ncpu) * CPUSTATES;
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
long cp_times[*cp_times_length];
|
|
|
|
|
|
|
|
size_t cp_times_size = sizeof(cp_times);
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
if (sysctl(mib_kern_cp_times, mib_kern_cp_times_len, &cp_times, &cp_times_size, NULL, 0) == -1 ||
|
|
|
|
|
|
|
|
sizeof(cp_times) != cp_times_size) {
|
|
|
|
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return clockrate.stathz > 0 ? clockrate.stathz : clockrate.hz;
|
|
|
|
|
|
|
|
|
|
|
|
// Compute absolute time for different CPU states
|
|
|
|
|
|
|
|
long cpufreq = clockrate.stathz > 0 ? clockrate.stathz : clockrate.hz;
|
|
|
|
|
|
|
|
*cpu_times = (double *) malloc(sizeof(double)*(*cp_times_length));
|
|
|
|
|
|
|
|
for (int i = 0; i < (*cp_times_length); i++) {
|
|
|
|
|
|
|
|
(*cpu_times)[i] = ((double) cp_times[i]) / cpufreq;
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
void freeCPUTimes(double *cpu_times) {
|
|
|
|
|
|
|
|
free(cpu_times);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
*/
|
|
|
|
*/
|
|
|
@ -62,6 +114,9 @@ func init() {
|
|
|
|
// Takes a prometheus registry and returns a new Collector exposing
|
|
|
|
// Takes a prometheus registry and returns a new Collector exposing
|
|
|
|
// CPU stats.
|
|
|
|
// CPU stats.
|
|
|
|
func NewStatCollector() (Collector, error) {
|
|
|
|
func NewStatCollector() (Collector, error) {
|
|
|
|
|
|
|
|
if C.setupSysctlMIBs() == -1 {
|
|
|
|
|
|
|
|
return nil, errors.New("could not initialize sysctl MIBs")
|
|
|
|
|
|
|
|
}
|
|
|
|
return &statCollector{
|
|
|
|
return &statCollector{
|
|
|
|
cpu: prometheus.NewCounterVec(
|
|
|
|
cpu: prometheus.NewCounterVec(
|
|
|
|
prometheus.CounterOpts{
|
|
|
|
prometheus.CounterOpts{
|
|
|
@ -74,50 +129,40 @@ func NewStatCollector() (Collector, error) {
|
|
|
|
}, nil
|
|
|
|
}, nil
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
// Expose CPU stats using KVM.
|
|
|
|
// Expose CPU stats using sysctl.
|
|
|
|
func (c *statCollector) Update(ch chan<- prometheus.Metric) (err error) {
|
|
|
|
func (c *statCollector) Update(ch chan<- prometheus.Metric) (err error) {
|
|
|
|
if os.Geteuid() != 0 && os.Getegid() != 2 {
|
|
|
|
|
|
|
|
return errors.New("caller should be either root user or kmem group to access /dev/mem")
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
var errbuf *C.char
|
|
|
|
// We want time spent per-cpu per CPUSTATE.
|
|
|
|
kd := C.kvm_open(nil, nil, nil, C.O_RDONLY, errbuf)
|
|
|
|
// CPUSTATES (number of CPUSTATES) is defined as 5U.
|
|
|
|
if errbuf != nil {
|
|
|
|
// Order: CP_USER | CP_NICE | CP_SYS | CP_IDLE | CP_INTR
|
|
|
|
return errors.New("failed to call kvm_open()")
|
|
|
|
// sysctl kern.cp_times provides hw.ncpu * CPUSTATES long integers:
|
|
|
|
}
|
|
|
|
// hw.ncpu * (space-separated list of the above variables)
|
|
|
|
defer C.kvm_close(kd)
|
|
|
|
//
|
|
|
|
|
|
|
|
// Each value is a counter incremented at frequency
|
|
|
|
// The cp_time variable is an array of CPUSTATES long integers -- in
|
|
|
|
// kern.clockrate.(stathz | hz)
|
|
|
|
// the same format as the kern.cp_time sysctl. According to the
|
|
|
|
//
|
|
|
|
// comments in sys/kern/kern_clock.c, the frequency of this timer will
|
|
|
|
// Look into sys/kern/kern_clock.c for details.
|
|
|
|
// be stathz (or hz, if stathz is zero).
|
|
|
|
|
|
|
|
clockrate, err := getClockRate()
|
|
|
|
var ncpu C.int
|
|
|
|
if err != nil {
|
|
|
|
var cpuTimesC *C.double
|
|
|
|
return err
|
|
|
|
var cpuTimesLength C.size_t
|
|
|
|
|
|
|
|
if C.getCPUTimes(&ncpu, &cpuTimesC, &cpuTimesLength) == -1 {
|
|
|
|
|
|
|
|
return errors.New("could not retrieve CPU times")
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
defer C.freeCPUTimes(cpuTimesC)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
// Convert C.double array to Go array (https://github.com/golang/go/wiki/cgo#turning-c-arrays-into-go-slices).
|
|
|
|
|
|
|
|
cpuTimes := (*[1 << 30]C.double)(unsafe.Pointer(cpuTimesC))[:cpuTimesLength:cpuTimesLength]
|
|
|
|
|
|
|
|
|
|
|
|
ncpus := C.kvm_getncpus(kd)
|
|
|
|
for cpu := 0; cpu < int(ncpu); cpu++ {
|
|
|
|
for i := 0; i < int(ncpus); i++ {
|
|
|
|
base_idx := C.CPUSTATES * cpu
|
|
|
|
pcpu := C.kvm_getpcpu(kd, C.int(i))
|
|
|
|
c.cpu.With(prometheus.Labels{"cpu": strconv.Itoa(cpu), "mode": "user"}).Set(float64(cpuTimes[base_idx+C.CP_USER]))
|
|
|
|
cp_time := ((*C.struct_pcpu)(unsafe.Pointer(pcpu))).pc_cp_time
|
|
|
|
c.cpu.With(prometheus.Labels{"cpu": strconv.Itoa(cpu), "mode": "nice"}).Set(float64(cpuTimes[base_idx+C.CP_NICE]))
|
|
|
|
c.cpu.With(prometheus.Labels{"cpu": strconv.Itoa(i), "mode": "user"}).Set(float64(cp_time[C.CP_USER]) / clockrate)
|
|
|
|
c.cpu.With(prometheus.Labels{"cpu": strconv.Itoa(cpu), "mode": "system"}).Set(float64(cpuTimes[base_idx+C.CP_SYS]))
|
|
|
|
c.cpu.With(prometheus.Labels{"cpu": strconv.Itoa(i), "mode": "nice"}).Set(float64(cp_time[C.CP_NICE]) / clockrate)
|
|
|
|
c.cpu.With(prometheus.Labels{"cpu": strconv.Itoa(cpu), "mode": "interrupt"}).Set(float64(cpuTimes[base_idx+C.CP_INTR]))
|
|
|
|
c.cpu.With(prometheus.Labels{"cpu": strconv.Itoa(i), "mode": "system"}).Set(float64(cp_time[C.CP_SYS]) / clockrate)
|
|
|
|
c.cpu.With(prometheus.Labels{"cpu": strconv.Itoa(cpu), "mode": "idle"}).Set(float64(cpuTimes[base_idx+C.CP_IDLE]))
|
|
|
|
c.cpu.With(prometheus.Labels{"cpu": strconv.Itoa(i), "mode": "interrupt"}).Set(float64(cp_time[C.CP_INTR]) / clockrate)
|
|
|
|
|
|
|
|
c.cpu.With(prometheus.Labels{"cpu": strconv.Itoa(i), "mode": "idle"}).Set(float64(cp_time[C.CP_IDLE]) / clockrate)
|
|
|
|
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
c.cpu.Collect(ch)
|
|
|
|
c.cpu.Collect(ch)
|
|
|
|
return err
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
func getClockRate() (float64, error) {
|
|
|
|
|
|
|
|
clockrate := C._clockrate()
|
|
|
|
|
|
|
|
if clockrate == -1 {
|
|
|
|
|
|
|
|
return 0, errors.New("sysctl(kern.clockrate) failed")
|
|
|
|
|
|
|
|
} else if clockrate == -2 {
|
|
|
|
|
|
|
|
return 0, errors.New("sysctl(kern.clockrate) failed, wrong buffer size")
|
|
|
|
|
|
|
|
} else if clockrate <= 0 {
|
|
|
|
|
|
|
|
return 0, errors.New("sysctl(kern.clockrate) bad clocktime")
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
return float64(clockrate), nil
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|