Move stat_linux to cpu_linux and add cpufreq stats (#548)
parent
798950d25b
commit
2e9f1913b8
|
@ -23,7 +23,7 @@ Name | Description | OS
|
||||||
---------|-------------|----
|
---------|-------------|----
|
||||||
arp | Exposes ARP statistics from `/proc/net/arp`. | Linux
|
arp | Exposes ARP statistics from `/proc/net/arp`. | Linux
|
||||||
conntrack | Shows conntrack statistics (does nothing if no `/proc/sys/net/netfilter/` present). | Linux
|
conntrack | Shows conntrack statistics (does nothing if no `/proc/sys/net/netfilter/` present). | Linux
|
||||||
cpu | Exposes CPU statistics | Darwin, Dragonfly, FreeBSD
|
cpu | Exposes CPU statistics | Darwin, Dragonfly, FreeBSD, Linux
|
||||||
diskstats | Exposes disk I/O statistics from `/proc/diskstats`. | Linux
|
diskstats | Exposes disk I/O statistics from `/proc/diskstats`. | Linux
|
||||||
edac | Exposes error detection and correction statistics. | Linux
|
edac | Exposes error detection and correction statistics. | Linux
|
||||||
entropy | Exposes available entropy. | Linux
|
entropy | Exposes available entropy. | Linux
|
||||||
|
@ -38,7 +38,7 @@ meminfo | Exposes memory statistics. | Darwin, Dragonfly, FreeBSD, Linux
|
||||||
netdev | Exposes network interface statistics such as bytes transferred. | Darwin, Dragonfly, FreeBSD, Linux, OpenBSD
|
netdev | Exposes network interface statistics such as bytes transferred. | Darwin, Dragonfly, FreeBSD, Linux, OpenBSD
|
||||||
netstat | Exposes network statistics from `/proc/net/netstat`. This is the same information as `netstat -s`. | Linux
|
netstat | Exposes network statistics from `/proc/net/netstat`. This is the same information as `netstat -s`. | Linux
|
||||||
sockstat | Exposes various statistics from `/proc/net/sockstat`. | Linux
|
sockstat | Exposes various statistics from `/proc/net/sockstat`. | Linux
|
||||||
stat | Exposes various statistics from `/proc/stat`. This includes CPU usage, boot time, forks and interrupts. | Linux
|
stat | Exposes various statistics from `/proc/stat`. This includes boot time, forks and interrupts. | Linux
|
||||||
textfile | Exposes statistics read from local disk. The `--collector.textfile.directory` flag must be set. | _any_
|
textfile | Exposes statistics read from local disk. The `--collector.textfile.directory` flag must be set. | _any_
|
||||||
time | Exposes the current system time. | _any_
|
time | Exposes the current system time. | _any_
|
||||||
uname | Exposes system information as provided by the uname system call. | Linux
|
uname | Exposes system information as provided by the uname system call. | Linux
|
||||||
|
|
|
@ -0,0 +1,157 @@
|
||||||
|
// Copyright 2015 The Prometheus Authors
|
||||||
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
||||||
|
// you may not use this file except in compliance with the License.
|
||||||
|
// You may obtain a copy of the License at
|
||||||
|
//
|
||||||
|
// http://www.apache.org/licenses/LICENSE-2.0
|
||||||
|
//
|
||||||
|
// Unless required by applicable law or agreed to in writing, software
|
||||||
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
||||||
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||||
|
// See the License for the specific language governing permissions and
|
||||||
|
// limitations under the License.
|
||||||
|
|
||||||
|
// +build !nocpu
|
||||||
|
|
||||||
|
package collector
|
||||||
|
|
||||||
|
import (
|
||||||
|
"fmt"
|
||||||
|
"path/filepath"
|
||||||
|
|
||||||
|
"github.com/prometheus/client_golang/prometheus"
|
||||||
|
"github.com/prometheus/procfs"
|
||||||
|
)
|
||||||
|
|
||||||
|
const (
|
||||||
|
cpuCollectorNamespace = "cpu"
|
||||||
|
)
|
||||||
|
|
||||||
|
type cpuCollector struct {
|
||||||
|
cpu *prometheus.Desc
|
||||||
|
cpuFreq *prometheus.Desc
|
||||||
|
cpuFreqMin *prometheus.Desc
|
||||||
|
cpuFreqMax *prometheus.Desc
|
||||||
|
cpuCoreThrottle *prometheus.Desc
|
||||||
|
cpuPackageThrottle *prometheus.Desc
|
||||||
|
}
|
||||||
|
|
||||||
|
func init() {
|
||||||
|
Factories["cpu"] = NewCPUCollector
|
||||||
|
}
|
||||||
|
|
||||||
|
// NewCPUCollector returns a new Collector exposing kernel/system statistics.
|
||||||
|
func NewCPUCollector() (Collector, error) {
|
||||||
|
return &cpuCollector{
|
||||||
|
cpu: prometheus.NewDesc(
|
||||||
|
prometheus.BuildFQName(Namespace, "", cpuCollectorNamespace),
|
||||||
|
"Seconds the cpus spent in each mode.",
|
||||||
|
[]string{"cpu", "mode"}, nil,
|
||||||
|
),
|
||||||
|
cpuFreq: prometheus.NewDesc(
|
||||||
|
prometheus.BuildFQName(Namespace, cpuCollectorNamespace, "frequency_hertz"),
|
||||||
|
"Current cpu thread frequency in hertz.",
|
||||||
|
[]string{"cpu"}, nil,
|
||||||
|
),
|
||||||
|
cpuFreqMin: prometheus.NewDesc(
|
||||||
|
prometheus.BuildFQName(Namespace, cpuCollectorNamespace, "frequency_min_hertz"),
|
||||||
|
"Minimum cpu thread frequency in hertz.",
|
||||||
|
[]string{"cpu"}, nil,
|
||||||
|
),
|
||||||
|
cpuFreqMax: prometheus.NewDesc(
|
||||||
|
prometheus.BuildFQName(Namespace, cpuCollectorNamespace, "frequency_max_hertz"),
|
||||||
|
"Maximum cpu thread frequency in hertz.",
|
||||||
|
[]string{"cpu"}, nil,
|
||||||
|
),
|
||||||
|
cpuCoreThrottle: prometheus.NewDesc(
|
||||||
|
prometheus.BuildFQName(Namespace, cpuCollectorNamespace, "core_throttles_total"),
|
||||||
|
"Number of times this cpu core has been throttled.",
|
||||||
|
[]string{"cpu"}, nil,
|
||||||
|
),
|
||||||
|
cpuPackageThrottle: prometheus.NewDesc(
|
||||||
|
prometheus.BuildFQName(Namespace, cpuCollectorNamespace, "package_throttles_total"),
|
||||||
|
"Number of times this cpu package has been throttled.",
|
||||||
|
[]string{"cpu"}, nil,
|
||||||
|
),
|
||||||
|
}, nil
|
||||||
|
}
|
||||||
|
|
||||||
|
// Update implements Collector and exposes cpu related metrics from /proc/stat and /sys/.../cpu/.
|
||||||
|
func (c *cpuCollector) Update(ch chan<- prometheus.Metric) error {
|
||||||
|
if err := c.updateStat(ch); err != nil {
|
||||||
|
return err
|
||||||
|
}
|
||||||
|
if err := c.updateCPUfreq(ch); err != nil {
|
||||||
|
return err
|
||||||
|
}
|
||||||
|
return nil
|
||||||
|
}
|
||||||
|
|
||||||
|
// updateCPUfreq reads /sys/bus/cpu/devices/cpu* and expose cpu frequency statistics.
|
||||||
|
func (c *cpuCollector) updateCPUfreq(ch chan<- prometheus.Metric) error {
|
||||||
|
cpus, err := filepath.Glob(sysFilePath("bus/cpu/devices/cpu[0-9]*"))
|
||||||
|
if err != nil {
|
||||||
|
return err
|
||||||
|
}
|
||||||
|
|
||||||
|
var value uint64
|
||||||
|
|
||||||
|
for _, cpu := range cpus {
|
||||||
|
_, cpuname := filepath.Split(cpu)
|
||||||
|
|
||||||
|
if value, err = readUintFromFile(filepath.Join(cpu, "cpufreq/scaling_cur_freq")); err != nil {
|
||||||
|
return err
|
||||||
|
}
|
||||||
|
ch <- prometheus.MustNewConstMetric(c.cpuFreq, prometheus.GaugeValue, float64(value), cpuname)
|
||||||
|
|
||||||
|
if value, err = readUintFromFile(filepath.Join(cpu, "cpufreq/scaling_min_freq")); err != nil {
|
||||||
|
return err
|
||||||
|
}
|
||||||
|
ch <- prometheus.MustNewConstMetric(c.cpuFreqMin, prometheus.GaugeValue, float64(value), cpuname)
|
||||||
|
|
||||||
|
if value, err = readUintFromFile(filepath.Join(cpu, "cpufreq/scaling_max_freq")); err != nil {
|
||||||
|
return err
|
||||||
|
}
|
||||||
|
ch <- prometheus.MustNewConstMetric(c.cpuFreqMax, prometheus.GaugeValue, float64(value), cpuname)
|
||||||
|
|
||||||
|
if value, err = readUintFromFile(filepath.Join(cpu, "thermal_throttle/core_throttle_count")); err != nil {
|
||||||
|
return err
|
||||||
|
}
|
||||||
|
ch <- prometheus.MustNewConstMetric(c.cpuCoreThrottle, prometheus.CounterValue, float64(value), cpuname)
|
||||||
|
|
||||||
|
if value, err = readUintFromFile(filepath.Join(cpu, "thermal_throttle/package_throttle_count")); err != nil {
|
||||||
|
return err
|
||||||
|
}
|
||||||
|
ch <- prometheus.MustNewConstMetric(c.cpuPackageThrottle, prometheus.CounterValue, float64(value), cpuname)
|
||||||
|
}
|
||||||
|
|
||||||
|
return nil
|
||||||
|
}
|
||||||
|
|
||||||
|
// updateStat reads /proc/stat through procfs and exports cpu related metrics.
|
||||||
|
func (c *cpuCollector) updateStat(ch chan<- prometheus.Metric) error {
|
||||||
|
fs, err := procfs.NewFS(*procPath)
|
||||||
|
if err != nil {
|
||||||
|
return fmt.Errorf("failed to open procfs: %v", err)
|
||||||
|
}
|
||||||
|
stats, err := fs.NewStat()
|
||||||
|
if err != nil {
|
||||||
|
return err
|
||||||
|
}
|
||||||
|
|
||||||
|
for cpuID, cpuStat := range stats.CPU {
|
||||||
|
cpuName := fmt.Sprintf("cpu%d", cpuID)
|
||||||
|
ch <- prometheus.MustNewConstMetric(c.cpu, prometheus.CounterValue, cpuStat.User, cpuName, "user")
|
||||||
|
ch <- prometheus.MustNewConstMetric(c.cpu, prometheus.CounterValue, cpuStat.Nice, cpuName, "nice")
|
||||||
|
ch <- prometheus.MustNewConstMetric(c.cpu, prometheus.CounterValue, cpuStat.System, cpuName, "system")
|
||||||
|
ch <- prometheus.MustNewConstMetric(c.cpu, prometheus.CounterValue, cpuStat.Idle, cpuName, "idle")
|
||||||
|
ch <- prometheus.MustNewConstMetric(c.cpu, prometheus.CounterValue, cpuStat.Iowait, cpuName, "iowait")
|
||||||
|
ch <- prometheus.MustNewConstMetric(c.cpu, prometheus.CounterValue, cpuStat.IRQ, cpuName, "irq")
|
||||||
|
ch <- prometheus.MustNewConstMetric(c.cpu, prometheus.CounterValue, cpuStat.SoftIRQ, cpuName, "softirq")
|
||||||
|
ch <- prometheus.MustNewConstMetric(c.cpu, prometheus.CounterValue, cpuStat.Steal, cpuName, "steal")
|
||||||
|
ch <- prometheus.MustNewConstMetric(c.cpu, prometheus.CounterValue, cpuStat.Guest, cpuName, "guest")
|
||||||
|
ch <- prometheus.MustNewConstMetric(c.cpu, prometheus.CounterValue, cpuStat.GuestNice, cpuName, "guest_nice")
|
||||||
|
}
|
||||||
|
|
||||||
|
return nil
|
||||||
|
}
|
|
@ -208,6 +208,26 @@ node_cpu{cpu="cpu7",mode="softirq"} 0.31
|
||||||
node_cpu{cpu="cpu7",mode="steal"} 0
|
node_cpu{cpu="cpu7",mode="steal"} 0
|
||||||
node_cpu{cpu="cpu7",mode="system"} 101.64
|
node_cpu{cpu="cpu7",mode="system"} 101.64
|
||||||
node_cpu{cpu="cpu7",mode="user"} 290.98
|
node_cpu{cpu="cpu7",mode="user"} 290.98
|
||||||
|
# HELP node_cpu_core_throttles_total Number of times this cpu core has been throttled.
|
||||||
|
# TYPE node_cpu_core_throttles_total counter
|
||||||
|
node_cpu_core_throttles_total{cpu="cpu0"} 5
|
||||||
|
node_cpu_core_throttles_total{cpu="cpu1"} 0
|
||||||
|
# HELP node_cpu_frequency_hertz Current cpu thread frequency in hertz.
|
||||||
|
# TYPE node_cpu_frequency_hertz gauge
|
||||||
|
node_cpu_frequency_hertz{cpu="cpu0"} 1.699981e+06
|
||||||
|
node_cpu_frequency_hertz{cpu="cpu1"} 1.699981e+06
|
||||||
|
# HELP node_cpu_frequency_max_hertz Maximum cpu thread frequency in hertz.
|
||||||
|
# TYPE node_cpu_frequency_max_hertz gauge
|
||||||
|
node_cpu_frequency_max_hertz{cpu="cpu0"} 3.7e+06
|
||||||
|
node_cpu_frequency_max_hertz{cpu="cpu1"} 3.7e+06
|
||||||
|
# HELP node_cpu_frequency_min_hertz Minimum cpu thread frequency in hertz.
|
||||||
|
# TYPE node_cpu_frequency_min_hertz gauge
|
||||||
|
node_cpu_frequency_min_hertz{cpu="cpu0"} 800000
|
||||||
|
node_cpu_frequency_min_hertz{cpu="cpu1"} 800000
|
||||||
|
# HELP node_cpu_package_throttles_total Number of times this cpu package has been throttled.
|
||||||
|
# TYPE node_cpu_package_throttles_total counter
|
||||||
|
node_cpu_package_throttles_total{cpu="cpu0"} 30
|
||||||
|
node_cpu_package_throttles_total{cpu="cpu1"} 30
|
||||||
# HELP node_disk_bytes_read The total number of bytes read successfully.
|
# HELP node_disk_bytes_read The total number of bytes read successfully.
|
||||||
# TYPE node_disk_bytes_read counter
|
# TYPE node_disk_bytes_read counter
|
||||||
node_disk_bytes_read{device="dm-0"} 5.13708655616e+11
|
node_disk_bytes_read{device="dm-0"} 5.13708655616e+11
|
||||||
|
@ -2142,6 +2162,7 @@ node_scrape_collector_success{collector="arp"} 1
|
||||||
node_scrape_collector_success{collector="bonding"} 1
|
node_scrape_collector_success{collector="bonding"} 1
|
||||||
node_scrape_collector_success{collector="buddyinfo"} 1
|
node_scrape_collector_success{collector="buddyinfo"} 1
|
||||||
node_scrape_collector_success{collector="conntrack"} 1
|
node_scrape_collector_success{collector="conntrack"} 1
|
||||||
|
node_scrape_collector_success{collector="cpu"} 1
|
||||||
node_scrape_collector_success{collector="diskstats"} 1
|
node_scrape_collector_success{collector="diskstats"} 1
|
||||||
node_scrape_collector_success{collector="drbd"} 1
|
node_scrape_collector_success{collector="drbd"} 1
|
||||||
node_scrape_collector_success{collector="edac"} 1
|
node_scrape_collector_success{collector="edac"} 1
|
||||||
|
|
|
@ -0,0 +1 @@
|
||||||
|
1699981
|
|
@ -0,0 +1 @@
|
||||||
|
3700000
|
|
@ -0,0 +1 @@
|
||||||
|
800000
|
|
@ -0,0 +1 @@
|
||||||
|
5
|
|
@ -0,0 +1 @@
|
||||||
|
30
|
|
@ -0,0 +1 @@
|
||||||
|
1699981
|
|
@ -0,0 +1 @@
|
||||||
|
3700000
|
|
@ -0,0 +1 @@
|
||||||
|
800000
|
|
@ -0,0 +1 @@
|
||||||
|
0
|
|
@ -0,0 +1 @@
|
||||||
|
30
|
|
@ -16,18 +16,13 @@
|
||||||
package collector
|
package collector
|
||||||
|
|
||||||
import (
|
import (
|
||||||
"bufio"
|
"fmt"
|
||||||
"os"
|
|
||||||
"strconv"
|
"github.com/prometheus/procfs"
|
||||||
"strings"
|
|
||||||
|
|
||||||
"github.com/prometheus/client_golang/prometheus"
|
"github.com/prometheus/client_golang/prometheus"
|
||||||
)
|
)
|
||||||
|
|
||||||
const (
|
|
||||||
userHz = 100
|
|
||||||
)
|
|
||||||
|
|
||||||
type statCollector struct {
|
type statCollector struct {
|
||||||
cpu *prometheus.Desc
|
cpu *prometheus.Desc
|
||||||
intr *prometheus.Desc
|
intr *prometheus.Desc
|
||||||
|
@ -83,80 +78,25 @@ func NewStatCollector() (Collector, error) {
|
||||||
}, nil
|
}, nil
|
||||||
}
|
}
|
||||||
|
|
||||||
// Expose kernel and system statistics.
|
// Update implements Collector and exposes kernel and system statistics.
|
||||||
func (c *statCollector) Update(ch chan<- prometheus.Metric) error {
|
func (c *statCollector) Update(ch chan<- prometheus.Metric) error {
|
||||||
file, err := os.Open(procFilePath("stat"))
|
fs, err := procfs.NewFS(*procPath)
|
||||||
|
if err != nil {
|
||||||
|
return fmt.Errorf("failed to open procfs: %v", err)
|
||||||
|
}
|
||||||
|
stats, err := fs.NewStat()
|
||||||
if err != nil {
|
if err != nil {
|
||||||
return err
|
return err
|
||||||
}
|
}
|
||||||
defer file.Close()
|
|
||||||
|
|
||||||
scanner := bufio.NewScanner(file)
|
ch <- prometheus.MustNewConstMetric(c.intr, prometheus.CounterValue, float64(stats.IRQTotal))
|
||||||
for scanner.Scan() {
|
ch <- prometheus.MustNewConstMetric(c.ctxt, prometheus.CounterValue, float64(stats.ContextSwitches))
|
||||||
parts := strings.Fields(scanner.Text())
|
ch <- prometheus.MustNewConstMetric(c.forks, prometheus.CounterValue, float64(stats.ProcessCreated))
|
||||||
if len(parts) == 0 {
|
|
||||||
continue
|
ch <- prometheus.MustNewConstMetric(c.btime, prometheus.GaugeValue, float64(stats.BootTime))
|
||||||
}
|
|
||||||
switch {
|
ch <- prometheus.MustNewConstMetric(c.procsRunning, prometheus.GaugeValue, float64(stats.ProcessesRunning))
|
||||||
case strings.HasPrefix(parts[0], "cpu"):
|
ch <- prometheus.MustNewConstMetric(c.procsBlocked, prometheus.GaugeValue, float64(stats.ProcessesBlocked))
|
||||||
// Export only per-cpu stats, it can be aggregated up in prometheus.
|
|
||||||
if parts[0] == "cpu" {
|
return nil
|
||||||
break
|
|
||||||
}
|
|
||||||
// Only some of these may be present, depending on kernel version.
|
|
||||||
cpuFields := []string{"user", "nice", "system", "idle", "iowait", "irq", "softirq", "steal", "guest", "guest_nice"}
|
|
||||||
// OpenVZ guests lack the "guest" CPU field, which needs to be ignored.
|
|
||||||
expectedFieldNum := len(cpuFields) + 1
|
|
||||||
if expectedFieldNum > len(parts) {
|
|
||||||
expectedFieldNum = len(parts)
|
|
||||||
}
|
|
||||||
for i, v := range parts[1:expectedFieldNum] {
|
|
||||||
value, err := strconv.ParseFloat(v, 64)
|
|
||||||
if err != nil {
|
|
||||||
return err
|
|
||||||
}
|
|
||||||
// Convert from ticks to seconds
|
|
||||||
value /= userHz
|
|
||||||
ch <- prometheus.MustNewConstMetric(c.cpu, prometheus.CounterValue, value, parts[0], cpuFields[i])
|
|
||||||
}
|
|
||||||
case parts[0] == "intr":
|
|
||||||
// Only expose the overall number, use the 'interrupts' collector for more detail.
|
|
||||||
value, err := strconv.ParseFloat(parts[1], 64)
|
|
||||||
if err != nil {
|
|
||||||
return err
|
|
||||||
}
|
|
||||||
ch <- prometheus.MustNewConstMetric(c.intr, prometheus.CounterValue, value)
|
|
||||||
case parts[0] == "ctxt":
|
|
||||||
value, err := strconv.ParseFloat(parts[1], 64)
|
|
||||||
if err != nil {
|
|
||||||
return err
|
|
||||||
}
|
|
||||||
ch <- prometheus.MustNewConstMetric(c.ctxt, prometheus.CounterValue, value)
|
|
||||||
case parts[0] == "processes":
|
|
||||||
value, err := strconv.ParseFloat(parts[1], 64)
|
|
||||||
if err != nil {
|
|
||||||
return err
|
|
||||||
}
|
|
||||||
ch <- prometheus.MustNewConstMetric(c.forks, prometheus.CounterValue, value)
|
|
||||||
case parts[0] == "btime":
|
|
||||||
value, err := strconv.ParseFloat(parts[1], 64)
|
|
||||||
if err != nil {
|
|
||||||
return err
|
|
||||||
}
|
|
||||||
ch <- prometheus.MustNewConstMetric(c.btime, prometheus.GaugeValue, value)
|
|
||||||
case parts[0] == "procs_running":
|
|
||||||
value, err := strconv.ParseFloat(parts[1], 64)
|
|
||||||
if err != nil {
|
|
||||||
return err
|
|
||||||
}
|
|
||||||
ch <- prometheus.MustNewConstMetric(c.procsRunning, prometheus.GaugeValue, value)
|
|
||||||
case parts[0] == "procs_blocked":
|
|
||||||
value, err := strconv.ParseFloat(parts[1], 64)
|
|
||||||
if err != nil {
|
|
||||||
return err
|
|
||||||
}
|
|
||||||
ch <- prometheus.MustNewConstMetric(c.procsBlocked, prometheus.GaugeValue, value)
|
|
||||||
}
|
|
||||||
}
|
|
||||||
return scanner.Err()
|
|
||||||
}
|
}
|
||||||
|
|
|
@ -6,6 +6,7 @@ collectors=$(cat << COLLECTORS
|
||||||
arp
|
arp
|
||||||
buddyinfo
|
buddyinfo
|
||||||
conntrack
|
conntrack
|
||||||
|
cpu
|
||||||
diskstats
|
diskstats
|
||||||
drbd
|
drbd
|
||||||
edac
|
edac
|
||||||
|
|
Loading…
Reference in New Issue