mirror of https://github.com/k3s-io/k3s
218 lines
7.8 KiB
Go
218 lines
7.8 KiB
Go
/*
|
|
Copyright 2016 The Kubernetes Authors.
|
|
|
|
Licensed under the Apache License, Version 2.0 (the "License");
|
|
you may not use this file except in compliance with the License.
|
|
You may obtain a copy of the License at
|
|
|
|
http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
Unless required by applicable law or agreed to in writing, software
|
|
distributed under the License is distributed on an "AS IS" BASIS,
|
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
See the License for the specific language governing permissions and
|
|
limitations under the License.
|
|
*/
|
|
|
|
package prometheus
|
|
|
|
import (
|
|
"k8s.io/client-go/util/workqueue"
|
|
"k8s.io/klog"
|
|
|
|
"github.com/prometheus/client_golang/prometheus"
|
|
)
|
|
|
|
// Package prometheus sets the workqueue DefaultMetricsFactory to produce
|
|
// prometheus metrics. To use this package, you just have to import it.
|
|
|
|
// Metrics subsystem and keys used by the workqueue.
|
|
const (
|
|
WorkQueueSubsystem = "workqueue"
|
|
DepthKey = "depth"
|
|
AddsKey = "adds_total"
|
|
QueueLatencyKey = "queue_latency_seconds"
|
|
WorkDurationKey = "work_duration_seconds"
|
|
UnfinishedWorkKey = "unfinished_work_seconds"
|
|
LongestRunningProcessorKey = "longest_running_processor_seconds"
|
|
RetriesKey = "retries_total"
|
|
)
|
|
|
|
func init() {
|
|
workqueue.SetProvider(prometheusMetricsProvider{})
|
|
}
|
|
|
|
type prometheusMetricsProvider struct{}
|
|
|
|
func (prometheusMetricsProvider) NewDepthMetric(name string) workqueue.GaugeMetric {
|
|
depth := prometheus.NewGauge(prometheus.GaugeOpts{
|
|
Subsystem: WorkQueueSubsystem,
|
|
Name: DepthKey,
|
|
Help: "Current depth of workqueue",
|
|
ConstLabels: prometheus.Labels{"name": name},
|
|
})
|
|
prometheus.Register(depth)
|
|
return depth
|
|
}
|
|
|
|
func (prometheusMetricsProvider) NewAddsMetric(name string) workqueue.CounterMetric {
|
|
adds := prometheus.NewCounter(prometheus.CounterOpts{
|
|
Subsystem: WorkQueueSubsystem,
|
|
Name: AddsKey,
|
|
Help: "Total number of adds handled by workqueue",
|
|
ConstLabels: prometheus.Labels{"name": name},
|
|
})
|
|
prometheus.Register(adds)
|
|
return adds
|
|
}
|
|
|
|
func (prometheusMetricsProvider) NewLatencyMetric(name string) workqueue.HistogramMetric {
|
|
latency := prometheus.NewHistogram(prometheus.HistogramOpts{
|
|
Subsystem: WorkQueueSubsystem,
|
|
Name: QueueLatencyKey,
|
|
Help: "How long in seconds an item stays in workqueue before being requested.",
|
|
ConstLabels: prometheus.Labels{"name": name},
|
|
Buckets: prometheus.ExponentialBuckets(10e-9, 10, 10),
|
|
})
|
|
prometheus.Register(latency)
|
|
return latency
|
|
}
|
|
|
|
func (prometheusMetricsProvider) NewWorkDurationMetric(name string) workqueue.HistogramMetric {
|
|
workDuration := prometheus.NewHistogram(prometheus.HistogramOpts{
|
|
Subsystem: WorkQueueSubsystem,
|
|
Name: WorkDurationKey,
|
|
Help: "How long in seconds processing an item from workqueue takes.",
|
|
ConstLabels: prometheus.Labels{"name": name},
|
|
Buckets: prometheus.ExponentialBuckets(10e-9, 10, 10),
|
|
})
|
|
prometheus.Register(workDuration)
|
|
return workDuration
|
|
}
|
|
|
|
func (prometheusMetricsProvider) NewUnfinishedWorkSecondsMetric(name string) workqueue.SettableGaugeMetric {
|
|
unfinished := prometheus.NewGauge(prometheus.GaugeOpts{
|
|
Subsystem: WorkQueueSubsystem,
|
|
Name: UnfinishedWorkKey,
|
|
Help: "How many seconds of work has done that " +
|
|
"is in progress and hasn't been observed by work_duration. Large " +
|
|
"values indicate stuck threads. One can deduce the number of stuck " +
|
|
"threads by observing the rate at which this increases.",
|
|
ConstLabels: prometheus.Labels{"name": name},
|
|
})
|
|
prometheus.Register(unfinished)
|
|
return unfinished
|
|
}
|
|
|
|
func (prometheusMetricsProvider) NewLongestRunningProcessorSecondsMetric(name string) workqueue.SettableGaugeMetric {
|
|
unfinished := prometheus.NewGauge(prometheus.GaugeOpts{
|
|
Subsystem: WorkQueueSubsystem,
|
|
Name: LongestRunningProcessorKey,
|
|
Help: "How many seconds has the longest running " +
|
|
"processor for workqueue been running.",
|
|
ConstLabels: prometheus.Labels{"name": name},
|
|
})
|
|
prometheus.Register(unfinished)
|
|
return unfinished
|
|
}
|
|
|
|
func (prometheusMetricsProvider) NewRetriesMetric(name string) workqueue.CounterMetric {
|
|
retries := prometheus.NewCounter(prometheus.CounterOpts{
|
|
Subsystem: WorkQueueSubsystem,
|
|
Name: RetriesKey,
|
|
Help: "Total number of retries handled by workqueue",
|
|
ConstLabels: prometheus.Labels{"name": name},
|
|
})
|
|
prometheus.Register(retries)
|
|
return retries
|
|
}
|
|
|
|
// TODO(danielqsj): Remove the following metrics, they are deprecated
|
|
func (prometheusMetricsProvider) NewDeprecatedDepthMetric(name string) workqueue.GaugeMetric {
|
|
depth := prometheus.NewGauge(prometheus.GaugeOpts{
|
|
Subsystem: name,
|
|
Name: "depth",
|
|
Help: "(Deprecated) Current depth of workqueue: " + name,
|
|
})
|
|
if err := prometheus.Register(depth); err != nil {
|
|
klog.Errorf("failed to register depth metric %v: %v", name, err)
|
|
}
|
|
return depth
|
|
}
|
|
|
|
func (prometheusMetricsProvider) NewDeprecatedAddsMetric(name string) workqueue.CounterMetric {
|
|
adds := prometheus.NewCounter(prometheus.CounterOpts{
|
|
Subsystem: name,
|
|
Name: "adds",
|
|
Help: "(Deprecated) Total number of adds handled by workqueue: " + name,
|
|
})
|
|
if err := prometheus.Register(adds); err != nil {
|
|
klog.Errorf("failed to register adds metric %v: %v", name, err)
|
|
}
|
|
return adds
|
|
}
|
|
|
|
func (prometheusMetricsProvider) NewDeprecatedLatencyMetric(name string) workqueue.SummaryMetric {
|
|
latency := prometheus.NewSummary(prometheus.SummaryOpts{
|
|
Subsystem: name,
|
|
Name: "queue_latency",
|
|
Help: "(Deprecated) How long an item stays in workqueue" + name + " before being requested.",
|
|
})
|
|
if err := prometheus.Register(latency); err != nil {
|
|
klog.Errorf("failed to register latency metric %v: %v", name, err)
|
|
}
|
|
return latency
|
|
}
|
|
|
|
func (prometheusMetricsProvider) NewDeprecatedWorkDurationMetric(name string) workqueue.SummaryMetric {
|
|
workDuration := prometheus.NewSummary(prometheus.SummaryOpts{
|
|
Subsystem: name,
|
|
Name: "work_duration",
|
|
Help: "(Deprecated) How long processing an item from workqueue" + name + " takes.",
|
|
})
|
|
if err := prometheus.Register(workDuration); err != nil {
|
|
klog.Errorf("failed to register work_duration metric %v: %v", name, err)
|
|
}
|
|
return workDuration
|
|
}
|
|
|
|
func (prometheusMetricsProvider) NewDeprecatedUnfinishedWorkSecondsMetric(name string) workqueue.SettableGaugeMetric {
|
|
unfinished := prometheus.NewGauge(prometheus.GaugeOpts{
|
|
Subsystem: name,
|
|
Name: "unfinished_work_seconds",
|
|
Help: "(Deprecated) How many seconds of work " + name + " has done that " +
|
|
"is in progress and hasn't been observed by work_duration. Large " +
|
|
"values indicate stuck threads. One can deduce the number of stuck " +
|
|
"threads by observing the rate at which this increases.",
|
|
})
|
|
if err := prometheus.Register(unfinished); err != nil {
|
|
klog.Errorf("failed to register unfinished_work_seconds metric %v: %v", name, err)
|
|
}
|
|
return unfinished
|
|
}
|
|
|
|
func (prometheusMetricsProvider) NewDeprecatedLongestRunningProcessorMicrosecondsMetric(name string) workqueue.SettableGaugeMetric {
|
|
unfinished := prometheus.NewGauge(prometheus.GaugeOpts{
|
|
Subsystem: name,
|
|
Name: "longest_running_processor_microseconds",
|
|
Help: "(Deprecated) How many microseconds has the longest running " +
|
|
"processor for " + name + " been running.",
|
|
})
|
|
if err := prometheus.Register(unfinished); err != nil {
|
|
klog.Errorf("failed to register longest_running_processor_microseconds metric %v: %v", name, err)
|
|
}
|
|
return unfinished
|
|
}
|
|
|
|
func (prometheusMetricsProvider) NewDeprecatedRetriesMetric(name string) workqueue.CounterMetric {
|
|
retries := prometheus.NewCounter(prometheus.CounterOpts{
|
|
Subsystem: name,
|
|
Name: "retries",
|
|
Help: "(Deprecated) Total number of retries handled by workqueue: " + name,
|
|
})
|
|
if err := prometheus.Register(retries); err != nil {
|
|
klog.Errorf("failed to register retries metric %v: %v", name, err)
|
|
}
|
|
return retries
|
|
}
|