mirror of https://github.com/prometheus/prometheus
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
345 lines
9.8 KiB
345 lines
9.8 KiB
// Copyright 2016 The Prometheus Authors |
|
// Licensed under the Apache License, Version 2.0 (the "License"); |
|
// you may not use this file except in compliance with the License. |
|
// You may obtain a copy of the License at |
|
// |
|
// http://www.apache.org/licenses/LICENSE-2.0 |
|
// |
|
// Unless required by applicable law or agreed to in writing, software |
|
// distributed under the License is distributed on an "AS IS" BASIS, |
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
|
// See the License for the specific language governing permissions and |
|
// limitations under the License. |
|
|
|
package kubernetes |
|
|
|
import ( |
|
"context" |
|
"errors" |
|
"fmt" |
|
"log/slog" |
|
"net" |
|
"strconv" |
|
"strings" |
|
|
|
"github.com/prometheus/client_golang/prometheus" |
|
"github.com/prometheus/common/model" |
|
"github.com/prometheus/common/promslog" |
|
apiv1 "k8s.io/api/core/v1" |
|
metav1 "k8s.io/apimachinery/pkg/apis/meta/v1" |
|
"k8s.io/client-go/tools/cache" |
|
"k8s.io/client-go/util/workqueue" |
|
|
|
"github.com/prometheus/prometheus/discovery/targetgroup" |
|
) |
|
|
|
const ( |
|
nodeIndex = "node" |
|
podIndex = "pod" |
|
) |
|
|
|
// Pod discovers new pod targets. |
|
type Pod struct { |
|
podInf cache.SharedIndexInformer |
|
nodeInf cache.SharedInformer |
|
withNodeMetadata bool |
|
store cache.Store |
|
logger *slog.Logger |
|
queue *workqueue.Type |
|
} |
|
|
|
// NewPod creates a new pod discovery. |
|
func NewPod(l *slog.Logger, pods cache.SharedIndexInformer, nodes cache.SharedInformer, eventCount *prometheus.CounterVec) *Pod { |
|
if l == nil { |
|
l = promslog.NewNopLogger() |
|
} |
|
|
|
podAddCount := eventCount.WithLabelValues(RolePod.String(), MetricLabelRoleAdd) |
|
podDeleteCount := eventCount.WithLabelValues(RolePod.String(), MetricLabelRoleDelete) |
|
podUpdateCount := eventCount.WithLabelValues(RolePod.String(), MetricLabelRoleUpdate) |
|
|
|
p := &Pod{ |
|
podInf: pods, |
|
nodeInf: nodes, |
|
withNodeMetadata: nodes != nil, |
|
store: pods.GetStore(), |
|
logger: l, |
|
queue: workqueue.NewNamed(RolePod.String()), |
|
} |
|
_, err := p.podInf.AddEventHandler(cache.ResourceEventHandlerFuncs{ |
|
AddFunc: func(o interface{}) { |
|
podAddCount.Inc() |
|
p.enqueue(o) |
|
}, |
|
DeleteFunc: func(o interface{}) { |
|
podDeleteCount.Inc() |
|
p.enqueue(o) |
|
}, |
|
UpdateFunc: func(_, o interface{}) { |
|
podUpdateCount.Inc() |
|
p.enqueue(o) |
|
}, |
|
}) |
|
if err != nil { |
|
l.Error("Error adding pods event handler.", "err", err) |
|
} |
|
|
|
if p.withNodeMetadata { |
|
_, err = p.nodeInf.AddEventHandler(cache.ResourceEventHandlerFuncs{ |
|
AddFunc: func(o interface{}) { |
|
node := o.(*apiv1.Node) |
|
p.enqueuePodsForNode(node.Name) |
|
}, |
|
UpdateFunc: func(_, o interface{}) { |
|
node := o.(*apiv1.Node) |
|
p.enqueuePodsForNode(node.Name) |
|
}, |
|
DeleteFunc: func(o interface{}) { |
|
nodeName, err := nodeName(o) |
|
if err != nil { |
|
l.Error("Error getting Node name", "err", err) |
|
} |
|
p.enqueuePodsForNode(nodeName) |
|
}, |
|
}) |
|
if err != nil { |
|
l.Error("Error adding pods event handler.", "err", err) |
|
} |
|
} |
|
|
|
return p |
|
} |
|
|
|
func (p *Pod) enqueue(obj interface{}) { |
|
key, err := cache.DeletionHandlingMetaNamespaceKeyFunc(obj) |
|
if err != nil { |
|
return |
|
} |
|
|
|
p.queue.Add(key) |
|
} |
|
|
|
// Run implements the Discoverer interface. |
|
func (p *Pod) Run(ctx context.Context, ch chan<- []*targetgroup.Group) { |
|
defer p.queue.ShutDown() |
|
|
|
cacheSyncs := []cache.InformerSynced{p.podInf.HasSynced} |
|
if p.withNodeMetadata { |
|
cacheSyncs = append(cacheSyncs, p.nodeInf.HasSynced) |
|
} |
|
|
|
if !cache.WaitForCacheSync(ctx.Done(), cacheSyncs...) { |
|
if !errors.Is(ctx.Err(), context.Canceled) { |
|
p.logger.Error("pod informer unable to sync cache") |
|
} |
|
return |
|
} |
|
|
|
go func() { |
|
for p.process(ctx, ch) { |
|
} |
|
}() |
|
|
|
// Block until the target provider is explicitly canceled. |
|
<-ctx.Done() |
|
} |
|
|
|
func (p *Pod) process(ctx context.Context, ch chan<- []*targetgroup.Group) bool { |
|
keyObj, quit := p.queue.Get() |
|
if quit { |
|
return false |
|
} |
|
defer p.queue.Done(keyObj) |
|
key := keyObj.(string) |
|
|
|
namespace, name, err := cache.SplitMetaNamespaceKey(key) |
|
if err != nil { |
|
return true |
|
} |
|
|
|
o, exists, err := p.store.GetByKey(key) |
|
if err != nil { |
|
return true |
|
} |
|
if !exists { |
|
send(ctx, ch, &targetgroup.Group{Source: podSourceFromNamespaceAndName(namespace, name)}) |
|
return true |
|
} |
|
pod, err := convertToPod(o) |
|
if err != nil { |
|
p.logger.Error("converting to Pod object failed", "err", err) |
|
return true |
|
} |
|
send(ctx, ch, p.buildPod(pod)) |
|
return true |
|
} |
|
|
|
func convertToPod(o interface{}) (*apiv1.Pod, error) { |
|
pod, ok := o.(*apiv1.Pod) |
|
if ok { |
|
return pod, nil |
|
} |
|
|
|
return nil, fmt.Errorf("received unexpected object: %v", o) |
|
} |
|
|
|
const ( |
|
podIPLabel = metaLabelPrefix + "pod_ip" |
|
podContainerNameLabel = metaLabelPrefix + "pod_container_name" |
|
podContainerIDLabel = metaLabelPrefix + "pod_container_id" |
|
podContainerImageLabel = metaLabelPrefix + "pod_container_image" |
|
podContainerPortNameLabel = metaLabelPrefix + "pod_container_port_name" |
|
podContainerPortNumberLabel = metaLabelPrefix + "pod_container_port_number" |
|
podContainerPortProtocolLabel = metaLabelPrefix + "pod_container_port_protocol" |
|
podContainerIsInit = metaLabelPrefix + "pod_container_init" |
|
podReadyLabel = metaLabelPrefix + "pod_ready" |
|
podPhaseLabel = metaLabelPrefix + "pod_phase" |
|
podNodeNameLabel = metaLabelPrefix + "pod_node_name" |
|
podHostIPLabel = metaLabelPrefix + "pod_host_ip" |
|
podUID = metaLabelPrefix + "pod_uid" |
|
podControllerKind = metaLabelPrefix + "pod_controller_kind" |
|
podControllerName = metaLabelPrefix + "pod_controller_name" |
|
) |
|
|
|
// GetControllerOf returns a pointer to a copy of the controllerRef if controllee has a controller |
|
// https://github.com/kubernetes/apimachinery/blob/cd2cae2b39fa57e8063fa1f5f13cfe9862db3d41/pkg/apis/meta/v1/controller_ref.go |
|
func GetControllerOf(controllee metav1.Object) *metav1.OwnerReference { |
|
for _, ref := range controllee.GetOwnerReferences() { |
|
if ref.Controller != nil && *ref.Controller { |
|
return &ref |
|
} |
|
} |
|
return nil |
|
} |
|
|
|
func podLabels(pod *apiv1.Pod) model.LabelSet { |
|
ls := model.LabelSet{ |
|
podIPLabel: lv(pod.Status.PodIP), |
|
podReadyLabel: podReady(pod), |
|
podPhaseLabel: lv(string(pod.Status.Phase)), |
|
podNodeNameLabel: lv(pod.Spec.NodeName), |
|
podHostIPLabel: lv(pod.Status.HostIP), |
|
podUID: lv(string(pod.ObjectMeta.UID)), |
|
} |
|
|
|
addObjectMetaLabels(ls, pod.ObjectMeta, RolePod) |
|
|
|
createdBy := GetControllerOf(pod) |
|
if createdBy != nil { |
|
if createdBy.Kind != "" { |
|
ls[podControllerKind] = lv(createdBy.Kind) |
|
} |
|
if createdBy.Name != "" { |
|
ls[podControllerName] = lv(createdBy.Name) |
|
} |
|
} |
|
|
|
return ls |
|
} |
|
|
|
func (p *Pod) findPodContainerStatus(statuses *[]apiv1.ContainerStatus, containerName string) (*apiv1.ContainerStatus, error) { |
|
for _, s := range *statuses { |
|
if s.Name == containerName { |
|
return &s, nil |
|
} |
|
} |
|
return nil, fmt.Errorf("cannot find container with name %v", containerName) |
|
} |
|
|
|
func (p *Pod) findPodContainerID(statuses *[]apiv1.ContainerStatus, containerName string) string { |
|
cStatus, err := p.findPodContainerStatus(statuses, containerName) |
|
if err != nil { |
|
p.logger.Debug("cannot find container ID", "err", err) |
|
return "" |
|
} |
|
return cStatus.ContainerID |
|
} |
|
|
|
func (p *Pod) buildPod(pod *apiv1.Pod) *targetgroup.Group { |
|
tg := &targetgroup.Group{ |
|
Source: podSource(pod), |
|
} |
|
// PodIP can be empty when a pod is starting or has been evicted. |
|
if len(pod.Status.PodIP) == 0 { |
|
return tg |
|
} |
|
|
|
tg.Labels = podLabels(pod) |
|
tg.Labels[namespaceLabel] = lv(pod.Namespace) |
|
if p.withNodeMetadata { |
|
tg.Labels = addNodeLabels(tg.Labels, p.nodeInf, p.logger, &pod.Spec.NodeName) |
|
} |
|
|
|
containers := append(pod.Spec.Containers, pod.Spec.InitContainers...) |
|
for i, c := range containers { |
|
isInit := i >= len(pod.Spec.Containers) |
|
|
|
cStatuses := &pod.Status.ContainerStatuses |
|
if isInit { |
|
cStatuses = &pod.Status.InitContainerStatuses |
|
} |
|
cID := p.findPodContainerID(cStatuses, c.Name) |
|
|
|
// If no ports are defined for the container, create an anonymous |
|
// target per container. |
|
if len(c.Ports) == 0 { |
|
// We don't have a port so we just set the address label to the pod IP. |
|
// The user has to add a port manually. |
|
tg.Targets = append(tg.Targets, model.LabelSet{ |
|
model.AddressLabel: lv(pod.Status.PodIP), |
|
podContainerNameLabel: lv(c.Name), |
|
podContainerIDLabel: lv(cID), |
|
podContainerImageLabel: lv(c.Image), |
|
podContainerIsInit: lv(strconv.FormatBool(isInit)), |
|
}) |
|
continue |
|
} |
|
// Otherwise create one target for each container/port combination. |
|
for _, port := range c.Ports { |
|
ports := strconv.FormatUint(uint64(port.ContainerPort), 10) |
|
addr := net.JoinHostPort(pod.Status.PodIP, ports) |
|
|
|
tg.Targets = append(tg.Targets, model.LabelSet{ |
|
model.AddressLabel: lv(addr), |
|
podContainerNameLabel: lv(c.Name), |
|
podContainerIDLabel: lv(cID), |
|
podContainerImageLabel: lv(c.Image), |
|
podContainerPortNumberLabel: lv(ports), |
|
podContainerPortNameLabel: lv(port.Name), |
|
podContainerPortProtocolLabel: lv(string(port.Protocol)), |
|
podContainerIsInit: lv(strconv.FormatBool(isInit)), |
|
}) |
|
} |
|
} |
|
|
|
return tg |
|
} |
|
|
|
func (p *Pod) enqueuePodsForNode(nodeName string) { |
|
pods, err := p.podInf.GetIndexer().ByIndex(nodeIndex, nodeName) |
|
if err != nil { |
|
p.logger.Error("Error getting pods for node", "node", nodeName, "err", err) |
|
return |
|
} |
|
|
|
for _, pod := range pods { |
|
p.enqueue(pod.(*apiv1.Pod)) |
|
} |
|
} |
|
|
|
func podSource(pod *apiv1.Pod) string { |
|
return podSourceFromNamespaceAndName(pod.Namespace, pod.Name) |
|
} |
|
|
|
func podSourceFromNamespaceAndName(namespace, name string) string { |
|
return "pod/" + namespacedName(namespace, name) |
|
} |
|
|
|
func podReady(pod *apiv1.Pod) model.LabelValue { |
|
for _, cond := range pod.Status.Conditions { |
|
if cond.Type == apiv1.PodReady { |
|
return lv(strings.ToLower(string(cond.Status))) |
|
} |
|
} |
|
return lv(strings.ToLower(string(apiv1.ConditionUnknown))) |
|
}
|
|
|