mirror of https://github.com/k3s-io/k3s
366 lines
13 KiB
Go
366 lines
13 KiB
Go
|
/*
|
||
|
Copyright 2015 The Kubernetes Authors.
|
||
|
|
||
|
Licensed under the Apache License, Version 2.0 (the "License");
|
||
|
you may not use this file except in compliance with the License.
|
||
|
You may obtain a copy of the License at
|
||
|
|
||
|
http://www.apache.org/licenses/LICENSE-2.0
|
||
|
|
||
|
Unless required by applicable law or agreed to in writing, software
|
||
|
distributed under the License is distributed on an "AS IS" BASIS,
|
||
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||
|
See the License for the specific language governing permissions and
|
||
|
limitations under the License.
|
||
|
*/
|
||
|
|
||
|
package pod
|
||
|
|
||
|
import (
|
||
|
"sync"
|
||
|
|
||
|
"k8s.io/klog"
|
||
|
|
||
|
"k8s.io/api/core/v1"
|
||
|
"k8s.io/apimachinery/pkg/types"
|
||
|
"k8s.io/kubernetes/pkg/kubelet/checkpoint"
|
||
|
"k8s.io/kubernetes/pkg/kubelet/checkpointmanager"
|
||
|
"k8s.io/kubernetes/pkg/kubelet/configmap"
|
||
|
kubecontainer "k8s.io/kubernetes/pkg/kubelet/container"
|
||
|
"k8s.io/kubernetes/pkg/kubelet/secret"
|
||
|
kubetypes "k8s.io/kubernetes/pkg/kubelet/types"
|
||
|
)
|
||
|
|
||
|
// Manager stores and manages access to pods, maintaining the mappings
|
||
|
// between static pods and mirror pods.
|
||
|
//
|
||
|
// The kubelet discovers pod updates from 3 sources: file, http, and
|
||
|
// apiserver. Pods from non-apiserver sources are called static pods, and API
|
||
|
// server is not aware of the existence of static pods. In order to monitor
|
||
|
// the status of such pods, the kubelet creates a mirror pod for each static
|
||
|
// pod via the API server.
|
||
|
//
|
||
|
// A mirror pod has the same pod full name (name and namespace) as its static
|
||
|
// counterpart (albeit different metadata such as UID, etc). By leveraging the
|
||
|
// fact that the kubelet reports the pod status using the pod full name, the
|
||
|
// status of the mirror pod always reflects the actual status of the static
|
||
|
// pod. When a static pod gets deleted, the associated orphaned mirror pod
|
||
|
// will also be removed.
|
||
|
type Manager interface {
|
||
|
// GetPods returns the regular pods bound to the kubelet and their spec.
|
||
|
GetPods() []*v1.Pod
|
||
|
// GetPodByFullName returns the (non-mirror) pod that matches full name, as well as
|
||
|
// whether the pod was found.
|
||
|
GetPodByFullName(podFullName string) (*v1.Pod, bool)
|
||
|
// GetPodByName provides the (non-mirror) pod that matches namespace and
|
||
|
// name, as well as whether the pod was found.
|
||
|
GetPodByName(namespace, name string) (*v1.Pod, bool)
|
||
|
// GetPodByUID provides the (non-mirror) pod that matches pod UID, as well as
|
||
|
// whether the pod is found.
|
||
|
GetPodByUID(types.UID) (*v1.Pod, bool)
|
||
|
// GetPodByMirrorPod returns the static pod for the given mirror pod and
|
||
|
// whether it was known to the pod manger.
|
||
|
GetPodByMirrorPod(*v1.Pod) (*v1.Pod, bool)
|
||
|
// GetMirrorPodByPod returns the mirror pod for the given static pod and
|
||
|
// whether it was known to the pod manager.
|
||
|
GetMirrorPodByPod(*v1.Pod) (*v1.Pod, bool)
|
||
|
// GetPodsAndMirrorPods returns the both regular and mirror pods.
|
||
|
GetPodsAndMirrorPods() ([]*v1.Pod, []*v1.Pod)
|
||
|
// SetPods replaces the internal pods with the new pods.
|
||
|
// It is currently only used for testing.
|
||
|
SetPods(pods []*v1.Pod)
|
||
|
// AddPod adds the given pod to the manager.
|
||
|
AddPod(pod *v1.Pod)
|
||
|
// UpdatePod updates the given pod in the manager.
|
||
|
UpdatePod(pod *v1.Pod)
|
||
|
// DeletePod deletes the given pod from the manager. For mirror pods,
|
||
|
// this means deleting the mappings related to mirror pods. For non-
|
||
|
// mirror pods, this means deleting from indexes for all non-mirror pods.
|
||
|
DeletePod(pod *v1.Pod)
|
||
|
// DeleteOrphanedMirrorPods deletes all mirror pods which do not have
|
||
|
// associated static pods. This method sends deletion requests to the API
|
||
|
// server, but does NOT modify the internal pod storage in basicManager.
|
||
|
DeleteOrphanedMirrorPods()
|
||
|
// TranslatePodUID returns the actual UID of a pod. If the UID belongs to
|
||
|
// a mirror pod, returns the UID of its static pod. Otherwise, returns the
|
||
|
// original UID.
|
||
|
//
|
||
|
// All public-facing functions should perform this translation for UIDs
|
||
|
// because user may provide a mirror pod UID, which is not recognized by
|
||
|
// internal Kubelet functions.
|
||
|
TranslatePodUID(uid types.UID) kubetypes.ResolvedPodUID
|
||
|
// GetUIDTranslations returns the mappings of static pod UIDs to mirror pod
|
||
|
// UIDs and mirror pod UIDs to static pod UIDs.
|
||
|
GetUIDTranslations() (podToMirror map[kubetypes.ResolvedPodUID]kubetypes.MirrorPodUID, mirrorToPod map[kubetypes.MirrorPodUID]kubetypes.ResolvedPodUID)
|
||
|
// IsMirrorPodOf returns true if mirrorPod is a correct representation of
|
||
|
// pod; false otherwise.
|
||
|
IsMirrorPodOf(mirrorPod, pod *v1.Pod) bool
|
||
|
|
||
|
MirrorClient
|
||
|
}
|
||
|
|
||
|
// basicManager is a functional Manager.
|
||
|
//
|
||
|
// All fields in basicManager are read-only and are updated calling SetPods,
|
||
|
// AddPod, UpdatePod, or DeletePod.
|
||
|
type basicManager struct {
|
||
|
// Protects all internal maps.
|
||
|
lock sync.RWMutex
|
||
|
|
||
|
// Regular pods indexed by UID.
|
||
|
podByUID map[kubetypes.ResolvedPodUID]*v1.Pod
|
||
|
// Mirror pods indexed by UID.
|
||
|
mirrorPodByUID map[kubetypes.MirrorPodUID]*v1.Pod
|
||
|
|
||
|
// Pods indexed by full name for easy access.
|
||
|
podByFullName map[string]*v1.Pod
|
||
|
mirrorPodByFullName map[string]*v1.Pod
|
||
|
|
||
|
// Mirror pod UID to pod UID map.
|
||
|
translationByUID map[kubetypes.MirrorPodUID]kubetypes.ResolvedPodUID
|
||
|
|
||
|
// basicManager is keeping secretManager and configMapManager up-to-date.
|
||
|
secretManager secret.Manager
|
||
|
configMapManager configmap.Manager
|
||
|
checkpointManager checkpointmanager.CheckpointManager
|
||
|
|
||
|
// A mirror pod client to create/delete mirror pods.
|
||
|
MirrorClient
|
||
|
}
|
||
|
|
||
|
// NewBasicPodManager returns a functional Manager.
|
||
|
func NewBasicPodManager(client MirrorClient, secretManager secret.Manager, configMapManager configmap.Manager, cpm checkpointmanager.CheckpointManager) Manager {
|
||
|
pm := &basicManager{}
|
||
|
pm.secretManager = secretManager
|
||
|
pm.configMapManager = configMapManager
|
||
|
pm.checkpointManager = cpm
|
||
|
pm.MirrorClient = client
|
||
|
pm.SetPods(nil)
|
||
|
return pm
|
||
|
}
|
||
|
|
||
|
// Set the internal pods based on the new pods.
|
||
|
func (pm *basicManager) SetPods(newPods []*v1.Pod) {
|
||
|
pm.lock.Lock()
|
||
|
defer pm.lock.Unlock()
|
||
|
|
||
|
pm.podByUID = make(map[kubetypes.ResolvedPodUID]*v1.Pod)
|
||
|
pm.podByFullName = make(map[string]*v1.Pod)
|
||
|
pm.mirrorPodByUID = make(map[kubetypes.MirrorPodUID]*v1.Pod)
|
||
|
pm.mirrorPodByFullName = make(map[string]*v1.Pod)
|
||
|
pm.translationByUID = make(map[kubetypes.MirrorPodUID]kubetypes.ResolvedPodUID)
|
||
|
|
||
|
pm.updatePodsInternal(newPods...)
|
||
|
}
|
||
|
|
||
|
func (pm *basicManager) AddPod(pod *v1.Pod) {
|
||
|
pm.UpdatePod(pod)
|
||
|
}
|
||
|
|
||
|
func (pm *basicManager) UpdatePod(pod *v1.Pod) {
|
||
|
pm.lock.Lock()
|
||
|
defer pm.lock.Unlock()
|
||
|
pm.updatePodsInternal(pod)
|
||
|
if pm.checkpointManager != nil {
|
||
|
if err := checkpoint.WritePod(pm.checkpointManager, pod); err != nil {
|
||
|
klog.Errorf("Error writing checkpoint for pod: %v", pod.GetName())
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
|
||
|
// updatePodsInternal replaces the given pods in the current state of the
|
||
|
// manager, updating the various indices. The caller is assumed to hold the
|
||
|
// lock.
|
||
|
func (pm *basicManager) updatePodsInternal(pods ...*v1.Pod) {
|
||
|
for _, pod := range pods {
|
||
|
if pm.secretManager != nil {
|
||
|
// TODO: Consider detecting only status update and in such case do
|
||
|
// not register pod, as it doesn't really matter.
|
||
|
pm.secretManager.RegisterPod(pod)
|
||
|
}
|
||
|
if pm.configMapManager != nil {
|
||
|
// TODO: Consider detecting only status update and in such case do
|
||
|
// not register pod, as it doesn't really matter.
|
||
|
pm.configMapManager.RegisterPod(pod)
|
||
|
}
|
||
|
podFullName := kubecontainer.GetPodFullName(pod)
|
||
|
// This logic relies on a static pod and its mirror to have the same name.
|
||
|
// It is safe to type convert here due to the IsMirrorPod guard.
|
||
|
if IsMirrorPod(pod) {
|
||
|
mirrorPodUID := kubetypes.MirrorPodUID(pod.UID)
|
||
|
pm.mirrorPodByUID[mirrorPodUID] = pod
|
||
|
pm.mirrorPodByFullName[podFullName] = pod
|
||
|
if p, ok := pm.podByFullName[podFullName]; ok {
|
||
|
pm.translationByUID[mirrorPodUID] = kubetypes.ResolvedPodUID(p.UID)
|
||
|
}
|
||
|
} else {
|
||
|
resolvedPodUID := kubetypes.ResolvedPodUID(pod.UID)
|
||
|
pm.podByUID[resolvedPodUID] = pod
|
||
|
pm.podByFullName[podFullName] = pod
|
||
|
if mirror, ok := pm.mirrorPodByFullName[podFullName]; ok {
|
||
|
pm.translationByUID[kubetypes.MirrorPodUID(mirror.UID)] = resolvedPodUID
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
|
||
|
func (pm *basicManager) DeletePod(pod *v1.Pod) {
|
||
|
pm.lock.Lock()
|
||
|
defer pm.lock.Unlock()
|
||
|
if pm.secretManager != nil {
|
||
|
pm.secretManager.UnregisterPod(pod)
|
||
|
}
|
||
|
if pm.configMapManager != nil {
|
||
|
pm.configMapManager.UnregisterPod(pod)
|
||
|
}
|
||
|
podFullName := kubecontainer.GetPodFullName(pod)
|
||
|
// It is safe to type convert here due to the IsMirrorPod guard.
|
||
|
if IsMirrorPod(pod) {
|
||
|
mirrorPodUID := kubetypes.MirrorPodUID(pod.UID)
|
||
|
delete(pm.mirrorPodByUID, mirrorPodUID)
|
||
|
delete(pm.mirrorPodByFullName, podFullName)
|
||
|
delete(pm.translationByUID, mirrorPodUID)
|
||
|
} else {
|
||
|
delete(pm.podByUID, kubetypes.ResolvedPodUID(pod.UID))
|
||
|
delete(pm.podByFullName, podFullName)
|
||
|
}
|
||
|
if pm.checkpointManager != nil {
|
||
|
if err := checkpoint.DeletePod(pm.checkpointManager, pod); err != nil {
|
||
|
klog.Errorf("Error deleting checkpoint for pod: %v", pod.GetName())
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
|
||
|
func (pm *basicManager) GetPods() []*v1.Pod {
|
||
|
pm.lock.RLock()
|
||
|
defer pm.lock.RUnlock()
|
||
|
return podsMapToPods(pm.podByUID)
|
||
|
}
|
||
|
|
||
|
func (pm *basicManager) GetPodsAndMirrorPods() ([]*v1.Pod, []*v1.Pod) {
|
||
|
pm.lock.RLock()
|
||
|
defer pm.lock.RUnlock()
|
||
|
pods := podsMapToPods(pm.podByUID)
|
||
|
mirrorPods := mirrorPodsMapToMirrorPods(pm.mirrorPodByUID)
|
||
|
return pods, mirrorPods
|
||
|
}
|
||
|
|
||
|
func (pm *basicManager) GetPodByUID(uid types.UID) (*v1.Pod, bool) {
|
||
|
pm.lock.RLock()
|
||
|
defer pm.lock.RUnlock()
|
||
|
pod, ok := pm.podByUID[kubetypes.ResolvedPodUID(uid)] // Safe conversion, map only holds non-mirrors.
|
||
|
return pod, ok
|
||
|
}
|
||
|
|
||
|
func (pm *basicManager) GetPodByName(namespace, name string) (*v1.Pod, bool) {
|
||
|
podFullName := kubecontainer.BuildPodFullName(name, namespace)
|
||
|
return pm.GetPodByFullName(podFullName)
|
||
|
}
|
||
|
|
||
|
func (pm *basicManager) GetPodByFullName(podFullName string) (*v1.Pod, bool) {
|
||
|
pm.lock.RLock()
|
||
|
defer pm.lock.RUnlock()
|
||
|
pod, ok := pm.podByFullName[podFullName]
|
||
|
return pod, ok
|
||
|
}
|
||
|
|
||
|
func (pm *basicManager) TranslatePodUID(uid types.UID) kubetypes.ResolvedPodUID {
|
||
|
// It is safe to type convert to a resolved UID because type conversion is idempotent.
|
||
|
if uid == "" {
|
||
|
return kubetypes.ResolvedPodUID(uid)
|
||
|
}
|
||
|
|
||
|
pm.lock.RLock()
|
||
|
defer pm.lock.RUnlock()
|
||
|
if translated, ok := pm.translationByUID[kubetypes.MirrorPodUID(uid)]; ok {
|
||
|
return translated
|
||
|
}
|
||
|
return kubetypes.ResolvedPodUID(uid)
|
||
|
}
|
||
|
|
||
|
func (pm *basicManager) GetUIDTranslations() (podToMirror map[kubetypes.ResolvedPodUID]kubetypes.MirrorPodUID,
|
||
|
mirrorToPod map[kubetypes.MirrorPodUID]kubetypes.ResolvedPodUID) {
|
||
|
pm.lock.RLock()
|
||
|
defer pm.lock.RUnlock()
|
||
|
|
||
|
podToMirror = make(map[kubetypes.ResolvedPodUID]kubetypes.MirrorPodUID, len(pm.translationByUID))
|
||
|
mirrorToPod = make(map[kubetypes.MirrorPodUID]kubetypes.ResolvedPodUID, len(pm.translationByUID))
|
||
|
// Insert empty translation mapping for all static pods.
|
||
|
for uid, pod := range pm.podByUID {
|
||
|
if !IsStaticPod(pod) {
|
||
|
continue
|
||
|
}
|
||
|
podToMirror[uid] = ""
|
||
|
}
|
||
|
// Fill in translations. Notice that if there is no mirror pod for a
|
||
|
// static pod, its uid will be translated into empty string "". This
|
||
|
// is WAI, from the caller side we can know that the static pod doesn't
|
||
|
// have a corresponding mirror pod instead of using static pod uid directly.
|
||
|
for k, v := range pm.translationByUID {
|
||
|
mirrorToPod[k] = v
|
||
|
podToMirror[v] = k
|
||
|
}
|
||
|
return podToMirror, mirrorToPod
|
||
|
}
|
||
|
|
||
|
func (pm *basicManager) getOrphanedMirrorPodNames() []string {
|
||
|
pm.lock.RLock()
|
||
|
defer pm.lock.RUnlock()
|
||
|
var podFullNames []string
|
||
|
for podFullName := range pm.mirrorPodByFullName {
|
||
|
if _, ok := pm.podByFullName[podFullName]; !ok {
|
||
|
podFullNames = append(podFullNames, podFullName)
|
||
|
}
|
||
|
}
|
||
|
return podFullNames
|
||
|
}
|
||
|
|
||
|
func (pm *basicManager) DeleteOrphanedMirrorPods() {
|
||
|
podFullNames := pm.getOrphanedMirrorPodNames()
|
||
|
for _, podFullName := range podFullNames {
|
||
|
pm.MirrorClient.DeleteMirrorPod(podFullName)
|
||
|
}
|
||
|
}
|
||
|
|
||
|
func (pm *basicManager) IsMirrorPodOf(mirrorPod, pod *v1.Pod) bool {
|
||
|
// Check name and namespace first.
|
||
|
if pod.Name != mirrorPod.Name || pod.Namespace != mirrorPod.Namespace {
|
||
|
return false
|
||
|
}
|
||
|
hash, ok := getHashFromMirrorPod(mirrorPod)
|
||
|
if !ok {
|
||
|
return false
|
||
|
}
|
||
|
return hash == getPodHash(pod)
|
||
|
}
|
||
|
|
||
|
func podsMapToPods(UIDMap map[kubetypes.ResolvedPodUID]*v1.Pod) []*v1.Pod {
|
||
|
pods := make([]*v1.Pod, 0, len(UIDMap))
|
||
|
for _, pod := range UIDMap {
|
||
|
pods = append(pods, pod)
|
||
|
}
|
||
|
return pods
|
||
|
}
|
||
|
|
||
|
func mirrorPodsMapToMirrorPods(UIDMap map[kubetypes.MirrorPodUID]*v1.Pod) []*v1.Pod {
|
||
|
pods := make([]*v1.Pod, 0, len(UIDMap))
|
||
|
for _, pod := range UIDMap {
|
||
|
pods = append(pods, pod)
|
||
|
}
|
||
|
return pods
|
||
|
}
|
||
|
|
||
|
func (pm *basicManager) GetMirrorPodByPod(pod *v1.Pod) (*v1.Pod, bool) {
|
||
|
pm.lock.RLock()
|
||
|
defer pm.lock.RUnlock()
|
||
|
mirrorPod, ok := pm.mirrorPodByFullName[kubecontainer.GetPodFullName(pod)]
|
||
|
return mirrorPod, ok
|
||
|
}
|
||
|
|
||
|
func (pm *basicManager) GetPodByMirrorPod(mirrorPod *v1.Pod) (*v1.Pod, bool) {
|
||
|
pm.lock.RLock()
|
||
|
defer pm.lock.RUnlock()
|
||
|
pod, ok := pm.podByFullName[kubecontainer.GetPodFullName(mirrorPod)]
|
||
|
return pod, ok
|
||
|
}
|