2019-01-12 04:58:27 +00:00
/ *
Copyright 2018 The Kubernetes Authors .
Licensed under the Apache License , Version 2.0 ( the "License" ) ;
you may not use this file except in compliance with the License .
You may obtain a copy of the License at
http : //www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing , software
distributed under the License is distributed on an "AS IS" BASIS ,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND , either express or implied .
See the License for the specific language governing permissions and
limitations under the License .
* /
package nodestatus
import (
"fmt"
"math"
"net"
goruntime "runtime"
"strings"
"time"
cadvisorapiv1 "github.com/google/cadvisor/info/v1"
2021-03-18 22:40:29 +00:00
v1 "k8s.io/api/core/v1"
2019-01-12 04:58:27 +00:00
"k8s.io/apimachinery/pkg/api/resource"
metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
2019-04-07 17:07:55 +00:00
"k8s.io/apimachinery/pkg/util/errors"
2019-01-12 04:58:27 +00:00
utilnet "k8s.io/apimachinery/pkg/util/net"
utilfeature "k8s.io/apiserver/pkg/util/feature"
2019-08-30 18:33:25 +00:00
cloudprovider "k8s.io/cloud-provider"
2020-08-10 17:43:49 +00:00
cloudproviderapi "k8s.io/cloud-provider/api"
2019-12-12 01:27:03 +00:00
"k8s.io/component-base/version"
2019-01-12 04:58:27 +00:00
v1helper "k8s.io/kubernetes/pkg/apis/core/v1/helper"
"k8s.io/kubernetes/pkg/features"
"k8s.io/kubernetes/pkg/kubelet/cadvisor"
"k8s.io/kubernetes/pkg/kubelet/cm"
kubecontainer "k8s.io/kubernetes/pkg/kubelet/container"
"k8s.io/kubernetes/pkg/kubelet/events"
"k8s.io/kubernetes/pkg/volume"
2020-08-10 17:43:49 +00:00
"k8s.io/klog/v2"
2019-01-12 04:58:27 +00:00
)
const (
// MaxNamesPerImageInNodeStatus is max number of names
// per image stored in the node status.
MaxNamesPerImageInNodeStatus = 5
)
// Setter modifies the node in-place, and returns an error if the modification failed.
// Setters may partially mutate the node before returning an error.
type Setter func ( node * v1 . Node ) error
// NodeAddress returns a Setter that updates address-related information on the node.
2020-12-01 01:06:26 +00:00
func NodeAddress ( nodeIPs [ ] net . IP , // typically Kubelet.nodeIPs
2019-01-12 04:58:27 +00:00
validateNodeIPFunc func ( net . IP ) error , // typically Kubelet.nodeIPValidator
hostname string , // typically Kubelet.hostname
2019-04-07 17:07:55 +00:00
hostnameOverridden bool , // was the hostname force set?
externalCloudProvider bool , // typically Kubelet.externalCloudProvider
2019-08-30 18:33:25 +00:00
cloud cloudprovider . Interface , // typically Kubelet.cloud
2019-04-07 17:07:55 +00:00
nodeAddressesFunc func ( ) ( [ ] v1 . NodeAddress , error ) , // typically Kubelet.cloudResourceSyncManager.NodeAddresses
2019-01-12 04:58:27 +00:00
) Setter {
2020-12-01 01:06:26 +00:00
var nodeIP , secondaryNodeIP net . IP
if len ( nodeIPs ) > 0 {
nodeIP = nodeIPs [ 0 ]
}
2020-03-26 21:07:15 +00:00
preferIPv4 := nodeIP == nil || nodeIP . To4 ( ) != nil
isPreferredIPFamily := func ( ip net . IP ) bool { return ( ip . To4 ( ) != nil ) == preferIPv4 }
nodeIPSpecified := nodeIP != nil && ! nodeIP . IsUnspecified ( )
2020-12-01 01:06:26 +00:00
if len ( nodeIPs ) > 1 {
secondaryNodeIP = nodeIPs [ 1 ]
}
secondaryNodeIPSpecified := secondaryNodeIP != nil && ! secondaryNodeIP . IsUnspecified ( )
2019-01-12 04:58:27 +00:00
return func ( node * v1 . Node ) error {
2020-03-26 21:07:15 +00:00
if nodeIPSpecified {
2019-01-12 04:58:27 +00:00
if err := validateNodeIPFunc ( nodeIP ) ; err != nil {
return fmt . Errorf ( "failed to validate nodeIP: %v" , err )
}
2021-03-18 22:40:29 +00:00
klog . V ( 4 ) . InfoS ( "Using node IP" , "IP" , nodeIP . String ( ) )
2019-01-12 04:58:27 +00:00
}
2020-12-01 01:06:26 +00:00
if secondaryNodeIPSpecified {
if err := validateNodeIPFunc ( secondaryNodeIP ) ; err != nil {
return fmt . Errorf ( "failed to validate secondaryNodeIP: %v" , err )
}
2021-03-18 22:40:29 +00:00
klog . V ( 4 ) . InfoS ( "Using secondary node IP" , "IP" , secondaryNodeIP . String ( ) )
2020-12-01 01:06:26 +00:00
}
2019-01-12 04:58:27 +00:00
2019-04-07 17:07:55 +00:00
if externalCloudProvider {
2020-03-26 21:07:15 +00:00
if nodeIPSpecified {
2019-04-07 17:07:55 +00:00
if node . ObjectMeta . Annotations == nil {
node . ObjectMeta . Annotations = make ( map [ string ] string )
2019-01-12 04:58:27 +00:00
}
2020-08-10 17:43:49 +00:00
node . ObjectMeta . Annotations [ cloudproviderapi . AnnotationAlphaProvidedIPAddr ] = nodeIP . String ( )
2019-04-07 17:07:55 +00:00
}
2019-09-27 21:51:53 +00:00
// If --cloud-provider=external and node address is already set,
// then we return early because provider set addresses should take precedence.
// Otherwise, we try to look up the node IP and let the cloud provider override it later
// This should alleviate a lot of the bootstrapping issues with out-of-tree providers
if len ( node . Status . Addresses ) > 0 {
return nil
}
2019-04-07 17:07:55 +00:00
}
2019-08-30 18:33:25 +00:00
if cloud != nil {
2019-09-27 21:51:53 +00:00
cloudNodeAddresses , err := nodeAddressesFunc ( )
2019-08-30 18:33:25 +00:00
if err != nil {
return err
}
2019-09-27 21:51:53 +00:00
var nodeAddresses [ ] v1 . NodeAddress
// For every address supplied by the cloud provider that matches nodeIP, nodeIP is the enforced node address for
// that address Type (like InternalIP and ExternalIP), meaning other addresses of the same Type are discarded.
// See #61921 for more information: some cloud providers may supply secondary IPs, so nodeIP serves as a way to
// ensure that the correct IPs show up on a Node object.
2020-03-26 21:07:15 +00:00
if nodeIPSpecified {
2019-08-30 18:33:25 +00:00
enforcedNodeAddresses := [ ] v1 . NodeAddress { }
2019-04-07 17:07:55 +00:00
2019-08-30 18:33:25 +00:00
nodeIPTypes := make ( map [ v1 . NodeAddressType ] bool )
2019-09-27 21:51:53 +00:00
for _ , nodeAddress := range cloudNodeAddresses {
2019-08-30 18:33:25 +00:00
if nodeAddress . Address == nodeIP . String ( ) {
enforcedNodeAddresses = append ( enforcedNodeAddresses , v1 . NodeAddress { Type : nodeAddress . Type , Address : nodeAddress . Address } )
nodeIPTypes [ nodeAddress . Type ] = true
}
}
2019-01-12 04:58:27 +00:00
2019-09-27 21:51:53 +00:00
// nodeIP must be among the addresses supplied by the cloud provider
if len ( enforcedNodeAddresses ) == 0 {
return fmt . Errorf ( "failed to get node address from cloud provider that matches ip: %v" , nodeIP )
}
// nodeIP was found, now use all other addresses supplied by the cloud provider NOT of the same Type as nodeIP.
for _ , nodeAddress := range cloudNodeAddresses {
if ! nodeIPTypes [ nodeAddress . Type ] {
enforcedNodeAddresses = append ( enforcedNodeAddresses , v1 . NodeAddress { Type : nodeAddress . Type , Address : nodeAddress . Address } )
}
2019-08-30 18:33:25 +00:00
}
2019-09-27 21:51:53 +00:00
nodeAddresses = enforcedNodeAddresses
2020-03-26 21:07:15 +00:00
} else if nodeIP != nil {
// nodeIP is "0.0.0.0" or "::"; sort cloudNodeAddresses to
// prefer addresses of the matching family
sortedAddresses := make ( [ ] v1 . NodeAddress , 0 , len ( cloudNodeAddresses ) )
for _ , nodeAddress := range cloudNodeAddresses {
ip := net . ParseIP ( nodeAddress . Address )
if ip == nil || isPreferredIPFamily ( ip ) {
sortedAddresses = append ( sortedAddresses , nodeAddress )
}
}
for _ , nodeAddress := range cloudNodeAddresses {
ip := net . ParseIP ( nodeAddress . Address )
if ip != nil && ! isPreferredIPFamily ( ip ) {
sortedAddresses = append ( sortedAddresses , nodeAddress )
}
}
nodeAddresses = sortedAddresses
2019-09-27 21:51:53 +00:00
} else {
// If nodeIP is unset, just use the addresses provided by the cloud provider as-is
nodeAddresses = cloudNodeAddresses
2019-08-30 18:33:25 +00:00
}
switch {
2019-09-27 21:51:53 +00:00
case len ( cloudNodeAddresses ) == 0 :
2019-08-30 18:33:25 +00:00
// the cloud provider didn't specify any addresses
nodeAddresses = append ( nodeAddresses , v1 . NodeAddress { Type : v1 . NodeHostName , Address : hostname } )
2019-09-27 21:51:53 +00:00
case ! hasAddressType ( cloudNodeAddresses , v1 . NodeHostName ) && hasAddressValue ( cloudNodeAddresses , hostname ) :
2019-08-30 18:33:25 +00:00
// the cloud provider didn't specify an address of type Hostname,
// but the auto-detected hostname matched an address reported by the cloud provider,
// so we can add it and count on the value being verifiable via cloud provider metadata
nodeAddresses = append ( nodeAddresses , v1 . NodeAddress { Type : v1 . NodeHostName , Address : hostname } )
case hostnameOverridden :
// the hostname was force-set via flag/config.
// this means the hostname might not be able to be validated via cloud provider metadata,
// but was a choice by the kubelet deployer we should honor
var existingHostnameAddress * v1 . NodeAddress
for i := range nodeAddresses {
if nodeAddresses [ i ] . Type == v1 . NodeHostName {
existingHostnameAddress = & nodeAddresses [ i ]
2019-04-07 17:07:55 +00:00
break
}
2019-08-30 18:33:25 +00:00
}
if existingHostnameAddress == nil {
// no existing Hostname address found, add it
2021-03-18 22:40:29 +00:00
klog . InfoS ( "Adding overridden hostname to cloudprovider-reported addresses" , "hostname" , hostname )
2019-08-30 18:33:25 +00:00
nodeAddresses = append ( nodeAddresses , v1 . NodeAddress { Type : v1 . NodeHostName , Address : hostname } )
} else if existingHostnameAddress . Address != hostname {
// override the Hostname address reported by the cloud provider
2021-03-18 22:40:29 +00:00
klog . InfoS ( "Replacing cloudprovider-reported hostname with overridden hostname" , "cloudProviderHostname" , existingHostnameAddress . Address , "overriddenHostname" , hostname )
2019-08-30 18:33:25 +00:00
existingHostnameAddress . Address = hostname
}
}
node . Status . Addresses = nodeAddresses
2020-12-01 01:06:26 +00:00
} else if nodeIPSpecified && secondaryNodeIPSpecified {
node . Status . Addresses = [ ] v1 . NodeAddress {
{ Type : v1 . NodeInternalIP , Address : nodeIP . String ( ) } ,
{ Type : v1 . NodeInternalIP , Address : secondaryNodeIP . String ( ) } ,
{ Type : v1 . NodeHostName , Address : hostname } ,
}
2019-08-30 18:33:25 +00:00
} else {
var ipAddr net . IP
var err error
2020-03-26 21:07:15 +00:00
// 1) Use nodeIP if set (and not "0.0.0.0"/"::")
2019-08-30 18:33:25 +00:00
// 2) If the user has specified an IP to HostnameOverride, use it
2020-03-26 21:07:15 +00:00
// 3) Lookup the IP from node name by DNS
2019-08-30 18:33:25 +00:00
// 4) Try to get the IP from the network interface used as default gateway
2020-03-26 21:07:15 +00:00
//
// For steps 3 and 4, IPv4 addresses are preferred to IPv6 addresses
// unless nodeIP is "::", in which case it is reversed.
if nodeIPSpecified {
2019-08-30 18:33:25 +00:00
ipAddr = nodeIP
} else if addr := net . ParseIP ( hostname ) ; addr != nil {
ipAddr = addr
} else {
var addrs [ ] net . IP
addrs , _ = net . LookupIP ( node . Name )
for _ , addr := range addrs {
if err = validateNodeIPFunc ( addr ) ; err == nil {
2020-03-26 21:07:15 +00:00
if isPreferredIPFamily ( addr ) {
2019-08-30 18:33:25 +00:00
ipAddr = addr
break
2020-03-26 21:07:15 +00:00
} else if ipAddr == nil {
2019-08-30 18:33:25 +00:00
ipAddr = addr
}
2019-04-07 17:07:55 +00:00
}
2019-01-12 04:58:27 +00:00
}
2019-08-30 18:33:25 +00:00
if ipAddr == nil {
2020-03-26 21:07:15 +00:00
ipAddr , err = utilnet . ResolveBindAddress ( nodeIP )
2019-08-30 18:33:25 +00:00
}
2019-01-12 04:58:27 +00:00
}
if ipAddr == nil {
2019-08-30 18:33:25 +00:00
// We tried everything we could, but the IP address wasn't fetchable; error out
return fmt . Errorf ( "can't get ip address of node %s. error: %v" , node . Name , err )
}
node . Status . Addresses = [ ] v1 . NodeAddress {
{ Type : v1 . NodeInternalIP , Address : ipAddr . String ( ) } ,
{ Type : v1 . NodeHostName , Address : hostname } ,
2019-01-12 04:58:27 +00:00
}
2019-04-07 17:07:55 +00:00
}
2019-01-12 04:58:27 +00:00
return nil
}
}
2019-04-07 17:07:55 +00:00
func hasAddressType ( addresses [ ] v1 . NodeAddress , addressType v1 . NodeAddressType ) bool {
for _ , address := range addresses {
if address . Type == addressType {
return true
}
}
return false
}
func hasAddressValue ( addresses [ ] v1 . NodeAddress , addressValue string ) bool {
for _ , address := range addresses {
if address . Address == addressValue {
return true
}
}
return false
}
2019-01-12 04:58:27 +00:00
// MachineInfo returns a Setter that updates machine-related information on the node.
func MachineInfo ( nodeName string ,
maxPods int ,
podsPerCore int ,
machineInfoFunc func ( ) ( * cadvisorapiv1 . MachineInfo , error ) , // typically Kubelet.GetCachedMachineInfo
capacityFunc func ( ) v1 . ResourceList , // typically Kubelet.containerManager.GetCapacity
devicePluginResourceCapacityFunc func ( ) ( v1 . ResourceList , v1 . ResourceList , [ ] string ) , // typically Kubelet.containerManager.GetDevicePluginResourceCapacity
nodeAllocatableReservationFunc func ( ) v1 . ResourceList , // typically Kubelet.containerManager.GetNodeAllocatableReservation
recordEventFunc func ( eventType , event , message string ) , // typically Kubelet.recordEvent
) Setter {
return func ( node * v1 . Node ) error {
// Note: avoid blindly overwriting the capacity in case opaque
// resources are being advertised.
if node . Status . Capacity == nil {
node . Status . Capacity = v1 . ResourceList { }
}
var devicePluginAllocatable v1 . ResourceList
var devicePluginCapacity v1 . ResourceList
var removedDevicePlugins [ ] string
// TODO: Post NotReady if we cannot get MachineInfo from cAdvisor. This needs to start
// cAdvisor locally, e.g. for test-cmd.sh, and in integration test.
info , err := machineInfoFunc ( )
if err != nil {
// TODO(roberthbailey): This is required for test-cmd.sh to pass.
// See if the test should be updated instead.
node . Status . Capacity [ v1 . ResourceCPU ] = * resource . NewMilliQuantity ( 0 , resource . DecimalSI )
node . Status . Capacity [ v1 . ResourceMemory ] = resource . MustParse ( "0Gi" )
node . Status . Capacity [ v1 . ResourcePods ] = * resource . NewQuantity ( int64 ( maxPods ) , resource . DecimalSI )
2021-03-18 22:40:29 +00:00
klog . ErrorS ( err , "Error getting machine info" )
2019-01-12 04:58:27 +00:00
} else {
node . Status . NodeInfo . MachineID = info . MachineID
node . Status . NodeInfo . SystemUUID = info . SystemUUID
for rName , rCap := range cadvisor . CapacityFromMachineInfo ( info ) {
node . Status . Capacity [ rName ] = rCap
}
if podsPerCore > 0 {
node . Status . Capacity [ v1 . ResourcePods ] = * resource . NewQuantity (
int64 ( math . Min ( float64 ( info . NumCores * podsPerCore ) , float64 ( maxPods ) ) ) , resource . DecimalSI )
} else {
node . Status . Capacity [ v1 . ResourcePods ] = * resource . NewQuantity (
int64 ( maxPods ) , resource . DecimalSI )
}
if node . Status . NodeInfo . BootID != "" &&
node . Status . NodeInfo . BootID != info . BootID {
// TODO: This requires a transaction, either both node status is updated
// and event is recorded or neither should happen, see issue #6055.
recordEventFunc ( v1 . EventTypeWarning , events . NodeRebooted ,
fmt . Sprintf ( "Node %s has been rebooted, boot id: %s" , nodeName , info . BootID ) )
}
node . Status . NodeInfo . BootID = info . BootID
if utilfeature . DefaultFeatureGate . Enabled ( features . LocalStorageCapacityIsolation ) {
// TODO: all the node resources should use ContainerManager.GetCapacity instead of deriving the
// capacity for every node status request
initialCapacity := capacityFunc ( )
if initialCapacity != nil {
2019-04-07 17:07:55 +00:00
if v , exists := initialCapacity [ v1 . ResourceEphemeralStorage ] ; exists {
node . Status . Capacity [ v1 . ResourceEphemeralStorage ] = v
}
2019-01-12 04:58:27 +00:00
}
}
devicePluginCapacity , devicePluginAllocatable , removedDevicePlugins = devicePluginResourceCapacityFunc ( )
2020-08-10 17:43:49 +00:00
for k , v := range devicePluginCapacity {
if old , ok := node . Status . Capacity [ k ] ; ! ok || old . Value ( ) != v . Value ( ) {
2021-03-18 22:40:29 +00:00
klog . V ( 2 ) . InfoS ( "Updated capacity for device plugin" , "plugin" , k , "capacity" , v . Value ( ) )
2019-01-12 04:58:27 +00:00
}
2020-08-10 17:43:49 +00:00
node . Status . Capacity [ k ] = v
2019-01-12 04:58:27 +00:00
}
for _ , removedResource := range removedDevicePlugins {
2021-03-18 22:40:29 +00:00
klog . V ( 2 ) . InfoS ( "Set capacity for removed resource to 0 on device removal" , "device" , removedResource )
2019-01-12 04:58:27 +00:00
// Set the capacity of the removed resource to 0 instead of
// removing the resource from the node status. This is to indicate
// that the resource is managed by device plugin and had been
// registered before.
//
// This is required to differentiate the device plugin managed
// resources and the cluster-level resources, which are absent in
// node status.
node . Status . Capacity [ v1 . ResourceName ( removedResource ) ] = * resource . NewQuantity ( int64 ( 0 ) , resource . DecimalSI )
}
}
// Set Allocatable.
if node . Status . Allocatable == nil {
node . Status . Allocatable = make ( v1 . ResourceList )
}
// Remove extended resources from allocatable that are no longer
// present in capacity.
for k := range node . Status . Allocatable {
_ , found := node . Status . Capacity [ k ]
if ! found && v1helper . IsExtendedResourceName ( k ) {
delete ( node . Status . Allocatable , k )
}
}
allocatableReservation := nodeAllocatableReservationFunc ( )
for k , v := range node . Status . Capacity {
2019-09-27 21:51:53 +00:00
value := v . DeepCopy ( )
2019-01-12 04:58:27 +00:00
if res , exists := allocatableReservation [ k ] ; exists {
value . Sub ( res )
}
if value . Sign ( ) < 0 {
// Negative Allocatable resources don't make sense.
value . Set ( 0 )
}
node . Status . Allocatable [ k ] = value
}
2020-08-10 17:43:49 +00:00
for k , v := range devicePluginAllocatable {
if old , ok := node . Status . Allocatable [ k ] ; ! ok || old . Value ( ) != v . Value ( ) {
2021-03-18 22:40:29 +00:00
klog . V ( 2 ) . InfoS ( "Updated allocatable" , "device" , k , "allocatable" , v . Value ( ) )
2019-01-12 04:58:27 +00:00
}
2020-08-10 17:43:49 +00:00
node . Status . Allocatable [ k ] = v
2019-01-12 04:58:27 +00:00
}
// for every huge page reservation, we need to remove it from allocatable memory
for k , v := range node . Status . Capacity {
if v1helper . IsHugePageResourceName ( k ) {
allocatableMemory := node . Status . Allocatable [ v1 . ResourceMemory ]
2019-09-27 21:51:53 +00:00
value := v . DeepCopy ( )
2019-01-12 04:58:27 +00:00
allocatableMemory . Sub ( value )
if allocatableMemory . Sign ( ) < 0 {
// Negative Allocatable resources don't make sense.
allocatableMemory . Set ( 0 )
}
node . Status . Allocatable [ v1 . ResourceMemory ] = allocatableMemory
}
}
return nil
}
}
// VersionInfo returns a Setter that updates version-related information on the node.
func VersionInfo ( versionInfoFunc func ( ) ( * cadvisorapiv1 . VersionInfo , error ) , // typically Kubelet.cadvisor.VersionInfo
runtimeTypeFunc func ( ) string , // typically Kubelet.containerRuntime.Type
runtimeVersionFunc func ( ) ( kubecontainer . Version , error ) , // typically Kubelet.containerRuntime.Version
) Setter {
return func ( node * v1 . Node ) error {
verinfo , err := versionInfoFunc ( )
if err != nil {
return fmt . Errorf ( "error getting version info: %v" , err )
}
node . Status . NodeInfo . KernelVersion = verinfo . KernelVersion
node . Status . NodeInfo . OSImage = verinfo . ContainerOsVersion
runtimeVersion := "Unknown"
if runtimeVer , err := runtimeVersionFunc ( ) ; err == nil {
runtimeVersion = runtimeVer . String ( )
}
node . Status . NodeInfo . ContainerRuntimeVersion = fmt . Sprintf ( "%s://%s" , runtimeTypeFunc ( ) , runtimeVersion )
node . Status . NodeInfo . KubeletVersion = version . Get ( ) . String ( )
// TODO: kube-proxy might be different version from kubelet in the future
node . Status . NodeInfo . KubeProxyVersion = version . Get ( ) . String ( )
return nil
}
}
// DaemonEndpoints returns a Setter that updates the daemon endpoints on the node.
func DaemonEndpoints ( daemonEndpoints * v1 . NodeDaemonEndpoints ) Setter {
return func ( node * v1 . Node ) error {
node . Status . DaemonEndpoints = * daemonEndpoints
return nil
}
}
// Images returns a Setter that updates the images on the node.
// imageListFunc is expected to return a list of images sorted in descending order by image size.
// nodeStatusMaxImages is ignored if set to -1.
func Images ( nodeStatusMaxImages int32 ,
imageListFunc func ( ) ( [ ] kubecontainer . Image , error ) , // typically Kubelet.imageManager.GetImageList
) Setter {
return func ( node * v1 . Node ) error {
// Update image list of this node
var imagesOnNode [ ] v1 . ContainerImage
containerImages , err := imageListFunc ( )
if err != nil {
node . Status . Images = imagesOnNode
return fmt . Errorf ( "error getting image list: %v" , err )
}
// we expect imageListFunc to return a sorted list, so we just need to truncate
if int ( nodeStatusMaxImages ) > - 1 &&
int ( nodeStatusMaxImages ) < len ( containerImages ) {
containerImages = containerImages [ 0 : nodeStatusMaxImages ]
}
for _ , image := range containerImages {
2020-03-26 21:07:15 +00:00
// make a copy to avoid modifying slice members of the image items in the list
names := append ( [ ] string { } , image . RepoDigests ... )
names = append ( names , image . RepoTags ... )
2019-01-12 04:58:27 +00:00
// Report up to MaxNamesPerImageInNodeStatus names per image.
if len ( names ) > MaxNamesPerImageInNodeStatus {
names = names [ 0 : MaxNamesPerImageInNodeStatus ]
}
imagesOnNode = append ( imagesOnNode , v1 . ContainerImage {
Names : names ,
SizeBytes : image . Size ,
} )
}
node . Status . Images = imagesOnNode
return nil
}
}
// GoRuntime returns a Setter that sets GOOS and GOARCH on the node.
func GoRuntime ( ) Setter {
return func ( node * v1 . Node ) error {
node . Status . NodeInfo . OperatingSystem = goruntime . GOOS
node . Status . NodeInfo . Architecture = goruntime . GOARCH
return nil
}
}
// ReadyCondition returns a Setter that updates the v1.NodeReady condition on the node.
func ReadyCondition (
nowFunc func ( ) time . Time , // typically Kubelet.clock.Now
2019-04-07 17:07:55 +00:00
runtimeErrorsFunc func ( ) error , // typically Kubelet.runtimeState.runtimeErrors
networkErrorsFunc func ( ) error , // typically Kubelet.runtimeState.networkErrors
storageErrorsFunc func ( ) error , // typically Kubelet.runtimeState.storageErrors
2019-01-12 04:58:27 +00:00
appArmorValidateHostFunc func ( ) error , // typically Kubelet.appArmorValidator.ValidateHost, might be nil depending on whether there was an appArmorValidator
cmStatusFunc func ( ) cm . Status , // typically Kubelet.containerManager.Status
2020-12-01 01:06:26 +00:00
nodeShutdownManagerErrorsFunc func ( ) error , // typically kubelet.shutdownManager.errors.
2019-01-12 04:58:27 +00:00
recordEventFunc func ( eventType , event string ) , // typically Kubelet.recordNodeStatusEvent
) Setter {
return func ( node * v1 . Node ) error {
// NOTE(aaronlevy): NodeReady condition needs to be the last in the list of node conditions.
// This is due to an issue with version skewed kubelet and master components.
// ref: https://github.com/kubernetes/kubernetes/issues/16961
currentTime := metav1 . NewTime ( nowFunc ( ) )
newNodeReadyCondition := v1 . NodeCondition {
Type : v1 . NodeReady ,
Status : v1 . ConditionTrue ,
Reason : "KubeletReady" ,
Message : "kubelet is posting ready status" ,
LastHeartbeatTime : currentTime ,
}
2020-12-01 01:06:26 +00:00
errs := [ ] error { runtimeErrorsFunc ( ) , networkErrorsFunc ( ) , storageErrorsFunc ( ) , nodeShutdownManagerErrorsFunc ( ) }
2019-01-12 04:58:27 +00:00
requiredCapacities := [ ] v1 . ResourceName { v1 . ResourceCPU , v1 . ResourceMemory , v1 . ResourcePods }
if utilfeature . DefaultFeatureGate . Enabled ( features . LocalStorageCapacityIsolation ) {
requiredCapacities = append ( requiredCapacities , v1 . ResourceEphemeralStorage )
}
missingCapacities := [ ] string { }
for _ , resource := range requiredCapacities {
if _ , found := node . Status . Capacity [ resource ] ; ! found {
missingCapacities = append ( missingCapacities , string ( resource ) )
}
}
if len ( missingCapacities ) > 0 {
2019-09-27 21:51:53 +00:00
errs = append ( errs , fmt . Errorf ( "missing node capacity for resources: %s" , strings . Join ( missingCapacities , ", " ) ) )
2019-01-12 04:58:27 +00:00
}
2019-04-07 17:07:55 +00:00
if aggregatedErr := errors . NewAggregate ( errs ) ; aggregatedErr != nil {
2019-01-12 04:58:27 +00:00
newNodeReadyCondition = v1 . NodeCondition {
Type : v1 . NodeReady ,
Status : v1 . ConditionFalse ,
Reason : "KubeletNotReady" ,
2019-04-07 17:07:55 +00:00
Message : aggregatedErr . Error ( ) ,
2019-01-12 04:58:27 +00:00
LastHeartbeatTime : currentTime ,
}
}
// Append AppArmor status if it's enabled.
// TODO(tallclair): This is a temporary message until node feature reporting is added.
if appArmorValidateHostFunc != nil && newNodeReadyCondition . Status == v1 . ConditionTrue {
if err := appArmorValidateHostFunc ( ) ; err == nil {
newNodeReadyCondition . Message = fmt . Sprintf ( "%s. AppArmor enabled" , newNodeReadyCondition . Message )
}
}
// Record any soft requirements that were not met in the container manager.
status := cmStatusFunc ( )
if status . SoftRequirements != nil {
newNodeReadyCondition . Message = fmt . Sprintf ( "%s. WARNING: %s" , newNodeReadyCondition . Message , status . SoftRequirements . Error ( ) )
}
readyConditionUpdated := false
needToRecordEvent := false
for i := range node . Status . Conditions {
if node . Status . Conditions [ i ] . Type == v1 . NodeReady {
if node . Status . Conditions [ i ] . Status == newNodeReadyCondition . Status {
newNodeReadyCondition . LastTransitionTime = node . Status . Conditions [ i ] . LastTransitionTime
} else {
newNodeReadyCondition . LastTransitionTime = currentTime
needToRecordEvent = true
}
node . Status . Conditions [ i ] = newNodeReadyCondition
readyConditionUpdated = true
break
}
}
if ! readyConditionUpdated {
newNodeReadyCondition . LastTransitionTime = currentTime
node . Status . Conditions = append ( node . Status . Conditions , newNodeReadyCondition )
}
if needToRecordEvent {
if newNodeReadyCondition . Status == v1 . ConditionTrue {
recordEventFunc ( v1 . EventTypeNormal , events . NodeReady )
} else {
recordEventFunc ( v1 . EventTypeNormal , events . NodeNotReady )
2021-03-18 22:40:29 +00:00
klog . InfoS ( "Node became not ready" , "node" , klog . KObj ( node ) , "condition" , newNodeReadyCondition )
2019-01-12 04:58:27 +00:00
}
}
return nil
}
}
// MemoryPressureCondition returns a Setter that updates the v1.NodeMemoryPressure condition on the node.
func MemoryPressureCondition ( nowFunc func ( ) time . Time , // typically Kubelet.clock.Now
pressureFunc func ( ) bool , // typically Kubelet.evictionManager.IsUnderMemoryPressure
recordEventFunc func ( eventType , event string ) , // typically Kubelet.recordNodeStatusEvent
) Setter {
return func ( node * v1 . Node ) error {
currentTime := metav1 . NewTime ( nowFunc ( ) )
var condition * v1 . NodeCondition
// Check if NodeMemoryPressure condition already exists and if it does, just pick it up for update.
for i := range node . Status . Conditions {
if node . Status . Conditions [ i ] . Type == v1 . NodeMemoryPressure {
condition = & node . Status . Conditions [ i ]
}
}
newCondition := false
// If the NodeMemoryPressure condition doesn't exist, create one
if condition == nil {
condition = & v1 . NodeCondition {
Type : v1 . NodeMemoryPressure ,
Status : v1 . ConditionUnknown ,
}
// cannot be appended to node.Status.Conditions here because it gets
// copied to the slice. So if we append to the slice here none of the
// updates we make below are reflected in the slice.
newCondition = true
}
// Update the heartbeat time
condition . LastHeartbeatTime = currentTime
// Note: The conditions below take care of the case when a new NodeMemoryPressure condition is
// created and as well as the case when the condition already exists. When a new condition
// is created its status is set to v1.ConditionUnknown which matches either
// condition.Status != v1.ConditionTrue or
// condition.Status != v1.ConditionFalse in the conditions below depending on whether
// the kubelet is under memory pressure or not.
if pressureFunc ( ) {
if condition . Status != v1 . ConditionTrue {
condition . Status = v1 . ConditionTrue
condition . Reason = "KubeletHasInsufficientMemory"
condition . Message = "kubelet has insufficient memory available"
condition . LastTransitionTime = currentTime
recordEventFunc ( v1 . EventTypeNormal , "NodeHasInsufficientMemory" )
}
} else if condition . Status != v1 . ConditionFalse {
condition . Status = v1 . ConditionFalse
condition . Reason = "KubeletHasSufficientMemory"
condition . Message = "kubelet has sufficient memory available"
condition . LastTransitionTime = currentTime
recordEventFunc ( v1 . EventTypeNormal , "NodeHasSufficientMemory" )
}
if newCondition {
node . Status . Conditions = append ( node . Status . Conditions , * condition )
}
return nil
}
}
// PIDPressureCondition returns a Setter that updates the v1.NodePIDPressure condition on the node.
func PIDPressureCondition ( nowFunc func ( ) time . Time , // typically Kubelet.clock.Now
pressureFunc func ( ) bool , // typically Kubelet.evictionManager.IsUnderPIDPressure
recordEventFunc func ( eventType , event string ) , // typically Kubelet.recordNodeStatusEvent
) Setter {
return func ( node * v1 . Node ) error {
currentTime := metav1 . NewTime ( nowFunc ( ) )
var condition * v1 . NodeCondition
// Check if NodePIDPressure condition already exists and if it does, just pick it up for update.
for i := range node . Status . Conditions {
if node . Status . Conditions [ i ] . Type == v1 . NodePIDPressure {
condition = & node . Status . Conditions [ i ]
}
}
newCondition := false
// If the NodePIDPressure condition doesn't exist, create one
if condition == nil {
condition = & v1 . NodeCondition {
Type : v1 . NodePIDPressure ,
Status : v1 . ConditionUnknown ,
}
// cannot be appended to node.Status.Conditions here because it gets
// copied to the slice. So if we append to the slice here none of the
// updates we make below are reflected in the slice.
newCondition = true
}
// Update the heartbeat time
condition . LastHeartbeatTime = currentTime
// Note: The conditions below take care of the case when a new NodePIDPressure condition is
// created and as well as the case when the condition already exists. When a new condition
// is created its status is set to v1.ConditionUnknown which matches either
// condition.Status != v1.ConditionTrue or
// condition.Status != v1.ConditionFalse in the conditions below depending on whether
// the kubelet is under PID pressure or not.
if pressureFunc ( ) {
if condition . Status != v1 . ConditionTrue {
condition . Status = v1 . ConditionTrue
condition . Reason = "KubeletHasInsufficientPID"
condition . Message = "kubelet has insufficient PID available"
condition . LastTransitionTime = currentTime
recordEventFunc ( v1 . EventTypeNormal , "NodeHasInsufficientPID" )
}
} else if condition . Status != v1 . ConditionFalse {
condition . Status = v1 . ConditionFalse
condition . Reason = "KubeletHasSufficientPID"
condition . Message = "kubelet has sufficient PID available"
condition . LastTransitionTime = currentTime
recordEventFunc ( v1 . EventTypeNormal , "NodeHasSufficientPID" )
}
if newCondition {
node . Status . Conditions = append ( node . Status . Conditions , * condition )
}
return nil
}
}
// DiskPressureCondition returns a Setter that updates the v1.NodeDiskPressure condition on the node.
func DiskPressureCondition ( nowFunc func ( ) time . Time , // typically Kubelet.clock.Now
pressureFunc func ( ) bool , // typically Kubelet.evictionManager.IsUnderDiskPressure
recordEventFunc func ( eventType , event string ) , // typically Kubelet.recordNodeStatusEvent
) Setter {
return func ( node * v1 . Node ) error {
currentTime := metav1 . NewTime ( nowFunc ( ) )
var condition * v1 . NodeCondition
// Check if NodeDiskPressure condition already exists and if it does, just pick it up for update.
for i := range node . Status . Conditions {
if node . Status . Conditions [ i ] . Type == v1 . NodeDiskPressure {
condition = & node . Status . Conditions [ i ]
}
}
newCondition := false
// If the NodeDiskPressure condition doesn't exist, create one
if condition == nil {
condition = & v1 . NodeCondition {
Type : v1 . NodeDiskPressure ,
Status : v1 . ConditionUnknown ,
}
// cannot be appended to node.Status.Conditions here because it gets
// copied to the slice. So if we append to the slice here none of the
// updates we make below are reflected in the slice.
newCondition = true
}
// Update the heartbeat time
condition . LastHeartbeatTime = currentTime
// Note: The conditions below take care of the case when a new NodeDiskPressure condition is
// created and as well as the case when the condition already exists. When a new condition
// is created its status is set to v1.ConditionUnknown which matches either
// condition.Status != v1.ConditionTrue or
// condition.Status != v1.ConditionFalse in the conditions below depending on whether
// the kubelet is under disk pressure or not.
if pressureFunc ( ) {
if condition . Status != v1 . ConditionTrue {
condition . Status = v1 . ConditionTrue
condition . Reason = "KubeletHasDiskPressure"
condition . Message = "kubelet has disk pressure"
condition . LastTransitionTime = currentTime
recordEventFunc ( v1 . EventTypeNormal , "NodeHasDiskPressure" )
}
} else if condition . Status != v1 . ConditionFalse {
condition . Status = v1 . ConditionFalse
condition . Reason = "KubeletHasNoDiskPressure"
condition . Message = "kubelet has no disk pressure"
condition . LastTransitionTime = currentTime
recordEventFunc ( v1 . EventTypeNormal , "NodeHasNoDiskPressure" )
}
if newCondition {
node . Status . Conditions = append ( node . Status . Conditions , * condition )
}
return nil
}
}
// VolumesInUse returns a Setter that updates the volumes in use on the node.
func VolumesInUse ( syncedFunc func ( ) bool , // typically Kubelet.volumeManager.ReconcilerStatesHasBeenSynced
volumesInUseFunc func ( ) [ ] v1 . UniqueVolumeName , // typically Kubelet.volumeManager.GetVolumesInUse
) Setter {
return func ( node * v1 . Node ) error {
// Make sure to only update node status after reconciler starts syncing up states
if syncedFunc ( ) {
node . Status . VolumesInUse = volumesInUseFunc ( )
}
return nil
}
}
// VolumeLimits returns a Setter that updates the volume limits on the node.
func VolumeLimits ( volumePluginListFunc func ( ) [ ] volume . VolumePluginWithAttachLimits , // typically Kubelet.volumePluginMgr.ListVolumePluginWithLimits
) Setter {
return func ( node * v1 . Node ) error {
if node . Status . Capacity == nil {
node . Status . Capacity = v1 . ResourceList { }
}
if node . Status . Allocatable == nil {
node . Status . Allocatable = v1 . ResourceList { }
}
pluginWithLimits := volumePluginListFunc ( )
for _ , volumePlugin := range pluginWithLimits {
attachLimits , err := volumePlugin . GetVolumeLimits ( )
if err != nil {
2021-07-02 08:43:15 +00:00
klog . V ( 4 ) . InfoS ( "Skipping volume limits for volume plugin" , "plugin" , volumePlugin . GetPluginName ( ) )
2019-01-12 04:58:27 +00:00
continue
}
for limitKey , value := range attachLimits {
node . Status . Capacity [ v1 . ResourceName ( limitKey ) ] = * resource . NewQuantity ( value , resource . DecimalSI )
node . Status . Allocatable [ v1 . ResourceName ( limitKey ) ] = * resource . NewQuantity ( value , resource . DecimalSI )
}
}
return nil
}
}