2019-09-27 21:51:53 +00:00
/ *
Copyright 2019 The Kubernetes Authors .
Licensed under the Apache License , Version 2.0 ( the "License" ) ;
you may not use this file except in compliance with the License .
You may obtain a copy of the License at
http : //www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing , software
distributed under the License is distributed on an "AS IS" BASIS ,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND , either express or implied .
See the License for the specific language governing permissions and
limitations under the License .
* /
package endpointslice
import (
"fmt"
"time"
corev1 "k8s.io/api/core/v1"
2020-12-01 01:06:26 +00:00
v1 "k8s.io/api/core/v1"
2021-03-18 22:40:29 +00:00
discovery "k8s.io/api/discovery/v1"
2019-09-27 21:51:53 +00:00
apiequality "k8s.io/apimachinery/pkg/api/equality"
metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
"k8s.io/apimachinery/pkg/runtime/schema"
2020-02-14 00:18:16 +00:00
utilruntime "k8s.io/apimachinery/pkg/util/runtime"
2021-03-18 22:40:29 +00:00
"k8s.io/apimachinery/pkg/util/sets"
2020-12-01 01:06:26 +00:00
utilfeature "k8s.io/apiserver/pkg/util/feature"
2020-02-14 00:18:16 +00:00
"k8s.io/client-go/tools/cache"
2020-08-10 17:43:49 +00:00
"k8s.io/klog/v2"
2019-09-27 21:51:53 +00:00
podutil "k8s.io/kubernetes/pkg/api/v1/pod"
api "k8s.io/kubernetes/pkg/apis/core"
2020-12-01 01:06:26 +00:00
helper "k8s.io/kubernetes/pkg/apis/core/v1/helper"
2019-09-27 21:51:53 +00:00
"k8s.io/kubernetes/pkg/apis/discovery/validation"
2019-12-12 01:27:03 +00:00
endpointutil "k8s.io/kubernetes/pkg/controller/util/endpoint"
2020-12-01 01:06:26 +00:00
"k8s.io/kubernetes/pkg/features"
2019-12-12 01:27:03 +00:00
utilnet "k8s.io/utils/net"
2019-09-27 21:51:53 +00:00
)
2020-12-01 01:06:26 +00:00
// podToEndpoint returns an Endpoint object generated from a Pod, a Node, and a Service for a particular addressType.
func podToEndpoint ( pod * corev1 . Pod , node * corev1 . Node , service * corev1 . Service , addressType discovery . AddressType ) discovery . Endpoint {
serving := podutil . IsPodReady ( pod )
terminating := pod . DeletionTimestamp != nil
// For compatibility reasons, "ready" should never be "true" if a pod is terminatng, unless
// publishNotReadyAddresses was set.
ready := service . Spec . PublishNotReadyAddresses || ( serving && ! terminating )
2019-12-12 01:27:03 +00:00
ep := discovery . Endpoint {
2020-12-01 01:06:26 +00:00
Addresses : getEndpointAddresses ( pod . Status , service , addressType ) ,
2019-09-27 21:51:53 +00:00
Conditions : discovery . EndpointConditions {
Ready : & ready ,
} ,
TargetRef : & corev1 . ObjectReference {
Kind : "Pod" ,
Namespace : pod . ObjectMeta . Namespace ,
Name : pod . ObjectMeta . Name ,
UID : pod . ObjectMeta . UID ,
ResourceVersion : pod . ObjectMeta . ResourceVersion ,
} ,
}
2019-12-12 01:27:03 +00:00
2020-12-01 01:06:26 +00:00
if utilfeature . DefaultFeatureGate . Enabled ( features . EndpointSliceTerminatingCondition ) {
ep . Conditions . Serving = & serving
ep . Conditions . Terminating = & terminating
}
2021-03-18 22:40:29 +00:00
if pod . Spec . NodeName != "" {
2020-12-01 01:06:26 +00:00
ep . NodeName = & pod . Spec . NodeName
}
2021-03-18 22:40:29 +00:00
if node != nil && node . Labels [ corev1 . LabelTopologyZone ] != "" {
zone := node . Labels [ corev1 . LabelTopologyZone ]
ep . Zone = & zone
}
2019-12-12 01:27:03 +00:00
if endpointutil . ShouldSetHostname ( pod , service ) {
ep . Hostname = & pod . Spec . Hostname
}
return ep
2019-09-27 21:51:53 +00:00
}
// getEndpointPorts returns a list of EndpointPorts generated from a Service
// and Pod.
func getEndpointPorts ( service * corev1 . Service , pod * corev1 . Pod ) [ ] discovery . EndpointPort {
endpointPorts := [ ] discovery . EndpointPort { }
// Allow headless service not to have ports.
if len ( service . Spec . Ports ) == 0 && service . Spec . ClusterIP == api . ClusterIPNone {
return endpointPorts
}
for i := range service . Spec . Ports {
servicePort := & service . Spec . Ports [ i ]
portName := servicePort . Name
portProto := servicePort . Protocol
portNum , err := podutil . FindPort ( pod , servicePort )
if err != nil {
klog . V ( 4 ) . Infof ( "Failed to find port for service %s/%s: %v" , service . Namespace , service . Name , err )
continue
}
i32PortNum := int32 ( portNum )
endpointPorts = append ( endpointPorts , discovery . EndpointPort {
2020-03-26 21:07:15 +00:00
Name : & portName ,
Port : & i32PortNum ,
Protocol : & portProto ,
AppProtocol : servicePort . AppProtocol ,
2019-09-27 21:51:53 +00:00
} )
}
return endpointPorts
}
// getEndpointAddresses returns a list of addresses generated from a pod status.
2020-12-01 01:06:26 +00:00
func getEndpointAddresses ( podStatus corev1 . PodStatus , service * corev1 . Service , addressType discovery . AddressType ) [ ] string {
2019-12-12 01:27:03 +00:00
addresses := [ ] string { }
for _ , podIP := range podStatus . PodIPs {
isIPv6PodIP := utilnet . IsIPv6String ( podIP . IP )
2020-12-01 01:06:26 +00:00
if isIPv6PodIP && addressType == discovery . AddressTypeIPv6 {
addresses = append ( addresses , podIP . IP )
}
if ! isIPv6PodIP && addressType == discovery . AddressTypeIPv4 {
2019-12-12 01:27:03 +00:00
addresses = append ( addresses , podIP . IP )
2019-09-27 21:51:53 +00:00
}
}
2019-12-12 01:27:03 +00:00
return addresses
}
2019-09-27 21:51:53 +00:00
// newEndpointSlice returns an EndpointSlice generated from a service and
// endpointMeta.
func newEndpointSlice ( service * corev1 . Service , endpointMeta * endpointMeta ) * discovery . EndpointSlice {
gvk := schema . GroupVersionKind { Version : "v1" , Kind : "Service" }
ownerRef := metav1 . NewControllerRef ( service , gvk )
2020-12-01 01:06:26 +00:00
epSlice := & discovery . EndpointSlice {
2019-09-27 21:51:53 +00:00
ObjectMeta : metav1 . ObjectMeta {
2020-12-01 01:06:26 +00:00
Labels : map [ string ] string { } ,
2019-09-27 21:51:53 +00:00
GenerateName : getEndpointSlicePrefix ( service . Name ) ,
OwnerReferences : [ ] metav1 . OwnerReference { * ownerRef } ,
Namespace : service . Namespace ,
} ,
Ports : endpointMeta . Ports ,
AddressType : endpointMeta . AddressType ,
Endpoints : [ ] discovery . Endpoint { } ,
}
2020-12-01 01:06:26 +00:00
// add parent service labels
epSlice . Labels , _ = setEndpointSliceLabels ( epSlice , service )
return epSlice
2019-09-27 21:51:53 +00:00
}
// getEndpointSlicePrefix returns a suitable prefix for an EndpointSlice name.
func getEndpointSlicePrefix ( serviceName string ) string {
// use the dash (if the name isn't too long) to make the pod name a bit prettier
prefix := fmt . Sprintf ( "%s-" , serviceName )
if len ( validation . ValidateEndpointSliceName ( prefix , true ) ) != 0 {
prefix = serviceName
}
return prefix
}
2020-10-14 19:03:41 +00:00
// ownedBy returns true if the provided EndpointSlice is owned by the provided
// Service.
func ownedBy ( endpointSlice * discovery . EndpointSlice , svc * corev1 . Service ) bool {
for _ , o := range endpointSlice . OwnerReferences {
if o . UID == svc . UID && o . Kind == "Service" && o . APIVersion == "v1" {
return true
}
}
return false
2019-09-27 21:51:53 +00:00
}
// getSliceToFill will return the EndpointSlice that will be closest to full
// when numEndpoints are added. If no EndpointSlice can be found, a nil pointer
// will be returned.
func getSliceToFill ( endpointSlices [ ] * discovery . EndpointSlice , numEndpoints , maxEndpoints int ) ( slice * discovery . EndpointSlice ) {
closestDiff := maxEndpoints
var closestSlice * discovery . EndpointSlice
for _ , endpointSlice := range endpointSlices {
currentDiff := maxEndpoints - ( numEndpoints + len ( endpointSlice . Endpoints ) )
if currentDiff >= 0 && currentDiff < closestDiff {
closestDiff = currentDiff
closestSlice = endpointSlice
if closestDiff == 0 {
return closestSlice
}
}
}
return closestSlice
}
2020-02-14 00:18:16 +00:00
// getEndpointSliceFromDeleteAction parses an EndpointSlice from a delete action.
func getEndpointSliceFromDeleteAction ( obj interface { } ) * discovery . EndpointSlice {
if endpointSlice , ok := obj . ( * discovery . EndpointSlice ) ; ok {
// Enqueue all the services that the pod used to be a member of.
// This is the same thing we do when we add a pod.
return endpointSlice
}
// If we reached here it means the pod was deleted but its final state is unrecorded.
tombstone , ok := obj . ( cache . DeletedFinalStateUnknown )
if ! ok {
utilruntime . HandleError ( fmt . Errorf ( "Couldn't get object from tombstone %#v" , obj ) )
return nil
}
endpointSlice , ok := tombstone . Obj . ( * discovery . EndpointSlice )
if ! ok {
utilruntime . HandleError ( fmt . Errorf ( "Tombstone contained object that is not a EndpointSlice: %#v" , obj ) )
return nil
}
return endpointSlice
}
2019-09-27 21:51:53 +00:00
// addTriggerTimeAnnotation adds a triggerTime annotation to an EndpointSlice
func addTriggerTimeAnnotation ( endpointSlice * discovery . EndpointSlice , triggerTime time . Time ) {
if endpointSlice . Annotations == nil {
endpointSlice . Annotations = make ( map [ string ] string )
}
if ! triggerTime . IsZero ( ) {
endpointSlice . Annotations [ corev1 . EndpointsLastChangeTriggerTime ] = triggerTime . Format ( time . RFC3339Nano )
} else { // No new trigger time, clear the annotation.
delete ( endpointSlice . Annotations , corev1 . EndpointsLastChangeTriggerTime )
}
}
2020-02-14 00:18:16 +00:00
// serviceControllerKey returns a controller key for a Service but derived from
// an EndpointSlice.
func serviceControllerKey ( endpointSlice * discovery . EndpointSlice ) ( string , error ) {
if endpointSlice == nil {
return "" , fmt . Errorf ( "nil EndpointSlice passed to serviceControllerKey()" )
}
serviceName , ok := endpointSlice . Labels [ discovery . LabelServiceName ]
if ! ok || serviceName == "" {
return "" , fmt . Errorf ( "EndpointSlice missing %s label" , discovery . LabelServiceName )
}
return fmt . Sprintf ( "%s/%s" , endpointSlice . Namespace , serviceName ) , nil
}
2020-12-01 01:06:26 +00:00
// setEndpointSliceLabels returns a map with the new endpoint slices labels and true if there was an update.
// Slices labels must be equivalent to the Service labels except for the reserved IsHeadlessService, LabelServiceName and LabelManagedBy labels
// Changes to IsHeadlessService, LabelServiceName and LabelManagedBy labels on the Service do not result in updates to EndpointSlice labels.
func setEndpointSliceLabels ( epSlice * discovery . EndpointSlice , service * corev1 . Service ) ( map [ string ] string , bool ) {
updated := false
epLabels := make ( map [ string ] string )
svcLabels := make ( map [ string ] string )
// check if the endpoint slice and the service have the same labels
// clone current slice labels except the reserved labels
for key , value := range epSlice . Labels {
if IsReservedLabelKey ( key ) {
continue
}
// copy endpoint slice labels
epLabels [ key ] = value
}
for key , value := range service . Labels {
if IsReservedLabelKey ( key ) {
klog . Warningf ( "Service %s/%s using reserved endpoint slices label, skipping label %s: %s" , service . Namespace , service . Name , key , value )
continue
}
// copy service labels
svcLabels [ key ] = value
}
// if the labels are not identical update the slice with the corresponding service labels
if ! apiequality . Semantic . DeepEqual ( epLabels , svcLabels ) {
updated = true
}
// add or remove headless label depending on the service Type
if ! helper . IsServiceIPSet ( service ) {
svcLabels [ v1 . IsHeadlessService ] = ""
} else {
delete ( svcLabels , v1 . IsHeadlessService )
}
// override endpoint slices reserved labels
svcLabels [ discovery . LabelServiceName ] = service . Name
svcLabels [ discovery . LabelManagedBy ] = controllerName
return svcLabels , updated
}
// IsReservedLabelKey return true if the label is one of the reserved label for slices
func IsReservedLabelKey ( label string ) bool {
if label == discovery . LabelServiceName ||
label == discovery . LabelManagedBy ||
label == v1 . IsHeadlessService {
return true
}
return false
}
2019-09-27 21:51:53 +00:00
// endpointSliceEndpointLen helps sort endpoint slices by the number of
// endpoints they contain.
type endpointSliceEndpointLen [ ] * discovery . EndpointSlice
func ( sl endpointSliceEndpointLen ) Len ( ) int { return len ( sl ) }
func ( sl endpointSliceEndpointLen ) Swap ( i , j int ) { sl [ i ] , sl [ j ] = sl [ j ] , sl [ i ] }
func ( sl endpointSliceEndpointLen ) Less ( i , j int ) bool {
return len ( sl [ i ] . Endpoints ) > len ( sl [ j ] . Endpoints )
}
2020-12-01 01:06:26 +00:00
// returns a map of address types used by a service
func getAddressTypesForService ( service * corev1 . Service ) map [ discovery . AddressType ] struct { } {
serviceSupportedAddresses := make ( map [ discovery . AddressType ] struct { } )
// TODO: (khenidak) when address types are removed in favor of
// v1.IPFamily this will need to be removed, and work directly with
// v1.IPFamily types
// IMPORTANT: we assume that IP of (discovery.AddressType enum) is never in use
// as it gets deprecated
for _ , family := range service . Spec . IPFamilies {
if family == corev1 . IPv4Protocol {
serviceSupportedAddresses [ discovery . AddressTypeIPv4 ] = struct { } { }
}
if family == corev1 . IPv6Protocol {
serviceSupportedAddresses [ discovery . AddressTypeIPv6 ] = struct { } { }
}
}
if len ( serviceSupportedAddresses ) > 0 {
return serviceSupportedAddresses // we have found families for this service
}
// TODO (khenidak) remove when (1) dual stack becomes
// enabled by default (2) v1.19 falls off supported versions
// Why do we need this:
// a cluster being upgraded to the new apis
// will have service.spec.IPFamilies: nil
// if the controller manager connected to old api
// server. This will have the nasty side effect of
// removing all slices already created for this service.
// this will disable all routing to service vip (ClusterIP)
// this ensures that this does not happen. Same for headless services
// we assume it is dual stack, until they get defaulted by *new* api-server
// this ensures that traffic is not disrupted until then. But *may*
// include undesired families for headless services until then.
if len ( service . Spec . ClusterIP ) > 0 && service . Spec . ClusterIP != corev1 . ClusterIPNone { // headfull
addrType := discovery . AddressTypeIPv4
if utilnet . IsIPv6String ( service . Spec . ClusterIP ) {
addrType = discovery . AddressTypeIPv6
}
serviceSupportedAddresses [ addrType ] = struct { } { }
2021-03-18 22:40:29 +00:00
klog . V ( 2 ) . Infof ( "couldn't find ipfamilies for service: %v/%v. This could happen if controller manager is connected to an old apiserver that does not support ip families yet. EndpointSlices for this Service will use %s as the IP Family based on familyOf(ClusterIP:%v)." , service . Namespace , service . Name , addrType , service . Spec . ClusterIP )
2020-12-01 01:06:26 +00:00
return serviceSupportedAddresses
}
// headless
// for now we assume two families. This should have minimal side effect
// if the service is headless with no selector, then this will remain the case
// if the service is headless with selector then chances are pods are still using single family
// since kubelet will need to restart in order to start patching pod status with multiple ips
serviceSupportedAddresses [ discovery . AddressTypeIPv4 ] = struct { } { }
serviceSupportedAddresses [ discovery . AddressTypeIPv6 ] = struct { } { }
klog . V ( 2 ) . Infof ( "couldn't find ipfamilies for headless service: %v/%v likely because controller manager is likely connected to an old apiserver that does not support ip families yet. The service endpoint slice will use dual stack families until api-server default it correctly" , service . Namespace , service . Name )
return serviceSupportedAddresses
}
2021-03-18 22:40:29 +00:00
func unchangedSlices ( existingSlices , slicesToUpdate , slicesToDelete [ ] * discovery . EndpointSlice ) [ ] * discovery . EndpointSlice {
changedSliceNames := sets . String { }
for _ , slice := range slicesToUpdate {
changedSliceNames . Insert ( slice . Name )
}
for _ , slice := range slicesToDelete {
changedSliceNames . Insert ( slice . Name )
}
unchangedSlices := [ ] * discovery . EndpointSlice { }
for _ , slice := range existingSlices {
if ! changedSliceNames . Has ( slice . Name ) {
unchangedSlices = append ( unchangedSlices , slice )
}
}
return unchangedSlices
}
// hintsEnabled returns true if the provided annotations include a
// corev1.AnnotationTopologyAwareHints key with a value set to "auto".
func hintsEnabled ( annotations map [ string ] string ) bool {
val , ok := annotations [ corev1 . AnnotationTopologyAwareHints ]
if ! ok {
return false
}
return val == "auto"
}