2015-07-13 14:27:35 +00:00
|
|
|
/*
|
|
|
|
Copyright 2015 The Kubernetes Authors All rights reserved.
|
|
|
|
|
|
|
|
Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
you may not use this file except in compliance with the License.
|
|
|
|
You may obtain a copy of the License at
|
|
|
|
|
|
|
|
http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
|
|
|
|
Unless required by applicable law or agreed to in writing, software
|
|
|
|
distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
See the License for the specific language governing permissions and
|
|
|
|
limitations under the License.
|
|
|
|
*/
|
|
|
|
|
|
|
|
package e2e
|
|
|
|
|
|
|
|
import (
|
|
|
|
"fmt"
|
|
|
|
"time"
|
|
|
|
|
2015-08-05 22:03:47 +00:00
|
|
|
"k8s.io/kubernetes/pkg/api"
|
|
|
|
"k8s.io/kubernetes/pkg/api/resource"
|
2015-08-13 19:01:50 +00:00
|
|
|
client "k8s.io/kubernetes/pkg/client/unversioned"
|
2015-08-05 22:03:47 +00:00
|
|
|
"k8s.io/kubernetes/pkg/fields"
|
|
|
|
"k8s.io/kubernetes/pkg/labels"
|
|
|
|
"k8s.io/kubernetes/pkg/util"
|
2015-07-13 14:27:35 +00:00
|
|
|
|
|
|
|
. "github.com/onsi/ginkgo"
|
|
|
|
. "github.com/onsi/gomega"
|
|
|
|
)
|
|
|
|
|
2015-08-14 07:23:10 +00:00
|
|
|
// Returns a number of currently running and not running Pods.
|
|
|
|
func getPodsNumbers(pods *api.PodList) (runningPods, notRunningPods int) {
|
|
|
|
for _, pod := range pods.Items {
|
|
|
|
if pod.Status.Phase == api.PodRunning {
|
|
|
|
runningPods += 1
|
|
|
|
} else {
|
|
|
|
notRunningPods += 1
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2015-07-13 14:27:35 +00:00
|
|
|
// Simplified version of RunRC, that does not create RC, but creates plain Pods and
|
|
|
|
// requires passing whole Pod definition, which is needed to test various Scheduler predicates.
|
|
|
|
func startPods(c *client.Client, replicas int, ns string, podNamePrefix string, pod api.Pod) {
|
2015-08-14 07:23:10 +00:00
|
|
|
allPods, err := c.Pods(api.NamespaceAll).List(labels.Everything(), fields.Everything())
|
2015-07-13 14:27:35 +00:00
|
|
|
expectNoError(err)
|
2015-08-14 07:23:10 +00:00
|
|
|
podsRunningBefore, _ := getPodsNumbers(allPods)
|
2015-07-13 14:27:35 +00:00
|
|
|
|
|
|
|
for i := 0; i < replicas; i++ {
|
|
|
|
podName := fmt.Sprintf("%v-%v", podNamePrefix, i)
|
|
|
|
pod.ObjectMeta.Name = podName
|
|
|
|
pod.ObjectMeta.Labels["name"] = podName
|
|
|
|
pod.Spec.Containers[0].Name = podName
|
|
|
|
_, err = c.Pods(ns).Create(&pod)
|
|
|
|
expectNoError(err)
|
|
|
|
}
|
|
|
|
|
2015-08-05 05:59:30 +00:00
|
|
|
// Wait for pods to start running. Note: this is a functional
|
|
|
|
// test, not a performance test, so the timeout needs to be
|
|
|
|
// sufficiently long that it's only triggered if things are
|
|
|
|
// completely broken vs. running slowly.
|
|
|
|
timeout := 10 * time.Minute
|
2015-07-13 14:27:35 +00:00
|
|
|
startTime := time.Now()
|
|
|
|
currentlyRunningPods := 0
|
|
|
|
for podsRunningBefore+replicas != currentlyRunningPods {
|
|
|
|
allPods, err := c.Pods(api.NamespaceAll).List(labels.Everything(), fields.Everything())
|
|
|
|
expectNoError(err)
|
|
|
|
runningPods := 0
|
|
|
|
for _, pod := range allPods.Items {
|
|
|
|
if pod.Status.Phase == api.PodRunning {
|
|
|
|
runningPods += 1
|
|
|
|
}
|
|
|
|
}
|
|
|
|
currentlyRunningPods = runningPods
|
2015-08-05 05:59:30 +00:00
|
|
|
Logf("%v pods running", currentlyRunningPods)
|
2015-07-13 14:27:35 +00:00
|
|
|
if startTime.Add(timeout).Before(time.Now()) {
|
2015-08-05 05:59:30 +00:00
|
|
|
Logf("Timed out after %v waiting for pods to start running.", timeout)
|
2015-07-13 14:27:35 +00:00
|
|
|
break
|
|
|
|
}
|
|
|
|
time.Sleep(5 * time.Second)
|
|
|
|
}
|
|
|
|
Expect(currentlyRunningPods).To(Equal(podsRunningBefore + replicas))
|
|
|
|
}
|
|
|
|
|
|
|
|
func getRequestedCPU(pod api.Pod) int64 {
|
|
|
|
var result int64
|
|
|
|
for _, container := range pod.Spec.Containers {
|
|
|
|
result += container.Resources.Limits.Cpu().MilliValue()
|
|
|
|
}
|
|
|
|
return result
|
|
|
|
}
|
|
|
|
|
2015-08-14 07:23:10 +00:00
|
|
|
func verifyResult(c *client.Client, podName string, ns string, oldNotRunning int) {
|
2015-07-13 14:27:35 +00:00
|
|
|
allPods, err := c.Pods(api.NamespaceAll).List(labels.Everything(), fields.Everything())
|
|
|
|
expectNoError(err)
|
2015-08-14 07:23:10 +00:00
|
|
|
_, notRunningPods := getPodsNumbers(allPods)
|
2015-07-13 14:27:35 +00:00
|
|
|
|
|
|
|
schedEvents, err := c.Events(ns).List(
|
|
|
|
labels.Everything(),
|
|
|
|
fields.Set{
|
|
|
|
"involvedObject.kind": "Pod",
|
|
|
|
"involvedObject.name": podName,
|
|
|
|
"involvedObject.namespace": ns,
|
|
|
|
"source": "scheduler",
|
2015-08-14 07:23:10 +00:00
|
|
|
"reason": "FailedScheduling",
|
2015-07-13 14:27:35 +00:00
|
|
|
}.AsSelector())
|
|
|
|
expectNoError(err)
|
|
|
|
|
|
|
|
printed := false
|
|
|
|
printOnce := func(msg string) string {
|
|
|
|
if !printed {
|
|
|
|
printed = true
|
|
|
|
return msg
|
|
|
|
} else {
|
|
|
|
return ""
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2015-08-14 07:23:10 +00:00
|
|
|
Expect(notRunningPods).To(Equal(1+oldNotRunning), printOnce(fmt.Sprintf("Pods found in the cluster: %#v", allPods)))
|
2015-07-13 14:27:35 +00:00
|
|
|
Expect(schedEvents.Items).ToNot(BeEmpty(), printOnce(fmt.Sprintf("Pods found in the cluster: %#v", allPods)))
|
|
|
|
}
|
|
|
|
|
2015-08-19 09:29:35 +00:00
|
|
|
func cleanupPods(c *client.Client, ns string) {
|
|
|
|
By("Removing all pods in namespace " + ns)
|
|
|
|
pods, err := c.Pods(ns).List(labels.Everything(), fields.Everything())
|
|
|
|
expectNoError(err)
|
|
|
|
opt := api.NewDeleteOptions(0)
|
|
|
|
for _, p := range pods.Items {
|
|
|
|
expectNoError(c.Pods(ns).Delete(p.ObjectMeta.Name, opt))
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2015-07-13 14:27:35 +00:00
|
|
|
var _ = Describe("SchedulerPredicates", func() {
|
|
|
|
var c *client.Client
|
|
|
|
var nodeList *api.NodeList
|
|
|
|
var nodeCount int
|
|
|
|
var totalPodCapacity int64
|
|
|
|
var RCName string
|
|
|
|
var ns string
|
|
|
|
var uuid string
|
|
|
|
|
|
|
|
BeforeEach(func() {
|
|
|
|
var err error
|
|
|
|
c, err = loadClient()
|
|
|
|
expectNoError(err)
|
|
|
|
nodeList, err = c.Nodes().List(labels.Everything(), fields.Everything())
|
|
|
|
expectNoError(err)
|
|
|
|
nodeCount = len(nodeList.Items)
|
|
|
|
Expect(nodeCount).NotTo(BeZero())
|
|
|
|
|
|
|
|
err = deleteTestingNS(c)
|
|
|
|
expectNoError(err)
|
|
|
|
|
|
|
|
nsForTesting, err := createTestingNS("sched-pred", c)
|
|
|
|
ns = nsForTesting.Name
|
|
|
|
expectNoError(err)
|
|
|
|
uuid = string(util.NewUUID())
|
|
|
|
})
|
|
|
|
|
|
|
|
AfterEach(func() {
|
|
|
|
rc, err := c.ReplicationControllers(ns).Get(RCName)
|
|
|
|
if err == nil && rc.Spec.Replicas != 0 {
|
|
|
|
By("Cleaning up the replication controller")
|
|
|
|
err := DeleteRC(c, ns, RCName)
|
|
|
|
expectNoError(err)
|
|
|
|
}
|
|
|
|
|
|
|
|
By(fmt.Sprintf("Destroying namespace for this suite %v", ns))
|
2015-08-18 21:13:13 +00:00
|
|
|
if err := deleteNS(c, ns); err != nil {
|
2015-07-13 14:27:35 +00:00
|
|
|
Failf("Couldn't delete ns %s", err)
|
|
|
|
}
|
|
|
|
})
|
|
|
|
|
|
|
|
// This test verifies that max-pods flag works as advertised. It assumes that cluster add-on pods stay stable
|
|
|
|
// and cannot be run in parallel with any other test that touches Nodes or Pods. It is so because to check
|
|
|
|
// if max-pods is working we need to fully saturate the cluster and keep it in this state for few seconds.
|
|
|
|
It("validates MaxPods limit number of pods that are allowed to run.", func() {
|
|
|
|
totalPodCapacity = 0
|
|
|
|
|
|
|
|
for _, node := range nodeList.Items {
|
|
|
|
podCapacity, found := node.Status.Capacity["pods"]
|
|
|
|
Expect(found).To(Equal(true))
|
|
|
|
totalPodCapacity += podCapacity.Value()
|
|
|
|
Logf("Node: %v", node)
|
|
|
|
}
|
|
|
|
|
2015-08-14 07:23:10 +00:00
|
|
|
allPods, err := c.Pods(api.NamespaceAll).List(labels.Everything(), fields.Everything())
|
2015-07-13 14:27:35 +00:00
|
|
|
expectNoError(err)
|
2015-08-14 07:23:10 +00:00
|
|
|
currentlyRunningPods, currentlyDeadPods := getPodsNumbers(allPods)
|
2015-07-13 14:27:35 +00:00
|
|
|
podsNeededForSaturation := int(totalPodCapacity) - currentlyRunningPods
|
|
|
|
|
|
|
|
By(fmt.Sprintf("Starting additional %v Pods to fully saturate the cluster max pods and trying to start another one", podsNeededForSaturation))
|
|
|
|
|
|
|
|
startPods(c, podsNeededForSaturation, ns, "maxp", api.Pod{
|
|
|
|
TypeMeta: api.TypeMeta{
|
|
|
|
Kind: "Pod",
|
|
|
|
},
|
|
|
|
ObjectMeta: api.ObjectMeta{
|
|
|
|
Name: "",
|
|
|
|
Labels: map[string]string{"name": ""},
|
|
|
|
},
|
|
|
|
Spec: api.PodSpec{
|
|
|
|
Containers: []api.Container{
|
|
|
|
{
|
|
|
|
Name: "",
|
|
|
|
Image: "gcr.io/google_containers/pause:go",
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
})
|
|
|
|
|
|
|
|
podName := "additional-pod"
|
|
|
|
_, err = c.Pods(ns).Create(&api.Pod{
|
|
|
|
TypeMeta: api.TypeMeta{
|
|
|
|
Kind: "Pod",
|
|
|
|
},
|
|
|
|
ObjectMeta: api.ObjectMeta{
|
|
|
|
Name: podName,
|
|
|
|
Labels: map[string]string{"name": "additional"},
|
|
|
|
},
|
|
|
|
Spec: api.PodSpec{
|
|
|
|
Containers: []api.Container{
|
|
|
|
{
|
|
|
|
Name: podName,
|
|
|
|
Image: "gcr.io/google_containers/pause:go",
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
})
|
|
|
|
expectNoError(err)
|
|
|
|
// Wait a bit to allow scheduler to do its thing
|
2015-08-05 05:59:30 +00:00
|
|
|
// TODO: this is brittle; there's no guarantee the scheduler will have run in 10 seconds.
|
|
|
|
Logf("Sleeping 10 seconds and crossing our fingers that scheduler will run in that time.")
|
2015-07-13 14:27:35 +00:00
|
|
|
time.Sleep(10 * time.Second)
|
|
|
|
|
2015-08-14 07:23:10 +00:00
|
|
|
verifyResult(c, podName, ns, currentlyDeadPods)
|
2015-08-19 09:29:35 +00:00
|
|
|
cleanupPods(c, ns)
|
2015-07-13 14:27:35 +00:00
|
|
|
})
|
|
|
|
|
|
|
|
// This test verifies we don't allow scheduling of pods in a way that sum of limits of pods is greater than machines capacit.
|
|
|
|
// It assumes that cluster add-on pods stay stable and cannot be run in parallel with any other test that touches Nodes or Pods.
|
|
|
|
// It is so because we need to have precise control on what's running in the cluster.
|
|
|
|
It("validates resource limits of pods that are allowed to run.", func() {
|
|
|
|
nodeToCapacityMap := make(map[string]int64)
|
|
|
|
for _, node := range nodeList.Items {
|
|
|
|
capacity, found := node.Status.Capacity["cpu"]
|
|
|
|
Expect(found).To(Equal(true))
|
|
|
|
nodeToCapacityMap[node.Name] = capacity.MilliValue()
|
|
|
|
}
|
|
|
|
|
|
|
|
pods, err := c.Pods(api.NamespaceAll).List(labels.Everything(), fields.Everything())
|
|
|
|
expectNoError(err)
|
2015-08-14 07:23:10 +00:00
|
|
|
var currentlyDeadPods int
|
2015-07-13 14:27:35 +00:00
|
|
|
for _, pod := range pods.Items {
|
|
|
|
_, found := nodeToCapacityMap[pod.Spec.NodeName]
|
|
|
|
Expect(found).To(Equal(true))
|
2015-08-14 07:23:10 +00:00
|
|
|
if pod.Status.Phase == api.PodRunning {
|
|
|
|
Logf("Pod %v requesting capacity %v on Node %v", pod.Name, getRequestedCPU(pod), pod.Spec.NodeName)
|
|
|
|
nodeToCapacityMap[pod.Spec.NodeName] -= getRequestedCPU(pod)
|
|
|
|
} else {
|
|
|
|
currentlyDeadPods += 1
|
|
|
|
}
|
2015-07-13 14:27:35 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
var podsNeededForSaturation int
|
|
|
|
for name, leftCapacity := range nodeToCapacityMap {
|
|
|
|
Logf("Node: %v has capacity: %v", name, leftCapacity)
|
|
|
|
podsNeededForSaturation += (int)(leftCapacity / 100)
|
|
|
|
}
|
|
|
|
|
|
|
|
By(fmt.Sprintf("Starting additional %v Pods to fully saturate the cluster CPU and trying to start another one", podsNeededForSaturation))
|
|
|
|
|
|
|
|
startPods(c, podsNeededForSaturation, ns, "overcommit", api.Pod{
|
|
|
|
TypeMeta: api.TypeMeta{
|
|
|
|
Kind: "Pod",
|
|
|
|
},
|
|
|
|
ObjectMeta: api.ObjectMeta{
|
|
|
|
Name: "",
|
|
|
|
Labels: map[string]string{"name": ""},
|
|
|
|
},
|
|
|
|
Spec: api.PodSpec{
|
|
|
|
Containers: []api.Container{
|
|
|
|
{
|
|
|
|
Name: "",
|
|
|
|
Image: "gcr.io/google_containers/pause:go",
|
|
|
|
Resources: api.ResourceRequirements{
|
|
|
|
Limits: api.ResourceList{
|
|
|
|
"cpu": *resource.NewMilliQuantity(100, "DecimalSI"),
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
})
|
|
|
|
|
|
|
|
podName := "additional-pod"
|
|
|
|
_, err = c.Pods(ns).Create(&api.Pod{
|
|
|
|
TypeMeta: api.TypeMeta{
|
|
|
|
Kind: "Pod",
|
|
|
|
},
|
|
|
|
ObjectMeta: api.ObjectMeta{
|
|
|
|
Name: podName,
|
|
|
|
Labels: map[string]string{"name": "additional"},
|
|
|
|
},
|
|
|
|
Spec: api.PodSpec{
|
|
|
|
Containers: []api.Container{
|
|
|
|
{
|
|
|
|
Name: podName,
|
|
|
|
Image: "gcr.io/google_containers/pause:go",
|
|
|
|
Resources: api.ResourceRequirements{
|
|
|
|
Limits: api.ResourceList{
|
|
|
|
"cpu": *resource.NewMilliQuantity(100, "DecimalSI"),
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
})
|
|
|
|
expectNoError(err)
|
|
|
|
// Wait a bit to allow scheduler to do its thing
|
2015-08-05 05:59:30 +00:00
|
|
|
// TODO: this is brittle; there's no guarantee the scheduler will have run in 10 seconds.
|
|
|
|
Logf("Sleeping 10 seconds and crossing our fingers that scheduler will run in that time.")
|
2015-07-13 14:27:35 +00:00
|
|
|
time.Sleep(10 * time.Second)
|
|
|
|
|
2015-08-14 07:23:10 +00:00
|
|
|
verifyResult(c, podName, ns, currentlyDeadPods)
|
2015-08-19 09:29:35 +00:00
|
|
|
cleanupPods(c, ns)
|
2015-07-13 14:27:35 +00:00
|
|
|
})
|
|
|
|
|
|
|
|
// Test Nodes does not have any label, hence it should be impossible to schedule Pod with
|
|
|
|
// nonempty Selector set.
|
|
|
|
It("validates that NodeSelector is respected.", func() {
|
|
|
|
By("Trying to schedule Pod with nonempty NodeSelector.")
|
|
|
|
podName := "restricted-pod"
|
|
|
|
|
2015-08-14 07:23:10 +00:00
|
|
|
allPods, err := c.Pods(api.NamespaceAll).List(labels.Everything(), fields.Everything())
|
|
|
|
expectNoError(err)
|
|
|
|
_, currentlyDeadPods := getPodsNumbers(allPods)
|
|
|
|
|
|
|
|
_, err = c.Pods(ns).Create(&api.Pod{
|
2015-07-13 14:27:35 +00:00
|
|
|
TypeMeta: api.TypeMeta{
|
|
|
|
Kind: "Pod",
|
|
|
|
},
|
|
|
|
ObjectMeta: api.ObjectMeta{
|
|
|
|
Name: podName,
|
|
|
|
Labels: map[string]string{"name": "restricted"},
|
|
|
|
},
|
|
|
|
Spec: api.PodSpec{
|
|
|
|
Containers: []api.Container{
|
|
|
|
{
|
|
|
|
Name: podName,
|
|
|
|
Image: "gcr.io/google_containers/pause:go",
|
|
|
|
},
|
|
|
|
},
|
|
|
|
NodeSelector: map[string]string{
|
|
|
|
"label": "nonempty",
|
|
|
|
},
|
|
|
|
},
|
|
|
|
})
|
|
|
|
expectNoError(err)
|
|
|
|
// Wait a bit to allow scheduler to do its thing
|
2015-08-05 05:59:30 +00:00
|
|
|
// TODO: this is brittle; there's no guarantee the scheduler will have run in 10 seconds.
|
|
|
|
Logf("Sleeping 10 seconds and crossing our fingers that scheduler will run in that time.")
|
2015-07-13 14:27:35 +00:00
|
|
|
time.Sleep(10 * time.Second)
|
|
|
|
|
2015-08-14 07:23:10 +00:00
|
|
|
verifyResult(c, podName, ns, currentlyDeadPods)
|
2015-08-19 09:29:35 +00:00
|
|
|
cleanupPods(c, ns)
|
2015-07-13 14:27:35 +00:00
|
|
|
})
|
|
|
|
})
|