2015-02-23 14:50:40 +00:00
|
|
|
/*
|
|
|
|
Copyright 2015 Google Inc. All rights reserved.
|
|
|
|
|
|
|
|
Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
you may not use this file except in compliance with the License.
|
|
|
|
You may obtain a copy of the License at
|
|
|
|
|
|
|
|
http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
|
|
|
|
Unless required by applicable law or agreed to in writing, software
|
|
|
|
distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
See the License for the specific language governing permissions and
|
|
|
|
limitations under the License.
|
|
|
|
*/
|
|
|
|
|
|
|
|
package e2e
|
|
|
|
|
|
|
|
import (
|
|
|
|
"fmt"
|
2015-03-27 10:14:54 +00:00
|
|
|
"strconv"
|
2015-03-10 23:59:26 +00:00
|
|
|
"sync"
|
2015-02-23 14:50:40 +00:00
|
|
|
"time"
|
|
|
|
|
|
|
|
"github.com/GoogleCloudPlatform/kubernetes/pkg/api"
|
|
|
|
"github.com/GoogleCloudPlatform/kubernetes/pkg/client"
|
2015-04-10 10:08:36 +00:00
|
|
|
"github.com/GoogleCloudPlatform/kubernetes/pkg/fields"
|
2015-02-23 14:50:40 +00:00
|
|
|
"github.com/GoogleCloudPlatform/kubernetes/pkg/labels"
|
|
|
|
"github.com/GoogleCloudPlatform/kubernetes/pkg/util"
|
|
|
|
"github.com/GoogleCloudPlatform/kubernetes/pkg/util/wait"
|
|
|
|
|
2015-03-26 16:00:12 +00:00
|
|
|
"github.com/golang/glog"
|
2015-02-23 14:50:40 +00:00
|
|
|
. "github.com/onsi/ginkgo"
|
|
|
|
. "github.com/onsi/gomega"
|
|
|
|
)
|
|
|
|
|
2015-04-15 09:17:32 +00:00
|
|
|
// Convenient wrapper around listing pods supporting retries.
|
|
|
|
func listPods(c *client.Client, namespace string, label labels.Selector) (*api.PodList, error) {
|
2015-04-17 10:35:56 +00:00
|
|
|
maxRetries := 4
|
2015-04-15 09:17:32 +00:00
|
|
|
pods, err := c.Pods(namespace).List(label)
|
|
|
|
for i := 0; i < maxRetries; i++ {
|
|
|
|
if err == nil {
|
|
|
|
return pods, nil
|
|
|
|
}
|
|
|
|
pods, err = c.Pods(namespace).List(label)
|
|
|
|
}
|
|
|
|
return pods, err
|
|
|
|
}
|
|
|
|
|
2015-02-23 14:50:40 +00:00
|
|
|
// Delete a Replication Controller and all pods it spawned
|
|
|
|
func DeleteRC(c *client.Client, ns, name string) error {
|
|
|
|
rc, err := c.ReplicationControllers(ns).Get(name)
|
|
|
|
if err != nil {
|
|
|
|
return fmt.Errorf("Failed to find replication controller %s in namespace %s: %v", name, ns, err)
|
|
|
|
}
|
|
|
|
|
|
|
|
rc.Spec.Replicas = 0
|
|
|
|
|
|
|
|
if _, err := c.ReplicationControllers(ns).Update(rc); err != nil {
|
|
|
|
return fmt.Errorf("Failed to resize replication controller %s to zero: %v", name, err)
|
|
|
|
}
|
|
|
|
|
2015-04-15 13:31:00 +00:00
|
|
|
// Wait up to 20 minutes until all replicas are killed.
|
|
|
|
endTime := time.Now().Add(time.Minute * 20)
|
|
|
|
for {
|
|
|
|
if time.Now().After(endTime) {
|
|
|
|
return fmt.Errorf("Timeout while waiting for replication controller %s replicas to 0", name)
|
|
|
|
}
|
|
|
|
remainingTime := endTime.Sub(time.Now())
|
|
|
|
err := wait.Poll(time.Second, remainingTime, client.ControllerHasDesiredReplicas(c, rc))
|
|
|
|
if err != nil {
|
|
|
|
glog.Errorf("Error while waiting for replication controller %s replicas to read 0: %v", name, err)
|
|
|
|
} else {
|
|
|
|
break
|
|
|
|
}
|
2015-02-23 14:50:40 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// Delete the replication controller.
|
|
|
|
if err := c.ReplicationControllers(ns).Delete(name); err != nil {
|
|
|
|
return fmt.Errorf("Failed to delete replication controller %s: %v", name, err)
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// Launch a Replication Controller and wait for all pods it spawns
|
2015-03-25 19:35:54 +00:00
|
|
|
// to become running. The controller will need to be cleaned up external
|
|
|
|
// to this method
|
2015-02-23 14:50:40 +00:00
|
|
|
func RunRC(c *client.Client, name string, ns, image string, replicas int) {
|
|
|
|
defer GinkgoRecover()
|
|
|
|
|
|
|
|
var last int
|
|
|
|
current := 0
|
|
|
|
same := 0
|
|
|
|
|
|
|
|
By(fmt.Sprintf("Creating replication controller %s", name))
|
|
|
|
_, err := c.ReplicationControllers(ns).Create(&api.ReplicationController{
|
|
|
|
ObjectMeta: api.ObjectMeta{
|
|
|
|
Name: name,
|
|
|
|
},
|
|
|
|
Spec: api.ReplicationControllerSpec{
|
|
|
|
Replicas: replicas,
|
|
|
|
Selector: map[string]string{
|
|
|
|
"name": name,
|
|
|
|
},
|
|
|
|
Template: &api.PodTemplateSpec{
|
|
|
|
ObjectMeta: api.ObjectMeta{
|
|
|
|
Labels: map[string]string{"name": name},
|
|
|
|
},
|
|
|
|
Spec: api.PodSpec{
|
|
|
|
Containers: []api.Container{
|
|
|
|
{
|
|
|
|
Name: name,
|
|
|
|
Image: image,
|
|
|
|
Ports: []api.ContainerPort{{ContainerPort: 80}},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
})
|
|
|
|
Expect(err).NotTo(HaveOccurred())
|
|
|
|
|
|
|
|
By(fmt.Sprintf("Making sure all %d replicas exist", replicas))
|
|
|
|
label := labels.SelectorFromSet(labels.Set(map[string]string{"name": name}))
|
2015-04-15 09:17:32 +00:00
|
|
|
pods, err := listPods(c, ns, label)
|
2015-02-23 14:50:40 +00:00
|
|
|
Expect(err).NotTo(HaveOccurred())
|
|
|
|
current = len(pods.Items)
|
|
|
|
failCount := 5
|
|
|
|
for same < failCount && current < replicas {
|
2015-03-26 16:00:12 +00:00
|
|
|
glog.Infof("Controller %s: Found %d pods out of %d", name, current, replicas)
|
2015-02-23 14:50:40 +00:00
|
|
|
if last < current {
|
|
|
|
same = 0
|
|
|
|
} else if last == current {
|
|
|
|
same++
|
|
|
|
} else if current < last {
|
2015-03-25 19:35:54 +00:00
|
|
|
Failf("Controller %s: Number of submitted pods dropped from %d to %d", name, last, current)
|
2015-02-23 14:50:40 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
if same >= failCount {
|
2015-03-26 16:00:12 +00:00
|
|
|
glog.Infof("No pods submitted for the last %d checks", failCount)
|
2015-02-23 14:50:40 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
last = current
|
|
|
|
time.Sleep(5 * time.Second)
|
2015-04-15 09:17:32 +00:00
|
|
|
pods, err = listPods(c, ns, label)
|
2015-02-23 14:50:40 +00:00
|
|
|
Expect(err).NotTo(HaveOccurred())
|
|
|
|
current = len(pods.Items)
|
|
|
|
}
|
|
|
|
Expect(current).To(Equal(replicas))
|
2015-03-26 16:00:12 +00:00
|
|
|
glog.Infof("Controller %s: Found %d pods out of %d", name, current, replicas)
|
2015-02-23 14:50:40 +00:00
|
|
|
|
|
|
|
By("Waiting for each pod to be running")
|
|
|
|
same = 0
|
|
|
|
last = 0
|
2015-03-26 16:00:12 +00:00
|
|
|
failCount = 10
|
2015-02-23 14:50:40 +00:00
|
|
|
current = 0
|
|
|
|
for same < failCount && current < replicas {
|
|
|
|
current = 0
|
2015-03-26 16:00:12 +00:00
|
|
|
waiting := 0
|
|
|
|
pending := 0
|
|
|
|
unknown := 0
|
2015-02-23 14:50:40 +00:00
|
|
|
time.Sleep(10 * time.Second)
|
2015-03-26 16:00:12 +00:00
|
|
|
|
2015-04-15 09:17:32 +00:00
|
|
|
currentPods, listErr := listPods(c, ns, label)
|
2015-03-26 16:00:12 +00:00
|
|
|
Expect(listErr).NotTo(HaveOccurred())
|
|
|
|
if len(currentPods.Items) != len(pods.Items) {
|
|
|
|
Failf("Number of reported pods changed: %d vs %d", len(currentPods.Items), len(pods.Items))
|
|
|
|
}
|
|
|
|
for _, p := range currentPods.Items {
|
2015-02-23 14:50:40 +00:00
|
|
|
if p.Status.Phase == api.PodRunning {
|
|
|
|
current++
|
|
|
|
} else if p.Status.Phase == api.PodPending {
|
2015-04-02 12:52:03 +00:00
|
|
|
if p.Spec.Host == "" {
|
2015-03-26 16:00:12 +00:00
|
|
|
waiting++
|
|
|
|
} else {
|
|
|
|
pending++
|
|
|
|
}
|
2015-02-23 14:50:40 +00:00
|
|
|
} else if p.Status.Phase == api.PodUnknown {
|
|
|
|
unknown++
|
|
|
|
}
|
|
|
|
}
|
2015-03-26 16:00:12 +00:00
|
|
|
glog.Infof("Pod States: %d running, %d pending, %d waiting, %d unknown ", current, pending, waiting, unknown)
|
2015-02-23 14:50:40 +00:00
|
|
|
if last < current {
|
|
|
|
same = 0
|
|
|
|
} else if last == current {
|
|
|
|
same++
|
|
|
|
} else if current < last {
|
|
|
|
Failf("Number of running pods dropped from %d to %d", last, current)
|
|
|
|
}
|
|
|
|
if same >= failCount {
|
2015-03-26 16:00:12 +00:00
|
|
|
glog.Infof("No pods started for the last %d checks", failCount)
|
2015-02-23 14:50:40 +00:00
|
|
|
}
|
|
|
|
last = current
|
|
|
|
}
|
|
|
|
Expect(current).To(Equal(replicas))
|
|
|
|
}
|
|
|
|
|
2015-03-25 23:28:04 +00:00
|
|
|
// This test suite can take a long time to run, so by default it is added to
|
|
|
|
// the ginkgo.skip list (see driver.go).
|
|
|
|
// To run this suite you must explicitly ask for it by setting the
|
|
|
|
// -t/--test flag or ginkgo.focus flag.
|
|
|
|
var _ = Describe("Density", func() {
|
2015-02-23 14:50:40 +00:00
|
|
|
var c *client.Client
|
|
|
|
var minionCount int
|
|
|
|
var RCName string
|
|
|
|
var ns string
|
|
|
|
|
|
|
|
BeforeEach(func() {
|
|
|
|
var err error
|
|
|
|
c, err = loadClient()
|
|
|
|
expectNoError(err)
|
2015-04-10 10:08:36 +00:00
|
|
|
minions, err := c.Nodes().List(labels.Everything(), fields.Everything())
|
2015-02-23 14:50:40 +00:00
|
|
|
expectNoError(err)
|
|
|
|
minionCount = len(minions.Items)
|
|
|
|
Expect(minionCount).NotTo(BeZero())
|
|
|
|
ns = api.NamespaceDefault
|
|
|
|
})
|
|
|
|
|
|
|
|
AfterEach(func() {
|
2015-03-12 16:29:00 +00:00
|
|
|
// Remove any remaining pods from this test if the
|
|
|
|
// replication controller still exists and the replica count
|
|
|
|
// isn't 0. This means the controller wasn't cleaned up
|
|
|
|
// during the test so clean it up here
|
|
|
|
rc, err := c.ReplicationControllers(ns).Get(RCName)
|
|
|
|
if err == nil && rc.Spec.Replicas != 0 {
|
2015-03-25 19:35:54 +00:00
|
|
|
By("Cleaning up the replication controller")
|
|
|
|
err := DeleteRC(c, ns, RCName)
|
|
|
|
expectNoError(err)
|
|
|
|
}
|
|
|
|
|
|
|
|
// Clean up the namespace if a non-default one was used
|
|
|
|
if ns != api.NamespaceDefault {
|
|
|
|
By("Cleaning up the namespace")
|
|
|
|
err := c.Namespaces().Delete(ns)
|
|
|
|
expectNoError(err)
|
2015-03-12 16:29:00 +00:00
|
|
|
}
|
2015-02-23 14:50:40 +00:00
|
|
|
})
|
|
|
|
|
2015-03-27 10:14:54 +00:00
|
|
|
// Tests with "Skipped" substring in their name will be skipped when running
|
|
|
|
// e2e test suite without --ginkgo.focus & --ginkgo.skip flags.
|
2015-04-06 03:37:58 +00:00
|
|
|
type Density struct {
|
|
|
|
skip bool
|
|
|
|
podsPerMinion int
|
2015-03-27 10:14:54 +00:00
|
|
|
}
|
2015-03-10 23:59:26 +00:00
|
|
|
|
2015-04-07 11:26:52 +00:00
|
|
|
densityTests := []Density{
|
|
|
|
// This test should always run, even if larger densities are skipped.
|
|
|
|
{podsPerMinion: 3, skip: false},
|
2015-04-13 06:44:52 +00:00
|
|
|
{podsPerMinion: 30, skip: false},
|
|
|
|
// More than 30 pods per node is outside our v1.0 goals.
|
|
|
|
// We might want to enable those tests in the future.
|
2015-04-07 11:26:52 +00:00
|
|
|
{podsPerMinion: 50, skip: true},
|
|
|
|
{podsPerMinion: 100, skip: true},
|
|
|
|
}
|
2015-04-06 03:37:58 +00:00
|
|
|
|
2015-04-07 11:26:52 +00:00
|
|
|
for _, testArg := range densityTests {
|
|
|
|
name := fmt.Sprintf("should allow starting %d pods per node", testArg.podsPerMinion)
|
2015-04-14 11:41:48 +00:00
|
|
|
if testArg.podsPerMinion <= 30 {
|
|
|
|
name = "[Performance suite] " + name
|
|
|
|
}
|
2015-04-07 11:26:52 +00:00
|
|
|
if testArg.skip {
|
|
|
|
name = "[Skipped] " + name
|
|
|
|
}
|
|
|
|
itArg := testArg
|
|
|
|
It(name, func() {
|
2015-03-25 19:35:54 +00:00
|
|
|
uuid := string(util.NewUUID())
|
2015-04-07 11:26:52 +00:00
|
|
|
totalPods := itArg.podsPerMinion * minionCount
|
2015-03-25 19:35:54 +00:00
|
|
|
nameStr := strconv.Itoa(totalPods) + "-" + uuid
|
|
|
|
ns = "e2e-density" + nameStr
|
|
|
|
RCName = "my-hostname-density" + nameStr
|
2015-04-07 11:26:52 +00:00
|
|
|
RunRC(c, RCName, ns, "gcr.io/google_containers/pause:go", totalPods)
|
2015-03-25 19:35:54 +00:00
|
|
|
By("waiting for all events to be recorded")
|
|
|
|
last := -1
|
|
|
|
current := 0
|
|
|
|
var events *api.EventList
|
|
|
|
for last < current {
|
|
|
|
e, err := c.Events(ns).List(
|
|
|
|
labels.Everything(),
|
|
|
|
fields.Set{
|
|
|
|
"involvedObject.namespace": ns,
|
|
|
|
}.AsSelector(),
|
|
|
|
)
|
|
|
|
expectNoError(err)
|
|
|
|
last = current
|
|
|
|
current = len(e.Items)
|
|
|
|
events = e
|
|
|
|
time.Sleep(10 * time.Second)
|
|
|
|
}
|
|
|
|
Logf("Found %d events", current)
|
|
|
|
|
|
|
|
// Verify no pods were killed or failed to start
|
|
|
|
By("verifying no pods were killed or failed to start")
|
|
|
|
for _, e := range events.Items {
|
|
|
|
for _, s := range []string{"kill", "fail"} {
|
|
|
|
Expect(e.Reason).NotTo(ContainSubstring(s), "event:' %s', reason: '%s', message: '%s', field path: '%s'", e, e.ObjectMeta.Name, e.Message, e.InvolvedObject.FieldPath)
|
|
|
|
}
|
|
|
|
}
|
2015-04-07 11:26:52 +00:00
|
|
|
})
|
|
|
|
}
|
2015-04-06 03:37:58 +00:00
|
|
|
|
2015-04-07 11:26:52 +00:00
|
|
|
type Scalability struct {
|
|
|
|
skip bool
|
|
|
|
totalPods int
|
|
|
|
podsPerMinion int
|
|
|
|
rcsPerThread int
|
|
|
|
}
|
2015-04-06 03:37:58 +00:00
|
|
|
|
2015-04-07 11:26:52 +00:00
|
|
|
scalabilityTests := []Scalability{
|
|
|
|
{totalPods: 500, podsPerMinion: 10, rcsPerThread: 5, skip: true},
|
|
|
|
{totalPods: 500, podsPerMinion: 10, rcsPerThread: 25, skip: true},
|
|
|
|
}
|
2015-04-06 03:37:58 +00:00
|
|
|
|
2015-04-07 11:26:52 +00:00
|
|
|
for _, testArg := range scalabilityTests {
|
|
|
|
// # of threads calibrate to totalPods
|
|
|
|
threads := (testArg.totalPods / (testArg.podsPerMinion * testArg.rcsPerThread))
|
2015-04-06 03:37:58 +00:00
|
|
|
|
2015-04-07 11:26:52 +00:00
|
|
|
name := fmt.Sprintf(
|
|
|
|
"should be able to launch %v pods, %v per minion, in %v rcs/thread.",
|
|
|
|
testArg.totalPods, testArg.podsPerMinion, testArg.rcsPerThread)
|
|
|
|
if testArg.skip {
|
|
|
|
name = "[Skipped] " + name
|
|
|
|
}
|
2015-04-06 03:37:58 +00:00
|
|
|
|
2015-04-07 11:26:52 +00:00
|
|
|
itArg := testArg
|
|
|
|
It(name, func() {
|
2015-04-06 03:37:58 +00:00
|
|
|
podsLaunched := 0
|
2015-04-07 11:26:52 +00:00
|
|
|
var wg sync.WaitGroup
|
|
|
|
wg.Add(threads)
|
|
|
|
|
|
|
|
// Create queue of pending requests on the api server.
|
|
|
|
for i := 0; i < threads; i++ {
|
|
|
|
go func() {
|
|
|
|
defer wg.Done()
|
|
|
|
for i := 0; i < itArg.rcsPerThread; i++ {
|
|
|
|
name := "my-short-lived-pod" + string(util.NewUUID())
|
|
|
|
n := itArg.podsPerMinion * minionCount
|
|
|
|
RunRC(c, name, ns, "gcr.io/google_containers/pause:go", n)
|
|
|
|
podsLaunched += n
|
|
|
|
glog.Info("Launched %v pods so far...", podsLaunched)
|
2015-03-25 19:35:54 +00:00
|
|
|
err := DeleteRC(c, ns, name)
|
|
|
|
expectNoError(err)
|
2015-04-07 11:26:52 +00:00
|
|
|
}
|
|
|
|
}()
|
|
|
|
}
|
|
|
|
// Wait for all the pods from all the RC's to return.
|
|
|
|
wg.Wait()
|
|
|
|
glog.Info("%v pods out of %v launched", podsLaunched, itArg.totalPods)
|
|
|
|
})
|
2015-04-06 03:37:58 +00:00
|
|
|
}
|
2015-02-23 14:50:40 +00:00
|
|
|
})
|