mirror of https://github.com/k3s-io/k3s
144 lines
5.3 KiB
Go
144 lines
5.3 KiB
Go
/*
|
|
Copyright 2017 The Kubernetes Authors.
|
|
|
|
Licensed under the Apache License, Version 2.0 (the "License");
|
|
you may not use this file except in compliance with the License.
|
|
You may obtain a copy of the License at
|
|
|
|
http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
Unless required by applicable law or agreed to in writing, software
|
|
distributed under the License is distributed on an "AS IS" BASIS,
|
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
See the License for the specific language governing permissions and
|
|
limitations under the License.
|
|
*/
|
|
|
|
package server
|
|
|
|
import (
|
|
"time"
|
|
|
|
"github.com/containerd/containerd/errdefs"
|
|
"github.com/docker/docker/pkg/signal"
|
|
"github.com/pkg/errors"
|
|
"github.com/sirupsen/logrus"
|
|
"golang.org/x/net/context"
|
|
"golang.org/x/sys/unix"
|
|
runtime "k8s.io/kubernetes/pkg/kubelet/apis/cri/runtime/v1alpha2"
|
|
|
|
"github.com/containerd/cri/pkg/store"
|
|
containerstore "github.com/containerd/cri/pkg/store/container"
|
|
)
|
|
|
|
// killContainerTimeout is the timeout that we wait for the container to
|
|
// be SIGKILLed.
|
|
// The timeout is set to 1 min, because the default CRI operation timeout
|
|
// for StopContainer is (2 min + stop timeout). Set to 1 min, so that we
|
|
// have enough time for kill(all=true) and kill(all=false).
|
|
const killContainerTimeout = 1 * time.Minute
|
|
|
|
// StopContainer stops a running container with a grace period (i.e., timeout).
|
|
func (c *criService) StopContainer(ctx context.Context, r *runtime.StopContainerRequest) (*runtime.StopContainerResponse, error) {
|
|
// Get container config from container store.
|
|
container, err := c.containerStore.Get(r.GetContainerId())
|
|
if err != nil {
|
|
return nil, errors.Wrapf(err, "an error occurred when try to find container %q", r.GetContainerId())
|
|
}
|
|
|
|
if err := c.stopContainer(ctx, container, time.Duration(r.GetTimeout())*time.Second); err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
return &runtime.StopContainerResponse{}, nil
|
|
}
|
|
|
|
// stopContainer stops a container based on the container metadata.
|
|
func (c *criService) stopContainer(ctx context.Context, container containerstore.Container, timeout time.Duration) error {
|
|
id := container.ID
|
|
|
|
// Return without error if container is not running. This makes sure that
|
|
// stop only takes real action after the container is started.
|
|
state := container.Status.Get().State()
|
|
if state != runtime.ContainerState_CONTAINER_RUNNING {
|
|
logrus.Infof("Container to stop %q is not running, current state %q",
|
|
id, criContainerStateToString(state))
|
|
return nil
|
|
}
|
|
|
|
task, err := container.Container.Task(ctx, nil)
|
|
if err != nil {
|
|
if !errdefs.IsNotFound(err) {
|
|
return errors.Wrapf(err, "failed to stop container, task not found for container %q", id)
|
|
}
|
|
return nil
|
|
}
|
|
|
|
// We only need to kill the task. The event handler will Delete the
|
|
// task from containerd after it handles the Exited event.
|
|
if timeout > 0 {
|
|
stopSignal := "SIGTERM"
|
|
if container.StopSignal != "" {
|
|
stopSignal = container.StopSignal
|
|
} else {
|
|
// The image may have been deleted, and the `StopSignal` field is
|
|
// just introduced to handle that.
|
|
// However, for containers created before the `StopSignal` field is
|
|
// introduced, still try to get the stop signal from the image config.
|
|
// If the image has been deleted, logging an error and using the
|
|
// default SIGTERM is still better than returning error and leaving
|
|
// the container unstoppable. (See issue #990)
|
|
// TODO(random-liu): Remove this logic when containerd 1.2 is deprecated.
|
|
image, err := c.imageStore.Get(container.ImageRef)
|
|
if err != nil {
|
|
if err != store.ErrNotExist {
|
|
return errors.Wrapf(err, "failed to get image %q", container.ImageRef)
|
|
}
|
|
logrus.Warningf("Image %q not found, stop container with signal %q", container.ImageRef, stopSignal)
|
|
} else {
|
|
if image.ImageSpec.Config.StopSignal != "" {
|
|
stopSignal = image.ImageSpec.Config.StopSignal
|
|
}
|
|
}
|
|
}
|
|
sig, err := signal.ParseSignal(stopSignal)
|
|
if err != nil {
|
|
return errors.Wrapf(err, "failed to parse stop signal %q", stopSignal)
|
|
}
|
|
logrus.Infof("Stop container %q with signal %v", id, sig)
|
|
if err = task.Kill(ctx, sig); err != nil && !errdefs.IsNotFound(err) {
|
|
return errors.Wrapf(err, "failed to stop container %q", id)
|
|
}
|
|
|
|
if err = c.waitContainerStop(ctx, container, timeout); err == nil {
|
|
return nil
|
|
}
|
|
logrus.WithError(err).Errorf("An error occurs during waiting for container %q to be stopped", id)
|
|
}
|
|
|
|
logrus.Infof("Kill container %q", id)
|
|
if err = task.Kill(ctx, unix.SIGKILL); err != nil && !errdefs.IsNotFound(err) {
|
|
return errors.Wrapf(err, "failed to kill container %q", id)
|
|
}
|
|
|
|
// Wait for a fixed timeout until container stop is observed by event monitor.
|
|
if err = c.waitContainerStop(ctx, container, killContainerTimeout); err == nil {
|
|
return nil
|
|
}
|
|
return errors.Wrapf(err, "an error occurs during waiting for container %q to be killed", id)
|
|
}
|
|
|
|
// waitContainerStop waits for container to be stopped until timeout exceeds or context is cancelled.
|
|
func (c *criService) waitContainerStop(ctx context.Context, container containerstore.Container, timeout time.Duration) error {
|
|
timeoutTimer := time.NewTimer(timeout)
|
|
defer timeoutTimer.Stop()
|
|
select {
|
|
case <-ctx.Done():
|
|
return errors.Errorf("wait container %q is cancelled", container.ID)
|
|
case <-timeoutTimer.C:
|
|
return errors.Errorf("wait container %q stop timeout", container.ID)
|
|
case <-container.Stopped():
|
|
return nil
|
|
}
|
|
}
|