// +build linux package fs2 import ( "fmt" "os" "strings" "github.com/opencontainers/runc/libcontainer/cgroups" "github.com/opencontainers/runc/libcontainer/cgroups/fscommon" "github.com/opencontainers/runc/libcontainer/configs" "github.com/pkg/errors" ) type manager struct { config *configs.Cgroup // dirPath is like "/sys/fs/cgroup/user.slice/user-1001.slice/session-1.scope" dirPath string // controllers is content of "cgroup.controllers" file. // excludes pseudo-controllers ("devices" and "freezer"). controllers map[string]struct{} rootless bool } // NewManager creates a manager for cgroup v2 unified hierarchy. // dirPath is like "/sys/fs/cgroup/user.slice/user-1001.slice/session-1.scope". // If dirPath is empty, it is automatically set using config. func NewManager(config *configs.Cgroup, dirPath string, rootless bool) (cgroups.Manager, error) { if config == nil { config = &configs.Cgroup{} } if dirPath == "" { var err error dirPath, err = defaultDirPath(config) if err != nil { return nil, err } } m := &manager{ config: config, dirPath: dirPath, rootless: rootless, } return m, nil } func (m *manager) getControllers() error { if m.controllers != nil { return nil } data, err := cgroups.ReadFile(m.dirPath, "cgroup.controllers") if err != nil { if m.rootless && m.config.Path == "" { return nil } return err } fields := strings.Fields(data) m.controllers = make(map[string]struct{}, len(fields)) for _, c := range fields { m.controllers[c] = struct{}{} } return nil } func (m *manager) Apply(pid int) error { if err := CreateCgroupPath(m.dirPath, m.config); err != nil { // Related tests: // - "runc create (no limits + no cgrouppath + no permission) succeeds" // - "runc create (rootless + no limits + cgrouppath + no permission) fails with permission error" // - "runc create (rootless + limits + no cgrouppath + no permission) fails with informative error" if m.rootless { if m.config.Path == "" { if blNeed, nErr := needAnyControllers(m.config.Resources); nErr == nil && !blNeed { return nil } return errors.Wrap(err, "rootless needs no limits + no cgrouppath when no permission is granted for cgroups") } } return err } if err := cgroups.WriteCgroupProc(m.dirPath, pid); err != nil { return err } return nil } func (m *manager) GetPids() ([]int, error) { return cgroups.GetPids(m.dirPath) } func (m *manager) GetAllPids() ([]int, error) { return cgroups.GetAllPids(m.dirPath) } func (m *manager) GetStats() (*cgroups.Stats, error) { var errs []error st := cgroups.NewStats() // pids (since kernel 4.5) if err := statPids(m.dirPath, st); err != nil { errs = append(errs, err) } // memory (since kernel 4.5) if err := statMemory(m.dirPath, st); err != nil && !os.IsNotExist(err) { errs = append(errs, err) } // io (since kernel 4.5) if err := statIo(m.dirPath, st); err != nil && !os.IsNotExist(err) { errs = append(errs, err) } // cpu (since kernel 4.15) // Note cpu.stat is available even if the controller is not enabled. if err := statCpu(m.dirPath, st); err != nil && !os.IsNotExist(err) { errs = append(errs, err) } // hugetlb (since kernel 5.6) if err := statHugeTlb(m.dirPath, st); err != nil && !os.IsNotExist(err) { errs = append(errs, err) } if len(errs) > 0 && !m.rootless { return st, errors.Errorf("error while statting cgroup v2: %+v", errs) } return st, nil } func (m *manager) Freeze(state configs.FreezerState) error { if err := setFreezer(m.dirPath, state); err != nil { return err } m.config.Resources.Freezer = state return nil } func (m *manager) Destroy() error { return cgroups.RemovePath(m.dirPath) } func (m *manager) Path(_ string) string { return m.dirPath } func (m *manager) Set(r *configs.Resources) error { if err := m.getControllers(); err != nil { return err } // pids (since kernel 4.5) if err := setPids(m.dirPath, r); err != nil { return err } // memory (since kernel 4.5) if err := setMemory(m.dirPath, r); err != nil { return err } // io (since kernel 4.5) if err := setIo(m.dirPath, r); err != nil { return err } // cpu (since kernel 4.15) if err := setCpu(m.dirPath, r); err != nil { return err } // devices (since kernel 4.15, pseudo-controller) // // When m.rootless is true, errors from the device subsystem are ignored because it is really not expected to work. // However, errors from other subsystems are not ignored. // see @test "runc create (rootless + limits + no cgrouppath + no permission) fails with informative error" if err := setDevices(m.dirPath, r); err != nil && !m.rootless { return err } // cpuset (since kernel 5.0) if err := setCpuset(m.dirPath, r); err != nil { return err } // hugetlb (since kernel 5.6) if err := setHugeTlb(m.dirPath, r); err != nil { return err } // freezer (since kernel 5.2, pseudo-controller) if err := setFreezer(m.dirPath, r.Freezer); err != nil { return err } if err := m.setUnified(r.Unified); err != nil { return err } m.config.Resources = r return nil } func (m *manager) setUnified(res map[string]string) error { for k, v := range res { if strings.Contains(k, "/") { return fmt.Errorf("unified resource %q must be a file name (no slashes)", k) } if err := cgroups.WriteFile(m.dirPath, k, v); err != nil { errC := errors.Cause(err) // Check for both EPERM and ENOENT since O_CREAT is used by WriteFile. if errors.Is(errC, os.ErrPermission) || errors.Is(errC, os.ErrNotExist) { // Check if a controller is available, // to give more specific error if not. sk := strings.SplitN(k, ".", 2) if len(sk) != 2 { return fmt.Errorf("unified resource %q must be in the form CONTROLLER.PARAMETER", k) } c := sk[0] if _, ok := m.controllers[c]; !ok && c != "cgroup" { return fmt.Errorf("unified resource %q can't be set: controller %q not available", k, c) } } return errors.Wrapf(err, "can't set unified resource %q", k) } } return nil } func (m *manager) GetPaths() map[string]string { paths := make(map[string]string, 1) paths[""] = m.dirPath return paths } func (m *manager) GetCgroups() (*configs.Cgroup, error) { return m.config, nil } func (m *manager) GetFreezerState() (configs.FreezerState, error) { return getFreezer(m.dirPath) } func (m *manager) Exists() bool { return cgroups.PathExists(m.dirPath) } func OOMKillCount(path string) (uint64, error) { return fscommon.GetValueByKey(path, "memory.events", "oom_kill") } func (m *manager) OOMKillCount() (uint64, error) { c, err := OOMKillCount(m.dirPath) if err != nil && m.rootless && os.IsNotExist(err) { err = nil } return c, err }