2016-02-05 00:03:17 +00:00
|
|
|
package executor
|
2016-02-02 21:38:38 +00:00
|
|
|
|
|
|
|
import (
|
2016-02-03 02:54:04 +00:00
|
|
|
"fmt"
|
2016-02-03 18:23:00 +00:00
|
|
|
"os"
|
|
|
|
"os/user"
|
2016-02-03 02:54:04 +00:00
|
|
|
"path/filepath"
|
2016-02-03 18:23:00 +00:00
|
|
|
"strconv"
|
2016-04-19 20:48:02 +00:00
|
|
|
"strings"
|
2016-02-03 18:23:00 +00:00
|
|
|
"syscall"
|
|
|
|
|
|
|
|
"github.com/hashicorp/go-multierror"
|
2016-02-03 19:41:49 +00:00
|
|
|
"github.com/opencontainers/runc/libcontainer/cgroups"
|
|
|
|
cgroupFs "github.com/opencontainers/runc/libcontainer/cgroups/fs"
|
|
|
|
cgroupConfig "github.com/opencontainers/runc/libcontainer/configs"
|
2016-02-03 18:23:00 +00:00
|
|
|
|
|
|
|
"github.com/hashicorp/nomad/client/allocdir"
|
2016-04-28 23:06:01 +00:00
|
|
|
cstructs "github.com/hashicorp/nomad/client/driver/structs"
|
2016-02-03 19:41:49 +00:00
|
|
|
"github.com/hashicorp/nomad/nomad/structs"
|
2016-02-03 18:23:00 +00:00
|
|
|
)
|
|
|
|
|
|
|
|
var (
|
|
|
|
// A mapping of directories on the host OS to attempt to embed inside each
|
|
|
|
// task's chroot.
|
|
|
|
chrootEnv = map[string]string{
|
2016-03-10 23:05:49 +00:00
|
|
|
"/bin": "/bin",
|
|
|
|
"/etc": "/etc",
|
|
|
|
"/lib": "/lib",
|
|
|
|
"/lib32": "/lib32",
|
|
|
|
"/lib64": "/lib64",
|
2016-03-16 16:56:04 +00:00
|
|
|
"/run/resolvconf": "/run/resolvconf",
|
2016-03-10 23:05:49 +00:00
|
|
|
"/sbin": "/sbin",
|
2016-03-29 23:14:56 +00:00
|
|
|
"/usr": "/usr",
|
2016-02-03 18:23:00 +00:00
|
|
|
}
|
2016-02-02 21:38:38 +00:00
|
|
|
)
|
|
|
|
|
2016-02-05 00:18:10 +00:00
|
|
|
// configureIsolation configures chroot and creates cgroups
|
2016-02-04 00:03:43 +00:00
|
|
|
func (e *UniversalExecutor) configureIsolation() error {
|
2016-03-17 09:53:31 +00:00
|
|
|
if e.command.FSIsolation {
|
2016-02-04 00:03:43 +00:00
|
|
|
if err := e.configureChroot(); err != nil {
|
|
|
|
return err
|
2016-02-03 18:23:00 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-03-17 09:53:31 +00:00
|
|
|
if e.command.ResourceLimits {
|
|
|
|
if err := e.configureCgroups(e.ctx.Task.Resources); err != nil {
|
2016-02-04 00:03:43 +00:00
|
|
|
return fmt.Errorf("error creating cgroups: %v", err)
|
|
|
|
}
|
2016-02-03 19:41:49 +00:00
|
|
|
}
|
2016-02-04 00:03:43 +00:00
|
|
|
return nil
|
|
|
|
}
|
2016-02-03 19:41:49 +00:00
|
|
|
|
2016-02-05 00:18:10 +00:00
|
|
|
// applyLimits puts a process in a pre-configured cgroup
|
2016-02-05 08:11:09 +00:00
|
|
|
func (e *UniversalExecutor) applyLimits(pid int) error {
|
2016-03-17 09:53:31 +00:00
|
|
|
if !e.command.ResourceLimits {
|
2016-02-04 00:03:43 +00:00
|
|
|
return nil
|
2016-02-03 18:23:00 +00:00
|
|
|
}
|
2016-02-05 08:11:09 +00:00
|
|
|
|
|
|
|
// Entering the process in the cgroup
|
2016-04-02 08:06:41 +00:00
|
|
|
manager := getCgroupManager(e.groups, nil)
|
2016-02-05 08:11:09 +00:00
|
|
|
if err := manager.Apply(pid); err != nil {
|
2016-04-02 08:36:31 +00:00
|
|
|
e.logger.Printf("[ERR] executor: error applying pid to cgroup: %v", err)
|
2016-04-02 08:06:41 +00:00
|
|
|
if er := e.removeChrootMounts(); er != nil {
|
|
|
|
e.logger.Printf("[ERR] executor: error removing chroot: %v", er)
|
2016-02-03 19:41:49 +00:00
|
|
|
}
|
2016-02-04 00:03:43 +00:00
|
|
|
return err
|
2016-02-03 19:41:49 +00:00
|
|
|
}
|
2016-04-02 08:06:41 +00:00
|
|
|
e.cgPaths = manager.GetPaths()
|
2016-04-02 08:51:17 +00:00
|
|
|
cgConfig := cgroupConfig.Config{Cgroups: e.groups}
|
2016-04-02 08:36:31 +00:00
|
|
|
if err := manager.Set(&cgConfig); err != nil {
|
|
|
|
e.logger.Printf("[ERR] executor: error setting cgroup config: %v", err)
|
2016-04-19 00:20:11 +00:00
|
|
|
if er := DestroyCgroup(e.groups, e.cgPaths, os.Getpid()); er != nil {
|
2016-04-02 08:36:31 +00:00
|
|
|
e.logger.Printf("[ERR] executor: error destroying cgroup: %v", er)
|
|
|
|
}
|
2016-04-02 08:51:17 +00:00
|
|
|
if er := e.removeChrootMounts(); er != nil {
|
|
|
|
e.logger.Printf("[ERR] executor: error removing chroot: %v", er)
|
|
|
|
}
|
2016-04-02 08:36:31 +00:00
|
|
|
return err
|
|
|
|
}
|
2016-02-04 00:03:43 +00:00
|
|
|
return nil
|
2016-02-03 18:23:00 +00:00
|
|
|
}
|
|
|
|
|
2016-02-04 00:03:43 +00:00
|
|
|
// configureCgroups converts a Nomad Resources specification into the equivalent
|
|
|
|
// cgroup configuration. It returns an error if the resources are invalid.
|
|
|
|
func (e *UniversalExecutor) configureCgroups(resources *structs.Resources) error {
|
|
|
|
e.groups = &cgroupConfig.Cgroup{}
|
|
|
|
e.groups.Resources = &cgroupConfig.Resources{}
|
2016-03-02 00:53:56 +00:00
|
|
|
cgroupName := structs.GenerateUUID()
|
2016-04-02 08:06:41 +00:00
|
|
|
e.groups.Path = filepath.Join("/nomad", cgroupName)
|
2016-02-03 18:23:00 +00:00
|
|
|
|
2016-02-04 00:03:43 +00:00
|
|
|
// TODO: verify this is needed for things like network access
|
|
|
|
e.groups.Resources.AllowAllDevices = true
|
2016-02-03 18:23:00 +00:00
|
|
|
|
2016-02-04 00:03:43 +00:00
|
|
|
if resources.MemoryMB > 0 {
|
|
|
|
// Total amount of memory allowed to consume
|
|
|
|
e.groups.Resources.Memory = int64(resources.MemoryMB * 1024 * 1024)
|
|
|
|
// Disable swap to avoid issues on the machine
|
|
|
|
e.groups.Resources.MemorySwap = int64(-1)
|
2016-02-03 18:23:00 +00:00
|
|
|
}
|
|
|
|
|
2016-02-04 00:03:43 +00:00
|
|
|
if resources.CPU < 2 {
|
|
|
|
return fmt.Errorf("resources.CPU must be equal to or greater than 2: %v", resources.CPU)
|
2016-02-03 18:23:00 +00:00
|
|
|
}
|
|
|
|
|
2016-02-04 00:03:43 +00:00
|
|
|
// Set the relative CPU shares for this cgroup.
|
|
|
|
e.groups.Resources.CpuShares = int64(resources.CPU)
|
2016-02-03 18:23:00 +00:00
|
|
|
|
2016-02-04 00:03:43 +00:00
|
|
|
if resources.IOPS != 0 {
|
|
|
|
// Validate it is in an acceptable range.
|
|
|
|
if resources.IOPS < 10 || resources.IOPS > 1000 {
|
|
|
|
return fmt.Errorf("resources.IOPS must be between 10 and 1000: %d", resources.IOPS)
|
2016-02-03 18:23:00 +00:00
|
|
|
}
|
2016-02-04 00:03:43 +00:00
|
|
|
|
|
|
|
e.groups.Resources.BlkioWeight = uint16(resources.IOPS)
|
2016-02-03 18:23:00 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2016-04-28 23:06:01 +00:00
|
|
|
func (e *UniversalExecutor) Stats() (*cstructs.TaskResourceUsage, error) {
|
|
|
|
manager := getCgroupManager(e.groups, e.cgPaths)
|
|
|
|
stats, err := manager.GetStats()
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
e.logger.Printf("DIPTANU stats %#v", stats.MemoryStats.Stats)
|
|
|
|
return &cstructs.TaskResourceUsage{}, nil
|
|
|
|
}
|
|
|
|
|
2016-02-03 18:23:00 +00:00
|
|
|
// runAs takes a user id as a string and looks up the user, and sets the command
|
|
|
|
// to execute as that user.
|
2016-02-04 00:03:43 +00:00
|
|
|
func (e *UniversalExecutor) runAs(userid string) error {
|
2016-02-03 18:23:00 +00:00
|
|
|
u, err := user.Lookup(userid)
|
|
|
|
if err != nil {
|
|
|
|
return fmt.Errorf("Failed to identify user %v: %v", userid, err)
|
|
|
|
}
|
|
|
|
|
|
|
|
// Convert the uid and gid
|
|
|
|
uid, err := strconv.ParseUint(u.Uid, 10, 32)
|
|
|
|
if err != nil {
|
|
|
|
return fmt.Errorf("Unable to convert userid to uint32: %s", err)
|
|
|
|
}
|
|
|
|
gid, err := strconv.ParseUint(u.Gid, 10, 32)
|
|
|
|
if err != nil {
|
|
|
|
return fmt.Errorf("Unable to convert groupid to uint32: %s", err)
|
|
|
|
}
|
|
|
|
|
|
|
|
// Set the command to run as that user and group.
|
|
|
|
if e.cmd.SysProcAttr == nil {
|
|
|
|
e.cmd.SysProcAttr = &syscall.SysProcAttr{}
|
|
|
|
}
|
|
|
|
if e.cmd.SysProcAttr.Credential == nil {
|
|
|
|
e.cmd.SysProcAttr.Credential = &syscall.Credential{}
|
|
|
|
}
|
|
|
|
e.cmd.SysProcAttr.Credential.Uid = uint32(uid)
|
|
|
|
e.cmd.SysProcAttr.Credential.Gid = uint32(gid)
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2016-02-05 00:18:10 +00:00
|
|
|
// configureChroot configures a chroot
|
2016-02-04 00:03:43 +00:00
|
|
|
func (e *UniversalExecutor) configureChroot() error {
|
|
|
|
allocDir := e.ctx.AllocDir
|
2016-03-17 09:53:31 +00:00
|
|
|
if err := allocDir.MountSharedDir(e.ctx.Task.Name); err != nil {
|
2016-02-04 00:03:43 +00:00
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2016-03-17 09:53:31 +00:00
|
|
|
if err := allocDir.Embed(e.ctx.Task.Name, chrootEnv); err != nil {
|
2016-02-04 00:03:43 +00:00
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
// Set the tasks AllocDir environment variable.
|
2016-03-29 00:24:10 +00:00
|
|
|
e.ctx.TaskEnv.
|
|
|
|
SetAllocDir(filepath.Join("/", allocdir.SharedAllocName)).
|
|
|
|
SetTaskLocalDir(filepath.Join("/", allocdir.TaskLocal)).
|
|
|
|
Build()
|
2016-02-04 00:03:43 +00:00
|
|
|
|
2016-02-03 18:23:00 +00:00
|
|
|
if e.cmd.SysProcAttr == nil {
|
|
|
|
e.cmd.SysProcAttr = &syscall.SysProcAttr{}
|
|
|
|
}
|
|
|
|
e.cmd.SysProcAttr.Chroot = e.taskDir
|
|
|
|
e.cmd.Dir = "/"
|
2016-02-04 00:03:43 +00:00
|
|
|
|
2016-02-08 22:11:53 +00:00
|
|
|
if err := allocDir.MountSpecialDirs(e.taskDir); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2016-02-04 00:03:43 +00:00
|
|
|
return nil
|
2016-02-03 18:23:00 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// cleanTaskDir is an idempotent operation to clean the task directory and
|
|
|
|
// should be called when tearing down the task.
|
2016-02-04 00:03:43 +00:00
|
|
|
func (e *UniversalExecutor) removeChrootMounts() error {
|
2016-02-03 18:23:00 +00:00
|
|
|
// Prevent a race between Wait/ForceStop
|
2016-03-17 09:53:31 +00:00
|
|
|
e.cgLock.Lock()
|
|
|
|
defer e.cgLock.Unlock()
|
2016-02-09 02:51:11 +00:00
|
|
|
return e.ctx.AllocDir.UnmountAll()
|
2016-02-02 21:38:38 +00:00
|
|
|
}
|
|
|
|
|
2016-02-03 19:41:49 +00:00
|
|
|
// destroyCgroup kills all processes in the cgroup and removes the cgroup
|
2016-04-19 20:48:02 +00:00
|
|
|
// configuration from the host. This function is idempotent.
|
2016-04-19 00:20:11 +00:00
|
|
|
func DestroyCgroup(groups *cgroupConfig.Cgroup, cgPaths map[string]string, executorPid int) error {
|
2016-04-19 20:48:02 +00:00
|
|
|
mErrs := new(multierror.Error)
|
2016-02-09 00:08:29 +00:00
|
|
|
if groups == nil {
|
2016-02-03 19:41:49 +00:00
|
|
|
return fmt.Errorf("Can't destroy: cgroup configuration empty")
|
|
|
|
}
|
|
|
|
|
2016-04-19 00:20:11 +00:00
|
|
|
// Move the executor into the global cgroup so that the task specific
|
|
|
|
// cgroup can be destroyed.
|
|
|
|
nilGroup := &cgroupConfig.Cgroup{}
|
|
|
|
nilGroup.Path = "/"
|
|
|
|
nilGroup.Resources = groups.Resources
|
|
|
|
nilManager := getCgroupManager(nilGroup, nil)
|
2016-04-19 20:48:02 +00:00
|
|
|
err := nilManager.Apply(executorPid)
|
|
|
|
if err != nil && !strings.Contains(err.Error(), "no such process") {
|
|
|
|
return fmt.Errorf("failed to remove executor pid %d: %v", executorPid, err)
|
|
|
|
}
|
|
|
|
|
|
|
|
// Freeze the Cgroup so that it can not continue to fork/exec.
|
|
|
|
manager := getCgroupManager(groups, cgPaths)
|
|
|
|
err = manager.Freeze(cgroupConfig.Frozen)
|
|
|
|
if err != nil && !strings.Contains(err.Error(), "no such file or directory") {
|
|
|
|
return fmt.Errorf("failed to freeze cgroup: %v", err)
|
|
|
|
}
|
|
|
|
|
|
|
|
var procs []*os.Process
|
|
|
|
pids, err := manager.GetAllPids()
|
|
|
|
if err != nil {
|
|
|
|
multierror.Append(mErrs, fmt.Errorf("error getting pids: %v", err))
|
|
|
|
|
|
|
|
// Unfreeze the cgroup.
|
|
|
|
err = manager.Freeze(cgroupConfig.Thawed)
|
|
|
|
if err != nil && !strings.Contains(err.Error(), "no such file or directory") {
|
|
|
|
multierror.Append(mErrs, fmt.Errorf("failed to unfreeze cgroup: %v", err))
|
|
|
|
}
|
|
|
|
return mErrs.ErrorOrNil()
|
|
|
|
}
|
|
|
|
|
|
|
|
// Kill the processes in the cgroup
|
|
|
|
for _, pid := range pids {
|
|
|
|
proc, err := os.FindProcess(pid)
|
|
|
|
if err != nil {
|
|
|
|
multierror.Append(mErrs, fmt.Errorf("error finding process %v: %v", pid, err))
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
|
|
|
procs = append(procs, proc)
|
|
|
|
if e := proc.Kill(); e != nil {
|
|
|
|
multierror.Append(mErrs, fmt.Errorf("error killing process %v: %v", pid, e))
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Unfreeze the cgroug so we can wait.
|
|
|
|
err = manager.Freeze(cgroupConfig.Thawed)
|
|
|
|
if err != nil && !strings.Contains(err.Error(), "no such file or directory") {
|
|
|
|
multierror.Append(mErrs, fmt.Errorf("failed to unfreeze cgroup: %v", err))
|
|
|
|
}
|
|
|
|
|
|
|
|
// Wait on the killed processes to ensure they are cleaned up.
|
|
|
|
for _, proc := range procs {
|
|
|
|
// Don't capture the error because we expect this to fail for
|
|
|
|
// processes we didn't fork.
|
|
|
|
proc.Wait()
|
2016-04-19 00:20:11 +00:00
|
|
|
}
|
|
|
|
|
2016-02-03 19:41:49 +00:00
|
|
|
// Remove the cgroup.
|
|
|
|
if err := manager.Destroy(); err != nil {
|
2016-04-19 20:48:02 +00:00
|
|
|
multierror.Append(mErrs, fmt.Errorf("failed to delete the cgroup directories: %v", err))
|
2016-02-03 19:41:49 +00:00
|
|
|
}
|
2016-04-19 20:48:02 +00:00
|
|
|
return mErrs.ErrorOrNil()
|
2016-02-03 19:41:49 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// getCgroupManager returns the correct libcontainer cgroup manager.
|
2016-04-02 08:06:41 +00:00
|
|
|
func getCgroupManager(groups *cgroupConfig.Cgroup, paths map[string]string) cgroups.Manager {
|
2016-04-15 21:55:30 +00:00
|
|
|
return &cgroupFs.Manager{Cgroups: groups, Paths: paths}
|
2016-02-03 19:41:49 +00:00
|
|
|
}
|