2015-12-01 19:56:08 +00:00
|
|
|
package runtime
|
2015-11-05 23:29:53 +00:00
|
|
|
|
2015-11-10 22:57:10 +00:00
|
|
|
import (
|
2016-05-09 17:25:52 +00:00
|
|
|
"bytes"
|
2016-02-01 19:02:41 +00:00
|
|
|
"encoding/json"
|
2016-04-26 20:29:35 +00:00
|
|
|
"fmt"
|
2016-02-29 22:15:16 +00:00
|
|
|
"io"
|
2016-02-01 19:02:41 +00:00
|
|
|
"io/ioutil"
|
2015-11-10 22:57:10 +00:00
|
|
|
"os"
|
2016-03-14 20:57:28 +00:00
|
|
|
"os/exec"
|
2016-02-01 19:02:41 +00:00
|
|
|
"path/filepath"
|
2016-04-26 20:29:35 +00:00
|
|
|
"strings"
|
|
|
|
"syscall"
|
2016-03-28 20:30:37 +00:00
|
|
|
"time"
|
2015-11-10 22:57:10 +00:00
|
|
|
|
2016-02-01 19:02:41 +00:00
|
|
|
"github.com/Sirupsen/logrus"
|
2016-02-29 18:48:39 +00:00
|
|
|
"github.com/docker/containerd/specs"
|
2016-04-26 20:29:35 +00:00
|
|
|
"github.com/opencontainers/runc/libcontainer"
|
|
|
|
ocs "github.com/opencontainers/runtime-spec/specs-go"
|
2015-11-10 22:57:10 +00:00
|
|
|
)
|
2015-11-10 21:44:35 +00:00
|
|
|
|
2015-11-05 23:29:53 +00:00
|
|
|
type Container interface {
|
2015-11-12 21:40:23 +00:00
|
|
|
// ID returns the container ID
|
2015-11-06 00:40:57 +00:00
|
|
|
ID() string
|
2015-11-12 21:40:23 +00:00
|
|
|
// Path returns the path to the bundle
|
2015-11-10 19:38:26 +00:00
|
|
|
Path() string
|
2016-01-06 21:32:46 +00:00
|
|
|
// Start starts the init process of the container
|
2016-02-03 21:56:15 +00:00
|
|
|
Start(checkpoint string, s Stdio) (Process, error)
|
2016-02-01 19:02:41 +00:00
|
|
|
// Exec starts another process in an existing container
|
2016-02-29 18:48:39 +00:00
|
|
|
Exec(string, specs.ProcessSpec, Stdio) (Process, error)
|
2016-01-06 21:32:46 +00:00
|
|
|
// Delete removes the container's state and any resources
|
2015-11-05 23:29:53 +00:00
|
|
|
Delete() error
|
2015-11-12 21:40:23 +00:00
|
|
|
// Processes returns all the containers processes that have been added
|
2015-11-10 21:44:35 +00:00
|
|
|
Processes() ([]Process, error)
|
2015-11-12 21:40:23 +00:00
|
|
|
// State returns the containers runtime state
|
|
|
|
State() State
|
|
|
|
// Resume resumes a paused container
|
|
|
|
Resume() error
|
|
|
|
// Pause pauses a running container
|
|
|
|
Pause() error
|
2016-02-01 23:07:02 +00:00
|
|
|
// RemoveProcess removes the specified process from the container
|
2016-02-01 19:02:41 +00:00
|
|
|
RemoveProcess(string) error
|
2015-12-07 22:47:03 +00:00
|
|
|
// Checkpoints returns all the checkpoints for a container
|
2016-02-01 23:07:02 +00:00
|
|
|
Checkpoints() ([]Checkpoint, error)
|
2015-12-07 22:47:03 +00:00
|
|
|
// Checkpoint creates a new checkpoint
|
2016-02-01 23:07:02 +00:00
|
|
|
Checkpoint(Checkpoint) error
|
2015-12-07 22:47:03 +00:00
|
|
|
// DeleteCheckpoint deletes the checkpoint for the provided name
|
2016-02-01 23:07:02 +00:00
|
|
|
DeleteCheckpoint(name string) error
|
2016-02-11 21:44:25 +00:00
|
|
|
// Labels are user provided labels for the container
|
|
|
|
Labels() []string
|
2016-02-11 22:07:34 +00:00
|
|
|
// Pids returns all pids inside the container
|
|
|
|
Pids() ([]int, error)
|
2015-12-08 18:04:31 +00:00
|
|
|
// Stats returns realtime container stats and resource information
|
2016-02-11 22:36:32 +00:00
|
|
|
Stats() (*Stat, error)
|
2016-02-25 20:59:34 +00:00
|
|
|
// Name or path of the OCI compliant runtime used to execute the container
|
|
|
|
Runtime() string
|
2016-02-11 22:36:32 +00:00
|
|
|
// OOM signals the channel if the container received an OOM notification
|
2016-02-29 22:15:16 +00:00
|
|
|
OOM() (OOM, error)
|
2016-03-07 23:23:52 +00:00
|
|
|
// UpdateResource updates the containers resources to new values
|
|
|
|
UpdateResources(*Resource) error
|
2016-04-22 19:49:55 +00:00
|
|
|
|
|
|
|
// Status return the current status of the container.
|
|
|
|
Status() (State, error)
|
2016-02-29 22:15:16 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
type OOM interface {
|
|
|
|
io.Closer
|
|
|
|
FD() int
|
|
|
|
ContainerID() string
|
|
|
|
Flush()
|
|
|
|
Removed() bool
|
2015-11-05 23:29:53 +00:00
|
|
|
}
|
2016-02-01 19:02:41 +00:00
|
|
|
|
2016-02-03 21:56:15 +00:00
|
|
|
type Stdio struct {
|
|
|
|
Stdin string
|
|
|
|
Stdout string
|
|
|
|
Stderr string
|
|
|
|
}
|
|
|
|
|
2016-02-11 20:20:29 +00:00
|
|
|
func NewStdio(stdin, stdout, stderr string) Stdio {
|
|
|
|
for _, s := range []*string{
|
|
|
|
&stdin, &stdout, &stderr,
|
|
|
|
} {
|
|
|
|
if *s == "" {
|
|
|
|
*s = "/dev/null"
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return Stdio{
|
|
|
|
Stdin: stdin,
|
|
|
|
Stdout: stdout,
|
|
|
|
Stderr: stderr,
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-03-30 21:25:42 +00:00
|
|
|
type ContainerOpts struct {
|
|
|
|
Root string
|
|
|
|
ID string
|
|
|
|
Bundle string
|
|
|
|
Runtime string
|
|
|
|
RuntimeArgs []string
|
2016-04-06 06:42:47 +00:00
|
|
|
Shim string
|
2016-03-30 21:25:42 +00:00
|
|
|
Labels []string
|
|
|
|
NoPivotRoot bool
|
2016-03-28 20:30:37 +00:00
|
|
|
Timeout time.Duration
|
2016-03-30 21:25:42 +00:00
|
|
|
}
|
|
|
|
|
2016-02-01 19:02:41 +00:00
|
|
|
// New returns a new container
|
2016-03-30 21:25:42 +00:00
|
|
|
func New(opts ContainerOpts) (Container, error) {
|
2016-02-01 19:02:41 +00:00
|
|
|
c := &container{
|
2016-03-30 21:25:42 +00:00
|
|
|
root: opts.Root,
|
|
|
|
id: opts.ID,
|
|
|
|
bundle: opts.Bundle,
|
|
|
|
labels: opts.Labels,
|
2016-03-24 20:30:27 +00:00
|
|
|
processes: make(map[string]*process),
|
2016-03-30 21:25:42 +00:00
|
|
|
runtime: opts.Runtime,
|
|
|
|
runtimeArgs: opts.RuntimeArgs,
|
2016-04-06 06:42:47 +00:00
|
|
|
shim: opts.Shim,
|
2016-03-30 21:25:42 +00:00
|
|
|
noPivotRoot: opts.NoPivotRoot,
|
2016-03-28 20:30:37 +00:00
|
|
|
timeout: opts.Timeout,
|
2016-02-01 19:02:41 +00:00
|
|
|
}
|
2016-03-30 21:25:42 +00:00
|
|
|
if err := os.Mkdir(filepath.Join(c.root, c.id), 0755); err != nil {
|
2016-02-01 19:02:41 +00:00
|
|
|
return nil, err
|
|
|
|
}
|
2016-03-30 21:25:42 +00:00
|
|
|
f, err := os.Create(filepath.Join(c.root, c.id, StateFile))
|
2016-02-01 19:02:41 +00:00
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
defer f.Close()
|
|
|
|
if err := json.NewEncoder(f).Encode(state{
|
2016-03-30 21:25:42 +00:00
|
|
|
Bundle: c.bundle,
|
|
|
|
Labels: c.labels,
|
|
|
|
Runtime: c.runtime,
|
|
|
|
RuntimeArgs: c.runtimeArgs,
|
2016-05-02 21:01:48 +00:00
|
|
|
Shim: c.shim,
|
2016-03-30 21:25:42 +00:00
|
|
|
NoPivotRoot: opts.NoPivotRoot,
|
2016-02-01 19:02:41 +00:00
|
|
|
}); err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
return c, nil
|
|
|
|
}
|
|
|
|
|
2016-05-02 21:03:01 +00:00
|
|
|
func Load(root, id string, timeout time.Duration) (Container, error) {
|
2016-02-01 19:02:41 +00:00
|
|
|
var s state
|
|
|
|
f, err := os.Open(filepath.Join(root, id, StateFile))
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
defer f.Close()
|
|
|
|
if err := json.NewDecoder(f).Decode(&s); err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
c := &container{
|
2016-03-24 20:30:27 +00:00
|
|
|
root: root,
|
|
|
|
id: id,
|
|
|
|
bundle: s.Bundle,
|
|
|
|
labels: s.Labels,
|
|
|
|
runtime: s.Runtime,
|
|
|
|
runtimeArgs: s.RuntimeArgs,
|
2016-04-06 06:42:47 +00:00
|
|
|
shim: s.Shim,
|
2016-03-30 21:25:42 +00:00
|
|
|
noPivotRoot: s.NoPivotRoot,
|
2016-03-24 20:30:27 +00:00
|
|
|
processes: make(map[string]*process),
|
2016-05-02 21:03:01 +00:00
|
|
|
timeout: timeout,
|
2016-02-01 19:02:41 +00:00
|
|
|
}
|
|
|
|
dirs, err := ioutil.ReadDir(filepath.Join(root, id))
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
for _, d := range dirs {
|
|
|
|
if !d.IsDir() {
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
pid := d.Name()
|
2016-02-03 21:56:15 +00:00
|
|
|
s, err := readProcessState(filepath.Join(root, id, pid))
|
2016-02-01 19:02:41 +00:00
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
2016-02-03 21:56:15 +00:00
|
|
|
p, err := loadProcess(filepath.Join(root, id, pid), pid, c, s)
|
2016-02-01 19:02:41 +00:00
|
|
|
if err != nil {
|
|
|
|
logrus.WithField("id", id).WithField("pid", pid).Debug("containerd: error loading process %s", err)
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
c.processes[pid] = p
|
|
|
|
}
|
|
|
|
return c, nil
|
|
|
|
}
|
|
|
|
|
2016-02-03 21:56:15 +00:00
|
|
|
func readProcessState(dir string) (*ProcessState, error) {
|
2016-02-01 19:02:41 +00:00
|
|
|
f, err := os.Open(filepath.Join(dir, "process.json"))
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
defer f.Close()
|
2016-02-03 21:56:15 +00:00
|
|
|
var s ProcessState
|
2016-02-01 19:02:41 +00:00
|
|
|
if err := json.NewDecoder(f).Decode(&s); err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
return &s, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
type container struct {
|
|
|
|
// path to store runtime state information
|
2016-03-24 20:30:27 +00:00
|
|
|
root string
|
|
|
|
id string
|
|
|
|
bundle string
|
|
|
|
runtime string
|
|
|
|
runtimeArgs []string
|
2016-04-06 06:42:47 +00:00
|
|
|
shim string
|
2016-03-24 20:30:27 +00:00
|
|
|
processes map[string]*process
|
|
|
|
labels []string
|
|
|
|
oomFds []int
|
2016-03-30 21:25:42 +00:00
|
|
|
noPivotRoot bool
|
2016-03-28 20:30:37 +00:00
|
|
|
timeout time.Duration
|
2016-02-01 19:02:41 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
func (c *container) ID() string {
|
|
|
|
return c.id
|
|
|
|
}
|
|
|
|
|
|
|
|
func (c *container) Path() string {
|
|
|
|
return c.bundle
|
|
|
|
}
|
|
|
|
|
2016-02-11 21:44:25 +00:00
|
|
|
func (c *container) Labels() []string {
|
|
|
|
return c.labels
|
|
|
|
}
|
|
|
|
|
2016-03-15 18:31:32 +00:00
|
|
|
func (c *container) readSpec() (*specs.Spec, error) {
|
|
|
|
var spec specs.Spec
|
2016-02-01 19:02:41 +00:00
|
|
|
f, err := os.Open(filepath.Join(c.bundle, "config.json"))
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
defer f.Close()
|
2016-03-11 07:08:54 +00:00
|
|
|
if err := json.NewDecoder(f).Decode(&spec); err != nil {
|
2016-02-01 19:02:41 +00:00
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
return &spec, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (c *container) Delete() error {
|
2016-03-14 20:57:28 +00:00
|
|
|
err := os.RemoveAll(filepath.Join(c.root, c.id))
|
2016-03-29 17:26:37 +00:00
|
|
|
|
|
|
|
args := c.runtimeArgs
|
|
|
|
args = append(args, "delete", c.id)
|
2016-03-28 20:30:37 +00:00
|
|
|
if derr := exec.Command(c.runtime, args...).Run(); err == nil {
|
|
|
|
err = derr
|
|
|
|
}
|
2016-03-14 20:57:28 +00:00
|
|
|
return err
|
2016-02-01 19:02:41 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
func (c *container) Processes() ([]Process, error) {
|
|
|
|
out := []Process{}
|
|
|
|
for _, p := range c.processes {
|
|
|
|
out = append(out, p)
|
|
|
|
}
|
|
|
|
return out, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (c *container) RemoveProcess(pid string) error {
|
|
|
|
delete(c.processes, pid)
|
2016-02-03 21:56:15 +00:00
|
|
|
return os.RemoveAll(filepath.Join(c.root, c.id, pid))
|
2016-02-01 19:02:41 +00:00
|
|
|
}
|
2016-03-07 23:23:52 +00:00
|
|
|
|
2016-05-09 17:25:52 +00:00
|
|
|
func u64Ptr(i uint64) *uint64 { return &i }
|
|
|
|
|
2016-03-07 23:23:52 +00:00
|
|
|
func (c *container) UpdateResources(r *Resource) error {
|
2016-05-09 17:25:52 +00:00
|
|
|
sr := ocs.Resources{
|
|
|
|
Memory: &ocs.Memory{
|
|
|
|
Limit: u64Ptr(uint64(r.Memory)),
|
|
|
|
Reservation: u64Ptr(uint64(r.MemoryReservation)),
|
|
|
|
Swap: u64Ptr(uint64(r.MemorySwap)),
|
|
|
|
Kernel: u64Ptr(uint64(r.KernelMemory)),
|
|
|
|
},
|
|
|
|
CPU: &ocs.CPU{
|
|
|
|
Shares: u64Ptr(uint64(r.CPUShares)),
|
|
|
|
Quota: u64Ptr(uint64(r.CPUQuota)),
|
|
|
|
Period: u64Ptr(uint64(r.CPUPeriod)),
|
|
|
|
Cpus: &r.CpusetCpus,
|
|
|
|
Mems: &r.CpusetMems,
|
|
|
|
},
|
|
|
|
BlockIO: &ocs.BlockIO{
|
|
|
|
Weight: &r.BlkioWeight,
|
|
|
|
},
|
|
|
|
}
|
|
|
|
|
|
|
|
srStr := bytes.NewBuffer(nil)
|
|
|
|
if err := json.NewEncoder(srStr).Encode(&sr); err != nil {
|
2016-03-07 23:23:52 +00:00
|
|
|
return err
|
|
|
|
}
|
2016-05-09 17:25:52 +00:00
|
|
|
|
|
|
|
args := c.runtimeArgs
|
|
|
|
args = append(args, "update", "-r", "-", c.id)
|
|
|
|
cmd := exec.Command(c.runtime, args...)
|
|
|
|
cmd.Stdin = srStr
|
|
|
|
b, err := cmd.CombinedOutput()
|
|
|
|
if err != nil {
|
|
|
|
return fmt.Errorf(string(b))
|
|
|
|
}
|
|
|
|
return nil
|
2016-03-07 23:23:52 +00:00
|
|
|
}
|
2016-04-26 20:29:35 +00:00
|
|
|
|
|
|
|
func getRootIDs(s *specs.Spec) (int, int, error) {
|
|
|
|
if s == nil {
|
|
|
|
return 0, 0, nil
|
|
|
|
}
|
|
|
|
var hasUserns bool
|
|
|
|
for _, ns := range s.Linux.Namespaces {
|
|
|
|
if ns.Type == ocs.UserNamespace {
|
|
|
|
hasUserns = true
|
|
|
|
break
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if !hasUserns {
|
|
|
|
return 0, 0, nil
|
|
|
|
}
|
|
|
|
uid := hostIDFromMap(0, s.Linux.UIDMappings)
|
|
|
|
gid := hostIDFromMap(0, s.Linux.GIDMappings)
|
|
|
|
return uid, gid, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (c *container) State() State {
|
|
|
|
proc := c.processes["init"]
|
|
|
|
if proc == nil {
|
|
|
|
return Stopped
|
|
|
|
}
|
|
|
|
return proc.State()
|
|
|
|
}
|
|
|
|
|
|
|
|
func (c *container) Runtime() string {
|
|
|
|
return c.runtime
|
|
|
|
}
|
|
|
|
|
|
|
|
func (c *container) Pause() error {
|
|
|
|
args := c.runtimeArgs
|
|
|
|
args = append(args, "pause", c.id)
|
|
|
|
b, err := exec.Command(c.runtime, args...).CombinedOutput()
|
|
|
|
if err != nil {
|
|
|
|
return fmt.Errorf(string(b))
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (c *container) Resume() error {
|
|
|
|
args := c.runtimeArgs
|
|
|
|
args = append(args, "resume", c.id)
|
|
|
|
b, err := exec.Command(c.runtime, args...).CombinedOutput()
|
|
|
|
if err != nil {
|
|
|
|
return fmt.Errorf(string(b))
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (c *container) Checkpoints() ([]Checkpoint, error) {
|
|
|
|
dirs, err := ioutil.ReadDir(filepath.Join(c.bundle, "checkpoints"))
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
var out []Checkpoint
|
|
|
|
for _, d := range dirs {
|
|
|
|
if !d.IsDir() {
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
path := filepath.Join(c.bundle, "checkpoints", d.Name(), "config.json")
|
|
|
|
data, err := ioutil.ReadFile(path)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
var cpt Checkpoint
|
|
|
|
if err := json.Unmarshal(data, &cpt); err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
out = append(out, cpt)
|
|
|
|
}
|
|
|
|
return out, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (c *container) Checkpoint(cpt Checkpoint) error {
|
|
|
|
if err := os.MkdirAll(filepath.Join(c.bundle, "checkpoints"), 0755); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
path := filepath.Join(c.bundle, "checkpoints", cpt.Name)
|
|
|
|
if err := os.Mkdir(path, 0755); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
f, err := os.Create(filepath.Join(path, "config.json"))
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
cpt.Created = time.Now()
|
|
|
|
err = json.NewEncoder(f).Encode(cpt)
|
|
|
|
f.Close()
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
args := []string{
|
|
|
|
"checkpoint",
|
|
|
|
"--image-path", path,
|
|
|
|
}
|
|
|
|
add := func(flags ...string) {
|
|
|
|
args = append(args, flags...)
|
|
|
|
}
|
|
|
|
add(c.runtimeArgs...)
|
|
|
|
if !cpt.Exit {
|
|
|
|
add("--leave-running")
|
|
|
|
}
|
|
|
|
if cpt.Shell {
|
|
|
|
add("--shell-job")
|
|
|
|
}
|
|
|
|
if cpt.Tcp {
|
|
|
|
add("--tcp-established")
|
|
|
|
}
|
|
|
|
if cpt.UnixSockets {
|
|
|
|
add("--ext-unix-sk")
|
|
|
|
}
|
|
|
|
add(c.id)
|
|
|
|
out, err := exec.Command(c.runtime, args...).CombinedOutput()
|
|
|
|
if err != nil {
|
|
|
|
return fmt.Errorf("%s: %s", err.Error(), string(out))
|
|
|
|
}
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
func (c *container) DeleteCheckpoint(name string) error {
|
|
|
|
return os.RemoveAll(filepath.Join(c.bundle, "checkpoints", name))
|
|
|
|
}
|
|
|
|
|
|
|
|
func (c *container) Start(checkpoint string, s Stdio) (Process, error) {
|
|
|
|
processRoot := filepath.Join(c.root, c.id, InitProcessID)
|
|
|
|
if err := os.Mkdir(processRoot, 0755); err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
cmd := exec.Command(c.shim,
|
|
|
|
c.id, c.bundle, c.runtime,
|
|
|
|
)
|
|
|
|
cmd.Dir = processRoot
|
|
|
|
cmd.SysProcAttr = &syscall.SysProcAttr{
|
|
|
|
Setpgid: true,
|
|
|
|
}
|
|
|
|
spec, err := c.readSpec()
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
config := &processConfig{
|
|
|
|
checkpoint: checkpoint,
|
|
|
|
root: processRoot,
|
|
|
|
id: InitProcessID,
|
|
|
|
c: c,
|
|
|
|
stdio: s,
|
|
|
|
spec: spec,
|
|
|
|
processSpec: specs.ProcessSpec(spec.Process),
|
|
|
|
}
|
|
|
|
p, err := newProcess(config)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
if err := c.startCmd(InitProcessID, cmd, p); err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
return p, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (c *container) Exec(pid string, pspec specs.ProcessSpec, s Stdio) (pp Process, err error) {
|
|
|
|
processRoot := filepath.Join(c.root, c.id, pid)
|
|
|
|
if err := os.Mkdir(processRoot, 0755); err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
defer func() {
|
|
|
|
if err != nil {
|
|
|
|
c.RemoveProcess(pid)
|
|
|
|
}
|
|
|
|
}()
|
|
|
|
cmd := exec.Command(c.shim,
|
|
|
|
c.id, c.bundle, c.runtime,
|
|
|
|
)
|
|
|
|
cmd.Dir = processRoot
|
|
|
|
cmd.SysProcAttr = &syscall.SysProcAttr{
|
|
|
|
Setpgid: true,
|
|
|
|
}
|
|
|
|
spec, err := c.readSpec()
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
config := &processConfig{
|
|
|
|
exec: true,
|
|
|
|
id: pid,
|
|
|
|
root: processRoot,
|
|
|
|
c: c,
|
|
|
|
processSpec: pspec,
|
|
|
|
spec: spec,
|
|
|
|
stdio: s,
|
|
|
|
}
|
|
|
|
p, err := newProcess(config)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
if err := c.startCmd(pid, cmd, p); err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
return p, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (c *container) startCmd(pid string, cmd *exec.Cmd, p *process) error {
|
2016-04-27 19:00:29 +00:00
|
|
|
p.cmd = cmd
|
2016-04-26 20:29:35 +00:00
|
|
|
if err := cmd.Start(); err != nil {
|
|
|
|
if exErr, ok := err.(*exec.Error); ok {
|
|
|
|
if exErr.Err == exec.ErrNotFound || exErr.Err == os.ErrNotExist {
|
|
|
|
return fmt.Errorf("%s not installed on system", c.shim)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
if err := c.waitForStart(p, cmd); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
c.processes[pid] = p
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (c *container) getLibctContainer() (libcontainer.Container, error) {
|
|
|
|
runtimeRoot := "/run/runc"
|
|
|
|
|
|
|
|
// Check that the root wasn't changed
|
|
|
|
for _, opt := range c.runtimeArgs {
|
|
|
|
if strings.HasPrefix(opt, "--root=") {
|
|
|
|
runtimeRoot = strings.TrimPrefix(opt, "--root=")
|
|
|
|
break
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
f, err := libcontainer.New(runtimeRoot, libcontainer.Cgroupfs)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
return f.Load(c.id)
|
|
|
|
}
|
|
|
|
|
|
|
|
func hostIDFromMap(id uint32, mp []ocs.IDMapping) int {
|
|
|
|
for _, m := range mp {
|
|
|
|
if (id >= m.ContainerID) && (id <= (m.ContainerID + m.Size - 1)) {
|
|
|
|
return int(m.HostID + (id - m.ContainerID))
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return 0
|
|
|
|
}
|
|
|
|
|
|
|
|
func (c *container) Pids() ([]int, error) {
|
2016-04-26 22:01:24 +00:00
|
|
|
args := c.runtimeArgs
|
|
|
|
args = append(args, "ps", "--format=json", c.id)
|
|
|
|
out, err := exec.Command(c.runtime, args...).CombinedOutput()
|
2016-04-26 20:29:35 +00:00
|
|
|
if err != nil {
|
2016-04-26 21:57:30 +00:00
|
|
|
return nil, fmt.Errorf("%s", out)
|
2016-04-26 21:40:05 +00:00
|
|
|
}
|
|
|
|
var pids []int
|
|
|
|
if err := json.Unmarshal(out, &pids); err != nil {
|
2016-04-26 20:29:35 +00:00
|
|
|
return nil, err
|
|
|
|
}
|
2016-04-26 21:40:05 +00:00
|
|
|
return pids, nil
|
2016-04-26 20:29:35 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
func (c *container) Stats() (*Stat, error) {
|
|
|
|
now := time.Now()
|
2016-04-26 22:01:24 +00:00
|
|
|
args := c.runtimeArgs
|
|
|
|
args = append(args, "events", "--stats", c.id)
|
|
|
|
out, err := exec.Command(c.runtime, args...).CombinedOutput()
|
2016-04-26 20:29:35 +00:00
|
|
|
if err != nil {
|
2016-04-26 21:57:30 +00:00
|
|
|
return nil, fmt.Errorf("%s", out)
|
|
|
|
}
|
|
|
|
s := struct {
|
|
|
|
Data *Stat `json:"data"`
|
|
|
|
}{}
|
|
|
|
if err := json.Unmarshal(out, &s); err != nil {
|
2016-04-26 20:29:35 +00:00
|
|
|
return nil, err
|
|
|
|
}
|
2016-04-26 21:57:30 +00:00
|
|
|
s.Data.Timestamp = now
|
|
|
|
return s.Data, nil
|
2016-04-26 20:29:35 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
func (c *container) OOM() (OOM, error) {
|
|
|
|
container, err := c.getLibctContainer()
|
|
|
|
if err != nil {
|
|
|
|
if lerr, ok := err.(libcontainer.Error); ok {
|
|
|
|
// with oom registration sometimes the container can run, exit, and be destroyed
|
|
|
|
// faster than we can get the state back so we can just ignore this
|
|
|
|
if lerr.Code() == libcontainer.ContainerNotExists {
|
|
|
|
return nil, ErrContainerExited
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
state, err := container.State()
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
memoryPath := state.CgroupPaths["memory"]
|
|
|
|
return c.getMemeoryEventFD(memoryPath)
|
|
|
|
}
|
|
|
|
|
|
|
|
// Status implements the runtime Container interface.
|
|
|
|
func (c *container) Status() (State, error) {
|
|
|
|
args := c.runtimeArgs
|
|
|
|
args = append(args, "state", c.id)
|
|
|
|
|
|
|
|
out, err := exec.Command(c.runtime, args...).CombinedOutput()
|
|
|
|
if err != nil {
|
2016-04-26 21:57:30 +00:00
|
|
|
return "", fmt.Errorf("%s", out)
|
2016-04-26 20:29:35 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// We only require the runtime json output to have a top level Status field.
|
|
|
|
var s struct {
|
|
|
|
Status State `json:"status"`
|
|
|
|
}
|
|
|
|
if err := json.Unmarshal(out, &s); err != nil {
|
|
|
|
return "", err
|
|
|
|
}
|
|
|
|
return s.Status, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (c *container) getMemeoryEventFD(root string) (*oom, error) {
|
|
|
|
f, err := os.Open(filepath.Join(root, "memory.oom_control"))
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
fd, _, serr := syscall.RawSyscall(syscall.SYS_EVENTFD2, 0, syscall.FD_CLOEXEC, 0)
|
|
|
|
if serr != 0 {
|
|
|
|
f.Close()
|
|
|
|
return nil, serr
|
|
|
|
}
|
|
|
|
if err := c.writeEventFD(root, int(f.Fd()), int(fd)); err != nil {
|
|
|
|
syscall.Close(int(fd))
|
|
|
|
f.Close()
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
return &oom{
|
|
|
|
root: root,
|
|
|
|
id: c.id,
|
|
|
|
eventfd: int(fd),
|
|
|
|
control: f,
|
|
|
|
}, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (c *container) writeEventFD(root string, cfd, efd int) error {
|
|
|
|
f, err := os.OpenFile(filepath.Join(root, "cgroup.event_control"), os.O_WRONLY, 0)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
defer f.Close()
|
|
|
|
_, err = f.WriteString(fmt.Sprintf("%d %d", efd, cfd))
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
type waitArgs struct {
|
|
|
|
pid int
|
|
|
|
err error
|
|
|
|
}
|
|
|
|
|
|
|
|
func (c *container) waitForStart(p *process, cmd *exec.Cmd) error {
|
|
|
|
wc := make(chan error, 1)
|
|
|
|
go func() {
|
|
|
|
for {
|
|
|
|
if _, err := p.getPidFromFile(); err != nil {
|
|
|
|
if os.IsNotExist(err) || err == errInvalidPidInt {
|
|
|
|
alive, err := isAlive(cmd)
|
|
|
|
if err != nil {
|
|
|
|
wc <- err
|
|
|
|
return
|
|
|
|
}
|
|
|
|
if !alive {
|
|
|
|
// runc could have failed to run the container so lets get the error
|
|
|
|
// out of the logs or the shim could have encountered an error
|
|
|
|
messages, err := readLogMessages(filepath.Join(p.root, "shim-log.json"))
|
|
|
|
if err != nil {
|
|
|
|
wc <- err
|
|
|
|
return
|
|
|
|
}
|
|
|
|
for _, m := range messages {
|
|
|
|
if m.Level == "error" {
|
|
|
|
wc <- fmt.Errorf("shim error: %v", m.Msg)
|
|
|
|
return
|
|
|
|
}
|
|
|
|
}
|
|
|
|
// no errors reported back from shim, check for runc/runtime errors
|
|
|
|
messages, err = readLogMessages(filepath.Join(p.root, "log.json"))
|
|
|
|
if err != nil {
|
|
|
|
if os.IsNotExist(err) {
|
|
|
|
err = ErrContainerNotStarted
|
|
|
|
}
|
|
|
|
wc <- err
|
|
|
|
return
|
|
|
|
}
|
|
|
|
for _, m := range messages {
|
|
|
|
if m.Level == "error" {
|
|
|
|
wc <- fmt.Errorf("oci runtime error: %v", m.Msg)
|
|
|
|
return
|
|
|
|
}
|
|
|
|
}
|
|
|
|
wc <- ErrContainerNotStarted
|
|
|
|
return
|
|
|
|
}
|
|
|
|
time.Sleep(15 * time.Millisecond)
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
wc <- err
|
|
|
|
return
|
|
|
|
}
|
|
|
|
// the pid file was read successfully
|
|
|
|
wc <- nil
|
|
|
|
return
|
|
|
|
}
|
|
|
|
}()
|
|
|
|
select {
|
|
|
|
case err := <-wc:
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
case <-time.After(c.timeout):
|
|
|
|
cmd.Process.Kill()
|
|
|
|
cmd.Wait()
|
|
|
|
return ErrContainerStartTimeout
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// isAlive checks if the shim that launched the container is still alive
|
|
|
|
func isAlive(cmd *exec.Cmd) (bool, error) {
|
2016-04-27 19:00:29 +00:00
|
|
|
if _, err := syscall.Wait4(cmd.Process.Pid, nil, syscall.WNOHANG, nil); err == nil {
|
|
|
|
return true, nil
|
|
|
|
}
|
2016-04-26 20:29:35 +00:00
|
|
|
if err := syscall.Kill(cmd.Process.Pid, 0); err != nil {
|
|
|
|
if err == syscall.ESRCH {
|
|
|
|
return false, nil
|
|
|
|
}
|
|
|
|
return false, err
|
|
|
|
}
|
|
|
|
return true, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
type oom struct {
|
|
|
|
id string
|
|
|
|
root string
|
|
|
|
control *os.File
|
|
|
|
eventfd int
|
|
|
|
}
|
|
|
|
|
|
|
|
func (o *oom) ContainerID() string {
|
|
|
|
return o.id
|
|
|
|
}
|
|
|
|
|
|
|
|
func (o *oom) FD() int {
|
|
|
|
return o.eventfd
|
|
|
|
}
|
|
|
|
|
|
|
|
func (o *oom) Flush() {
|
|
|
|
buf := make([]byte, 8)
|
|
|
|
syscall.Read(o.eventfd, buf)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (o *oom) Removed() bool {
|
|
|
|
_, err := os.Lstat(filepath.Join(o.root, "cgroup.event_control"))
|
|
|
|
return os.IsNotExist(err)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (o *oom) Close() error {
|
|
|
|
err := syscall.Close(o.eventfd)
|
|
|
|
if cerr := o.control.Close(); err == nil {
|
|
|
|
err = cerr
|
|
|
|
}
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
type message struct {
|
|
|
|
Level string `json:"level"`
|
|
|
|
Msg string `json:"msg"`
|
|
|
|
}
|
|
|
|
|
|
|
|
func readLogMessages(path string) ([]message, error) {
|
|
|
|
var out []message
|
|
|
|
f, err := os.Open(path)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
defer f.Close()
|
|
|
|
dec := json.NewDecoder(f)
|
|
|
|
for {
|
|
|
|
var m message
|
|
|
|
if err := dec.Decode(&m); err != nil {
|
|
|
|
if err == io.EOF {
|
|
|
|
break
|
|
|
|
}
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
out = append(out, m)
|
|
|
|
}
|
|
|
|
return out, nil
|
|
|
|
}
|