Skip to content
This repository has been archived by the owner on May 12, 2021. It is now read-only.

Commit

Permalink
shimv2: monitor sandbox liveness
Browse files Browse the repository at this point in the history
When sandbox quits unexpected, clean things up as much as we can.

Fixes: #1896
Signed-off-by: Peng Tao <bergwolf@hyper.sh>
  • Loading branch information
bergwolf committed Jul 23, 2019
1 parent 262484d commit e02f6dc
Show file tree
Hide file tree
Showing 3 changed files with 47 additions and 0 deletions.
1 change: 1 addition & 0 deletions containerd-shim-v2/service.go
Original file line number Diff line number Diff line change
Expand Up @@ -114,6 +114,7 @@ type service struct {
containers map[string]*container
config *oci.RuntimeConfig
events chan interface{}
monitor chan error

cancel func()

Expand Down
6 changes: 6 additions & 0 deletions containerd-shim-v2/start.go
Original file line number Diff line number Diff line change
Expand Up @@ -30,6 +30,12 @@ func startContainer(ctx context.Context, s *service, c *container) error {
if err != nil {
return err
}
// Start monitor after starting sandbox
s.monitor, err = s.sandbox.Monitor()
if err != nil {
return err
}
go watchSandbox(s)
} else {
_, err := s.sandbox.StartContainer(c.id)
if err != nil {
Expand Down
40 changes: 40 additions & 0 deletions containerd-shim-v2/wait.go
Original file line number Diff line number Diff line change
Expand Up @@ -6,9 +6,11 @@
package containerdshim

import (
"path"
"time"

"github.com/containerd/containerd/api/types/task"
"github.com/containerd/containerd/mount"
"github.com/sirupsen/logrus"
)

Expand Down Expand Up @@ -82,3 +84,41 @@ func wait(s *service, c *container, execID string) (int32, error) {

return ret, nil
}

func watchSandbox(s *service) {
if s.monitor == nil {
return
}
err := <-s.monitor
if err == nil {
return
}
s.monitor = nil

s.mu.Lock()
defer s.mu.Unlock()
// sandbox malfunctioning, cleanup as much as we can
logrus.WithError(err).Warn("sandbox stopped unexpectedly")
err = s.sandbox.Stop(true)
if err != nil {
logrus.WithError(err).Warn("stop sandbox failed")
}
err = s.sandbox.Delete()
if err != nil {
logrus.WithError(err).Warn("delete sandbox failed")
}

if s.mount {
for _, c := range s.containers {
rootfs := path.Join(c.bundle, "rootfs")
logrus.WithField("rootfs", rootfs).WithField("id", c.id).Debug("container umount rootfs")
if err := mount.UnmountAll(rootfs, 0); err != nil {
logrus.WithError(err).Warn("failed to cleanup rootfs mount")
}
}
}
s.containers = make(map[string]*container)

// Existing container/exec will be cleaned up by its waiters.
// No need to send async events here.
}

0 comments on commit e02f6dc

Please sign in to comment.