220 lines
		
	
	
		
			6.9 KiB
		
	
	
	
		
			Go
		
	
	
	
	
	
			
		
		
	
	
			220 lines
		
	
	
		
			6.9 KiB
		
	
	
	
		
			Go
		
	
	
	
	
	
| /*
 | |
|    Copyright The containerd Authors.
 | |
| 
 | |
|    Licensed under the Apache License, Version 2.0 (the "License");
 | |
|    you may not use this file except in compliance with the License.
 | |
|    You may obtain a copy of the License at
 | |
| 
 | |
|        http://www.apache.org/licenses/LICENSE-2.0
 | |
| 
 | |
|    Unless required by applicable law or agreed to in writing, software
 | |
|    distributed under the License is distributed on an "AS IS" BASIS,
 | |
|    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 | |
|    See the License for the specific language governing permissions and
 | |
|    limitations under the License.
 | |
| */
 | |
| 
 | |
| // Package restart enables containers to have labels added and monitored to
 | |
| // keep the container's task running if it is killed.
 | |
| //
 | |
| // Setting the StatusLabel on a container instructs the restart monitor to keep
 | |
| // that container's task in a specific status.
 | |
| // Setting the LogPathLabel on a container will setup the task's IO to be redirected
 | |
| // to a log file when running a task within the restart manager.
 | |
| //
 | |
| // The restart labels can be cleared off of a container using the WithNoRestarts Opt.
 | |
| //
 | |
| // The restart monitor has one option in the containerd config under the [plugins.restart]
 | |
| // section.  `interval = "10s" sets the reconcile interval that the restart monitor checks
 | |
| // for task state and reconciles the desired status for that task.
 | |
| package restart
 | |
| 
 | |
| import (
 | |
| 	"context"
 | |
| 	"fmt"
 | |
| 	"net/url"
 | |
| 	"strconv"
 | |
| 	"strings"
 | |
| 
 | |
| 	"github.com/containerd/containerd"
 | |
| 	"github.com/containerd/containerd/cio"
 | |
| 	"github.com/containerd/containerd/containers"
 | |
| 	"github.com/sirupsen/logrus"
 | |
| )
 | |
| 
 | |
| const (
 | |
| 	// StatusLabel sets the restart status label for a container
 | |
| 	StatusLabel = "containerd.io/restart.status"
 | |
| 	// LogURILabel sets the restart log uri label for a container
 | |
| 	LogURILabel = "containerd.io/restart.loguri"
 | |
| 
 | |
| 	// PolicyLabel sets the restart policy label for a container
 | |
| 	PolicyLabel = "containerd.io/restart.policy"
 | |
| 	// CountLabel sets the restart count label for a container
 | |
| 	CountLabel = "containerd.io/restart.count"
 | |
| 	// ExplicitlyStoppedLabel sets the restart explicitly stopped label for a container
 | |
| 	ExplicitlyStoppedLabel = "containerd.io/restart.explicitly-stopped"
 | |
| )
 | |
| 
 | |
| // Policy represents the restart policies of a container.
 | |
| type Policy struct {
 | |
| 	name              string
 | |
| 	maximumRetryCount int
 | |
| }
 | |
| 
 | |
| // NewPolicy creates a restart policy with the specified name.
 | |
| // supports the following restart policies:
 | |
| // - no, Do not restart the container.
 | |
| // - always, Always restart the container regardless of the exit status.
 | |
| // - on-failure[:max-retries], Restart only if the container exits with a non-zero exit status.
 | |
| // - unless-stopped, Always restart the container unless it is stopped.
 | |
| func NewPolicy(policy string) (*Policy, error) {
 | |
| 	policySlice := strings.Split(policy, ":")
 | |
| 	var (
 | |
| 		err        error
 | |
| 		retryCount int
 | |
| 	)
 | |
| 	switch policySlice[0] {
 | |
| 	case "", "no", "always", "unless-stopped":
 | |
| 		policy = policySlice[0]
 | |
| 		if policy == "" {
 | |
| 			policy = "always"
 | |
| 		}
 | |
| 		if len(policySlice) > 1 {
 | |
| 			return nil, fmt.Errorf("restart policy %q not support max retry count", policySlice[0])
 | |
| 		}
 | |
| 	case "on-failure":
 | |
| 		policy = policySlice[0]
 | |
| 		if len(policySlice) > 1 {
 | |
| 			retryCount, err = strconv.Atoi(policySlice[1])
 | |
| 			if err != nil {
 | |
| 				return nil, fmt.Errorf("invalid max retry count: %s", policySlice[1])
 | |
| 			}
 | |
| 		}
 | |
| 	default:
 | |
| 		return nil, fmt.Errorf("restart policy %q not supported", policy)
 | |
| 	}
 | |
| 	return &Policy{
 | |
| 		name:              policy,
 | |
| 		maximumRetryCount: retryCount,
 | |
| 	}, nil
 | |
| }
 | |
| 
 | |
| func (rp *Policy) String() string {
 | |
| 	if rp.maximumRetryCount > 0 {
 | |
| 		return fmt.Sprintf("%s:%d", rp.name, rp.maximumRetryCount)
 | |
| 	}
 | |
| 	return rp.name
 | |
| }
 | |
| 
 | |
| func (rp *Policy) Name() string {
 | |
| 	return rp.name
 | |
| }
 | |
| 
 | |
| func (rp *Policy) MaximumRetryCount() int {
 | |
| 	return rp.maximumRetryCount
 | |
| }
 | |
| 
 | |
| // Reconcile reconciles the restart policy of a container.
 | |
| func Reconcile(status containerd.Status, labels map[string]string) bool {
 | |
| 	rp, err := NewPolicy(labels[PolicyLabel])
 | |
| 	if err != nil {
 | |
| 		logrus.WithError(err).Error("policy reconcile")
 | |
| 		return false
 | |
| 	}
 | |
| 	switch rp.Name() {
 | |
| 	case "", "always":
 | |
| 		return true
 | |
| 	case "on-failure":
 | |
| 		restartCount, err := strconv.Atoi(labels[CountLabel])
 | |
| 		if err != nil && labels[CountLabel] != "" {
 | |
| 			logrus.WithError(err).Error("policy reconcile")
 | |
| 			return false
 | |
| 		}
 | |
| 		if status.ExitStatus != 0 && (rp.maximumRetryCount == 0 || restartCount < rp.maximumRetryCount) {
 | |
| 			return true
 | |
| 		}
 | |
| 	case "unless-stopped":
 | |
| 		explicitlyStopped, _ := strconv.ParseBool(labels[ExplicitlyStoppedLabel])
 | |
| 		if !explicitlyStopped {
 | |
| 			return true
 | |
| 		}
 | |
| 	}
 | |
| 	return false
 | |
| }
 | |
| 
 | |
| // WithLogURI sets the specified log uri for a container.
 | |
| func WithLogURI(uri *url.URL) func(context.Context, *containerd.Client, *containers.Container) error {
 | |
| 	return WithLogURIString(uri.String())
 | |
| }
 | |
| 
 | |
| // WithLogURIString sets the specified log uri string for a container.
 | |
| func WithLogURIString(uriString string) func(context.Context, *containerd.Client, *containers.Container) error {
 | |
| 	return func(_ context.Context, _ *containerd.Client, c *containers.Container) error {
 | |
| 		ensureLabels(c)
 | |
| 		c.Labels[LogURILabel] = uriString
 | |
| 		return nil
 | |
| 	}
 | |
| }
 | |
| 
 | |
| // WithBinaryLogURI sets the binary-type log uri for a container.
 | |
| //
 | |
| // Deprecated(in release 1.5): use WithLogURI
 | |
| func WithBinaryLogURI(binary string, args map[string]string) func(context.Context, *containerd.Client, *containers.Container) error {
 | |
| 	uri, err := cio.LogURIGenerator("binary", binary, args)
 | |
| 	if err != nil {
 | |
| 		return func(context.Context, *containerd.Client, *containers.Container) error {
 | |
| 			return err
 | |
| 		}
 | |
| 	}
 | |
| 	return WithLogURI(uri)
 | |
| }
 | |
| 
 | |
| // WithFileLogURI sets the file-type log uri for a container.
 | |
| //
 | |
| // Deprecated(in release 1.5): use WithLogURI
 | |
| func WithFileLogURI(path string) func(context.Context, *containerd.Client, *containers.Container) error {
 | |
| 	uri, err := cio.LogURIGenerator("file", path, nil)
 | |
| 	if err != nil {
 | |
| 		return func(context.Context, *containerd.Client, *containers.Container) error {
 | |
| 			return err
 | |
| 		}
 | |
| 	}
 | |
| 	return WithLogURI(uri)
 | |
| }
 | |
| 
 | |
| // WithStatus sets the status for a container
 | |
| func WithStatus(status containerd.ProcessStatus) func(context.Context, *containerd.Client, *containers.Container) error {
 | |
| 	return func(_ context.Context, _ *containerd.Client, c *containers.Container) error {
 | |
| 		ensureLabels(c)
 | |
| 		c.Labels[StatusLabel] = string(status)
 | |
| 		return nil
 | |
| 	}
 | |
| }
 | |
| 
 | |
| // WithPolicy sets the restart policy for a container
 | |
| func WithPolicy(policy *Policy) func(context.Context, *containerd.Client, *containers.Container) error {
 | |
| 	return func(_ context.Context, _ *containerd.Client, c *containers.Container) error {
 | |
| 		ensureLabels(c)
 | |
| 		c.Labels[PolicyLabel] = policy.String()
 | |
| 		return nil
 | |
| 	}
 | |
| }
 | |
| 
 | |
| // WithNoRestarts clears any restart information from the container
 | |
| func WithNoRestarts(_ context.Context, _ *containerd.Client, c *containers.Container) error {
 | |
| 	if c.Labels == nil {
 | |
| 		return nil
 | |
| 	}
 | |
| 	delete(c.Labels, StatusLabel)
 | |
| 	delete(c.Labels, PolicyLabel)
 | |
| 	delete(c.Labels, LogURILabel)
 | |
| 	return nil
 | |
| }
 | |
| 
 | |
| func ensureLabels(c *containers.Container) {
 | |
| 	if c.Labels == nil {
 | |
| 		c.Labels = make(map[string]string)
 | |
| 	}
 | |
| }
 | 
