Provide a flag which configures a lease to only hold reference to its given references and ignore label references during garbage collection rooted from the lease. Signed-off-by: Derek McGowan <derek@mcgstyle.net>
		
			
				
	
	
		
			514 lines
		
	
	
		
			12 KiB
		
	
	
	
		
			Go
		
	
	
	
	
	
			
		
		
	
	
			514 lines
		
	
	
		
			12 KiB
		
	
	
	
		
			Go
		
	
	
	
	
	
/*
 | 
						|
   Copyright The containerd Authors.
 | 
						|
 | 
						|
   Licensed under the Apache License, Version 2.0 (the "License");
 | 
						|
   you may not use this file except in compliance with the License.
 | 
						|
   You may obtain a copy of the License at
 | 
						|
 | 
						|
       http://www.apache.org/licenses/LICENSE-2.0
 | 
						|
 | 
						|
   Unless required by applicable law or agreed to in writing, software
 | 
						|
   distributed under the License is distributed on an "AS IS" BASIS,
 | 
						|
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 | 
						|
   See the License for the specific language governing permissions and
 | 
						|
   limitations under the License.
 | 
						|
*/
 | 
						|
 | 
						|
package metadata
 | 
						|
 | 
						|
import (
 | 
						|
	"bytes"
 | 
						|
	"context"
 | 
						|
	"fmt"
 | 
						|
	"strings"
 | 
						|
	"time"
 | 
						|
 | 
						|
	"github.com/containerd/containerd/gc"
 | 
						|
	"github.com/containerd/containerd/log"
 | 
						|
	"github.com/pkg/errors"
 | 
						|
	bolt "go.etcd.io/bbolt"
 | 
						|
)
 | 
						|
 | 
						|
const (
 | 
						|
	// ResourceUnknown specifies an unknown resource
 | 
						|
	ResourceUnknown gc.ResourceType = iota
 | 
						|
	// ResourceContent specifies a content resource
 | 
						|
	ResourceContent
 | 
						|
	// ResourceSnapshot specifies a snapshot resource
 | 
						|
	ResourceSnapshot
 | 
						|
	// ResourceContainer specifies a container resource
 | 
						|
	ResourceContainer
 | 
						|
	// ResourceTask specifies a task resource
 | 
						|
	ResourceTask
 | 
						|
	// ResourceLease specifies a lease
 | 
						|
	ResourceLease
 | 
						|
	// ResourceIngest specifies a content ingest
 | 
						|
	ResourceIngest
 | 
						|
)
 | 
						|
 | 
						|
const (
 | 
						|
	resourceContentFlat  = ResourceContent | 0x20
 | 
						|
	resourceSnapshotFlat = ResourceSnapshot | 0x20
 | 
						|
)
 | 
						|
 | 
						|
var (
 | 
						|
	labelGCRoot       = []byte("containerd.io/gc.root")
 | 
						|
	labelGCSnapRef    = []byte("containerd.io/gc.ref.snapshot.")
 | 
						|
	labelGCContentRef = []byte("containerd.io/gc.ref.content")
 | 
						|
	labelGCExpire     = []byte("containerd.io/gc.expire")
 | 
						|
	labelGCFlat       = []byte("containerd.io/gc.flat")
 | 
						|
)
 | 
						|
 | 
						|
func scanRoots(ctx context.Context, tx *bolt.Tx, nc chan<- gc.Node) error {
 | 
						|
	v1bkt := tx.Bucket(bucketKeyVersion)
 | 
						|
	if v1bkt == nil {
 | 
						|
		return nil
 | 
						|
	}
 | 
						|
 | 
						|
	expThreshold := time.Now()
 | 
						|
 | 
						|
	// iterate through each namespace
 | 
						|
	v1c := v1bkt.Cursor()
 | 
						|
 | 
						|
	// cerr indicates the scan did not successfully send all
 | 
						|
	// the roots. The scan does not need to be cancelled but
 | 
						|
	// must return error at the end.
 | 
						|
	var cerr error
 | 
						|
	fn := func(n gc.Node) {
 | 
						|
		select {
 | 
						|
		case nc <- n:
 | 
						|
		case <-ctx.Done():
 | 
						|
			cerr = ctx.Err()
 | 
						|
		}
 | 
						|
	}
 | 
						|
 | 
						|
	for k, v := v1c.First(); k != nil; k, v = v1c.Next() {
 | 
						|
		if v != nil {
 | 
						|
			continue
 | 
						|
		}
 | 
						|
		nbkt := v1bkt.Bucket(k)
 | 
						|
		ns := string(k)
 | 
						|
 | 
						|
		lbkt := nbkt.Bucket(bucketKeyObjectLeases)
 | 
						|
		if lbkt != nil {
 | 
						|
			if err := lbkt.ForEach(func(k, v []byte) error {
 | 
						|
				if v != nil {
 | 
						|
					return nil
 | 
						|
				}
 | 
						|
				libkt := lbkt.Bucket(k)
 | 
						|
				var flat bool
 | 
						|
 | 
						|
				if lblbkt := libkt.Bucket(bucketKeyObjectLabels); lblbkt != nil {
 | 
						|
					if expV := lblbkt.Get(labelGCExpire); expV != nil {
 | 
						|
						exp, err := time.Parse(time.RFC3339, string(expV))
 | 
						|
						if err != nil {
 | 
						|
							// label not used, log and continue to use lease
 | 
						|
							log.G(ctx).WithError(err).WithField("lease", string(k)).Infof("ignoring invalid expiration value %q", string(expV))
 | 
						|
						} else if expThreshold.After(exp) {
 | 
						|
							// lease has expired, skip
 | 
						|
							return nil
 | 
						|
						}
 | 
						|
					}
 | 
						|
 | 
						|
					if flatV := lblbkt.Get(labelGCFlat); flatV != nil {
 | 
						|
						flat = true
 | 
						|
					}
 | 
						|
				}
 | 
						|
 | 
						|
				fn(gcnode(ResourceLease, ns, string(k)))
 | 
						|
 | 
						|
				// Emit content and snapshots as roots instead of implementing
 | 
						|
				// in references. Since leases cannot be referenced there is
 | 
						|
				// no need to allow the lookup to be recursive, handling here
 | 
						|
				// therefore reduces the number of database seeks.
 | 
						|
 | 
						|
				ctype := ResourceContent
 | 
						|
				if flat {
 | 
						|
					ctype = resourceContentFlat
 | 
						|
				}
 | 
						|
 | 
						|
				cbkt := libkt.Bucket(bucketKeyObjectContent)
 | 
						|
				if cbkt != nil {
 | 
						|
					if err := cbkt.ForEach(func(k, v []byte) error {
 | 
						|
						fn(gcnode(ctype, ns, string(k)))
 | 
						|
						return nil
 | 
						|
					}); err != nil {
 | 
						|
						return err
 | 
						|
					}
 | 
						|
				}
 | 
						|
 | 
						|
				stype := ResourceSnapshot
 | 
						|
				if flat {
 | 
						|
					stype = resourceSnapshotFlat
 | 
						|
				}
 | 
						|
 | 
						|
				sbkt := libkt.Bucket(bucketKeyObjectSnapshots)
 | 
						|
				if sbkt != nil {
 | 
						|
					if err := sbkt.ForEach(func(sk, sv []byte) error {
 | 
						|
						if sv != nil {
 | 
						|
							return nil
 | 
						|
						}
 | 
						|
						snbkt := sbkt.Bucket(sk)
 | 
						|
 | 
						|
						return snbkt.ForEach(func(k, v []byte) error {
 | 
						|
							fn(gcnode(stype, ns, fmt.Sprintf("%s/%s", sk, k)))
 | 
						|
							return nil
 | 
						|
						})
 | 
						|
					}); err != nil {
 | 
						|
						return err
 | 
						|
					}
 | 
						|
				}
 | 
						|
 | 
						|
				ibkt := libkt.Bucket(bucketKeyObjectIngests)
 | 
						|
				if ibkt != nil {
 | 
						|
					if err := ibkt.ForEach(func(k, v []byte) error {
 | 
						|
						fn(gcnode(ResourceIngest, ns, string(k)))
 | 
						|
						return nil
 | 
						|
					}); err != nil {
 | 
						|
						return err
 | 
						|
					}
 | 
						|
				}
 | 
						|
 | 
						|
				return nil
 | 
						|
			}); err != nil {
 | 
						|
				return err
 | 
						|
			}
 | 
						|
		}
 | 
						|
 | 
						|
		ibkt := nbkt.Bucket(bucketKeyObjectImages)
 | 
						|
		if ibkt != nil {
 | 
						|
			if err := ibkt.ForEach(func(k, v []byte) error {
 | 
						|
				if v != nil {
 | 
						|
					return nil
 | 
						|
				}
 | 
						|
 | 
						|
				target := ibkt.Bucket(k).Bucket(bucketKeyTarget)
 | 
						|
				if target != nil {
 | 
						|
					contentKey := string(target.Get(bucketKeyDigest))
 | 
						|
					fn(gcnode(ResourceContent, ns, contentKey))
 | 
						|
				}
 | 
						|
				return sendLabelRefs(ns, ibkt.Bucket(k), fn)
 | 
						|
			}); err != nil {
 | 
						|
				return err
 | 
						|
			}
 | 
						|
		}
 | 
						|
 | 
						|
		cbkt := nbkt.Bucket(bucketKeyObjectContent)
 | 
						|
		if cbkt != nil {
 | 
						|
			ibkt := cbkt.Bucket(bucketKeyObjectIngests)
 | 
						|
			if ibkt != nil {
 | 
						|
				if err := ibkt.ForEach(func(k, v []byte) error {
 | 
						|
					if v != nil {
 | 
						|
						return nil
 | 
						|
					}
 | 
						|
					ea, err := readExpireAt(ibkt.Bucket(k))
 | 
						|
					if err != nil {
 | 
						|
						return err
 | 
						|
					}
 | 
						|
					if ea == nil || expThreshold.After(*ea) {
 | 
						|
						return nil
 | 
						|
					}
 | 
						|
					fn(gcnode(ResourceIngest, ns, string(k)))
 | 
						|
					return nil
 | 
						|
				}); err != nil {
 | 
						|
					return err
 | 
						|
				}
 | 
						|
			}
 | 
						|
			cbkt = cbkt.Bucket(bucketKeyObjectBlob)
 | 
						|
			if cbkt != nil {
 | 
						|
				if err := cbkt.ForEach(func(k, v []byte) error {
 | 
						|
					if v != nil {
 | 
						|
						return nil
 | 
						|
					}
 | 
						|
 | 
						|
					if isRootRef(cbkt.Bucket(k)) {
 | 
						|
						fn(gcnode(ResourceContent, ns, string(k)))
 | 
						|
					}
 | 
						|
 | 
						|
					return nil
 | 
						|
				}); err != nil {
 | 
						|
					return err
 | 
						|
				}
 | 
						|
			}
 | 
						|
		}
 | 
						|
 | 
						|
		cbkt = nbkt.Bucket(bucketKeyObjectContainers)
 | 
						|
		if cbkt != nil {
 | 
						|
			if err := cbkt.ForEach(func(k, v []byte) error {
 | 
						|
				if v != nil {
 | 
						|
					return nil
 | 
						|
				}
 | 
						|
 | 
						|
				cibkt := cbkt.Bucket(k)
 | 
						|
				snapshotter := string(cibkt.Get(bucketKeySnapshotter))
 | 
						|
				if snapshotter != "" {
 | 
						|
					ss := string(cibkt.Get(bucketKeySnapshotKey))
 | 
						|
					fn(gcnode(ResourceSnapshot, ns, fmt.Sprintf("%s/%s", snapshotter, ss)))
 | 
						|
				}
 | 
						|
 | 
						|
				return sendLabelRefs(ns, cibkt, fn)
 | 
						|
			}); err != nil {
 | 
						|
				return err
 | 
						|
			}
 | 
						|
		}
 | 
						|
 | 
						|
		sbkt := nbkt.Bucket(bucketKeyObjectSnapshots)
 | 
						|
		if sbkt != nil {
 | 
						|
			if err := sbkt.ForEach(func(sk, sv []byte) error {
 | 
						|
				if sv != nil {
 | 
						|
					return nil
 | 
						|
				}
 | 
						|
				snbkt := sbkt.Bucket(sk)
 | 
						|
 | 
						|
				return snbkt.ForEach(func(k, v []byte) error {
 | 
						|
					if v != nil {
 | 
						|
						return nil
 | 
						|
					}
 | 
						|
					if isRootRef(snbkt.Bucket(k)) {
 | 
						|
						fn(gcnode(ResourceSnapshot, ns, fmt.Sprintf("%s/%s", sk, k)))
 | 
						|
					}
 | 
						|
					return nil
 | 
						|
				})
 | 
						|
			}); err != nil {
 | 
						|
				return err
 | 
						|
			}
 | 
						|
		}
 | 
						|
	}
 | 
						|
	return cerr
 | 
						|
}
 | 
						|
 | 
						|
func references(ctx context.Context, tx *bolt.Tx, node gc.Node, fn func(gc.Node)) error {
 | 
						|
	switch node.Type {
 | 
						|
	case ResourceContent:
 | 
						|
		bkt := getBucket(tx, bucketKeyVersion, []byte(node.Namespace), bucketKeyObjectContent, bucketKeyObjectBlob, []byte(node.Key))
 | 
						|
		if bkt == nil {
 | 
						|
			// Node may be created from dead edge
 | 
						|
			return nil
 | 
						|
		}
 | 
						|
 | 
						|
		return sendLabelRefs(node.Namespace, bkt, fn)
 | 
						|
	case ResourceSnapshot, resourceSnapshotFlat:
 | 
						|
		parts := strings.SplitN(node.Key, "/", 2)
 | 
						|
		if len(parts) != 2 {
 | 
						|
			return errors.Errorf("invalid snapshot gc key %s", node.Key)
 | 
						|
		}
 | 
						|
		ss := parts[0]
 | 
						|
		name := parts[1]
 | 
						|
 | 
						|
		bkt := getBucket(tx, bucketKeyVersion, []byte(node.Namespace), bucketKeyObjectSnapshots, []byte(ss), []byte(name))
 | 
						|
		if bkt == nil {
 | 
						|
			// Node may be created from dead edge
 | 
						|
			return nil
 | 
						|
		}
 | 
						|
 | 
						|
		if pv := bkt.Get(bucketKeyParent); len(pv) > 0 {
 | 
						|
			fn(gcnode(node.Type, node.Namespace, fmt.Sprintf("%s/%s", ss, pv)))
 | 
						|
		}
 | 
						|
 | 
						|
		// Do not send labeled references for flat snapshot refs
 | 
						|
		if node.Type == resourceSnapshotFlat {
 | 
						|
			return nil
 | 
						|
		}
 | 
						|
 | 
						|
		return sendLabelRefs(node.Namespace, bkt, fn)
 | 
						|
	case ResourceIngest:
 | 
						|
		// Send expected value
 | 
						|
		bkt := getBucket(tx, bucketKeyVersion, []byte(node.Namespace), bucketKeyObjectContent, bucketKeyObjectIngests, []byte(node.Key))
 | 
						|
		if bkt == nil {
 | 
						|
			// Node may be created from dead edge
 | 
						|
			return nil
 | 
						|
		}
 | 
						|
		// Load expected
 | 
						|
		expected := bkt.Get(bucketKeyExpected)
 | 
						|
		if len(expected) > 0 {
 | 
						|
			fn(gcnode(ResourceContent, node.Namespace, string(expected)))
 | 
						|
		}
 | 
						|
		return nil
 | 
						|
	}
 | 
						|
 | 
						|
	return nil
 | 
						|
}
 | 
						|
 | 
						|
func scanAll(ctx context.Context, tx *bolt.Tx, fn func(ctx context.Context, n gc.Node) error) error {
 | 
						|
	v1bkt := tx.Bucket(bucketKeyVersion)
 | 
						|
	if v1bkt == nil {
 | 
						|
		return nil
 | 
						|
	}
 | 
						|
 | 
						|
	// iterate through each namespace
 | 
						|
	v1c := v1bkt.Cursor()
 | 
						|
 | 
						|
	for k, v := v1c.First(); k != nil; k, v = v1c.Next() {
 | 
						|
		if v != nil {
 | 
						|
			continue
 | 
						|
		}
 | 
						|
		nbkt := v1bkt.Bucket(k)
 | 
						|
		ns := string(k)
 | 
						|
 | 
						|
		lbkt := nbkt.Bucket(bucketKeyObjectLeases)
 | 
						|
		if lbkt != nil {
 | 
						|
			if err := lbkt.ForEach(func(k, v []byte) error {
 | 
						|
				if v != nil {
 | 
						|
					return nil
 | 
						|
				}
 | 
						|
				return fn(ctx, gcnode(ResourceLease, ns, string(k)))
 | 
						|
			}); err != nil {
 | 
						|
				return err
 | 
						|
			}
 | 
						|
		}
 | 
						|
 | 
						|
		sbkt := nbkt.Bucket(bucketKeyObjectSnapshots)
 | 
						|
		if sbkt != nil {
 | 
						|
			if err := sbkt.ForEach(func(sk, sv []byte) error {
 | 
						|
				if sv != nil {
 | 
						|
					return nil
 | 
						|
				}
 | 
						|
				snbkt := sbkt.Bucket(sk)
 | 
						|
				return snbkt.ForEach(func(k, v []byte) error {
 | 
						|
					if v != nil {
 | 
						|
						return nil
 | 
						|
					}
 | 
						|
					node := gcnode(ResourceSnapshot, ns, fmt.Sprintf("%s/%s", sk, k))
 | 
						|
					return fn(ctx, node)
 | 
						|
				})
 | 
						|
			}); err != nil {
 | 
						|
				return err
 | 
						|
			}
 | 
						|
		}
 | 
						|
 | 
						|
		cbkt := nbkt.Bucket(bucketKeyObjectContent)
 | 
						|
		if cbkt != nil {
 | 
						|
			ibkt := cbkt.Bucket(bucketKeyObjectIngests)
 | 
						|
			if ibkt != nil {
 | 
						|
				if err := ibkt.ForEach(func(k, v []byte) error {
 | 
						|
					if v != nil {
 | 
						|
						return nil
 | 
						|
					}
 | 
						|
					node := gcnode(ResourceIngest, ns, string(k))
 | 
						|
					return fn(ctx, node)
 | 
						|
				}); err != nil {
 | 
						|
					return err
 | 
						|
				}
 | 
						|
			}
 | 
						|
 | 
						|
			cbkt = cbkt.Bucket(bucketKeyObjectBlob)
 | 
						|
			if cbkt != nil {
 | 
						|
				if err := cbkt.ForEach(func(k, v []byte) error {
 | 
						|
					if v != nil {
 | 
						|
						return nil
 | 
						|
					}
 | 
						|
					node := gcnode(ResourceContent, ns, string(k))
 | 
						|
					return fn(ctx, node)
 | 
						|
				}); err != nil {
 | 
						|
					return err
 | 
						|
				}
 | 
						|
			}
 | 
						|
		}
 | 
						|
	}
 | 
						|
 | 
						|
	return nil
 | 
						|
}
 | 
						|
 | 
						|
func remove(ctx context.Context, tx *bolt.Tx, node gc.Node) error {
 | 
						|
	v1bkt := tx.Bucket(bucketKeyVersion)
 | 
						|
	if v1bkt == nil {
 | 
						|
		return nil
 | 
						|
	}
 | 
						|
 | 
						|
	nsbkt := v1bkt.Bucket([]byte(node.Namespace))
 | 
						|
	if nsbkt == nil {
 | 
						|
		return nil
 | 
						|
	}
 | 
						|
 | 
						|
	switch node.Type {
 | 
						|
	case ResourceContent:
 | 
						|
		cbkt := nsbkt.Bucket(bucketKeyObjectContent)
 | 
						|
		if cbkt != nil {
 | 
						|
			cbkt = cbkt.Bucket(bucketKeyObjectBlob)
 | 
						|
		}
 | 
						|
		if cbkt != nil {
 | 
						|
			log.G(ctx).WithField("key", node.Key).Debug("remove content")
 | 
						|
			return cbkt.DeleteBucket([]byte(node.Key))
 | 
						|
		}
 | 
						|
	case ResourceSnapshot:
 | 
						|
		sbkt := nsbkt.Bucket(bucketKeyObjectSnapshots)
 | 
						|
		if sbkt != nil {
 | 
						|
			parts := strings.SplitN(node.Key, "/", 2)
 | 
						|
			if len(parts) != 2 {
 | 
						|
				return errors.Errorf("invalid snapshot gc key %s", node.Key)
 | 
						|
			}
 | 
						|
			ssbkt := sbkt.Bucket([]byte(parts[0]))
 | 
						|
			if ssbkt != nil {
 | 
						|
				log.G(ctx).WithField("key", parts[1]).WithField("snapshotter", parts[0]).Debug("remove snapshot")
 | 
						|
				return ssbkt.DeleteBucket([]byte(parts[1]))
 | 
						|
			}
 | 
						|
		}
 | 
						|
	case ResourceLease:
 | 
						|
		lbkt := nsbkt.Bucket(bucketKeyObjectLeases)
 | 
						|
		if lbkt != nil {
 | 
						|
			return lbkt.DeleteBucket([]byte(node.Key))
 | 
						|
		}
 | 
						|
	case ResourceIngest:
 | 
						|
		ibkt := nsbkt.Bucket(bucketKeyObjectContent)
 | 
						|
		if ibkt != nil {
 | 
						|
			ibkt = ibkt.Bucket(bucketKeyObjectIngests)
 | 
						|
		}
 | 
						|
		if ibkt != nil {
 | 
						|
			log.G(ctx).WithField("ref", node.Key).Debug("remove ingest")
 | 
						|
			return ibkt.DeleteBucket([]byte(node.Key))
 | 
						|
		}
 | 
						|
	}
 | 
						|
 | 
						|
	return nil
 | 
						|
}
 | 
						|
 | 
						|
// sendLabelRefs sends all snapshot and content references referred to by the labels in the bkt
 | 
						|
func sendLabelRefs(ns string, bkt *bolt.Bucket, fn func(gc.Node)) error {
 | 
						|
	lbkt := bkt.Bucket(bucketKeyObjectLabels)
 | 
						|
	if lbkt != nil {
 | 
						|
		lc := lbkt.Cursor()
 | 
						|
 | 
						|
		labelRef := string(labelGCContentRef)
 | 
						|
		for k, v := lc.Seek(labelGCContentRef); k != nil && strings.HasPrefix(string(k), labelRef); k, v = lc.Next() {
 | 
						|
			if ks := string(k); ks != labelRef {
 | 
						|
				// Allow reference naming separated by . or /, ignore names
 | 
						|
				if ks[len(labelRef)] != '.' && ks[len(labelRef)] != '/' {
 | 
						|
					continue
 | 
						|
				}
 | 
						|
			}
 | 
						|
 | 
						|
			fn(gcnode(ResourceContent, ns, string(v)))
 | 
						|
		}
 | 
						|
 | 
						|
		for k, v := lc.Seek(labelGCSnapRef); k != nil && strings.HasPrefix(string(k), string(labelGCSnapRef)); k, v = lc.Next() {
 | 
						|
			snapshotter := k[len(labelGCSnapRef):]
 | 
						|
			if i := bytes.IndexByte(snapshotter, '/'); i >= 0 {
 | 
						|
				snapshotter = snapshotter[:i]
 | 
						|
			}
 | 
						|
			fn(gcnode(ResourceSnapshot, ns, fmt.Sprintf("%s/%s", snapshotter, v)))
 | 
						|
		}
 | 
						|
 | 
						|
	}
 | 
						|
	return nil
 | 
						|
}
 | 
						|
 | 
						|
func isRootRef(bkt *bolt.Bucket) bool {
 | 
						|
	lbkt := bkt.Bucket(bucketKeyObjectLabels)
 | 
						|
	if lbkt != nil {
 | 
						|
		rv := lbkt.Get(labelGCRoot)
 | 
						|
		if rv != nil {
 | 
						|
			// TODO: interpret rv as a timestamp and skip if expired
 | 
						|
			return true
 | 
						|
		}
 | 
						|
	}
 | 
						|
	return false
 | 
						|
}
 | 
						|
 | 
						|
func gcnode(t gc.ResourceType, ns, key string) gc.Node {
 | 
						|
	return gc.Node{
 | 
						|
		Type:      t,
 | 
						|
		Namespace: ns,
 | 
						|
		Key:       key,
 | 
						|
	}
 | 
						|
}
 |