386 lines
		
	
	
		
			10 KiB
		
	
	
	
		
			Go
		
	
	
	
	
	
			
		
		
	
	
			386 lines
		
	
	
		
			10 KiB
		
	
	
	
		
			Go
		
	
	
	
	
	
| //go:build linux && !no_btrfs && cgo
 | |
| 
 | |
| /*
 | |
|    Copyright The containerd Authors.
 | |
| 
 | |
|    Licensed under the Apache License, Version 2.0 (the "License");
 | |
|    you may not use this file except in compliance with the License.
 | |
|    You may obtain a copy of the License at
 | |
| 
 | |
|        http://www.apache.org/licenses/LICENSE-2.0
 | |
| 
 | |
|    Unless required by applicable law or agreed to in writing, software
 | |
|    distributed under the License is distributed on an "AS IS" BASIS,
 | |
|    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 | |
|    See the License for the specific language governing permissions and
 | |
|    limitations under the License.
 | |
| */
 | |
| 
 | |
| package btrfs
 | |
| 
 | |
| import (
 | |
| 	"context"
 | |
| 	"fmt"
 | |
| 	"os"
 | |
| 	"path/filepath"
 | |
| 	"strings"
 | |
| 
 | |
| 	"github.com/containerd/btrfs"
 | |
| 	"github.com/containerd/continuity/fs"
 | |
| 
 | |
| 	"github.com/containerd/containerd/log"
 | |
| 	"github.com/containerd/containerd/mount"
 | |
| 	"github.com/containerd/containerd/plugin"
 | |
| 	"github.com/containerd/containerd/snapshots"
 | |
| 	"github.com/containerd/containerd/snapshots/storage"
 | |
| 
 | |
| 	"github.com/sirupsen/logrus"
 | |
| )
 | |
| 
 | |
| type snapshotter struct {
 | |
| 	device string // device of the root
 | |
| 	root   string // root provides paths for internal storage.
 | |
| 	ms     *storage.MetaStore
 | |
| }
 | |
| 
 | |
| // NewSnapshotter returns a Snapshotter using btrfs. Uses the provided
 | |
| // root directory for snapshots and stores the metadata in
 | |
| // a file in the provided root.
 | |
| // root needs to be a mount point of btrfs.
 | |
| func NewSnapshotter(root string) (snapshots.Snapshotter, error) {
 | |
| 	// If directory does not exist, create it
 | |
| 	if st, err := os.Stat(root); err != nil {
 | |
| 		if !os.IsNotExist(err) {
 | |
| 			return nil, err
 | |
| 		}
 | |
| 		if err := os.Mkdir(root, 0700); err != nil {
 | |
| 			return nil, err
 | |
| 		}
 | |
| 	} else if st.Mode()&os.ModePerm != 0700 {
 | |
| 		if err := os.Chmod(root, 0700); err != nil {
 | |
| 			return nil, err
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	mnt, err := mount.Lookup(root)
 | |
| 	if err != nil {
 | |
| 		return nil, err
 | |
| 	}
 | |
| 	if mnt.FSType != "btrfs" {
 | |
| 		return nil, fmt.Errorf("path %s (%s) must be a btrfs filesystem to be used with the btrfs snapshotter: %w", root, mnt.FSType, plugin.ErrSkipPlugin)
 | |
| 	}
 | |
| 	var (
 | |
| 		active    = filepath.Join(root, "active")
 | |
| 		view      = filepath.Join(root, "view")
 | |
| 		snapshots = filepath.Join(root, "snapshots")
 | |
| 	)
 | |
| 
 | |
| 	for _, path := range []string{
 | |
| 		active,
 | |
| 		view,
 | |
| 		snapshots,
 | |
| 	} {
 | |
| 		if err := os.Mkdir(path, 0755); err != nil && !os.IsExist(err) {
 | |
| 			return nil, err
 | |
| 		}
 | |
| 	}
 | |
| 	ms, err := storage.NewMetaStore(filepath.Join(root, "metadata.db"))
 | |
| 	if err != nil {
 | |
| 		return nil, err
 | |
| 	}
 | |
| 
 | |
| 	return &snapshotter{
 | |
| 		device: mnt.Source,
 | |
| 		root:   root,
 | |
| 		ms:     ms,
 | |
| 	}, nil
 | |
| }
 | |
| 
 | |
| // Stat returns the info for an active or committed snapshot by name or
 | |
| // key.
 | |
| //
 | |
| // Should be used for parent resolution, existence checks and to discern
 | |
| // the kind of snapshot.
 | |
| func (b *snapshotter) Stat(ctx context.Context, key string) (info snapshots.Info, err error) {
 | |
| 	err = b.ms.WithTransaction(ctx, false, func(ctx context.Context) error {
 | |
| 		_, info, _, err = storage.GetInfo(ctx, key)
 | |
| 		return err
 | |
| 	})
 | |
| 
 | |
| 	if err != nil {
 | |
| 		return snapshots.Info{}, err
 | |
| 	}
 | |
| 
 | |
| 	return info, nil
 | |
| }
 | |
| 
 | |
| func (b *snapshotter) Update(ctx context.Context, info snapshots.Info, fieldpaths ...string) (_ snapshots.Info, err error) {
 | |
| 	err = b.ms.WithTransaction(ctx, true, func(ctx context.Context) error {
 | |
| 		info, err = storage.UpdateInfo(ctx, info, fieldpaths...)
 | |
| 		return err
 | |
| 	})
 | |
| 
 | |
| 	if err != nil {
 | |
| 		return snapshots.Info{}, err
 | |
| 	}
 | |
| 
 | |
| 	return info, nil
 | |
| }
 | |
| 
 | |
| // Usage retrieves the disk usage of the top-level snapshot.
 | |
| func (b *snapshotter) Usage(ctx context.Context, key string) (snapshots.Usage, error) {
 | |
| 	return b.usage(ctx, key)
 | |
| }
 | |
| 
 | |
| func (b *snapshotter) usage(ctx context.Context, key string) (usage snapshots.Usage, err error) {
 | |
| 	var (
 | |
| 		id, parentID string
 | |
| 		info         snapshots.Info
 | |
| 	)
 | |
| 
 | |
| 	err = b.ms.WithTransaction(ctx, false, func(ctx context.Context) error {
 | |
| 		id, info, usage, err = storage.GetInfo(ctx, key)
 | |
| 
 | |
| 		if err == nil && info.Kind == snapshots.KindActive && info.Parent != "" {
 | |
| 			parentID, _, _, err = storage.GetInfo(ctx, info.Parent)
 | |
| 		}
 | |
| 		return err
 | |
| 	})
 | |
| 
 | |
| 	if err != nil {
 | |
| 		return snapshots.Usage{}, err
 | |
| 	}
 | |
| 
 | |
| 	if info.Kind == snapshots.KindActive {
 | |
| 		var du fs.Usage
 | |
| 		p := filepath.Join(b.root, "active", id)
 | |
| 		if parentID != "" {
 | |
| 			du, err = fs.DiffUsage(ctx, filepath.Join(b.root, "snapshots", parentID), p)
 | |
| 		} else {
 | |
| 			du, err = fs.DiskUsage(ctx, p)
 | |
| 		}
 | |
| 		if err != nil {
 | |
| 			// TODO(stevvooe): Consider not reporting an error in this case.
 | |
| 			return snapshots.Usage{}, err
 | |
| 		}
 | |
| 
 | |
| 		usage = snapshots.Usage(du)
 | |
| 	}
 | |
| 
 | |
| 	return usage, nil
 | |
| }
 | |
| 
 | |
| // Walk the committed snapshots.
 | |
| func (b *snapshotter) Walk(ctx context.Context, fn snapshots.WalkFunc, fs ...string) (err error) {
 | |
| 	return b.ms.WithTransaction(ctx, false, func(ctx context.Context) error {
 | |
| 		return storage.WalkInfo(ctx, fn, fs...)
 | |
| 	})
 | |
| }
 | |
| 
 | |
| func (b *snapshotter) Prepare(ctx context.Context, key, parent string, opts ...snapshots.Opt) ([]mount.Mount, error) {
 | |
| 	return b.makeSnapshot(ctx, snapshots.KindActive, key, parent, opts)
 | |
| }
 | |
| 
 | |
| func (b *snapshotter) View(ctx context.Context, key, parent string, opts ...snapshots.Opt) ([]mount.Mount, error) {
 | |
| 	return b.makeSnapshot(ctx, snapshots.KindView, key, parent, opts)
 | |
| }
 | |
| 
 | |
| func (b *snapshotter) makeSnapshot(ctx context.Context, kind snapshots.Kind, key, parent string, opts []snapshots.Opt) (_ []mount.Mount, err error) {
 | |
| 	var (
 | |
| 		target string
 | |
| 		s      storage.Snapshot
 | |
| 	)
 | |
| 
 | |
| 	err = b.ms.WithTransaction(ctx, true, func(ctx context.Context) error {
 | |
| 		s, err = storage.CreateSnapshot(ctx, kind, key, parent, opts...)
 | |
| 		if err != nil {
 | |
| 			return err
 | |
| 		}
 | |
| 
 | |
| 		target = filepath.Join(b.root, strings.ToLower(s.Kind.String()), s.ID)
 | |
| 
 | |
| 		if len(s.ParentIDs) == 0 {
 | |
| 			// create new subvolume
 | |
| 			// btrfs subvolume create /dir
 | |
| 			return btrfs.SubvolCreate(target)
 | |
| 		}
 | |
| 		parentp := filepath.Join(b.root, "snapshots", s.ParentIDs[0])
 | |
| 
 | |
| 		// btrfs subvolume snapshot /parent /subvol
 | |
| 		readOnly := kind == snapshots.KindView
 | |
| 		return btrfs.SubvolSnapshot(target, parentp, readOnly)
 | |
| 	})
 | |
| 
 | |
| 	if err != nil {
 | |
| 		if target != "" {
 | |
| 			if derr := btrfs.SubvolDelete(target); derr != nil {
 | |
| 				log.G(ctx).WithError(derr).WithField("subvolume", target).Error("failed to delete subvolume")
 | |
| 			}
 | |
| 		}
 | |
| 
 | |
| 		return nil, err
 | |
| 	}
 | |
| 
 | |
| 	return b.mounts(target, s)
 | |
| }
 | |
| 
 | |
| func (b *snapshotter) mounts(dir string, s storage.Snapshot) ([]mount.Mount, error) {
 | |
| 	var options []string
 | |
| 
 | |
| 	// get the subvolume id back out for the mount
 | |
| 	sid, err := btrfs.SubvolID(dir)
 | |
| 	if err != nil {
 | |
| 		return nil, err
 | |
| 	}
 | |
| 
 | |
| 	options = append(options, fmt.Sprintf("subvolid=%d", sid))
 | |
| 
 | |
| 	if s.Kind != snapshots.KindActive {
 | |
| 		options = append(options, "ro")
 | |
| 	}
 | |
| 
 | |
| 	return []mount.Mount{
 | |
| 		{
 | |
| 			Type:   "btrfs",
 | |
| 			Source: b.device,
 | |
| 			// NOTE(stevvooe): While it would be nice to use to uuids for
 | |
| 			// mounts, they don't work reliably if the uuids are missing.
 | |
| 			Options: options,
 | |
| 		},
 | |
| 	}, nil
 | |
| }
 | |
| 
 | |
| func (b *snapshotter) Commit(ctx context.Context, name, key string, opts ...snapshots.Opt) (err error) {
 | |
| 	var usage snapshots.Usage
 | |
| 	usage, err = b.usage(ctx, key)
 | |
| 	if err != nil {
 | |
| 		return fmt.Errorf("failed to compute usage: %w", err)
 | |
| 	}
 | |
| 
 | |
| 	var source, target string
 | |
| 	err = b.ms.WithTransaction(ctx, true, func(ctx context.Context) error {
 | |
| 		id, err := storage.CommitActive(ctx, key, name, usage, opts...) // TODO(stevvooe): Resolve a usage value for btrfs
 | |
| 		if err != nil {
 | |
| 			return fmt.Errorf("failed to commit: %w", err)
 | |
| 		}
 | |
| 
 | |
| 		source = filepath.Join(b.root, "active", id)
 | |
| 		target = filepath.Join(b.root, "snapshots", id)
 | |
| 
 | |
| 		return btrfs.SubvolSnapshot(target, source, true)
 | |
| 	})
 | |
| 
 | |
| 	if err != nil {
 | |
| 		if target != "" {
 | |
| 			if derr := btrfs.SubvolDelete(target); derr != nil {
 | |
| 				log.G(ctx).WithError(derr).WithField("subvolume", target).Error("failed to delete subvolume")
 | |
| 			}
 | |
| 		}
 | |
| 
 | |
| 		return err
 | |
| 	}
 | |
| 
 | |
| 	if source != "" {
 | |
| 		if derr := btrfs.SubvolDelete(source); derr != nil {
 | |
| 			// Log as warning, only needed for cleanup, will not cause name collision
 | |
| 			log.G(ctx).WithError(derr).WithField("subvolume", source).Warn("failed to delete subvolume")
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	return nil
 | |
| }
 | |
| 
 | |
| // Mounts returns the mounts for the transaction identified by key. Can be
 | |
| // called on an read-write or readonly transaction.
 | |
| //
 | |
| // This can be used to recover mounts after calling View or Prepare.
 | |
| func (b *snapshotter) Mounts(ctx context.Context, key string) (_ []mount.Mount, err error) {
 | |
| 	var s storage.Snapshot
 | |
| 
 | |
| 	err = b.ms.WithTransaction(ctx, false, func(ctx context.Context) error {
 | |
| 		s, err = storage.GetSnapshot(ctx, key)
 | |
| 		return err
 | |
| 	})
 | |
| 
 | |
| 	if err != nil {
 | |
| 		return nil, fmt.Errorf("failed to get active snapshot: %w", err)
 | |
| 	}
 | |
| 
 | |
| 	dir := filepath.Join(b.root, strings.ToLower(s.Kind.String()), s.ID)
 | |
| 	return b.mounts(dir, s)
 | |
| }
 | |
| 
 | |
| // Remove abandons the transaction identified by key. All resources
 | |
| // associated with the key will be removed.
 | |
| func (b *snapshotter) Remove(ctx context.Context, key string) (err error) {
 | |
| 	var (
 | |
| 		source, removed   string
 | |
| 		readonly, restore bool
 | |
| 	)
 | |
| 
 | |
| 	defer func() {
 | |
| 		if removed != "" {
 | |
| 			if derr := btrfs.SubvolDelete(removed); derr != nil {
 | |
| 				log.G(ctx).WithError(derr).WithField("subvolume", removed).Warn("failed to delete subvolume")
 | |
| 			}
 | |
| 		}
 | |
| 	}()
 | |
| 
 | |
| 	err = b.ms.WithTransaction(ctx, true, func(ctx context.Context) error {
 | |
| 		id, k, err := storage.Remove(ctx, key)
 | |
| 		if err != nil {
 | |
| 			return fmt.Errorf("failed to remove snapshot: %w", err)
 | |
| 		}
 | |
| 
 | |
| 		switch k {
 | |
| 		case snapshots.KindView:
 | |
| 			source = filepath.Join(b.root, "view", id)
 | |
| 			removed = filepath.Join(b.root, "view", "rm-"+id)
 | |
| 			readonly = true
 | |
| 		case snapshots.KindActive:
 | |
| 			source = filepath.Join(b.root, "active", id)
 | |
| 			removed = filepath.Join(b.root, "active", "rm-"+id)
 | |
| 		case snapshots.KindCommitted:
 | |
| 			source = filepath.Join(b.root, "snapshots", id)
 | |
| 			removed = filepath.Join(b.root, "snapshots", "rm-"+id)
 | |
| 			readonly = true
 | |
| 		}
 | |
| 
 | |
| 		if err = btrfs.SubvolSnapshot(removed, source, readonly); err != nil {
 | |
| 			removed = ""
 | |
| 			return err
 | |
| 		}
 | |
| 
 | |
| 		if err = btrfs.SubvolDelete(source); err != nil {
 | |
| 			return fmt.Errorf("failed to remove snapshot %v: %w", source, err)
 | |
| 		}
 | |
| 
 | |
| 		restore = true
 | |
| 		return nil
 | |
| 	})
 | |
| 
 | |
| 	if err != nil {
 | |
| 		if restore { // means failed to commit transaction
 | |
| 			// Attempt to restore source
 | |
| 			if err1 := btrfs.SubvolSnapshot(source, removed, readonly); err1 != nil {
 | |
| 				log.G(ctx).WithFields(logrus.Fields{
 | |
| 					logrus.ErrorKey: err1,
 | |
| 					"subvolume":     source,
 | |
| 					"renamed":       removed,
 | |
| 				}).Error("failed to restore subvolume from renamed")
 | |
| 				// Keep removed to allow for manual restore
 | |
| 				removed = ""
 | |
| 			}
 | |
| 		}
 | |
| 
 | |
| 		return err
 | |
| 	}
 | |
| 
 | |
| 	return nil
 | |
| }
 | |
| 
 | |
| // Close closes the snapshotter
 | |
| func (b *snapshotter) Close() error {
 | |
| 	return b.ms.Close()
 | |
| }
 | 
