Fix hardlinks with unmodified files

Previously hardlinking to an unmodified file or linking to a file
which was touched by not detected as modified caused a new file
to be created on unpack. This new file and the original source file
were not linked since no link record was created in the tar. This
change addresses this by adding links for all hardlinks to a file
when it is detected as changed. These links will be written after
the source file is written and may occur out of order in regard to
file name.

Signed-off-by: Derek McGowan <derek@mcgstyle.net>
This commit is contained in:
Derek McGowan 2017-04-04 13:32:56 -07:00
parent 2b186fd1f6
commit 51b8e468e5
No known key found for this signature in database
GPG Key ID: F58C5D0A4405ACDB
8 changed files with 94 additions and 44 deletions

View File

@ -260,18 +260,20 @@ func Apply(ctx context.Context, root string, r io.Reader) (int64, error) {
} }
type changeWriter struct { type changeWriter struct {
tw *tar.Writer tw *tar.Writer
source string source string
whiteoutT time.Time whiteoutT time.Time
inodeCache map[uint64]string inodeSrc map[uint64]string
inodeRefs map[uint64][]string
} }
func newChangeWriter(w io.Writer, source string) *changeWriter { func newChangeWriter(w io.Writer, source string) *changeWriter {
return &changeWriter{ return &changeWriter{
tw: tar.NewWriter(w), tw: tar.NewWriter(w),
source: source, source: source,
whiteoutT: time.Now(), whiteoutT: time.Now(),
inodeCache: map[uint64]string{}, inodeSrc: map[uint64]string{},
inodeRefs: map[uint64][]string{},
} }
} }
@ -334,15 +336,28 @@ func (cw *changeWriter) HandleChange(k fs.ChangeKind, p string, f os.FileInfo, e
return errors.Wrap(err, "failed to set device headers") return errors.Wrap(err, "failed to set device headers")
} }
linkname, err := fs.GetLinkSource(name, f, cw.inodeCache) // additionalLinks stores file names which must be linked to
if err != nil { // this file when this file is added
return errors.Wrap(err, "failed to get hardlink") var additionalLinks []string
} inode, isHardlink := fs.GetLinkInfo(f)
if isHardlink {
if linkname != "" { // If the inode has a source, always link to it
hdr.Typeflag = tar.TypeLink if source, ok := cw.inodeSrc[inode]; ok {
hdr.Linkname = linkname hdr.Typeflag = tar.TypeLink
hdr.Size = 0 hdr.Linkname = source
hdr.Size = 0
} else {
if k == fs.ChangeKindUnmodified {
cw.inodeRefs[inode] = append(cw.inodeRefs[inode], name)
return nil
}
cw.inodeSrc[inode] = name
additionalLinks = cw.inodeRefs[inode]
delete(cw.inodeRefs, inode)
}
} else if k == fs.ChangeKindUnmodified {
// Nothing to write to diff
return nil
} }
if capability, err := getxattr(source, "security.capability"); err != nil { if capability, err := getxattr(source, "security.capability"); err != nil {
@ -374,6 +389,19 @@ func (cw *changeWriter) HandleChange(k fs.ChangeKind, p string, f os.FileInfo, e
return errors.New("short write copying file") return errors.New("short write copying file")
} }
} }
if additionalLinks != nil {
source = hdr.Name
for _, extra := range additionalLinks {
hdr.Name = extra
hdr.Typeflag = tar.TypeLink
hdr.Linkname = source
hdr.Size = 0
if err := cw.tw.WriteHeader(hdr); err != nil {
return errors.Wrap(err, "failed to write file header")
}
}
}
} }
return nil return nil
} }

View File

@ -65,7 +65,7 @@ func copyDirectory(dst, src string, inodes map[uint64]string) error {
} }
continue continue
case (fi.Mode() & os.ModeType) == 0: case (fi.Mode() & os.ModeType) == 0:
link, err := GetLinkSource(target, fi, inodes) link, err := getLinkSource(target, fi, inodes)
if err != nil { if err != nil {
return errors.Wrap(err, "failed to get hardlink") return errors.Wrap(err, "failed to get hardlink")
} }

View File

@ -16,9 +16,13 @@ import (
type ChangeKind int type ChangeKind int
const ( const (
// ChangeKindUnmodified represents an unmodified
// file
ChangeKindUnmodified = iota
// ChangeKindAdd represents an addition of // ChangeKindAdd represents an addition of
// a file // a file
ChangeKindAdd = iota ChangeKindAdd
// ChangeKindModify represents a change to // ChangeKindModify represents a change to
// an existing file // an existing file
@ -31,6 +35,8 @@ const (
func (k ChangeKind) String() string { func (k ChangeKind) String() string {
switch k { switch k {
case ChangeKindUnmodified:
return "unmodified"
case ChangeKindAdd: case ChangeKindAdd:
return "add" return "add"
case ChangeKindModify: case ChangeKindModify:
@ -287,7 +293,10 @@ func doubleWalkDiff(ctx context.Context, changeFn ChangeFunc, a, b string) (err
f1 = nil f1 = nil
f2 = nil f2 = nil
if same { if same {
continue if !isLinked(f) {
continue
}
k = ChangeKindUnmodified
} }
} }
if err := changeFn(k, p, f, nil); err != nil { if err := changeFn(k, p, f, nil); err != nil {

View File

@ -90,3 +90,11 @@ func compareCapabilities(p1, p2 string) (bool, error) {
} }
return bytes.Equal(c1, c2), nil return bytes.Equal(c1, c2), nil
} }
func isLinked(f os.FileInfo) bool {
s, ok := f.Sys().(*syscall.Stat_t)
if !ok {
return false
}
return !f.IsDir() && s.Nlink > 1
}

View File

@ -1,5 +1,7 @@
package fs package fs
import "os"
func detectDirDiff(upper, lower string) *diffDirOptions { func detectDirDiff(upper, lower string) *diffDirOptions {
return nil return nil
} }
@ -13,3 +15,7 @@ func compareCapabilities(p1, p2 string) (bool, error) {
// TODO: Use windows equivalent // TODO: Use windows equivalent
return true, nil return true, nil
} }
func isLinked(os.FileInfo) bool {
return false
}

View File

@ -2,11 +2,26 @@ package fs
import "os" import "os"
// GetLinkSource returns a path for the given name and // GetLinkID returns an identifier representing the node a hardlink is pointing
// to. If the file is not hard linked then 0 will be returned.
func GetLinkInfo(fi os.FileInfo) (uint64, bool) {
return getLinkInfo(fi)
}
// getLinkSource returns a path for the given name and
// file info to its link source in the provided inode // file info to its link source in the provided inode
// map. If the given file name is not in the map and // map. If the given file name is not in the map and
// has other links, it is added to the inode map // has other links, it is added to the inode map
// to be a source for other link locations. // to be a source for other link locations.
func GetLinkSource(name string, fi os.FileInfo, inodes map[uint64]string) (string, error) { func getLinkSource(name string, fi os.FileInfo, inodes map[uint64]string) (string, error) {
return getHardLink(name, fi, inodes) inode, isHardlink := getLinkInfo(fi)
if !isHardlink {
return "", nil
}
path, ok := inodes[inode]
if !ok {
inodes[inode] = name
}
return path, nil
} }

View File

@ -3,31 +3,15 @@
package fs package fs
import ( import (
"errors"
"os" "os"
"syscall" "syscall"
) )
func getHardLink(name string, fi os.FileInfo, inodes map[uint64]string) (string, error) { func getLinkInfo(fi os.FileInfo) (uint64, bool) {
if fi.IsDir() {
return "", nil
}
s, ok := fi.Sys().(*syscall.Stat_t) s, ok := fi.Sys().(*syscall.Stat_t)
if !ok { if !ok {
return "", errors.New("unsupported stat type") return 0, false
} }
// If inode is not hardlinked, no reason to lookup or save inode return uint64(s.Ino), !fi.IsDir() && s.Nlink > 1
if s.Nlink == 1 {
return "", nil
}
inode := uint64(s.Ino)
path, ok := inodes[inode]
if !ok {
inodes[inode] = name
}
return path, nil
} }

View File

@ -2,6 +2,6 @@ package fs
import "os" import "os"
func getHardLink(string, os.FileInfo, map[uint64]string) (string, error) { func getLinkInfo(fi os.FileInfo) (uint64, bool) {
return "", nil return 0, false
} }