From 5e82e37ae0e974f8af904fa5582419b137bea5f6 Mon Sep 17 00:00:00 2001 From: Mathias Fredriksson Date: Fri, 30 Aug 2024 08:25:02 +0000 Subject: [PATCH 1/2] Fix directory contents cache in imagefs --- pkg/executor/cache_probe_test.go | 3 +- pkg/imagefs/imagefs.go | 67 +++++++++++++++++++++++--------- pkg/util/fs_util.go | 2 +- 3 files changed, 50 insertions(+), 22 deletions(-) diff --git a/pkg/executor/cache_probe_test.go b/pkg/executor/cache_probe_test.go index e028db9813..86b54848b2 100644 --- a/pkg/executor/cache_probe_test.go +++ b/pkg/executor/cache_probe_test.go @@ -177,8 +177,7 @@ COPY foo/baz.txt copied/ ENV test test From scratch as second - COPY --from=first copied/bam.txt output/bam.txt - COPY --from=first copied/bam.link output/bam.link` + COPY --from=first copied/ output/` err := filesystem.WriteFile(filepath.Join(testDir, "workspace", "Dockerfile"), []byte(dockerFile), 0o755) testutil.CheckNoError(t, err) opts := &config.KanikoOptions{ diff --git a/pkg/imagefs/imagefs.go b/pkg/imagefs/imagefs.go index 05fe13896c..6c21d1c152 100644 --- a/pkg/imagefs/imagefs.go +++ b/pkg/imagefs/imagefs.go @@ -54,8 +54,16 @@ type imageFSFile interface { } func New(parent vfs.FS, root string, image v1.Image, filesToCache []string) (vfs.FS, error) { - var ifs *imageFS + if image == nil { + return nil, errors.New("imagefs: image cannot be nil") + } + + layers, err := image.Layers() + if err != nil { + return nil, errors.Wrap(err, "imagefs: get layers failed") + } + var ifs *imageFS // Multiple layers of imageFS might get confusing, enable delayering. if pfs, ok := parent.(*imageFS); ok { pfs.mu.Lock() @@ -75,39 +83,60 @@ func New(parent vfs.FS, root string, image v1.Image, filesToCache []string) (vfs } } + logrus.Debugf("imagefs: Caching files for %s", root) + + // Keep track of directories so we can cache all of their contents. + var dirsToCache []string // Walk the image and cache file info and hash of the requested files. - _, err := util.GetFSFromImage(root, image, func(dest string, hdr *tar.Header, cleanedName string, tr io.Reader) error { + _, err = util.GetFSFromLayers(root, layers, util.ExtractFunc(func(dest string, hdr *tar.Header, cleanedName string, tr io.Reader) error { // Trim prefix for consistent path. cleanedName = strings.TrimPrefix(cleanedName, "/") + path := filepath.Join(dest, cleanedName) + + cacheFile := func() error { + logrus.Debugf("imagefs: Found cacheable file /%s (path=%s) (%d:%d)", cleanedName, path, hdr.Uid, hdr.Gid) + + cf := newCachedFileInfo(path, hdr) + if cf.IsDir() { + dirsToCache = append(dirsToCache, cleanedName) + } + + sum, err := hashFile(hdr, tr) + if err != nil { + return errors.Wrap(err, "imagefs: hash file failed") + } + ifs.files[path] = newCachedFileInfoWithMD5Sum(cf, sum) + + return nil + } + + // All files inside a cached directory should be cached as well. + for _, dir := range dirsToCache { + if strings.HasPrefix(cleanedName, dir+"/") { + return cacheFile() + } + } for _, f := range filesToCache { - dest := filepath.Join(root, cleanedName) f = strings.TrimPrefix(f, "/") + f = strings.TrimSuffix(f, "/") // Check if the file matches the requested file. if ok, err := filepath.Match(f, cleanedName); ok && err == nil { - logrus.Debugf("imagefs: Found cacheable file %q (%s) (%d:%d)", f, dest, hdr.Uid, hdr.Gid) - - sum, err := hashFile(hdr, tr) - if err != nil { - return errors.Wrap(err, "imagefs: hash file failed") - } - - f := newCachedFileInfo(dest, hdr) - ifs.files[dest] = newCachedFileInfoWithMD5Sum(f, sum) - - return nil + return cacheFile() } - // Parent directories are needed for lookup. + // Cache parent directories for directory lookups. if cleanedName == "" || strings.HasPrefix(f, cleanedName+"/") { - logrus.Debugf("imagefs: Found cacheable file parent %q (%s)", f, dest) - - ifs.files[dest] = newCachedFileInfo(dest, hdr) + if _, ok := ifs.files[path]; !ok { + logrus.Debugf("imagefs: Found cacheable file parent /%s (file=/%s)", cleanedName, f) + ifs.files[path] = newCachedFileInfo(dest, hdr) + } } } + return nil - }) + })) if err != nil { return nil, errors.Wrap(err, "imagefs: walk image failed") } diff --git a/pkg/util/fs_util.go b/pkg/util/fs_util.go index f2c9bd7de0..d5b0307d59 100644 --- a/pkg/util/fs_util.go +++ b/pkg/util/fs_util.go @@ -483,7 +483,7 @@ func ExtractFile(dest string, hdr *tar.Header, cleanedName string, tr io.Reader) } } link := filepath.Clean(filepath.Join(dest, hdr.Linkname)) - if err := os.Link(link, path); err != nil { + if err := filesystem.FS.Link(link, path); err != nil { return err } From ce77d363c0ed9694d1e4dcc4054d6efc3c441ea8 Mon Sep 17 00:00:00 2001 From: Mathias Fredriksson Date: Fri, 30 Aug 2024 08:40:23 +0000 Subject: [PATCH 2/2] More logs --- pkg/imagefs/imagefs.go | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/pkg/imagefs/imagefs.go b/pkg/imagefs/imagefs.go index 6c21d1c152..dc148b3b31 100644 --- a/pkg/imagefs/imagefs.go +++ b/pkg/imagefs/imagefs.go @@ -141,6 +141,8 @@ func New(parent vfs.FS, root string, image v1.Image, filesToCache []string) (vfs return nil, errors.Wrap(err, "imagefs: walk image failed") } + logrus.Debugf("imagefs: Creating cached directories for %s", root) + for dir, d := range ifs.files { if !d.IsDir() { continue @@ -153,6 +155,8 @@ func New(parent vfs.FS, root string, image v1.Image, filesToCache []string) (vfs } } + logrus.Debugf("imagefs: Cached files for %s", root) + return ifs, nil }