Skip to content

Commit

Permalink
Resolve filepaths before scanning for changes
Browse files Browse the repository at this point in the history
  • Loading branch information
cvgw committed Feb 20, 2020
1 parent f5f1c3a commit a675ad9
Show file tree
Hide file tree
Showing 6 changed files with 429 additions and 57 deletions.
10 changes: 10 additions & 0 deletions integration/dockerfiles/Dockerfile_test_issue_1039
Original file line number Diff line number Diff line change
@@ -0,0 +1,10 @@
FROM registry.access.redhat.com/ubi7/ubi:7.7-214

# Install GCC, GCC-C++ and make libraries for build environment
# Then clean caches
RUN yum --disableplugin=subscription-manager update -y \
&& yum --disableplugin=subscription-manager install -y \
gcc-4.8.5-39.el7 \
gcc-c++-4.8.5-39.el7 \
make-3.82-24.el7 \
&& yum --disableplugin=subscription-manager clean all
158 changes: 158 additions & 0 deletions pkg/filesystem/resolve.go
Original file line number Diff line number Diff line change
@@ -0,0 +1,158 @@
/*
Copyright 2020 Google LLC
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
*/

package filesystem

import (
"os"
"path/filepath"

"github.com/GoogleContainerTools/kaniko/pkg/util"
"github.com/pkg/errors"
"github.com/sirupsen/logrus"
)

// ResolvePaths takes a slice of file paths and a slice of whitelist entries. It resolve each
// file path according to a set of rules and then returns a slice of resolved paths or error.
// File paths are resolved according to the following rules:
// * If path is whitelisted, skip it.
// * If path is a symlink, resolve it's ancestor link and add it to the output set.
// * If path is a symlink, resolve it's target. If the target is not whitelisted add it to the
// output set.
// * Add all ancestors of each path to the output set.
func ResolvePaths(paths []string, wl []util.WhitelistEntry) (pathsToAdd []string, err error) {
logrus.Info("Resolving paths")

fileSet := make(map[string]bool)

for _, f := range paths {
// If the given path is part of the whitelist ignore it
if util.IsInProvidedWhitelist(f, wl) {
logrus.Debugf("path %s is whitelisted, ignoring it", f)
continue
}

link, e := resolveSymlinkAncestor(f)
if e != nil {
err = e
return
}

if f != link {
logrus.Tracef("updated link %s to %s", f, link)
}

if !fileSet[link] {
pathsToAdd = append(pathsToAdd, link)
}
fileSet[link] = true

var evaled string

// If the path is a symlink we need to also consider the target of that
// link
evaled, err = filepath.EvalSymlinks(f)
if err != nil {
if !os.IsNotExist(err) {
logrus.Errorf("couldn't eval %s with link %s", f, link)
return
}

logrus.Debugf("symlink path %s, target does not exist", f)
}

// If the given path is a symlink and the target is part of the whitelist
// ignore the target
if util.IsInProvidedWhitelist(evaled, wl) {
logrus.Debugf("path %s is whitelisted, ignoring it", evaled)
continue
}

if !fileSet[evaled] {
pathsToAdd = append(pathsToAdd, evaled)
}
fileSet[evaled] = true
}

// Also add parent directories to keep the permission of them correctly.
pathsToAdd = filesWithParentDirs(pathsToAdd)

return
}

// filesWithParentDirs returns every ancestor path for each provided file path.
// I.E. /foo/bar/baz/boom.txt => [/, /foo, /foo/bar, /foo/bar/baz, /foo/bar/baz/boom.txt]
func filesWithParentDirs(files []string) []string {
filesSet := map[string]bool{}

for _, file := range files {
file = filepath.Clean(file)
filesSet[file] = true

for _, dir := range util.ParentDirectories(file) {
dir = filepath.Clean(dir)
filesSet[dir] = true
}
}

newFiles := []string{}
for file := range filesSet {
newFiles = append(newFiles, file)
}

return newFiles
}

// resolveSymlinkAncestor returns the ancestor link of the provided symlink path or returns the
// the path if it is not a link. The ancestor link is the filenode whose type is a Symlink.
// E.G /baz/boom/bar.txt links to /usr/bin/bar.txt but /baz/boom/bar.txt itself is not a link.
// Instead /bar/boom is actually a link to /usr/bin. In this case resolveSymlinkAncestor would
// return /bar/boom.
func resolveSymlinkAncestor(path string) (string, error) {
if !filepath.IsAbs(path) {
return "", errors.New("dest path must be abs")
}
last := ""
newPath := path
loop:
for newPath != "/" {
fi, err := os.Lstat(newPath)
if err != nil {
return "", errors.Wrap(err, "failed to lstat")
}

switch mode := fi.Mode(); {
case mode&os.ModeSymlink != 0:
last = filepath.Base(newPath)
newPath = filepath.Dir(newPath)
default:
target, err := filepath.EvalSymlinks(newPath)
if err != nil {
return "", err
}

if target != newPath {
last = filepath.Base(newPath)
newPath = filepath.Dir(newPath)
} else {
break loop
}
}
}

newPath = filepath.Join(newPath, last)
return filepath.Clean(newPath), nil
}
185 changes: 185 additions & 0 deletions pkg/filesystem/resolve_test.go
Original file line number Diff line number Diff line change
@@ -0,0 +1,185 @@
/*
Copyright 2020 Google LLC
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
*/

package filesystem

import (
"io/ioutil"
"os"
"path/filepath"
"reflect"
"sort"
"testing"

"github.com/GoogleContainerTools/kaniko/pkg/util"
)

func Test_ResolvePaths(t *testing.T) {
validateResults := func(
t *testing.T,
actualFiles,
expectedFiles []string,
err error,
) {
if err != nil {
t.Errorf("expected err to be nil but was %s", err)
}

// Sort so that comparison is against consistent order
sort.Strings(actualFiles)
sort.Strings(expectedFiles)

if !reflect.DeepEqual(actualFiles, expectedFiles) {
t.Errorf("expected files to equal %s but was %s",
expectedFiles, actualFiles,
)
}
}

t.Run("list of files", func(t *testing.T) {
dir, err := ioutil.TempDir("", "snapshot-test")
if err != nil {
t.Fatal(err)
}

defer os.RemoveAll(dir)

files := []string{
"/foo/bar.txt",
"/baz/boom.txt",
}

t.Run("all are symlinks", func(t *testing.T) {
for _, f := range files {
fLink := filepath.Join(dir, "link", f)
fTarget := filepath.Join(dir, "target", f)

if err := os.MkdirAll(filepath.Dir(fTarget), 0777); err != nil {
t.Fatal(err)
}

if err := ioutil.WriteFile(fTarget, []byte{}, 0777); err != nil {
t.Fatal(err)
}

if err := os.MkdirAll(filepath.Dir(fLink), 0777); err != nil {
t.Fatal(err)
}

if err := os.Symlink(fTarget, fLink); err != nil {
t.Fatal(err)
}
}

t.Run("none are whitelisted", func(t *testing.T) {
wl := []util.WhitelistEntry{}

inputFiles := []string{}
expectedFiles := []string{}

for _, f := range files {
link := filepath.Join(dir, "link", f)
expectedFiles = append(expectedFiles, link)
inputFiles = append(inputFiles, link)

target := filepath.Join(dir, "target", f)
expectedFiles = append(expectedFiles, target)
}

expectedFiles = filesWithParentDirs(expectedFiles)

files, err := ResolvePaths(inputFiles, wl)

validateResults(t, files, expectedFiles, err)
})

t.Run("some are whitelisted", func(t *testing.T) {
wl := []util.WhitelistEntry{
{
Path: filepath.Join(dir, "link", "baz"),
},
{
Path: filepath.Join(dir, "target", "foo"),
},
}

expectedFiles := []string{}
inputFiles := []string{}

for _, f := range files {
link := filepath.Join(dir, "link", f)
inputFiles = append(inputFiles, link)

if util.IsInProvidedWhitelist(link, wl) {
t.Logf("skipping %s", link)
continue
}

expectedFiles = append(expectedFiles, link)

target := filepath.Join(dir, "target", f)

if util.IsInProvidedWhitelist(target, wl) {
t.Logf("skipping %s", target)
continue
}

expectedFiles = append(expectedFiles, target)
}

link := filepath.Join(dir, "link", "zoom/")

target := filepath.Join(dir, "target", "zaam/")
if err := os.MkdirAll(target, 0777); err != nil {
t.Fatal(err)
}

if err := ioutil.WriteFile(filepath.Join(target, "meow.txt"), []byte{}, 0777); err != nil {
t.Fatal(err)
}

if err := os.Symlink(target, link); err != nil {
t.Fatal(err)
}

file := filepath.Join(link, "meow.txt")
inputFiles = append(inputFiles, file)

expectedFiles = append(expectedFiles, link)

targetFile := filepath.Join(target, "meow.txt")
expectedFiles = append(expectedFiles, targetFile)

expectedFiles = filesWithParentDirs(expectedFiles)

files, err := ResolvePaths(inputFiles, wl)

validateResults(t, files, expectedFiles, err)
})
})
})

t.Run("empty set of files", func(t *testing.T) {
inputFiles := []string{}
expectedFiles := []string{}

wl := []util.WhitelistEntry{}

files, err := ResolvePaths(inputFiles, wl)

validateResults(t, files, expectedFiles, err)
})
}
Loading

0 comments on commit a675ad9

Please sign in to comment.