123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545 |
- package dockerfile // import "github.com/docker/docker/builder/dockerfile"
- import (
- "fmt"
- "io"
- "mime"
- "net/http"
- "net/url"
- "os"
- "path/filepath"
- "runtime"
- "sort"
- "strings"
- "time"
- "github.com/docker/docker/builder"
- "github.com/docker/docker/builder/remotecontext"
- "github.com/docker/docker/builder/remotecontext/urlutil"
- "github.com/docker/docker/pkg/archive"
- "github.com/docker/docker/pkg/containerfs"
- "github.com/docker/docker/pkg/idtools"
- "github.com/docker/docker/pkg/longpath"
- "github.com/docker/docker/pkg/progress"
- "github.com/docker/docker/pkg/streamformatter"
- "github.com/docker/docker/pkg/system"
- "github.com/moby/buildkit/frontend/dockerfile/instructions"
- ocispec "github.com/opencontainers/image-spec/specs-go/v1"
- "github.com/pkg/errors"
- )
- const unnamedFilename = "__unnamed__"
- type pathCache interface {
- Load(key interface{}) (value interface{}, ok bool)
- Store(key, value interface{})
- }
- // copyInfo is a data object which stores the metadata about each source file in
- // a copyInstruction
- type copyInfo struct {
- root string
- path string
- hash string
- noDecompress bool
- }
- func (c copyInfo) fullPath() (string, error) {
- return containerfs.ResolveScopedPath(c.root, c.path)
- }
- func newCopyInfoFromSource(source builder.Source, path string, hash string) copyInfo {
- return copyInfo{root: source.Root(), path: path, hash: hash}
- }
- func newCopyInfos(copyInfos ...copyInfo) []copyInfo {
- return copyInfos
- }
- // copyInstruction is a fully parsed COPY or ADD command that is passed to
- // Builder.performCopy to copy files into the image filesystem
- type copyInstruction struct {
- cmdName string
- infos []copyInfo
- dest string
- chownStr string
- allowLocalDecompression bool
- preserveOwnership bool
- }
- // copier reads a raw COPY or ADD command, fetches remote sources using a downloader,
- // and creates a copyInstruction
- type copier struct {
- imageSource *imageMount
- source builder.Source
- pathCache pathCache
- download sourceDownloader
- platform *ocispec.Platform
- // for cleanup. TODO: having copier.cleanup() is error prone and hard to
- // follow. Code calling performCopy should manage the lifecycle of its params.
- // Copier should take override source as input, not imageMount.
- activeLayer builder.RWLayer
- tmpPaths []string
- }
- func copierFromDispatchRequest(req dispatchRequest, download sourceDownloader, imageSource *imageMount) copier {
- platform := req.builder.platform
- if platform == nil {
- // May be nil if not explicitly set in API/dockerfile
- platform = &ocispec.Platform{}
- }
- if platform.OS == "" {
- // Default to the dispatch requests operating system if not explicit in API/dockerfile
- platform.OS = req.state.operatingSystem
- }
- if platform.OS == "" {
- // This is a failsafe just in case. Shouldn't be hit.
- platform.OS = runtime.GOOS
- }
- return copier{
- source: req.source,
- pathCache: req.builder.pathCache,
- download: download,
- imageSource: imageSource,
- platform: platform,
- }
- }
- func (o *copier) createCopyInstruction(sourcesAndDest instructions.SourcesAndDest, cmdName string) (copyInstruction, error) {
- inst := copyInstruction{
- cmdName: cmdName,
- dest: filepath.FromSlash(sourcesAndDest.DestPath),
- }
- infos, err := o.getCopyInfosForSourcePaths(sourcesAndDest.SourcePaths, inst.dest)
- if err != nil {
- return inst, errors.Wrapf(err, "%s failed", cmdName)
- }
- if len(infos) > 1 && !strings.HasSuffix(inst.dest, string(os.PathSeparator)) {
- return inst, errors.Errorf("When using %s with more than one source file, the destination must be a directory and end with a /", cmdName)
- }
- inst.infos = infos
- return inst, nil
- }
- // getCopyInfosForSourcePaths iterates over the source files and calculate the info
- // needed to copy (e.g. hash value if cached)
- // The dest is used in case source is URL (and ends with "/")
- func (o *copier) getCopyInfosForSourcePaths(sources []string, dest string) ([]copyInfo, error) {
- var infos []copyInfo
- for _, orig := range sources {
- subinfos, err := o.getCopyInfoForSourcePath(orig, dest)
- if err != nil {
- return nil, err
- }
- infos = append(infos, subinfos...)
- }
- if len(infos) == 0 {
- return nil, errors.New("no source files were specified")
- }
- return infos, nil
- }
- func (o *copier) getCopyInfoForSourcePath(orig, dest string) ([]copyInfo, error) {
- if !urlutil.IsURL(orig) {
- return o.calcCopyInfo(orig, true)
- }
- remote, path, err := o.download(orig)
- if err != nil {
- return nil, err
- }
- // If path == "" then we are unable to determine filename from src
- // We have to make sure dest is available
- if path == "" {
- if strings.HasSuffix(dest, "/") {
- return nil, errors.Errorf("cannot determine filename for source %s", orig)
- }
- path = unnamedFilename
- }
- o.tmpPaths = append(o.tmpPaths, remote.Root())
- hash, err := remote.Hash(path)
- ci := newCopyInfoFromSource(remote, path, hash)
- ci.noDecompress = true // data from http shouldn't be extracted even on ADD
- return newCopyInfos(ci), err
- }
- // Cleanup removes any temporary directories created as part of downloading
- // remote files.
- func (o *copier) Cleanup() {
- for _, path := range o.tmpPaths {
- os.RemoveAll(path)
- }
- o.tmpPaths = []string{}
- if o.activeLayer != nil {
- o.activeLayer.Release()
- o.activeLayer = nil
- }
- }
- // TODO: allowWildcards can probably be removed by refactoring this function further.
- func (o *copier) calcCopyInfo(origPath string, allowWildcards bool) ([]copyInfo, error) {
- imageSource := o.imageSource
- if err := validateCopySourcePath(imageSource, origPath); err != nil {
- return nil, err
- }
- // TODO: do this when creating copier. Requires validateCopySourcePath
- // (and other below) to be aware of the difference sources. Why is it only
- // done on image Source?
- if imageSource != nil && o.activeLayer == nil {
- // this needs to be protected against repeated calls as wildcard copy
- // will call it multiple times for a single COPY
- var err error
- rwLayer, err := imageSource.NewRWLayer()
- if err != nil {
- return nil, err
- }
- o.activeLayer = rwLayer
- o.source, err = remotecontext.NewLazySource(rwLayer.Root())
- if err != nil {
- return nil, errors.Wrapf(err, "failed to create context for copy from %s", rwLayer.Root())
- }
- }
- if o.source == nil {
- return nil, errors.Errorf("missing build context")
- }
- // Work in daemon-specific OS filepath semantics
- origPath = filepath.FromSlash(origPath)
- origPath = strings.TrimPrefix(origPath, string(os.PathSeparator))
- origPath = strings.TrimPrefix(origPath, "."+string(os.PathSeparator))
- // Deal with wildcards
- if allowWildcards && containsWildcards(origPath) {
- return o.copyWithWildcards(origPath)
- }
- if imageSource != nil && imageSource.ImageID() != "" {
- // return a cached copy if one exists
- if h, ok := o.pathCache.Load(imageSource.ImageID() + origPath); ok {
- return newCopyInfos(newCopyInfoFromSource(o.source, origPath, h.(string))), nil
- }
- }
- // Deal with the single file case
- copyInfo, err := copyInfoForFile(o.source, origPath)
- switch {
- case imageSource == nil && errors.Is(err, os.ErrNotExist):
- return nil, errors.Wrapf(err, "file not found in build context or excluded by .dockerignore")
- case err != nil:
- return nil, err
- case copyInfo.hash != "":
- o.storeInPathCache(imageSource, origPath, copyInfo.hash)
- return newCopyInfos(copyInfo), err
- }
- // TODO: remove, handle dirs in Hash()
- subfiles, err := walkSource(o.source, origPath)
- if err != nil {
- return nil, err
- }
- hash := hashStringSlice("dir", subfiles)
- o.storeInPathCache(imageSource, origPath, hash)
- return newCopyInfos(newCopyInfoFromSource(o.source, origPath, hash)), nil
- }
- func (o *copier) storeInPathCache(im *imageMount, path string, hash string) {
- if im != nil {
- o.pathCache.Store(im.ImageID()+path, hash)
- }
- }
- func (o *copier) copyWithWildcards(origPath string) ([]copyInfo, error) {
- root := o.source.Root()
- var copyInfos []copyInfo
- if err := filepath.WalkDir(root, func(path string, _ os.DirEntry, err error) error {
- if err != nil {
- return err
- }
- rel, err := remotecontext.Rel(root, path)
- if err != nil {
- return err
- }
- if rel == "." {
- return nil
- }
- if match, _ := filepath.Match(origPath, rel); !match {
- return nil
- }
- // Note we set allowWildcards to false in case the name has
- // a * in it
- subInfos, err := o.calcCopyInfo(rel, false)
- if err != nil {
- return err
- }
- copyInfos = append(copyInfos, subInfos...)
- return nil
- }); err != nil {
- return nil, err
- }
- return copyInfos, nil
- }
- func copyInfoForFile(source builder.Source, path string) (copyInfo, error) {
- fi, err := remotecontext.StatAt(source, path)
- if err != nil {
- if errors.Is(err, os.ErrNotExist) {
- // return the relative path in the error, which is more user-friendly than the full path to the tmp-dir
- return copyInfo{}, errors.WithStack(&os.PathError{Op: "stat", Path: path, Err: os.ErrNotExist})
- }
- return copyInfo{}, err
- }
- if fi.IsDir() {
- return copyInfo{}, nil
- }
- hash, err := source.Hash(path)
- if err != nil {
- return copyInfo{}, err
- }
- return newCopyInfoFromSource(source, path, "file:"+hash), nil
- }
- // TODO: dedupe with copyWithWildcards()
- func walkSource(source builder.Source, origPath string) ([]string, error) {
- fp, err := remotecontext.FullPath(source, origPath)
- if err != nil {
- return nil, err
- }
- // Must be a dir
- var subfiles []string
- err = filepath.WalkDir(fp, func(path string, _ os.DirEntry, err error) error {
- if err != nil {
- return err
- }
- rel, err := remotecontext.Rel(source.Root(), path)
- if err != nil {
- return err
- }
- if rel == "." {
- return nil
- }
- hash, err := source.Hash(rel)
- if err != nil {
- return nil
- }
- // we already checked handleHash above
- subfiles = append(subfiles, hash)
- return nil
- })
- if err != nil {
- return nil, err
- }
- sort.Strings(subfiles)
- return subfiles, nil
- }
- type sourceDownloader func(string) (builder.Source, string, error)
- func newRemoteSourceDownloader(output, stdout io.Writer) sourceDownloader {
- return func(url string) (builder.Source, string, error) {
- return downloadSource(output, stdout, url)
- }
- }
- func errOnSourceDownload(_ string) (builder.Source, string, error) {
- return nil, "", errors.New("source can't be a URL for COPY")
- }
- func getFilenameForDownload(path string, resp *http.Response) string {
- // Guess filename based on source
- if path != "" && !strings.HasSuffix(path, "/") {
- if filename := filepath.Base(filepath.FromSlash(path)); filename != "" {
- return filename
- }
- }
- // Guess filename based on Content-Disposition
- if contentDisposition := resp.Header.Get("Content-Disposition"); contentDisposition != "" {
- if _, params, err := mime.ParseMediaType(contentDisposition); err == nil {
- if params["filename"] != "" && !strings.HasSuffix(params["filename"], "/") {
- if filename := filepath.Base(filepath.FromSlash(params["filename"])); filename != "" {
- return filename
- }
- }
- }
- }
- return ""
- }
- func downloadSource(output io.Writer, stdout io.Writer, srcURL string) (remote builder.Source, p string, err error) {
- u, err := url.Parse(srcURL)
- if err != nil {
- return
- }
- resp, err := remotecontext.GetWithStatusError(srcURL)
- if err != nil {
- return
- }
- filename := getFilenameForDownload(u.Path, resp)
- // Prepare file in a tmp dir
- tmpDir, err := longpath.MkdirTemp("", "docker-remote")
- if err != nil {
- return
- }
- defer func() {
- if err != nil {
- os.RemoveAll(tmpDir)
- }
- }()
- // If filename is empty, the returned filename will be "" but
- // the tmp filename will be created as "__unnamed__"
- tmpFileName := filename
- if filename == "" {
- tmpFileName = unnamedFilename
- }
- tmpFileName = filepath.Join(tmpDir, tmpFileName)
- tmpFile, err := os.OpenFile(tmpFileName, os.O_RDWR|os.O_CREATE|os.O_EXCL, 0o600)
- if err != nil {
- return
- }
- progressOutput := streamformatter.NewJSONProgressOutput(output, true)
- progressReader := progress.NewProgressReader(resp.Body, progressOutput, resp.ContentLength, "", "Downloading")
- // Download and dump result to tmp file
- // TODO: add filehash directly
- if _, err = io.Copy(tmpFile, progressReader); err != nil {
- tmpFile.Close()
- return
- }
- // TODO: how important is this random blank line to the output?
- fmt.Fprintln(stdout)
- // Set the mtime to the Last-Modified header value if present
- // Otherwise just remove atime and mtime
- mTime := time.Time{}
- lastMod := resp.Header.Get("Last-Modified")
- if lastMod != "" {
- // If we can't parse it then just let it default to 'zero'
- // otherwise use the parsed time value
- if parsedMTime, err := http.ParseTime(lastMod); err == nil {
- mTime = parsedMTime
- }
- }
- tmpFile.Close()
- if err = system.Chtimes(tmpFileName, mTime, mTime); err != nil {
- return
- }
- lc, err := remotecontext.NewLazySource(tmpDir)
- return lc, filename, err
- }
- type copyFileOptions struct {
- decompress bool
- identity *idtools.Identity
- archiver *archive.Archiver
- }
- func performCopyForInfo(dest copyInfo, source copyInfo, options copyFileOptions) error {
- srcPath, err := source.fullPath()
- if err != nil {
- return err
- }
- destPath, err := dest.fullPath()
- if err != nil {
- return err
- }
- archiver := options.archiver
- src, err := os.Stat(srcPath)
- if err != nil {
- return errors.Wrapf(err, "source path not found")
- }
- if src.IsDir() {
- return copyDirectory(archiver, srcPath, destPath, options.identity)
- }
- if options.decompress && archive.IsArchivePath(srcPath) && !source.noDecompress {
- return archiver.UntarPath(srcPath, destPath)
- }
- destExistsAsDir, err := isExistingDirectory(destPath)
- if err != nil {
- return err
- }
- // dest.path must be used because destPath has already been cleaned of any
- // trailing slash
- if endsInSlash(dest.path) || destExistsAsDir {
- // source.path must be used to get the correct filename when the source
- // is a symlink
- destPath = filepath.Join(destPath, filepath.Base(source.path))
- }
- return copyFile(archiver, srcPath, destPath, options.identity)
- }
- func copyDirectory(archiver *archive.Archiver, source, dest string, identity *idtools.Identity) error {
- destExists, err := isExistingDirectory(dest)
- if err != nil {
- return errors.Wrapf(err, "failed to query destination path")
- }
- if err := archiver.CopyWithTar(source, dest); err != nil {
- return errors.Wrapf(err, "failed to copy directory")
- }
- if identity != nil {
- return fixPermissions(source, dest, *identity, !destExists)
- }
- return nil
- }
- func copyFile(archiver *archive.Archiver, source, dest string, identity *idtools.Identity) error {
- if identity == nil {
- // Use system.MkdirAll here, which is a custom version of os.MkdirAll
- // modified for use on Windows to handle volume GUID paths. These paths
- // are of the form \\?\Volume{<GUID>}\<path>. An example would be:
- // \\?\Volume{dae8d3ac-b9a1-11e9-88eb-e8554b2ba1db}\bin\busybox.exe
- if err := system.MkdirAll(filepath.Dir(dest), 0o755); err != nil {
- return err
- }
- } else {
- if err := idtools.MkdirAllAndChownNew(filepath.Dir(dest), 0o755, *identity); err != nil {
- return errors.Wrapf(err, "failed to create new directory")
- }
- }
- if err := archiver.CopyFileWithTar(source, dest); err != nil {
- return errors.Wrapf(err, "failed to copy file")
- }
- if identity != nil {
- return fixPermissions(source, dest, *identity, false)
- }
- return nil
- }
- func endsInSlash(path string) bool {
- return strings.HasSuffix(path, string(filepath.Separator))
- }
- // isExistingDirectory returns true if the path exists and is a directory
- func isExistingDirectory(path string) (bool, error) {
- destStat, err := os.Stat(path)
- switch {
- case errors.Is(err, os.ErrNotExist):
- return false, nil
- case err != nil:
- return false, err
- }
- return destStat.IsDir(), nil
- }
|