archive_linux.go 9.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265
  1. package archive // import "github.com/docker/docker/pkg/archive"
  2. import (
  3. "archive/tar"
  4. "fmt"
  5. "io/ioutil"
  6. "os"
  7. "path/filepath"
  8. "strings"
  9. "syscall"
  10. "github.com/containerd/continuity/fs"
  11. "github.com/docker/docker/pkg/system"
  12. "github.com/pkg/errors"
  13. "golang.org/x/sys/unix"
  14. )
  15. func getWhiteoutConverter(format WhiteoutFormat, inUserNS bool) tarWhiteoutConverter {
  16. if format == OverlayWhiteoutFormat {
  17. return overlayWhiteoutConverter{inUserNS: inUserNS}
  18. }
  19. return nil
  20. }
  21. type overlayWhiteoutConverter struct {
  22. inUserNS bool
  23. }
  24. func (overlayWhiteoutConverter) ConvertWrite(hdr *tar.Header, path string, fi os.FileInfo) (wo *tar.Header, err error) {
  25. // convert whiteouts to AUFS format
  26. if fi.Mode()&os.ModeCharDevice != 0 && hdr.Devmajor == 0 && hdr.Devminor == 0 {
  27. // we just rename the file and make it normal
  28. dir, filename := filepath.Split(hdr.Name)
  29. hdr.Name = filepath.Join(dir, WhiteoutPrefix+filename)
  30. hdr.Mode = 0600
  31. hdr.Typeflag = tar.TypeReg
  32. hdr.Size = 0
  33. }
  34. if fi.Mode()&os.ModeDir != 0 {
  35. // convert opaque dirs to AUFS format by writing an empty file with the prefix
  36. opaque, err := system.Lgetxattr(path, "trusted.overlay.opaque")
  37. if err != nil {
  38. return nil, err
  39. }
  40. if len(opaque) == 1 && opaque[0] == 'y' {
  41. if hdr.Xattrs != nil {
  42. delete(hdr.Xattrs, "trusted.overlay.opaque")
  43. }
  44. // create a header for the whiteout file
  45. // it should inherit some properties from the parent, but be a regular file
  46. wo = &tar.Header{
  47. Typeflag: tar.TypeReg,
  48. Mode: hdr.Mode & int64(os.ModePerm),
  49. Name: filepath.Join(hdr.Name, WhiteoutOpaqueDir),
  50. Size: 0,
  51. Uid: hdr.Uid,
  52. Uname: hdr.Uname,
  53. Gid: hdr.Gid,
  54. Gname: hdr.Gname,
  55. AccessTime: hdr.AccessTime,
  56. ChangeTime: hdr.ChangeTime,
  57. }
  58. }
  59. }
  60. return
  61. }
  62. func (c overlayWhiteoutConverter) ConvertRead(hdr *tar.Header, path string) (bool, error) {
  63. base := filepath.Base(path)
  64. dir := filepath.Dir(path)
  65. // if a directory is marked as opaque by the AUFS special file, we need to translate that to overlay
  66. if base == WhiteoutOpaqueDir {
  67. err := unix.Setxattr(dir, "trusted.overlay.opaque", []byte{'y'}, 0)
  68. if err != nil {
  69. if c.inUserNS {
  70. if err = replaceDirWithOverlayOpaque(dir); err != nil {
  71. return false, errors.Wrapf(err, "replaceDirWithOverlayOpaque(%q) failed", dir)
  72. }
  73. } else {
  74. return false, errors.Wrapf(err, "setxattr(%q, trusted.overlay.opaque=y)", dir)
  75. }
  76. }
  77. // don't write the file itself
  78. return false, err
  79. }
  80. // if a file was deleted and we are using overlay, we need to create a character device
  81. if strings.HasPrefix(base, WhiteoutPrefix) {
  82. originalBase := base[len(WhiteoutPrefix):]
  83. originalPath := filepath.Join(dir, originalBase)
  84. if err := unix.Mknod(originalPath, unix.S_IFCHR, 0); err != nil {
  85. if c.inUserNS {
  86. // Ubuntu and a few distros support overlayfs in userns.
  87. //
  88. // Although we can't call mknod directly in userns (at least on bionic kernel 4.15),
  89. // we can still create 0,0 char device using mknodChar0Overlay().
  90. //
  91. // NOTE: we don't need this hack for the containerd snapshotter+unpack model.
  92. if err := mknodChar0Overlay(originalPath); err != nil {
  93. return false, errors.Wrapf(err, "failed to mknodChar0UserNS(%q)", originalPath)
  94. }
  95. } else {
  96. return false, errors.Wrapf(err, "failed to mknod(%q, S_IFCHR, 0)", originalPath)
  97. }
  98. }
  99. if err := os.Chown(originalPath, hdr.Uid, hdr.Gid); err != nil {
  100. return false, err
  101. }
  102. // don't write the file itself
  103. return false, nil
  104. }
  105. return true, nil
  106. }
  107. // mknodChar0Overlay creates 0,0 char device by mounting overlayfs and unlinking.
  108. // This function can be used for creating 0,0 char device in userns on Ubuntu.
  109. //
  110. // Steps:
  111. // * Mkdir lower,upper,merged,work
  112. // * Create lower/dummy
  113. // * Mount overlayfs
  114. // * Unlink merged/dummy
  115. // * Unmount overlayfs
  116. // * Make sure a 0,0 char device is created as upper/dummy
  117. // * Rename upper/dummy to cleansedOriginalPath
  118. func mknodChar0Overlay(cleansedOriginalPath string) error {
  119. dir := filepath.Dir(cleansedOriginalPath)
  120. tmp, err := ioutil.TempDir(dir, "mc0o")
  121. if err != nil {
  122. return errors.Wrapf(err, "failed to create a tmp directory under %s", dir)
  123. }
  124. defer os.RemoveAll(tmp)
  125. lower := filepath.Join(tmp, "l")
  126. upper := filepath.Join(tmp, "u")
  127. work := filepath.Join(tmp, "w")
  128. merged := filepath.Join(tmp, "m")
  129. for _, s := range []string{lower, upper, work, merged} {
  130. if err := os.MkdirAll(s, 0700); err != nil {
  131. return errors.Wrapf(err, "failed to mkdir %s", s)
  132. }
  133. }
  134. dummyBase := "d"
  135. lowerDummy := filepath.Join(lower, dummyBase)
  136. if err := ioutil.WriteFile(lowerDummy, []byte{}, 0600); err != nil {
  137. return errors.Wrapf(err, "failed to create a dummy lower file %s", lowerDummy)
  138. }
  139. // lowerdir needs ":" to be escaped: https://github.com/moby/moby/issues/40939#issuecomment-627098286
  140. lowerEscaped := strings.ReplaceAll(lower, ":", "\\:")
  141. mOpts := fmt.Sprintf("lowerdir=%s,upperdir=%s,workdir=%s", lowerEscaped, upper, work)
  142. // docker/pkg/mount.Mount() requires procfs to be mounted. So we use syscall.Mount() directly instead.
  143. if err := syscall.Mount("overlay", merged, "overlay", uintptr(0), mOpts); err != nil {
  144. return errors.Wrapf(err, "failed to mount overlay (%s) on %s", mOpts, merged)
  145. }
  146. mergedDummy := filepath.Join(merged, dummyBase)
  147. if err := os.Remove(mergedDummy); err != nil {
  148. syscall.Unmount(merged, 0)
  149. return errors.Wrapf(err, "failed to unlink %s", mergedDummy)
  150. }
  151. if err := syscall.Unmount(merged, 0); err != nil {
  152. return errors.Wrapf(err, "failed to unmount %s", merged)
  153. }
  154. upperDummy := filepath.Join(upper, dummyBase)
  155. if err := isChar0(upperDummy); err != nil {
  156. return err
  157. }
  158. if err := os.Rename(upperDummy, cleansedOriginalPath); err != nil {
  159. return errors.Wrapf(err, "failed to rename %s to %s", upperDummy, cleansedOriginalPath)
  160. }
  161. return nil
  162. }
  163. func isChar0(path string) error {
  164. osStat, err := os.Stat(path)
  165. if err != nil {
  166. return errors.Wrapf(err, "failed to stat %s", path)
  167. }
  168. st, ok := osStat.Sys().(*syscall.Stat_t)
  169. if !ok {
  170. return errors.Errorf("got unsupported stat for %s", path)
  171. }
  172. if os.FileMode(st.Mode)&syscall.S_IFMT != syscall.S_IFCHR {
  173. return errors.Errorf("%s is not a character device, got mode=%d", path, st.Mode)
  174. }
  175. if st.Rdev != 0 {
  176. return errors.Errorf("%s is not a 0,0 character device, got Rdev=%d", path, st.Rdev)
  177. }
  178. return nil
  179. }
  180. // replaceDirWithOverlayOpaque replaces path with a new directory with trusted.overlay.opaque
  181. // xattr. The contents of the directory are preserved.
  182. func replaceDirWithOverlayOpaque(path string) error {
  183. if path == "/" {
  184. return errors.New("replaceDirWithOverlayOpaque: path must not be \"/\"")
  185. }
  186. dir := filepath.Dir(path)
  187. tmp, err := ioutil.TempDir(dir, "rdwoo")
  188. if err != nil {
  189. return errors.Wrapf(err, "failed to create a tmp directory under %s", dir)
  190. }
  191. defer os.RemoveAll(tmp)
  192. // newPath is a new empty directory crafted with trusted.overlay.opaque xattr.
  193. // we copy the content of path into newPath, remove path, and rename newPath to path.
  194. newPath, err := createDirWithOverlayOpaque(tmp)
  195. if err != nil {
  196. return errors.Wrapf(err, "createDirWithOverlayOpaque(%q) failed", tmp)
  197. }
  198. if err := fs.CopyDir(newPath, path); err != nil {
  199. return errors.Wrapf(err, "CopyDir(%q, %q) failed", newPath, path)
  200. }
  201. if err := os.RemoveAll(path); err != nil {
  202. return err
  203. }
  204. return os.Rename(newPath, path)
  205. }
  206. // createDirWithOverlayOpaque creates a directory with trusted.overlay.opaque xattr,
  207. // without calling setxattr, so as to allow creating opaque dir in userns on Ubuntu.
  208. func createDirWithOverlayOpaque(tmp string) (string, error) {
  209. lower := filepath.Join(tmp, "l")
  210. upper := filepath.Join(tmp, "u")
  211. work := filepath.Join(tmp, "w")
  212. merged := filepath.Join(tmp, "m")
  213. for _, s := range []string{lower, upper, work, merged} {
  214. if err := os.MkdirAll(s, 0700); err != nil {
  215. return "", errors.Wrapf(err, "failed to mkdir %s", s)
  216. }
  217. }
  218. dummyBase := "d"
  219. lowerDummy := filepath.Join(lower, dummyBase)
  220. if err := os.MkdirAll(lowerDummy, 0700); err != nil {
  221. return "", errors.Wrapf(err, "failed to create a dummy lower directory %s", lowerDummy)
  222. }
  223. // lowerdir needs ":" to be escaped: https://github.com/moby/moby/issues/40939#issuecomment-627098286
  224. lowerEscaped := strings.ReplaceAll(lower, ":", "\\:")
  225. mOpts := fmt.Sprintf("lowerdir=%s,upperdir=%s,workdir=%s", lowerEscaped, upper, work)
  226. // docker/pkg/mount.Mount() requires procfs to be mounted. So we use syscall.Mount() directly instead.
  227. if err := syscall.Mount("overlay", merged, "overlay", uintptr(0), mOpts); err != nil {
  228. return "", errors.Wrapf(err, "failed to mount overlay (%s) on %s", mOpts, merged)
  229. }
  230. mergedDummy := filepath.Join(merged, dummyBase)
  231. if err := os.Remove(mergedDummy); err != nil {
  232. syscall.Unmount(merged, 0)
  233. return "", errors.Wrapf(err, "failed to rmdir %s", mergedDummy)
  234. }
  235. // upperDummy becomes a 0,0-char device file here
  236. if err := os.Mkdir(mergedDummy, 0700); err != nil {
  237. syscall.Unmount(merged, 0)
  238. return "", errors.Wrapf(err, "failed to mkdir %s", mergedDummy)
  239. }
  240. // upperDummy becomes a directory with trusted.overlay.opaque xattr
  241. // (but can't be verified in userns)
  242. if err := syscall.Unmount(merged, 0); err != nil {
  243. return "", errors.Wrapf(err, "failed to unmount %s", merged)
  244. }
  245. upperDummy := filepath.Join(upper, dummyBase)
  246. return upperDummy, nil
  247. }