123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686 |
- // +build linux
- package btrfs // import "github.com/docker/docker/daemon/graphdriver/btrfs"
- /*
- #include <stdlib.h>
- #include <dirent.h>
- #include <btrfs/ioctl.h>
- #include <btrfs/ctree.h>
- static void set_name_btrfs_ioctl_vol_args_v2(struct btrfs_ioctl_vol_args_v2* btrfs_struct, const char* value) {
- snprintf(btrfs_struct->name, BTRFS_SUBVOL_NAME_MAX, "%s", value);
- }
- */
- import "C"
- import (
- "fmt"
- "io/ioutil"
- "math"
- "os"
- "path"
- "path/filepath"
- "strconv"
- "strings"
- "sync"
- "unsafe"
- "github.com/docker/docker/daemon/graphdriver"
- "github.com/docker/docker/pkg/containerfs"
- "github.com/docker/docker/pkg/idtools"
- "github.com/docker/docker/pkg/mount"
- "github.com/docker/docker/pkg/parsers"
- "github.com/docker/docker/pkg/system"
- units "github.com/docker/go-units"
- "github.com/opencontainers/selinux/go-selinux/label"
- "github.com/pkg/errors"
- "github.com/sirupsen/logrus"
- "golang.org/x/sys/unix"
- )
- func init() {
- graphdriver.Register("btrfs", Init)
- }
- type btrfsOptions struct {
- minSpace uint64
- size uint64
- }
- // Init returns a new BTRFS driver.
- // An error is returned if BTRFS is not supported.
- func Init(home string, options []string, uidMaps, gidMaps []idtools.IDMap) (graphdriver.Driver, error) {
- // Perform feature detection on /var/lib/docker/btrfs if it's an existing directory.
- // This covers situations where /var/lib/docker/btrfs is a mount, and on a different
- // filesystem than /var/lib/docker.
- // If the path does not exist, fall back to using /var/lib/docker for feature detection.
- testdir := home
- if _, err := os.Stat(testdir); os.IsNotExist(err) {
- testdir = filepath.Dir(testdir)
- }
- fsMagic, err := graphdriver.GetFSMagic(testdir)
- if err != nil {
- return nil, err
- }
- if fsMagic != graphdriver.FsMagicBtrfs {
- return nil, graphdriver.ErrPrerequisites
- }
- rootUID, rootGID, err := idtools.GetRootUIDGID(uidMaps, gidMaps)
- if err != nil {
- return nil, err
- }
- if err := idtools.MkdirAllAndChown(home, 0700, idtools.Identity{UID: rootUID, GID: rootGID}); err != nil {
- return nil, err
- }
- opt, userDiskQuota, err := parseOptions(options)
- if err != nil {
- return nil, err
- }
- // For some reason shared mount propagation between a container
- // and the host does not work for btrfs, and a remedy is to bind
- // mount graphdriver home to itself (even without changing the
- // propagation mode).
- err = mount.MakeMount(home)
- if err != nil {
- return nil, errors.Wrapf(err, "failed to make %s a mount", home)
- }
- driver := &Driver{
- home: home,
- uidMaps: uidMaps,
- gidMaps: gidMaps,
- options: opt,
- }
- if userDiskQuota {
- if err := driver.subvolEnableQuota(); err != nil {
- return nil, err
- }
- }
- return graphdriver.NewNaiveDiffDriver(driver, uidMaps, gidMaps), nil
- }
- func parseOptions(opt []string) (btrfsOptions, bool, error) {
- var options btrfsOptions
- userDiskQuota := false
- for _, option := range opt {
- key, val, err := parsers.ParseKeyValueOpt(option)
- if err != nil {
- return options, userDiskQuota, err
- }
- key = strings.ToLower(key)
- switch key {
- case "btrfs.min_space":
- minSpace, err := units.RAMInBytes(val)
- if err != nil {
- return options, userDiskQuota, err
- }
- userDiskQuota = true
- options.minSpace = uint64(minSpace)
- default:
- return options, userDiskQuota, fmt.Errorf("Unknown option %s", key)
- }
- }
- return options, userDiskQuota, nil
- }
- // Driver contains information about the filesystem mounted.
- type Driver struct {
- // root of the file system
- home string
- uidMaps []idtools.IDMap
- gidMaps []idtools.IDMap
- options btrfsOptions
- quotaEnabled bool
- once sync.Once
- }
- // String prints the name of the driver (btrfs).
- func (d *Driver) String() string {
- return "btrfs"
- }
- // Status returns current driver information in a two dimensional string array.
- // Output contains "Build Version" and "Library Version" of the btrfs libraries used.
- // Version information can be used to check compatibility with your kernel.
- func (d *Driver) Status() [][2]string {
- status := [][2]string{}
- if bv := btrfsBuildVersion(); bv != "-" {
- status = append(status, [2]string{"Build Version", bv})
- }
- if lv := btrfsLibVersion(); lv != -1 {
- status = append(status, [2]string{"Library Version", fmt.Sprintf("%d", lv)})
- }
- return status
- }
- // GetMetadata returns empty metadata for this driver.
- func (d *Driver) GetMetadata(id string) (map[string]string, error) {
- return nil, nil
- }
- // Cleanup unmounts the home directory.
- func (d *Driver) Cleanup() error {
- err := d.subvolDisableQuota()
- umountErr := mount.Unmount(d.home)
- // in case we have two errors, prefer the one from disableQuota()
- if err != nil {
- return err
- }
- if umountErr != nil {
- return umountErr
- }
- return nil
- }
- func free(p *C.char) {
- C.free(unsafe.Pointer(p))
- }
- func openDir(path string) (*C.DIR, error) {
- Cpath := C.CString(path)
- defer free(Cpath)
- dir := C.opendir(Cpath)
- if dir == nil {
- return nil, fmt.Errorf("Can't open dir")
- }
- return dir, nil
- }
- func closeDir(dir *C.DIR) {
- if dir != nil {
- C.closedir(dir)
- }
- }
- func getDirFd(dir *C.DIR) uintptr {
- return uintptr(C.dirfd(dir))
- }
- func subvolCreate(path, name string) error {
- dir, err := openDir(path)
- if err != nil {
- return err
- }
- defer closeDir(dir)
- var args C.struct_btrfs_ioctl_vol_args
- for i, c := range []byte(name) {
- args.name[i] = C.char(c)
- }
- _, _, errno := unix.Syscall(unix.SYS_IOCTL, getDirFd(dir), C.BTRFS_IOC_SUBVOL_CREATE,
- uintptr(unsafe.Pointer(&args)))
- if errno != 0 {
- return fmt.Errorf("Failed to create btrfs subvolume: %v", errno.Error())
- }
- return nil
- }
- func subvolSnapshot(src, dest, name string) error {
- srcDir, err := openDir(src)
- if err != nil {
- return err
- }
- defer closeDir(srcDir)
- destDir, err := openDir(dest)
- if err != nil {
- return err
- }
- defer closeDir(destDir)
- var args C.struct_btrfs_ioctl_vol_args_v2
- args.fd = C.__s64(getDirFd(srcDir))
- var cs = C.CString(name)
- C.set_name_btrfs_ioctl_vol_args_v2(&args, cs)
- C.free(unsafe.Pointer(cs))
- _, _, errno := unix.Syscall(unix.SYS_IOCTL, getDirFd(destDir), C.BTRFS_IOC_SNAP_CREATE_V2,
- uintptr(unsafe.Pointer(&args)))
- if errno != 0 {
- return fmt.Errorf("Failed to create btrfs snapshot: %v", errno.Error())
- }
- return nil
- }
- func isSubvolume(p string) (bool, error) {
- var bufStat unix.Stat_t
- if err := unix.Lstat(p, &bufStat); err != nil {
- return false, err
- }
- // return true if it is a btrfs subvolume
- return bufStat.Ino == C.BTRFS_FIRST_FREE_OBJECTID, nil
- }
- func subvolDelete(dirpath, name string, quotaEnabled bool) error {
- dir, err := openDir(dirpath)
- if err != nil {
- return err
- }
- defer closeDir(dir)
- fullPath := path.Join(dirpath, name)
- var args C.struct_btrfs_ioctl_vol_args
- // walk the btrfs subvolumes
- walkSubvolumes := func(p string, f os.FileInfo, err error) error {
- if err != nil {
- if os.IsNotExist(err) && p != fullPath {
- // missing most likely because the path was a subvolume that got removed in the previous iteration
- // since it's gone anyway, we don't care
- return nil
- }
- return fmt.Errorf("error walking subvolumes: %v", err)
- }
- // we want to check children only so skip itself
- // it will be removed after the filepath walk anyways
- if f.IsDir() && p != fullPath {
- sv, err := isSubvolume(p)
- if err != nil {
- return fmt.Errorf("Failed to test if %s is a btrfs subvolume: %v", p, err)
- }
- if sv {
- if err := subvolDelete(path.Dir(p), f.Name(), quotaEnabled); err != nil {
- return fmt.Errorf("Failed to destroy btrfs child subvolume (%s) of parent (%s): %v", p, dirpath, err)
- }
- }
- }
- return nil
- }
- if err := filepath.Walk(path.Join(dirpath, name), walkSubvolumes); err != nil {
- return fmt.Errorf("Recursively walking subvolumes for %s failed: %v", dirpath, err)
- }
- if quotaEnabled {
- if qgroupid, err := subvolLookupQgroup(fullPath); err == nil {
- var args C.struct_btrfs_ioctl_qgroup_create_args
- args.qgroupid = C.__u64(qgroupid)
- _, _, errno := unix.Syscall(unix.SYS_IOCTL, getDirFd(dir), C.BTRFS_IOC_QGROUP_CREATE,
- uintptr(unsafe.Pointer(&args)))
- if errno != 0 {
- logrus.WithField("storage-driver", "btrfs").Errorf("Failed to delete btrfs qgroup %v for %s: %v", qgroupid, fullPath, errno.Error())
- }
- } else {
- logrus.WithField("storage-driver", "btrfs").Errorf("Failed to lookup btrfs qgroup for %s: %v", fullPath, err.Error())
- }
- }
- // all subvolumes have been removed
- // now remove the one originally passed in
- for i, c := range []byte(name) {
- args.name[i] = C.char(c)
- }
- _, _, errno := unix.Syscall(unix.SYS_IOCTL, getDirFd(dir), C.BTRFS_IOC_SNAP_DESTROY,
- uintptr(unsafe.Pointer(&args)))
- if errno != 0 {
- return fmt.Errorf("Failed to destroy btrfs snapshot %s for %s: %v", dirpath, name, errno.Error())
- }
- return nil
- }
- func (d *Driver) updateQuotaStatus() {
- d.once.Do(func() {
- if !d.quotaEnabled {
- // In case quotaEnabled is not set, check qgroup and update quotaEnabled as needed
- if err := subvolQgroupStatus(d.home); err != nil {
- // quota is still not enabled
- return
- }
- d.quotaEnabled = true
- }
- })
- }
- func (d *Driver) subvolEnableQuota() error {
- d.updateQuotaStatus()
- if d.quotaEnabled {
- return nil
- }
- dir, err := openDir(d.home)
- if err != nil {
- return err
- }
- defer closeDir(dir)
- var args C.struct_btrfs_ioctl_quota_ctl_args
- args.cmd = C.BTRFS_QUOTA_CTL_ENABLE
- _, _, errno := unix.Syscall(unix.SYS_IOCTL, getDirFd(dir), C.BTRFS_IOC_QUOTA_CTL,
- uintptr(unsafe.Pointer(&args)))
- if errno != 0 {
- return fmt.Errorf("Failed to enable btrfs quota for %s: %v", dir, errno.Error())
- }
- d.quotaEnabled = true
- return nil
- }
- func (d *Driver) subvolDisableQuota() error {
- d.updateQuotaStatus()
- if !d.quotaEnabled {
- return nil
- }
- dir, err := openDir(d.home)
- if err != nil {
- return err
- }
- defer closeDir(dir)
- var args C.struct_btrfs_ioctl_quota_ctl_args
- args.cmd = C.BTRFS_QUOTA_CTL_DISABLE
- _, _, errno := unix.Syscall(unix.SYS_IOCTL, getDirFd(dir), C.BTRFS_IOC_QUOTA_CTL,
- uintptr(unsafe.Pointer(&args)))
- if errno != 0 {
- return fmt.Errorf("Failed to disable btrfs quota for %s: %v", dir, errno.Error())
- }
- d.quotaEnabled = false
- return nil
- }
- func (d *Driver) subvolRescanQuota() error {
- d.updateQuotaStatus()
- if !d.quotaEnabled {
- return nil
- }
- dir, err := openDir(d.home)
- if err != nil {
- return err
- }
- defer closeDir(dir)
- var args C.struct_btrfs_ioctl_quota_rescan_args
- _, _, errno := unix.Syscall(unix.SYS_IOCTL, getDirFd(dir), C.BTRFS_IOC_QUOTA_RESCAN_WAIT,
- uintptr(unsafe.Pointer(&args)))
- if errno != 0 {
- return fmt.Errorf("Failed to rescan btrfs quota for %s: %v", dir, errno.Error())
- }
- return nil
- }
- func subvolLimitQgroup(path string, size uint64) error {
- dir, err := openDir(path)
- if err != nil {
- return err
- }
- defer closeDir(dir)
- var args C.struct_btrfs_ioctl_qgroup_limit_args
- args.lim.max_referenced = C.__u64(size)
- args.lim.flags = C.BTRFS_QGROUP_LIMIT_MAX_RFER
- _, _, errno := unix.Syscall(unix.SYS_IOCTL, getDirFd(dir), C.BTRFS_IOC_QGROUP_LIMIT,
- uintptr(unsafe.Pointer(&args)))
- if errno != 0 {
- return fmt.Errorf("Failed to limit qgroup for %s: %v", dir, errno.Error())
- }
- return nil
- }
- // subvolQgroupStatus performs a BTRFS_IOC_TREE_SEARCH on the root path
- // with search key of BTRFS_QGROUP_STATUS_KEY.
- // In case qgroup is enabled, the retuned key type will match BTRFS_QGROUP_STATUS_KEY.
- // For more details please see https://github.com/kdave/btrfs-progs/blob/v4.9/qgroup.c#L1035
- func subvolQgroupStatus(path string) error {
- dir, err := openDir(path)
- if err != nil {
- return err
- }
- defer closeDir(dir)
- var args C.struct_btrfs_ioctl_search_args
- args.key.tree_id = C.BTRFS_QUOTA_TREE_OBJECTID
- args.key.min_type = C.BTRFS_QGROUP_STATUS_KEY
- args.key.max_type = C.BTRFS_QGROUP_STATUS_KEY
- args.key.max_objectid = C.__u64(math.MaxUint64)
- args.key.max_offset = C.__u64(math.MaxUint64)
- args.key.max_transid = C.__u64(math.MaxUint64)
- args.key.nr_items = 4096
- _, _, errno := unix.Syscall(unix.SYS_IOCTL, getDirFd(dir), C.BTRFS_IOC_TREE_SEARCH,
- uintptr(unsafe.Pointer(&args)))
- if errno != 0 {
- return fmt.Errorf("Failed to search qgroup for %s: %v", path, errno.Error())
- }
- sh := (*C.struct_btrfs_ioctl_search_header)(unsafe.Pointer(&args.buf))
- if sh._type != C.BTRFS_QGROUP_STATUS_KEY {
- return fmt.Errorf("Invalid qgroup search header type for %s: %v", path, sh._type)
- }
- return nil
- }
- func subvolLookupQgroup(path string) (uint64, error) {
- dir, err := openDir(path)
- if err != nil {
- return 0, err
- }
- defer closeDir(dir)
- var args C.struct_btrfs_ioctl_ino_lookup_args
- args.objectid = C.BTRFS_FIRST_FREE_OBJECTID
- _, _, errno := unix.Syscall(unix.SYS_IOCTL, getDirFd(dir), C.BTRFS_IOC_INO_LOOKUP,
- uintptr(unsafe.Pointer(&args)))
- if errno != 0 {
- return 0, fmt.Errorf("Failed to lookup qgroup for %s: %v", dir, errno.Error())
- }
- if args.treeid == 0 {
- return 0, fmt.Errorf("Invalid qgroup id for %s: 0", dir)
- }
- return uint64(args.treeid), nil
- }
- func (d *Driver) subvolumesDir() string {
- return path.Join(d.home, "subvolumes")
- }
- func (d *Driver) subvolumesDirID(id string) string {
- return path.Join(d.subvolumesDir(), id)
- }
- func (d *Driver) quotasDir() string {
- return path.Join(d.home, "quotas")
- }
- func (d *Driver) quotasDirID(id string) string {
- return path.Join(d.quotasDir(), id)
- }
- // CreateReadWrite creates a layer that is writable for use as a container
- // file system.
- func (d *Driver) CreateReadWrite(id, parent string, opts *graphdriver.CreateOpts) error {
- return d.Create(id, parent, opts)
- }
- // Create the filesystem with given id.
- func (d *Driver) Create(id, parent string, opts *graphdriver.CreateOpts) error {
- quotas := path.Join(d.home, "quotas")
- subvolumes := path.Join(d.home, "subvolumes")
- rootUID, rootGID, err := idtools.GetRootUIDGID(d.uidMaps, d.gidMaps)
- if err != nil {
- return err
- }
- if err := idtools.MkdirAllAndChown(subvolumes, 0700, idtools.Identity{UID: rootUID, GID: rootGID}); err != nil {
- return err
- }
- if parent == "" {
- if err := subvolCreate(subvolumes, id); err != nil {
- return err
- }
- } else {
- parentDir := d.subvolumesDirID(parent)
- st, err := os.Stat(parentDir)
- if err != nil {
- return err
- }
- if !st.IsDir() {
- return fmt.Errorf("%s: not a directory", parentDir)
- }
- if err := subvolSnapshot(parentDir, subvolumes, id); err != nil {
- return err
- }
- }
- var storageOpt map[string]string
- if opts != nil {
- storageOpt = opts.StorageOpt
- }
- if _, ok := storageOpt["size"]; ok {
- driver := &Driver{}
- if err := d.parseStorageOpt(storageOpt, driver); err != nil {
- return err
- }
- if err := d.setStorageSize(path.Join(subvolumes, id), driver); err != nil {
- return err
- }
- if err := idtools.MkdirAllAndChown(quotas, 0700, idtools.Identity{UID: rootUID, GID: rootGID}); err != nil {
- return err
- }
- if err := ioutil.WriteFile(path.Join(quotas, id), []byte(fmt.Sprint(driver.options.size)), 0644); err != nil {
- return err
- }
- }
- // if we have a remapped root (user namespaces enabled), change the created snapshot
- // dir ownership to match
- if rootUID != 0 || rootGID != 0 {
- if err := os.Chown(path.Join(subvolumes, id), rootUID, rootGID); err != nil {
- return err
- }
- }
- mountLabel := ""
- if opts != nil {
- mountLabel = opts.MountLabel
- }
- return label.Relabel(path.Join(subvolumes, id), mountLabel, false)
- }
- // Parse btrfs storage options
- func (d *Driver) parseStorageOpt(storageOpt map[string]string, driver *Driver) error {
- // Read size to change the subvolume disk quota per container
- for key, val := range storageOpt {
- key := strings.ToLower(key)
- switch key {
- case "size":
- size, err := units.RAMInBytes(val)
- if err != nil {
- return err
- }
- driver.options.size = uint64(size)
- default:
- return fmt.Errorf("Unknown option %s", key)
- }
- }
- return nil
- }
- // Set btrfs storage size
- func (d *Driver) setStorageSize(dir string, driver *Driver) error {
- if driver.options.size == 0 {
- return fmt.Errorf("btrfs: invalid storage size: %s", units.HumanSize(float64(driver.options.size)))
- }
- if d.options.minSpace > 0 && driver.options.size < d.options.minSpace {
- return fmt.Errorf("btrfs: storage size cannot be less than %s", units.HumanSize(float64(d.options.minSpace)))
- }
- if err := d.subvolEnableQuota(); err != nil {
- return err
- }
- return subvolLimitQgroup(dir, driver.options.size)
- }
- // Remove the filesystem with given id.
- func (d *Driver) Remove(id string) error {
- dir := d.subvolumesDirID(id)
- if _, err := os.Stat(dir); err != nil {
- return err
- }
- quotasDir := d.quotasDirID(id)
- if _, err := os.Stat(quotasDir); err == nil {
- if err := os.Remove(quotasDir); err != nil {
- return err
- }
- } else if !os.IsNotExist(err) {
- return err
- }
- // Call updateQuotaStatus() to invoke status update
- d.updateQuotaStatus()
- if err := subvolDelete(d.subvolumesDir(), id, d.quotaEnabled); err != nil {
- return err
- }
- if err := system.EnsureRemoveAll(dir); err != nil {
- return err
- }
- return d.subvolRescanQuota()
- }
- // Get the requested filesystem id.
- func (d *Driver) Get(id, mountLabel string) (containerfs.ContainerFS, error) {
- dir := d.subvolumesDirID(id)
- st, err := os.Stat(dir)
- if err != nil {
- return nil, err
- }
- if !st.IsDir() {
- return nil, fmt.Errorf("%s: not a directory", dir)
- }
- if quota, err := ioutil.ReadFile(d.quotasDirID(id)); err == nil {
- if size, err := strconv.ParseUint(string(quota), 10, 64); err == nil && size >= d.options.minSpace {
- if err := d.subvolEnableQuota(); err != nil {
- return nil, err
- }
- if err := subvolLimitQgroup(dir, size); err != nil {
- return nil, err
- }
- }
- }
- return containerfs.NewLocalContainerFS(dir), nil
- }
- // Put is not implemented for BTRFS as there is no cleanup required for the id.
- func (d *Driver) Put(id string) error {
- // Get() creates no runtime resources (like e.g. mounts)
- // so this doesn't need to do anything.
- return nil
- }
- // Exists checks if the id exists in the filesystem.
- func (d *Driver) Exists(id string) bool {
- dir := d.subvolumesDirID(id)
- _, err := os.Stat(dir)
- return err == nil
- }
|