1e9be9d5eSMiklos Szeredi /* 2e9be9d5eSMiklos Szeredi * 3e9be9d5eSMiklos Szeredi * Copyright (C) 2011 Novell Inc. 4e9be9d5eSMiklos Szeredi * 5e9be9d5eSMiklos Szeredi * This program is free software; you can redistribute it and/or modify it 6e9be9d5eSMiklos Szeredi * under the terms of the GNU General Public License version 2 as published by 7e9be9d5eSMiklos Szeredi * the Free Software Foundation. 8e9be9d5eSMiklos Szeredi */ 9e9be9d5eSMiklos Szeredi 10e9be9d5eSMiklos Szeredi #include <linux/fs.h> 11e9be9d5eSMiklos Szeredi #include <linux/slab.h> 125b825c3aSIngo Molnar #include <linux/cred.h> 13e9be9d5eSMiklos Szeredi #include <linux/xattr.h> 145201dc44SMiklos Szeredi #include <linux/posix_acl.h> 155f8415d6SAmir Goldstein #include <linux/ratelimit.h> 16e9be9d5eSMiklos Szeredi #include "overlayfs.h" 17e9be9d5eSMiklos Szeredi 18ba1e563cSChandan Rajendra 19e9be9d5eSMiklos Szeredi int ovl_setattr(struct dentry *dentry, struct iattr *attr) 20e9be9d5eSMiklos Szeredi { 21e9be9d5eSMiklos Szeredi int err; 22e9be9d5eSMiklos Szeredi struct dentry *upperdentry; 231175b6b8SVivek Goyal const struct cred *old_cred; 24e9be9d5eSMiklos Szeredi 25cf9a6784SMiklos Szeredi /* 26cf9a6784SMiklos Szeredi * Check for permissions before trying to copy-up. This is redundant 27cf9a6784SMiklos Szeredi * since it will be rechecked later by ->setattr() on upper dentry. But 28cf9a6784SMiklos Szeredi * without this, copy-up can be triggered by just about anybody. 29cf9a6784SMiklos Szeredi * 30cf9a6784SMiklos Szeredi * We don't initialize inode->size, which just means that 31cf9a6784SMiklos Szeredi * inode_newsize_ok() will always check against MAX_LFS_FILESIZE and not 32cf9a6784SMiklos Szeredi * check for a swapfile (which this won't be anyway). 33cf9a6784SMiklos Szeredi */ 3431051c85SJan Kara err = setattr_prepare(dentry, attr); 35cf9a6784SMiklos Szeredi if (err) 36cf9a6784SMiklos Szeredi return err; 37cf9a6784SMiklos Szeredi 38e9be9d5eSMiklos Szeredi err = ovl_want_write(dentry); 39e9be9d5eSMiklos Szeredi if (err) 40e9be9d5eSMiklos Szeredi goto out; 41e9be9d5eSMiklos Szeredi 42acff81ecSMiklos Szeredi err = ovl_copy_up(dentry); 43acff81ecSMiklos Szeredi if (!err) { 44e9be9d5eSMiklos Szeredi upperdentry = ovl_dentry_upper(dentry); 45acff81ecSMiklos Szeredi 46b99c2d91SMiklos Szeredi if (attr->ia_valid & (ATTR_KILL_SUID|ATTR_KILL_SGID)) 47b99c2d91SMiklos Szeredi attr->ia_valid &= ~ATTR_MODE; 48b99c2d91SMiklos Szeredi 495955102cSAl Viro inode_lock(upperdentry->d_inode); 501175b6b8SVivek Goyal old_cred = ovl_override_creds(dentry->d_sb); 51e9be9d5eSMiklos Szeredi err = notify_change(upperdentry, attr, NULL); 521175b6b8SVivek Goyal revert_creds(old_cred); 53b81de061SKonstantin Khlebnikov if (!err) 54b81de061SKonstantin Khlebnikov ovl_copyattr(upperdentry->d_inode, dentry->d_inode); 555955102cSAl Viro inode_unlock(upperdentry->d_inode); 56e9be9d5eSMiklos Szeredi } 57e9be9d5eSMiklos Szeredi ovl_drop_write(dentry); 58e9be9d5eSMiklos Szeredi out: 59e9be9d5eSMiklos Szeredi return err; 60e9be9d5eSMiklos Szeredi } 61e9be9d5eSMiklos Szeredi 62da309e8cSAmir Goldstein static int ovl_map_dev_ino(struct dentry *dentry, struct kstat *stat, 63da309e8cSAmir Goldstein struct ovl_layer *lower_layer) 64da309e8cSAmir Goldstein { 65da309e8cSAmir Goldstein bool samefs = ovl_same_sb(dentry->d_sb); 66e487d889SAmir Goldstein unsigned int xinobits = ovl_xino_bits(dentry->d_sb); 67da309e8cSAmir Goldstein 68da309e8cSAmir Goldstein if (samefs) { 69da309e8cSAmir Goldstein /* 70da309e8cSAmir Goldstein * When all layers are on the same fs, all real inode 71da309e8cSAmir Goldstein * number are unique, so we use the overlay st_dev, 72da309e8cSAmir Goldstein * which is friendly to du -x. 73da309e8cSAmir Goldstein */ 74da309e8cSAmir Goldstein stat->dev = dentry->d_sb->s_dev; 75e487d889SAmir Goldstein return 0; 76e487d889SAmir Goldstein } else if (xinobits) { 77e487d889SAmir Goldstein unsigned int shift = 64 - xinobits; 78e487d889SAmir Goldstein /* 79e487d889SAmir Goldstein * All inode numbers of underlying fs should not be using the 80e487d889SAmir Goldstein * high xinobits, so we use high xinobits to partition the 81e487d889SAmir Goldstein * overlay st_ino address space. The high bits holds the fsid 82e487d889SAmir Goldstein * (upper fsid is 0). This way overlay inode numbers are unique 83e487d889SAmir Goldstein * and all inodes use overlay st_dev. Inode numbers are also 84e487d889SAmir Goldstein * persistent for a given layer configuration. 85e487d889SAmir Goldstein */ 86e487d889SAmir Goldstein if (stat->ino >> shift) { 87e487d889SAmir Goldstein pr_warn_ratelimited("overlayfs: inode number too big (%pd2, ino=%llu, xinobits=%d)\n", 88e487d889SAmir Goldstein dentry, stat->ino, xinobits); 89e487d889SAmir Goldstein } else { 90e487d889SAmir Goldstein if (lower_layer) 91e487d889SAmir Goldstein stat->ino |= ((u64)lower_layer->fsid) << shift; 92e487d889SAmir Goldstein 93e487d889SAmir Goldstein stat->dev = dentry->d_sb->s_dev; 94e487d889SAmir Goldstein return 0; 95e487d889SAmir Goldstein } 96e487d889SAmir Goldstein } 97e487d889SAmir Goldstein 98e487d889SAmir Goldstein /* The inode could not be mapped to a unified st_ino address space */ 99e487d889SAmir Goldstein if (S_ISDIR(dentry->d_inode->i_mode)) { 100da309e8cSAmir Goldstein /* 101da309e8cSAmir Goldstein * Always use the overlay st_dev for directories, so 'find 102da309e8cSAmir Goldstein * -xdev' will scan the entire overlay mount and won't cross the 103da309e8cSAmir Goldstein * overlay mount boundaries. 104da309e8cSAmir Goldstein * 105da309e8cSAmir Goldstein * If not all layers are on the same fs the pair {real st_ino; 106da309e8cSAmir Goldstein * overlay st_dev} is not unique, so use the non persistent 107da309e8cSAmir Goldstein * overlay st_ino for directories. 108da309e8cSAmir Goldstein */ 109da309e8cSAmir Goldstein stat->dev = dentry->d_sb->s_dev; 110da309e8cSAmir Goldstein stat->ino = dentry->d_inode->i_ino; 1115148626bSAmir Goldstein } else if (lower_layer && lower_layer->fsid) { 112da309e8cSAmir Goldstein /* 113da309e8cSAmir Goldstein * For non-samefs setup, if we cannot map all layers st_ino 114da309e8cSAmir Goldstein * to a unified address space, we need to make sure that st_dev 1155148626bSAmir Goldstein * is unique per lower fs. Upper layer uses real st_dev and 1165148626bSAmir Goldstein * lower layers use the unique anonymous bdev assigned to the 1175148626bSAmir Goldstein * lower fs. 118da309e8cSAmir Goldstein */ 1195148626bSAmir Goldstein stat->dev = lower_layer->fs->pseudo_dev; 120da309e8cSAmir Goldstein } 121da309e8cSAmir Goldstein 122da309e8cSAmir Goldstein return 0; 123da309e8cSAmir Goldstein } 124da309e8cSAmir Goldstein 1255b712091SMiklos Szeredi int ovl_getattr(const struct path *path, struct kstat *stat, 126a528d35eSDavid Howells u32 request_mask, unsigned int flags) 127e9be9d5eSMiklos Szeredi { 128a528d35eSDavid Howells struct dentry *dentry = path->dentry; 12972b608f0SAmir Goldstein enum ovl_path_type type; 130e9be9d5eSMiklos Szeredi struct path realpath; 1311175b6b8SVivek Goyal const struct cred *old_cred; 1325b712091SMiklos Szeredi bool is_dir = S_ISDIR(dentry->d_inode->i_mode); 133a0c5ad30SAmir Goldstein bool samefs = ovl_same_sb(dentry->d_sb); 134da309e8cSAmir Goldstein struct ovl_layer *lower_layer = NULL; 1351175b6b8SVivek Goyal int err; 136e9be9d5eSMiklos Szeredi 13772b608f0SAmir Goldstein type = ovl_path_real(dentry, &realpath); 1381175b6b8SVivek Goyal old_cred = ovl_override_creds(dentry->d_sb); 139a528d35eSDavid Howells err = vfs_getattr(&realpath, stat, request_mask, flags); 14072b608f0SAmir Goldstein if (err) 14172b608f0SAmir Goldstein goto out; 14272b608f0SAmir Goldstein 14372b608f0SAmir Goldstein /* 144da309e8cSAmir Goldstein * For non-dir or same fs, we use st_ino of the copy up origin. 145da309e8cSAmir Goldstein * This guaranties constant st_dev/st_ino across copy up. 146e487d889SAmir Goldstein * With xino feature and non-samefs, we use st_ino of the copy up 147e487d889SAmir Goldstein * origin masked with high bits that represent the layer id. 14872b608f0SAmir Goldstein * 149da309e8cSAmir Goldstein * If lower filesystem supports NFS file handles, this also guaranties 15072b608f0SAmir Goldstein * persistent st_ino across mount cycle. 15172b608f0SAmir Goldstein */ 152e487d889SAmir Goldstein if (!is_dir || samefs || ovl_xino_bits(dentry->d_sb)) { 153da309e8cSAmir Goldstein if (!OVL_TYPE_UPPER(type)) { 154da309e8cSAmir Goldstein lower_layer = ovl_layer_lower(dentry); 155da309e8cSAmir Goldstein } else if (OVL_TYPE_ORIGIN(type)) { 15672b608f0SAmir Goldstein struct kstat lowerstat; 1575b712091SMiklos Szeredi u32 lowermask = STATX_INO | (!is_dir ? STATX_NLINK : 0); 15872b608f0SAmir Goldstein 15972b608f0SAmir Goldstein ovl_path_lower(dentry, &realpath); 16072b608f0SAmir Goldstein err = vfs_getattr(&realpath, &lowerstat, 1615b712091SMiklos Szeredi lowermask, flags); 16272b608f0SAmir Goldstein if (err) 16372b608f0SAmir Goldstein goto out; 16472b608f0SAmir Goldstein 16572b608f0SAmir Goldstein /* 166359f392cSAmir Goldstein * Lower hardlinks may be broken on copy up to different 16772b608f0SAmir Goldstein * upper files, so we cannot use the lower origin st_ino 16872b608f0SAmir Goldstein * for those different files, even for the same fs case. 16986eaa130SAmir Goldstein * 17086eaa130SAmir Goldstein * Similarly, several redirected dirs can point to the 17186eaa130SAmir Goldstein * same dir on a lower layer. With the "verify_lower" 17286eaa130SAmir Goldstein * feature, we do not use the lower origin st_ino, if 17386eaa130SAmir Goldstein * we haven't verified that this redirect is unique. 17486eaa130SAmir Goldstein * 175359f392cSAmir Goldstein * With inodes index enabled, it is safe to use st_ino 17686eaa130SAmir Goldstein * of an indexed origin. The index validates that the 17786eaa130SAmir Goldstein * upper hardlink is not broken and that a redirected 17886eaa130SAmir Goldstein * dir is the only redirect to that origin. 17972b608f0SAmir Goldstein */ 18086eaa130SAmir Goldstein if (ovl_test_flag(OVL_INDEX, d_inode(dentry)) || 18186eaa130SAmir Goldstein (!ovl_verify_lower(dentry->d_sb) && 1829f99e50dSAmir Goldstein (is_dir || lowerstat.nlink == 1))) { 18372b608f0SAmir Goldstein stat->ino = lowerstat.ino; 184da309e8cSAmir Goldstein lower_layer = ovl_layer_lower(dentry); 18572b608f0SAmir Goldstein } 1869f99e50dSAmir Goldstein } 187a0c5ad30SAmir Goldstein } 188da309e8cSAmir Goldstein 189da309e8cSAmir Goldstein err = ovl_map_dev_ino(dentry, stat, lower_layer); 190da309e8cSAmir Goldstein if (err) 191da309e8cSAmir Goldstein goto out; 1925b712091SMiklos Szeredi 1935b712091SMiklos Szeredi /* 1945b712091SMiklos Szeredi * It's probably not worth it to count subdirs to get the 1955b712091SMiklos Szeredi * correct link count. nlink=1 seems to pacify 'find' and 1965b712091SMiklos Szeredi * other utilities. 1975b712091SMiklos Szeredi */ 1985b712091SMiklos Szeredi if (is_dir && OVL_TYPE_MERGE(type)) 1995b712091SMiklos Szeredi stat->nlink = 1; 2005b712091SMiklos Szeredi 2015f8415d6SAmir Goldstein /* 2025f8415d6SAmir Goldstein * Return the overlay inode nlinks for indexed upper inodes. 2035f8415d6SAmir Goldstein * Overlay inode nlink counts the union of the upper hardlinks 2045f8415d6SAmir Goldstein * and non-covered lower hardlinks. It does not include the upper 2055f8415d6SAmir Goldstein * index hardlink. 2065f8415d6SAmir Goldstein */ 2075f8415d6SAmir Goldstein if (!is_dir && ovl_test_flag(OVL_INDEX, d_inode(dentry))) 2085f8415d6SAmir Goldstein stat->nlink = dentry->d_inode->i_nlink; 2095f8415d6SAmir Goldstein 21072b608f0SAmir Goldstein out: 2111175b6b8SVivek Goyal revert_creds(old_cred); 21272b608f0SAmir Goldstein 2131175b6b8SVivek Goyal return err; 214e9be9d5eSMiklos Szeredi } 215e9be9d5eSMiklos Szeredi 216e9be9d5eSMiklos Szeredi int ovl_permission(struct inode *inode, int mask) 217e9be9d5eSMiklos Szeredi { 21809d8b586SMiklos Szeredi struct inode *upperinode = ovl_inode_upper(inode); 21909d8b586SMiklos Szeredi struct inode *realinode = upperinode ?: ovl_inode_lower(inode); 220c0ca3d70SVivek Goyal const struct cred *old_cred; 221e9be9d5eSMiklos Szeredi int err; 222e9be9d5eSMiklos Szeredi 223e9be9d5eSMiklos Szeredi /* Careful in RCU walk mode */ 224e9be9d5eSMiklos Szeredi if (!realinode) { 225e9be9d5eSMiklos Szeredi WARN_ON(!(mask & MAY_NOT_BLOCK)); 226a999d7e1SMiklos Szeredi return -ECHILD; 227e9be9d5eSMiklos Szeredi } 228e9be9d5eSMiklos Szeredi 229c0ca3d70SVivek Goyal /* 230c0ca3d70SVivek Goyal * Check overlay inode with the creds of task and underlying inode 231c0ca3d70SVivek Goyal * with creds of mounter 232c0ca3d70SVivek Goyal */ 233c0ca3d70SVivek Goyal err = generic_permission(inode, mask); 234c0ca3d70SVivek Goyal if (err) 235c0ca3d70SVivek Goyal return err; 236c0ca3d70SVivek Goyal 237c0ca3d70SVivek Goyal old_cred = ovl_override_creds(inode->i_sb); 23809d8b586SMiklos Szeredi if (!upperinode && 23909d8b586SMiklos Szeredi !special_file(realinode->i_mode) && mask & MAY_WRITE) { 240754f8cb7SVivek Goyal mask &= ~(MAY_WRITE | MAY_APPEND); 241500cac3cSVivek Goyal /* Make sure mounter can read file for copy up later */ 242500cac3cSVivek Goyal mask |= MAY_READ; 243500cac3cSVivek Goyal } 2449c630ebeSMiklos Szeredi err = inode_permission(realinode, mask); 245c0ca3d70SVivek Goyal revert_creds(old_cred); 246c0ca3d70SVivek Goyal 247c0ca3d70SVivek Goyal return err; 248e9be9d5eSMiklos Szeredi } 249e9be9d5eSMiklos Szeredi 2506b255391SAl Viro static const char *ovl_get_link(struct dentry *dentry, 251fceef393SAl Viro struct inode *inode, 252fceef393SAl Viro struct delayed_call *done) 253e9be9d5eSMiklos Szeredi { 2541175b6b8SVivek Goyal const struct cred *old_cred; 2551175b6b8SVivek Goyal const char *p; 256e9be9d5eSMiklos Szeredi 2576b255391SAl Viro if (!dentry) 2586b255391SAl Viro return ERR_PTR(-ECHILD); 2596b255391SAl Viro 2601175b6b8SVivek Goyal old_cred = ovl_override_creds(dentry->d_sb); 2617764235bSMiklos Szeredi p = vfs_get_link(ovl_dentry_real(dentry), done); 2621175b6b8SVivek Goyal revert_creds(old_cred); 2631175b6b8SVivek Goyal return p; 264e9be9d5eSMiklos Szeredi } 265e9be9d5eSMiklos Szeredi 2660956254aSMiklos Szeredi bool ovl_is_private_xattr(const char *name) 267e9be9d5eSMiklos Szeredi { 268fe2b7595SAndreas Gruenbacher return strncmp(name, OVL_XATTR_PREFIX, 269fe2b7595SAndreas Gruenbacher sizeof(OVL_XATTR_PREFIX) - 1) == 0; 270e9be9d5eSMiklos Szeredi } 271e9be9d5eSMiklos Szeredi 2721d88f183SMiklos Szeredi int ovl_xattr_set(struct dentry *dentry, struct inode *inode, const char *name, 2731d88f183SMiklos Szeredi const void *value, size_t size, int flags) 274e9be9d5eSMiklos Szeredi { 275e9be9d5eSMiklos Szeredi int err; 2761d88f183SMiklos Szeredi struct dentry *upperdentry = ovl_i_dentry_upper(inode); 2771d88f183SMiklos Szeredi struct dentry *realdentry = upperdentry ?: ovl_dentry_lower(dentry); 2781175b6b8SVivek Goyal const struct cred *old_cred; 279e9be9d5eSMiklos Szeredi 280e9be9d5eSMiklos Szeredi err = ovl_want_write(dentry); 281e9be9d5eSMiklos Szeredi if (err) 282e9be9d5eSMiklos Szeredi goto out; 283e9be9d5eSMiklos Szeredi 2841d88f183SMiklos Szeredi if (!value && !upperdentry) { 2851d88f183SMiklos Szeredi err = vfs_getxattr(realdentry, name, NULL, 0); 2860e585cccSAndreas Gruenbacher if (err < 0) 2870e585cccSAndreas Gruenbacher goto out_drop_write; 2880e585cccSAndreas Gruenbacher } 2890e585cccSAndreas Gruenbacher 2901d88f183SMiklos Szeredi if (!upperdentry) { 291e9be9d5eSMiklos Szeredi err = ovl_copy_up(dentry); 292e9be9d5eSMiklos Szeredi if (err) 293e9be9d5eSMiklos Szeredi goto out_drop_write; 294e9be9d5eSMiklos Szeredi 2951d88f183SMiklos Szeredi realdentry = ovl_dentry_upper(dentry); 2961d88f183SMiklos Szeredi } 2970e585cccSAndreas Gruenbacher 2981175b6b8SVivek Goyal old_cred = ovl_override_creds(dentry->d_sb); 2990e585cccSAndreas Gruenbacher if (value) 3001d88f183SMiklos Szeredi err = vfs_setxattr(realdentry, name, value, size, flags); 3010e585cccSAndreas Gruenbacher else { 3020e585cccSAndreas Gruenbacher WARN_ON(flags != XATTR_REPLACE); 3031d88f183SMiklos Szeredi err = vfs_removexattr(realdentry, name); 3040e585cccSAndreas Gruenbacher } 3051175b6b8SVivek Goyal revert_creds(old_cred); 306e9be9d5eSMiklos Szeredi 307e9be9d5eSMiklos Szeredi out_drop_write: 308e9be9d5eSMiklos Szeredi ovl_drop_write(dentry); 309e9be9d5eSMiklos Szeredi out: 310e9be9d5eSMiklos Szeredi return err; 311e9be9d5eSMiklos Szeredi } 312e9be9d5eSMiklos Szeredi 3131d88f183SMiklos Szeredi int ovl_xattr_get(struct dentry *dentry, struct inode *inode, const char *name, 3140eb45fc3SAndreas Gruenbacher void *value, size_t size) 315e9be9d5eSMiklos Szeredi { 3161175b6b8SVivek Goyal ssize_t res; 3171175b6b8SVivek Goyal const struct cred *old_cred; 3181d88f183SMiklos Szeredi struct dentry *realdentry = 3191d88f183SMiklos Szeredi ovl_i_dentry_upper(inode) ?: ovl_dentry_lower(dentry); 32052148463SMiklos Szeredi 3211175b6b8SVivek Goyal old_cred = ovl_override_creds(dentry->d_sb); 3221175b6b8SVivek Goyal res = vfs_getxattr(realdentry, name, value, size); 3231175b6b8SVivek Goyal revert_creds(old_cred); 3241175b6b8SVivek Goyal return res; 325e9be9d5eSMiklos Szeredi } 326e9be9d5eSMiklos Szeredi 327a082c6f6SMiklos Szeredi static bool ovl_can_list(const char *s) 328a082c6f6SMiklos Szeredi { 329a082c6f6SMiklos Szeredi /* List all non-trusted xatts */ 330a082c6f6SMiklos Szeredi if (strncmp(s, XATTR_TRUSTED_PREFIX, XATTR_TRUSTED_PREFIX_LEN) != 0) 331a082c6f6SMiklos Szeredi return true; 332a082c6f6SMiklos Szeredi 333a082c6f6SMiklos Szeredi /* Never list trusted.overlay, list other trusted for superuser only */ 334a082c6f6SMiklos Szeredi return !ovl_is_private_xattr(s) && capable(CAP_SYS_ADMIN); 335a082c6f6SMiklos Szeredi } 336a082c6f6SMiklos Szeredi 337e9be9d5eSMiklos Szeredi ssize_t ovl_listxattr(struct dentry *dentry, char *list, size_t size) 338e9be9d5eSMiklos Szeredi { 339b581755bSMiklos Szeredi struct dentry *realdentry = ovl_dentry_real(dentry); 340e9be9d5eSMiklos Szeredi ssize_t res; 3417cb35119SMiklos Szeredi size_t len; 3427cb35119SMiklos Szeredi char *s; 3431175b6b8SVivek Goyal const struct cred *old_cred; 344e9be9d5eSMiklos Szeredi 3451175b6b8SVivek Goyal old_cred = ovl_override_creds(dentry->d_sb); 346b581755bSMiklos Szeredi res = vfs_listxattr(realdentry, list, size); 3471175b6b8SVivek Goyal revert_creds(old_cred); 348e9be9d5eSMiklos Szeredi if (res <= 0 || size == 0) 349e9be9d5eSMiklos Szeredi return res; 350e9be9d5eSMiklos Szeredi 351e9be9d5eSMiklos Szeredi /* filter out private xattrs */ 3527cb35119SMiklos Szeredi for (s = list, len = res; len;) { 3537cb35119SMiklos Szeredi size_t slen = strnlen(s, len) + 1; 354e9be9d5eSMiklos Szeredi 3557cb35119SMiklos Szeredi /* underlying fs providing us with an broken xattr list? */ 3567cb35119SMiklos Szeredi if (WARN_ON(slen > len)) 3577cb35119SMiklos Szeredi return -EIO; 358e9be9d5eSMiklos Szeredi 3597cb35119SMiklos Szeredi len -= slen; 360a082c6f6SMiklos Szeredi if (!ovl_can_list(s)) { 361e9be9d5eSMiklos Szeredi res -= slen; 3627cb35119SMiklos Szeredi memmove(s, s + slen, len); 363e9be9d5eSMiklos Szeredi } else { 3647cb35119SMiklos Szeredi s += slen; 365e9be9d5eSMiklos Szeredi } 366e9be9d5eSMiklos Szeredi } 367e9be9d5eSMiklos Szeredi 368e9be9d5eSMiklos Szeredi return res; 369e9be9d5eSMiklos Szeredi } 370e9be9d5eSMiklos Szeredi 37139a25b2bSVivek Goyal struct posix_acl *ovl_get_acl(struct inode *inode, int type) 37239a25b2bSVivek Goyal { 37309d8b586SMiklos Szeredi struct inode *realinode = ovl_inode_real(inode); 3741175b6b8SVivek Goyal const struct cred *old_cred; 3751175b6b8SVivek Goyal struct posix_acl *acl; 37639a25b2bSVivek Goyal 3775201dc44SMiklos Szeredi if (!IS_ENABLED(CONFIG_FS_POSIX_ACL) || !IS_POSIXACL(realinode)) 37839a25b2bSVivek Goyal return NULL; 37939a25b2bSVivek Goyal 3801175b6b8SVivek Goyal old_cred = ovl_override_creds(inode->i_sb); 3815201dc44SMiklos Szeredi acl = get_acl(realinode, type); 3821175b6b8SVivek Goyal revert_creds(old_cred); 3831175b6b8SVivek Goyal 3841175b6b8SVivek Goyal return acl; 38539a25b2bSVivek Goyal } 38639a25b2bSVivek Goyal 38759be0971SAmir Goldstein static bool ovl_open_need_copy_up(struct dentry *dentry, int flags) 388e9be9d5eSMiklos Szeredi { 389aa3ff3c1SAmir Goldstein /* Copy up of disconnected dentry does not set upper alias */ 39059be0971SAmir Goldstein if (ovl_dentry_upper(dentry) && 391aa3ff3c1SAmir Goldstein (ovl_dentry_has_upper_alias(dentry) || 392aa3ff3c1SAmir Goldstein (dentry->d_flags & DCACHE_DISCONNECTED))) 393e9be9d5eSMiklos Szeredi return false; 394e9be9d5eSMiklos Szeredi 39559be0971SAmir Goldstein if (special_file(d_inode(dentry)->i_mode)) 396e9be9d5eSMiklos Szeredi return false; 397e9be9d5eSMiklos Szeredi 398e9be9d5eSMiklos Szeredi if (!(OPEN_FMODE(flags) & FMODE_WRITE) && !(flags & O_TRUNC)) 399e9be9d5eSMiklos Szeredi return false; 400e9be9d5eSMiklos Szeredi 401e9be9d5eSMiklos Szeredi return true; 402e9be9d5eSMiklos Szeredi } 403e9be9d5eSMiklos Szeredi 4042d902671SMiklos Szeredi int ovl_open_maybe_copy_up(struct dentry *dentry, unsigned int file_flags) 405e9be9d5eSMiklos Szeredi { 4062d902671SMiklos Szeredi int err = 0; 407e9be9d5eSMiklos Szeredi 40859be0971SAmir Goldstein if (ovl_open_need_copy_up(dentry, file_flags)) { 409e9be9d5eSMiklos Szeredi err = ovl_want_write(dentry); 4102d902671SMiklos Szeredi if (!err) { 4119aba6521SAmir Goldstein err = ovl_copy_up_flags(dentry, file_flags); 412f25801eeSDavid Howells ovl_drop_write(dentry); 4132d902671SMiklos Szeredi } 414e9be9d5eSMiklos Szeredi } 415e9be9d5eSMiklos Szeredi 4162d902671SMiklos Szeredi return err; 417e9be9d5eSMiklos Szeredi } 418e9be9d5eSMiklos Szeredi 419d719e8f2SMiklos Szeredi int ovl_update_time(struct inode *inode, struct timespec *ts, int flags) 420d719e8f2SMiklos Szeredi { 4218f35cf51SMiklos Szeredi if (flags & S_ATIME) { 4228f35cf51SMiklos Szeredi struct ovl_fs *ofs = inode->i_sb->s_fs_info; 4238f35cf51SMiklos Szeredi struct path upperpath = { 4248f35cf51SMiklos Szeredi .mnt = ofs->upper_mnt, 4258f35cf51SMiklos Szeredi .dentry = ovl_upperdentry_dereference(OVL_I(inode)), 4268f35cf51SMiklos Szeredi }; 427d719e8f2SMiklos Szeredi 428d719e8f2SMiklos Szeredi if (upperpath.dentry) { 429d719e8f2SMiklos Szeredi touch_atime(&upperpath); 430d719e8f2SMiklos Szeredi inode->i_atime = d_inode(upperpath.dentry)->i_atime; 431d719e8f2SMiklos Szeredi } 4328f35cf51SMiklos Szeredi } 433d719e8f2SMiklos Szeredi return 0; 434d719e8f2SMiklos Szeredi } 435d719e8f2SMiklos Szeredi 436e9be9d5eSMiklos Szeredi static const struct inode_operations ovl_file_inode_operations = { 437e9be9d5eSMiklos Szeredi .setattr = ovl_setattr, 438e9be9d5eSMiklos Szeredi .permission = ovl_permission, 439e9be9d5eSMiklos Szeredi .getattr = ovl_getattr, 440e9be9d5eSMiklos Szeredi .listxattr = ovl_listxattr, 44139a25b2bSVivek Goyal .get_acl = ovl_get_acl, 442d719e8f2SMiklos Szeredi .update_time = ovl_update_time, 443e9be9d5eSMiklos Szeredi }; 444e9be9d5eSMiklos Szeredi 445e9be9d5eSMiklos Szeredi static const struct inode_operations ovl_symlink_inode_operations = { 446e9be9d5eSMiklos Szeredi .setattr = ovl_setattr, 4476b255391SAl Viro .get_link = ovl_get_link, 448e9be9d5eSMiklos Szeredi .getattr = ovl_getattr, 449e9be9d5eSMiklos Szeredi .listxattr = ovl_listxattr, 450d719e8f2SMiklos Szeredi .update_time = ovl_update_time, 451e9be9d5eSMiklos Szeredi }; 452e9be9d5eSMiklos Szeredi 453b1eaa950SAmir Goldstein /* 454b1eaa950SAmir Goldstein * It is possible to stack overlayfs instance on top of another 455b1eaa950SAmir Goldstein * overlayfs instance as lower layer. We need to annonate the 456b1eaa950SAmir Goldstein * stackable i_mutex locks according to stack level of the super 457b1eaa950SAmir Goldstein * block instance. An overlayfs instance can never be in stack 458b1eaa950SAmir Goldstein * depth 0 (there is always a real fs below it). An overlayfs 459b1eaa950SAmir Goldstein * inode lock will use the lockdep annotaion ovl_i_mutex_key[depth]. 460b1eaa950SAmir Goldstein * 461b1eaa950SAmir Goldstein * For example, here is a snip from /proc/lockdep_chains after 462b1eaa950SAmir Goldstein * dir_iterate of nested overlayfs: 463b1eaa950SAmir Goldstein * 464b1eaa950SAmir Goldstein * [...] &ovl_i_mutex_dir_key[depth] (stack_depth=2) 465b1eaa950SAmir Goldstein * [...] &ovl_i_mutex_dir_key[depth]#2 (stack_depth=1) 466b1eaa950SAmir Goldstein * [...] &type->i_mutex_dir_key (stack_depth=0) 467b1eaa950SAmir Goldstein */ 468b1eaa950SAmir Goldstein #define OVL_MAX_NESTING FILESYSTEM_MAX_STACK_DEPTH 469b1eaa950SAmir Goldstein 470b1eaa950SAmir Goldstein static inline void ovl_lockdep_annotate_inode_mutex_key(struct inode *inode) 471b1eaa950SAmir Goldstein { 472b1eaa950SAmir Goldstein #ifdef CONFIG_LOCKDEP 473b1eaa950SAmir Goldstein static struct lock_class_key ovl_i_mutex_key[OVL_MAX_NESTING]; 474b1eaa950SAmir Goldstein static struct lock_class_key ovl_i_mutex_dir_key[OVL_MAX_NESTING]; 4754eae06deSAmir Goldstein static struct lock_class_key ovl_i_lock_key[OVL_MAX_NESTING]; 476b1eaa950SAmir Goldstein 477b1eaa950SAmir Goldstein int depth = inode->i_sb->s_stack_depth - 1; 478b1eaa950SAmir Goldstein 479b1eaa950SAmir Goldstein if (WARN_ON_ONCE(depth < 0 || depth >= OVL_MAX_NESTING)) 480b1eaa950SAmir Goldstein depth = 0; 481b1eaa950SAmir Goldstein 482b1eaa950SAmir Goldstein if (S_ISDIR(inode->i_mode)) 483b1eaa950SAmir Goldstein lockdep_set_class(&inode->i_rwsem, &ovl_i_mutex_dir_key[depth]); 484b1eaa950SAmir Goldstein else 485b1eaa950SAmir Goldstein lockdep_set_class(&inode->i_rwsem, &ovl_i_mutex_key[depth]); 4864eae06deSAmir Goldstein 4874eae06deSAmir Goldstein lockdep_set_class(&OVL_I(inode)->lock, &ovl_i_lock_key[depth]); 488b1eaa950SAmir Goldstein #endif 489b1eaa950SAmir Goldstein } 490b1eaa950SAmir Goldstein 491695b46e7SAmir Goldstein static void ovl_fill_inode(struct inode *inode, umode_t mode, dev_t rdev, 49212574a9fSAmir Goldstein unsigned long ino, int fsid) 493e9be9d5eSMiklos Szeredi { 49412574a9fSAmir Goldstein int xinobits = ovl_xino_bits(inode->i_sb); 49512574a9fSAmir Goldstein 496695b46e7SAmir Goldstein /* 497695b46e7SAmir Goldstein * When NFS export is enabled and d_ino is consistent with st_ino 49812574a9fSAmir Goldstein * (samefs or i_ino has enough bits to encode layer), set the same 49912574a9fSAmir Goldstein * value used for d_ino to i_ino, because nfsd readdirplus compares 50012574a9fSAmir Goldstein * d_ino values to i_ino values of child entries. When called from 50112574a9fSAmir Goldstein * ovl_new_inode(), ino arg is 0, so i_ino will be updated to real 502695b46e7SAmir Goldstein * upper inode i_ino on ovl_inode_init() or ovl_inode_update(). 503695b46e7SAmir Goldstein */ 50412574a9fSAmir Goldstein if (inode->i_sb->s_export_op && 50512574a9fSAmir Goldstein (ovl_same_sb(inode->i_sb) || xinobits)) { 506695b46e7SAmir Goldstein inode->i_ino = ino; 50712574a9fSAmir Goldstein if (xinobits && fsid && !(ino >> (64 - xinobits))) 50812574a9fSAmir Goldstein inode->i_ino |= (unsigned long)fsid << (64 - xinobits); 50912574a9fSAmir Goldstein } else { 510e9be9d5eSMiklos Szeredi inode->i_ino = get_next_ino(); 51112574a9fSAmir Goldstein } 512e9be9d5eSMiklos Szeredi inode->i_mode = mode; 513d719e8f2SMiklos Szeredi inode->i_flags |= S_NOCMTIME; 5142a3a2a3fSMiklos Szeredi #ifdef CONFIG_FS_POSIX_ACL 5152a3a2a3fSMiklos Szeredi inode->i_acl = inode->i_default_acl = ACL_DONT_CACHE; 5162a3a2a3fSMiklos Szeredi #endif 517e9be9d5eSMiklos Szeredi 518b1eaa950SAmir Goldstein ovl_lockdep_annotate_inode_mutex_key(inode); 519b1eaa950SAmir Goldstein 520ca4c8a3aSMiklos Szeredi switch (mode & S_IFMT) { 521ca4c8a3aSMiklos Szeredi case S_IFREG: 522ca4c8a3aSMiklos Szeredi inode->i_op = &ovl_file_inode_operations; 523ca4c8a3aSMiklos Szeredi break; 524ca4c8a3aSMiklos Szeredi 525e9be9d5eSMiklos Szeredi case S_IFDIR: 526e9be9d5eSMiklos Szeredi inode->i_op = &ovl_dir_inode_operations; 527e9be9d5eSMiklos Szeredi inode->i_fop = &ovl_dir_operations; 528e9be9d5eSMiklos Szeredi break; 529e9be9d5eSMiklos Szeredi 530e9be9d5eSMiklos Szeredi case S_IFLNK: 531e9be9d5eSMiklos Szeredi inode->i_op = &ovl_symlink_inode_operations; 532e9be9d5eSMiklos Szeredi break; 533e9be9d5eSMiklos Szeredi 53451f7e52dSMiklos Szeredi default: 535e9be9d5eSMiklos Szeredi inode->i_op = &ovl_file_inode_operations; 536ca4c8a3aSMiklos Szeredi init_special_inode(inode, mode, rdev); 537e9be9d5eSMiklos Szeredi break; 53851f7e52dSMiklos Szeredi } 53951f7e52dSMiklos Szeredi } 540e9be9d5eSMiklos Szeredi 5415f8415d6SAmir Goldstein /* 5425f8415d6SAmir Goldstein * With inodes index enabled, an overlay inode nlink counts the union of upper 5435f8415d6SAmir Goldstein * hardlinks and non-covered lower hardlinks. During the lifetime of a non-pure 5445f8415d6SAmir Goldstein * upper inode, the following nlink modifying operations can happen: 5455f8415d6SAmir Goldstein * 5465f8415d6SAmir Goldstein * 1. Lower hardlink copy up 5475f8415d6SAmir Goldstein * 2. Upper hardlink created, unlinked or renamed over 5485f8415d6SAmir Goldstein * 3. Lower hardlink whiteout or renamed over 5495f8415d6SAmir Goldstein * 5505f8415d6SAmir Goldstein * For the first, copy up case, the union nlink does not change, whether the 5515f8415d6SAmir Goldstein * operation succeeds or fails, but the upper inode nlink may change. 5525f8415d6SAmir Goldstein * Therefore, before copy up, we store the union nlink value relative to the 5535f8415d6SAmir Goldstein * lower inode nlink in the index inode xattr trusted.overlay.nlink. 5545f8415d6SAmir Goldstein * 5555f8415d6SAmir Goldstein * For the second, upper hardlink case, the union nlink should be incremented 5565f8415d6SAmir Goldstein * or decremented IFF the operation succeeds, aligned with nlink change of the 5575f8415d6SAmir Goldstein * upper inode. Therefore, before link/unlink/rename, we store the union nlink 5585f8415d6SAmir Goldstein * value relative to the upper inode nlink in the index inode. 5595f8415d6SAmir Goldstein * 5605f8415d6SAmir Goldstein * For the last, lower cover up case, we simplify things by preceding the 5615f8415d6SAmir Goldstein * whiteout or cover up with copy up. This makes sure that there is an index 5625f8415d6SAmir Goldstein * upper inode where the nlink xattr can be stored before the copied up upper 5635f8415d6SAmir Goldstein * entry is unlink. 5645f8415d6SAmir Goldstein */ 5655f8415d6SAmir Goldstein #define OVL_NLINK_ADD_UPPER (1 << 0) 5665f8415d6SAmir Goldstein 5675f8415d6SAmir Goldstein /* 5685f8415d6SAmir Goldstein * On-disk format for indexed nlink: 5695f8415d6SAmir Goldstein * 5705f8415d6SAmir Goldstein * nlink relative to the upper inode - "U[+-]NUM" 5715f8415d6SAmir Goldstein * nlink relative to the lower inode - "L[+-]NUM" 5725f8415d6SAmir Goldstein */ 5735f8415d6SAmir Goldstein 5745f8415d6SAmir Goldstein static int ovl_set_nlink_common(struct dentry *dentry, 5755f8415d6SAmir Goldstein struct dentry *realdentry, const char *format) 5765f8415d6SAmir Goldstein { 5775f8415d6SAmir Goldstein struct inode *inode = d_inode(dentry); 5785f8415d6SAmir Goldstein struct inode *realinode = d_inode(realdentry); 5795f8415d6SAmir Goldstein char buf[13]; 5805f8415d6SAmir Goldstein int len; 5815f8415d6SAmir Goldstein 5825f8415d6SAmir Goldstein len = snprintf(buf, sizeof(buf), format, 5835f8415d6SAmir Goldstein (int) (inode->i_nlink - realinode->i_nlink)); 5845f8415d6SAmir Goldstein 5856787341aSMiklos Szeredi if (WARN_ON(len >= sizeof(buf))) 5866787341aSMiklos Szeredi return -EIO; 5876787341aSMiklos Szeredi 5885f8415d6SAmir Goldstein return ovl_do_setxattr(ovl_dentry_upper(dentry), 5895f8415d6SAmir Goldstein OVL_XATTR_NLINK, buf, len, 0); 5905f8415d6SAmir Goldstein } 5915f8415d6SAmir Goldstein 5925f8415d6SAmir Goldstein int ovl_set_nlink_upper(struct dentry *dentry) 5935f8415d6SAmir Goldstein { 5945f8415d6SAmir Goldstein return ovl_set_nlink_common(dentry, ovl_dentry_upper(dentry), "U%+i"); 5955f8415d6SAmir Goldstein } 5965f8415d6SAmir Goldstein 5975f8415d6SAmir Goldstein int ovl_set_nlink_lower(struct dentry *dentry) 5985f8415d6SAmir Goldstein { 5995f8415d6SAmir Goldstein return ovl_set_nlink_common(dentry, ovl_dentry_lower(dentry), "L%+i"); 6005f8415d6SAmir Goldstein } 6015f8415d6SAmir Goldstein 602caf70cb2SAmir Goldstein unsigned int ovl_get_nlink(struct dentry *lowerdentry, 6035f8415d6SAmir Goldstein struct dentry *upperdentry, 6045f8415d6SAmir Goldstein unsigned int fallback) 6055f8415d6SAmir Goldstein { 6065f8415d6SAmir Goldstein int nlink_diff; 6075f8415d6SAmir Goldstein int nlink; 6085f8415d6SAmir Goldstein char buf[13]; 6095f8415d6SAmir Goldstein int err; 6105f8415d6SAmir Goldstein 6115f8415d6SAmir Goldstein if (!lowerdentry || !upperdentry || d_inode(lowerdentry)->i_nlink == 1) 6125f8415d6SAmir Goldstein return fallback; 6135f8415d6SAmir Goldstein 6145f8415d6SAmir Goldstein err = vfs_getxattr(upperdentry, OVL_XATTR_NLINK, &buf, sizeof(buf) - 1); 6155f8415d6SAmir Goldstein if (err < 0) 6165f8415d6SAmir Goldstein goto fail; 6175f8415d6SAmir Goldstein 6185f8415d6SAmir Goldstein buf[err] = '\0'; 6195f8415d6SAmir Goldstein if ((buf[0] != 'L' && buf[0] != 'U') || 6205f8415d6SAmir Goldstein (buf[1] != '+' && buf[1] != '-')) 6215f8415d6SAmir Goldstein goto fail; 6225f8415d6SAmir Goldstein 6235f8415d6SAmir Goldstein err = kstrtoint(buf + 1, 10, &nlink_diff); 6245f8415d6SAmir Goldstein if (err < 0) 6255f8415d6SAmir Goldstein goto fail; 6265f8415d6SAmir Goldstein 6275f8415d6SAmir Goldstein nlink = d_inode(buf[0] == 'L' ? lowerdentry : upperdentry)->i_nlink; 6285f8415d6SAmir Goldstein nlink += nlink_diff; 6295f8415d6SAmir Goldstein 6305f8415d6SAmir Goldstein if (nlink <= 0) 6315f8415d6SAmir Goldstein goto fail; 6325f8415d6SAmir Goldstein 6335f8415d6SAmir Goldstein return nlink; 6345f8415d6SAmir Goldstein 6355f8415d6SAmir Goldstein fail: 6365f8415d6SAmir Goldstein pr_warn_ratelimited("overlayfs: failed to get index nlink (%pd2, err=%i)\n", 6375f8415d6SAmir Goldstein upperdentry, err); 6385f8415d6SAmir Goldstein return fallback; 6395f8415d6SAmir Goldstein } 6405f8415d6SAmir Goldstein 641ca4c8a3aSMiklos Szeredi struct inode *ovl_new_inode(struct super_block *sb, umode_t mode, dev_t rdev) 64251f7e52dSMiklos Szeredi { 64351f7e52dSMiklos Szeredi struct inode *inode; 64451f7e52dSMiklos Szeredi 64551f7e52dSMiklos Szeredi inode = new_inode(sb); 64651f7e52dSMiklos Szeredi if (inode) 64712574a9fSAmir Goldstein ovl_fill_inode(inode, mode, rdev, 0, 0); 64851f7e52dSMiklos Szeredi 64951f7e52dSMiklos Szeredi return inode; 65051f7e52dSMiklos Szeredi } 65151f7e52dSMiklos Szeredi 65251f7e52dSMiklos Szeredi static int ovl_inode_test(struct inode *inode, void *data) 65351f7e52dSMiklos Szeredi { 65425b7713aSMiklos Szeredi return inode->i_private == data; 65551f7e52dSMiklos Szeredi } 65651f7e52dSMiklos Szeredi 65751f7e52dSMiklos Szeredi static int ovl_inode_set(struct inode *inode, void *data) 65851f7e52dSMiklos Szeredi { 65925b7713aSMiklos Szeredi inode->i_private = data; 66051f7e52dSMiklos Szeredi return 0; 66151f7e52dSMiklos Szeredi } 66251f7e52dSMiklos Szeredi 663b9ac5c27SMiklos Szeredi static bool ovl_verify_inode(struct inode *inode, struct dentry *lowerdentry, 6644b91c30aSAmir Goldstein struct dentry *upperdentry, bool strict) 665b9ac5c27SMiklos Szeredi { 6664b91c30aSAmir Goldstein /* 6674b91c30aSAmir Goldstein * For directories, @strict verify from lookup path performs consistency 6684b91c30aSAmir Goldstein * checks, so NULL lower/upper in dentry must match NULL lower/upper in 6694b91c30aSAmir Goldstein * inode. Non @strict verify from NFS handle decode path passes NULL for 6704b91c30aSAmir Goldstein * 'unknown' lower/upper. 6714b91c30aSAmir Goldstein */ 6724b91c30aSAmir Goldstein if (S_ISDIR(inode->i_mode) && strict) { 67331747edaSAmir Goldstein /* Real lower dir moved to upper layer under us? */ 67431747edaSAmir Goldstein if (!lowerdentry && ovl_inode_lower(inode)) 67531747edaSAmir Goldstein return false; 67631747edaSAmir Goldstein 67731747edaSAmir Goldstein /* Lookup of an uncovered redirect origin? */ 67831747edaSAmir Goldstein if (!upperdentry && ovl_inode_upper(inode)) 67931747edaSAmir Goldstein return false; 68031747edaSAmir Goldstein } 68131747edaSAmir Goldstein 682939ae4efSAmir Goldstein /* 683939ae4efSAmir Goldstein * Allow non-NULL lower inode in ovl_inode even if lowerdentry is NULL. 684939ae4efSAmir Goldstein * This happens when finding a copied up overlay inode for a renamed 685939ae4efSAmir Goldstein * or hardlinked overlay dentry and lower dentry cannot be followed 686939ae4efSAmir Goldstein * by origin because lower fs does not support file handles. 687939ae4efSAmir Goldstein */ 688939ae4efSAmir Goldstein if (lowerdentry && ovl_inode_lower(inode) != d_inode(lowerdentry)) 689b9ac5c27SMiklos Szeredi return false; 690b9ac5c27SMiklos Szeredi 691b9ac5c27SMiklos Szeredi /* 692b9ac5c27SMiklos Szeredi * Allow non-NULL __upperdentry in inode even if upperdentry is NULL. 693b9ac5c27SMiklos Szeredi * This happens when finding a lower alias for a copied up hard link. 694b9ac5c27SMiklos Szeredi */ 695b9ac5c27SMiklos Szeredi if (upperdentry && ovl_inode_upper(inode) != d_inode(upperdentry)) 696b9ac5c27SMiklos Szeredi return false; 697b9ac5c27SMiklos Szeredi 698b9ac5c27SMiklos Szeredi return true; 699b9ac5c27SMiklos Szeredi } 700b9ac5c27SMiklos Szeredi 7014b91c30aSAmir Goldstein struct inode *ovl_lookup_inode(struct super_block *sb, struct dentry *real, 7024b91c30aSAmir Goldstein bool is_upper) 7039436a1a3SAmir Goldstein { 7044b91c30aSAmir Goldstein struct inode *inode, *key = d_inode(real); 7059436a1a3SAmir Goldstein 7069436a1a3SAmir Goldstein inode = ilookup5(sb, (unsigned long) key, ovl_inode_test, key); 7079436a1a3SAmir Goldstein if (!inode) 7089436a1a3SAmir Goldstein return NULL; 7099436a1a3SAmir Goldstein 7104b91c30aSAmir Goldstein if (!ovl_verify_inode(inode, is_upper ? NULL : real, 7114b91c30aSAmir Goldstein is_upper ? real : NULL, false)) { 7129436a1a3SAmir Goldstein iput(inode); 7139436a1a3SAmir Goldstein return ERR_PTR(-ESTALE); 7149436a1a3SAmir Goldstein } 7159436a1a3SAmir Goldstein 7169436a1a3SAmir Goldstein return inode; 7179436a1a3SAmir Goldstein } 7189436a1a3SAmir Goldstein 719764baba8SAmir Goldstein /* 720764baba8SAmir Goldstein * Does overlay inode need to be hashed by lower inode? 721764baba8SAmir Goldstein */ 722764baba8SAmir Goldstein static bool ovl_hash_bylower(struct super_block *sb, struct dentry *upper, 723764baba8SAmir Goldstein struct dentry *lower, struct dentry *index) 724764baba8SAmir Goldstein { 725764baba8SAmir Goldstein struct ovl_fs *ofs = sb->s_fs_info; 726764baba8SAmir Goldstein 727764baba8SAmir Goldstein /* No, if pure upper */ 728764baba8SAmir Goldstein if (!lower) 729764baba8SAmir Goldstein return false; 730764baba8SAmir Goldstein 731764baba8SAmir Goldstein /* Yes, if already indexed */ 732764baba8SAmir Goldstein if (index) 733764baba8SAmir Goldstein return true; 734764baba8SAmir Goldstein 735764baba8SAmir Goldstein /* Yes, if won't be copied up */ 736764baba8SAmir Goldstein if (!ofs->upper_mnt) 737764baba8SAmir Goldstein return true; 738764baba8SAmir Goldstein 739764baba8SAmir Goldstein /* No, if lower hardlink is or will be broken on copy up */ 740764baba8SAmir Goldstein if ((upper || !ovl_indexdir(sb)) && 741764baba8SAmir Goldstein !d_is_dir(lower) && d_inode(lower)->i_nlink > 1) 742764baba8SAmir Goldstein return false; 743764baba8SAmir Goldstein 744764baba8SAmir Goldstein /* No, if non-indexed upper with NFS export */ 745764baba8SAmir Goldstein if (sb->s_export_op && upper) 746764baba8SAmir Goldstein return false; 747764baba8SAmir Goldstein 748764baba8SAmir Goldstein /* Otherwise, hash by lower inode for fsnotify */ 749764baba8SAmir Goldstein return true; 750764baba8SAmir Goldstein } 751764baba8SAmir Goldstein 752*01b39dccSAmir Goldstein static struct inode *ovl_iget5(struct super_block *sb, struct inode *newinode, 753*01b39dccSAmir Goldstein struct inode *key) 754*01b39dccSAmir Goldstein { 755*01b39dccSAmir Goldstein return newinode ? inode_insert5(newinode, (unsigned long) key, 756*01b39dccSAmir Goldstein ovl_inode_test, ovl_inode_set, key) : 757*01b39dccSAmir Goldstein iget5_locked(sb, (unsigned long) key, 758*01b39dccSAmir Goldstein ovl_inode_test, ovl_inode_set, key); 759*01b39dccSAmir Goldstein } 760*01b39dccSAmir Goldstein 761ac6a52ebSVivek Goyal struct inode *ovl_get_inode(struct super_block *sb, 762ac6a52ebSVivek Goyal struct ovl_inode_params *oip) 76351f7e52dSMiklos Szeredi { 764ac6a52ebSVivek Goyal struct dentry *upperdentry = oip->upperdentry; 765ac6a52ebSVivek Goyal struct ovl_path *lowerpath = oip->lowerpath; 76609d8b586SMiklos Szeredi struct inode *realinode = upperdentry ? d_inode(upperdentry) : NULL; 76751f7e52dSMiklos Szeredi struct inode *inode; 76812574a9fSAmir Goldstein struct dentry *lowerdentry = lowerpath ? lowerpath->dentry : NULL; 769ac6a52ebSVivek Goyal bool bylower = ovl_hash_bylower(sb, upperdentry, lowerdentry, 770ac6a52ebSVivek Goyal oip->index); 771ac6a52ebSVivek Goyal int fsid = bylower ? oip->lowerpath->layer->fsid : 0; 77231747edaSAmir Goldstein bool is_dir; 773695b46e7SAmir Goldstein unsigned long ino = 0; 7746eaf0111SAmir Goldstein 77509d8b586SMiklos Szeredi if (!realinode) 77609d8b586SMiklos Szeredi realinode = d_inode(lowerdentry); 77709d8b586SMiklos Szeredi 7786eaf0111SAmir Goldstein /* 779764baba8SAmir Goldstein * Copy up origin (lower) may exist for non-indexed upper, but we must 780764baba8SAmir Goldstein * not use lower as hash key if this is a broken hardlink. 7816eaf0111SAmir Goldstein */ 78231747edaSAmir Goldstein is_dir = S_ISDIR(realinode->i_mode); 783764baba8SAmir Goldstein if (upperdentry || bylower) { 784764baba8SAmir Goldstein struct inode *key = d_inode(bylower ? lowerdentry : 785764baba8SAmir Goldstein upperdentry); 78631747edaSAmir Goldstein unsigned int nlink = is_dir ? 1 : realinode->i_nlink; 787b9ac5c27SMiklos Szeredi 788*01b39dccSAmir Goldstein inode = ovl_iget5(sb, oip->newinode, key); 78909d8b586SMiklos Szeredi if (!inode) 790b9ac5c27SMiklos Szeredi goto out_nomem; 79109d8b586SMiklos Szeredi if (!(inode->i_state & I_NEW)) { 792b9ac5c27SMiklos Szeredi /* 793b9ac5c27SMiklos Szeredi * Verify that the underlying files stored in the inode 794b9ac5c27SMiklos Szeredi * match those in the dentry. 795b9ac5c27SMiklos Szeredi */ 7964b91c30aSAmir Goldstein if (!ovl_verify_inode(inode, lowerdentry, upperdentry, 7974b91c30aSAmir Goldstein true)) { 798b9ac5c27SMiklos Szeredi iput(inode); 799b9ac5c27SMiklos Szeredi inode = ERR_PTR(-ESTALE); 800b9ac5c27SMiklos Szeredi goto out; 801b9ac5c27SMiklos Szeredi } 802b9ac5c27SMiklos Szeredi 80309d8b586SMiklos Szeredi dput(upperdentry); 80409d8b586SMiklos Szeredi goto out; 80509d8b586SMiklos Szeredi } 806e9be9d5eSMiklos Szeredi 80731747edaSAmir Goldstein /* Recalculate nlink for non-dir due to indexing */ 80831747edaSAmir Goldstein if (!is_dir) 80931747edaSAmir Goldstein nlink = ovl_get_nlink(lowerdentry, upperdentry, nlink); 8105f8415d6SAmir Goldstein set_nlink(inode, nlink); 811695b46e7SAmir Goldstein ino = key->i_ino; 812e6d2ebddSMiklos Szeredi } else { 813764baba8SAmir Goldstein /* Lower hardlink that will be broken on copy up */ 8140aceb53eSAmir Goldstein inode = new_inode(sb); 815e6d2ebddSMiklos Szeredi if (!inode) 816b9ac5c27SMiklos Szeredi goto out_nomem; 817e6d2ebddSMiklos Szeredi } 81812574a9fSAmir Goldstein ovl_fill_inode(inode, realinode->i_mode, realinode->i_rdev, ino, fsid); 81909d8b586SMiklos Szeredi ovl_inode_init(inode, upperdentry, lowerdentry); 82013c72075SMiklos Szeredi 82113c72075SMiklos Szeredi if (upperdentry && ovl_is_impuredir(upperdentry)) 82213c72075SMiklos Szeredi ovl_set_flag(OVL_IMPURE, inode); 82313c72075SMiklos Szeredi 824ac6a52ebSVivek Goyal if (oip->index) 8250471a9cdSVivek Goyal ovl_set_flag(OVL_INDEX, inode); 8260471a9cdSVivek Goyal 827b79e05aaSAmir Goldstein /* Check for non-merge dir that may have whiteouts */ 82831747edaSAmir Goldstein if (is_dir) { 829ac6a52ebSVivek Goyal if (((upperdentry && lowerdentry) || oip->numlower > 1) || 830b79e05aaSAmir Goldstein ovl_check_origin_xattr(upperdentry ?: lowerdentry)) { 831b79e05aaSAmir Goldstein ovl_set_flag(OVL_WHITEOUTS, inode); 832b79e05aaSAmir Goldstein } 833b79e05aaSAmir Goldstein } 834b79e05aaSAmir Goldstein 835e6d2ebddSMiklos Szeredi if (inode->i_state & I_NEW) 836e6d2ebddSMiklos Szeredi unlock_new_inode(inode); 837e6d2ebddSMiklos Szeredi out: 838e9be9d5eSMiklos Szeredi return inode; 839b9ac5c27SMiklos Szeredi 840b9ac5c27SMiklos Szeredi out_nomem: 841b9ac5c27SMiklos Szeredi inode = ERR_PTR(-ENOMEM); 842b9ac5c27SMiklos Szeredi goto out; 843e9be9d5eSMiklos Szeredi } 844