13d14c5d2SYehuda Sadeh #include <linux/ceph/ceph_debug.h> 2*25e6bae3SYan, Zheng #include <linux/ceph/pagelist.h> 33d14c5d2SYehuda Sadeh 4355da1ebSSage Weil #include "super.h" 53d14c5d2SYehuda Sadeh #include "mds_client.h" 63d14c5d2SYehuda Sadeh 73d14c5d2SYehuda Sadeh #include <linux/ceph/decode.h> 8355da1ebSSage Weil 9355da1ebSSage Weil #include <linux/xattr.h> 104db658eaSLinus Torvalds #include <linux/posix_acl_xattr.h> 115a0e3ad6STejun Heo #include <linux/slab.h> 12355da1ebSSage Weil 1322891907SAlex Elder #define XATTR_CEPH_PREFIX "ceph." 1422891907SAlex Elder #define XATTR_CEPH_PREFIX_LEN (sizeof (XATTR_CEPH_PREFIX) - 1) 1522891907SAlex Elder 16bcdfeb2eSYan, Zheng static int __remove_xattr(struct ceph_inode_info *ci, 17bcdfeb2eSYan, Zheng struct ceph_inode_xattr *xattr); 18bcdfeb2eSYan, Zheng 197221fe4cSGuangliang Zhao /* 207221fe4cSGuangliang Zhao * List of handlers for synthetic system.* attributes. Other 217221fe4cSGuangliang Zhao * attributes are handled directly. 227221fe4cSGuangliang Zhao */ 237221fe4cSGuangliang Zhao const struct xattr_handler *ceph_xattr_handlers[] = { 247221fe4cSGuangliang Zhao #ifdef CONFIG_CEPH_FS_POSIX_ACL 254db658eaSLinus Torvalds &posix_acl_access_xattr_handler, 264db658eaSLinus Torvalds &posix_acl_default_xattr_handler, 277221fe4cSGuangliang Zhao #endif 287221fe4cSGuangliang Zhao NULL, 297221fe4cSGuangliang Zhao }; 307221fe4cSGuangliang Zhao 31355da1ebSSage Weil static bool ceph_is_valid_xattr(const char *name) 32355da1ebSSage Weil { 3322891907SAlex Elder return !strncmp(name, XATTR_CEPH_PREFIX, XATTR_CEPH_PREFIX_LEN) || 341a756278SSage Weil !strncmp(name, XATTR_SECURITY_PREFIX, 35355da1ebSSage Weil XATTR_SECURITY_PREFIX_LEN) || 367221fe4cSGuangliang Zhao !strncmp(name, XATTR_SYSTEM_PREFIX, XATTR_SYSTEM_PREFIX_LEN) || 37355da1ebSSage Weil !strncmp(name, XATTR_TRUSTED_PREFIX, XATTR_TRUSTED_PREFIX_LEN) || 38355da1ebSSage Weil !strncmp(name, XATTR_USER_PREFIX, XATTR_USER_PREFIX_LEN); 39355da1ebSSage Weil } 40355da1ebSSage Weil 41355da1ebSSage Weil /* 42355da1ebSSage Weil * These define virtual xattrs exposing the recursive directory 43355da1ebSSage Weil * statistics and layout metadata. 44355da1ebSSage Weil */ 45881a5fa2SAlex Elder struct ceph_vxattr { 46355da1ebSSage Weil char *name; 473ce6cd12SAlex Elder size_t name_size; /* strlen(name) + 1 (for '\0') */ 48355da1ebSSage Weil size_t (*getxattr_cb)(struct ceph_inode_info *ci, char *val, 49355da1ebSSage Weil size_t size); 508860147aSSage Weil bool readonly, hidden; 51f36e4472SSage Weil bool (*exists_cb)(struct ceph_inode_info *ci); 52355da1ebSSage Weil }; 53355da1ebSSage Weil 5432ab0bd7SSage Weil /* layouts */ 5532ab0bd7SSage Weil 5632ab0bd7SSage Weil static bool ceph_vxattrcb_layout_exists(struct ceph_inode_info *ci) 5732ab0bd7SSage Weil { 5832ab0bd7SSage Weil size_t s; 5932ab0bd7SSage Weil char *p = (char *)&ci->i_layout; 6032ab0bd7SSage Weil 6132ab0bd7SSage Weil for (s = 0; s < sizeof(ci->i_layout); s++, p++) 6232ab0bd7SSage Weil if (*p) 6332ab0bd7SSage Weil return true; 6432ab0bd7SSage Weil return false; 6532ab0bd7SSage Weil } 6632ab0bd7SSage Weil 6732ab0bd7SSage Weil static size_t ceph_vxattrcb_layout(struct ceph_inode_info *ci, char *val, 6832ab0bd7SSage Weil size_t size) 6932ab0bd7SSage Weil { 7032ab0bd7SSage Weil int ret; 7132ab0bd7SSage Weil struct ceph_fs_client *fsc = ceph_sb_to_client(ci->vfs_inode.i_sb); 7232ab0bd7SSage Weil struct ceph_osd_client *osdc = &fsc->client->osdc; 7332ab0bd7SSage Weil s64 pool = ceph_file_layout_pg_pool(ci->i_layout); 7432ab0bd7SSage Weil const char *pool_name; 751e5c6649SYan, Zheng char buf[128]; 7632ab0bd7SSage Weil 7732ab0bd7SSage Weil dout("ceph_vxattrcb_layout %p\n", &ci->vfs_inode); 7832ab0bd7SSage Weil down_read(&osdc->map_sem); 7932ab0bd7SSage Weil pool_name = ceph_pg_pool_name_by_id(osdc->osdmap, pool); 801e5c6649SYan, Zheng if (pool_name) { 811e5c6649SYan, Zheng size_t len = strlen(pool_name); 821e5c6649SYan, Zheng ret = snprintf(buf, sizeof(buf), 831e5c6649SYan, Zheng "stripe_unit=%lld stripe_count=%lld object_size=%lld pool=", 8432ab0bd7SSage Weil (unsigned long long)ceph_file_layout_su(ci->i_layout), 8532ab0bd7SSage Weil (unsigned long long)ceph_file_layout_stripe_count(ci->i_layout), 861e5c6649SYan, Zheng (unsigned long long)ceph_file_layout_object_size(ci->i_layout)); 871e5c6649SYan, Zheng if (!size) { 881e5c6649SYan, Zheng ret += len; 891e5c6649SYan, Zheng } else if (ret + len > size) { 901e5c6649SYan, Zheng ret = -ERANGE; 911e5c6649SYan, Zheng } else { 921e5c6649SYan, Zheng memcpy(val, buf, ret); 931e5c6649SYan, Zheng memcpy(val + ret, pool_name, len); 941e5c6649SYan, Zheng ret += len; 951e5c6649SYan, Zheng } 961e5c6649SYan, Zheng } else { 971e5c6649SYan, Zheng ret = snprintf(buf, sizeof(buf), 9832ab0bd7SSage Weil "stripe_unit=%lld stripe_count=%lld object_size=%lld pool=%lld", 9932ab0bd7SSage Weil (unsigned long long)ceph_file_layout_su(ci->i_layout), 10032ab0bd7SSage Weil (unsigned long long)ceph_file_layout_stripe_count(ci->i_layout), 10132ab0bd7SSage Weil (unsigned long long)ceph_file_layout_object_size(ci->i_layout), 10232ab0bd7SSage Weil (unsigned long long)pool); 1031e5c6649SYan, Zheng if (size) { 1041e5c6649SYan, Zheng if (ret <= size) 1051e5c6649SYan, Zheng memcpy(val, buf, ret); 1061e5c6649SYan, Zheng else 1071e5c6649SYan, Zheng ret = -ERANGE; 1081e5c6649SYan, Zheng } 1091e5c6649SYan, Zheng } 11032ab0bd7SSage Weil up_read(&osdc->map_sem); 11132ab0bd7SSage Weil return ret; 11232ab0bd7SSage Weil } 11332ab0bd7SSage Weil 114695b7119SSage Weil static size_t ceph_vxattrcb_layout_stripe_unit(struct ceph_inode_info *ci, 115695b7119SSage Weil char *val, size_t size) 116695b7119SSage Weil { 117695b7119SSage Weil return snprintf(val, size, "%lld", 118695b7119SSage Weil (unsigned long long)ceph_file_layout_su(ci->i_layout)); 119695b7119SSage Weil } 120695b7119SSage Weil 121695b7119SSage Weil static size_t ceph_vxattrcb_layout_stripe_count(struct ceph_inode_info *ci, 122695b7119SSage Weil char *val, size_t size) 123695b7119SSage Weil { 124695b7119SSage Weil return snprintf(val, size, "%lld", 125695b7119SSage Weil (unsigned long long)ceph_file_layout_stripe_count(ci->i_layout)); 126695b7119SSage Weil } 127695b7119SSage Weil 128695b7119SSage Weil static size_t ceph_vxattrcb_layout_object_size(struct ceph_inode_info *ci, 129695b7119SSage Weil char *val, size_t size) 130695b7119SSage Weil { 131695b7119SSage Weil return snprintf(val, size, "%lld", 132695b7119SSage Weil (unsigned long long)ceph_file_layout_object_size(ci->i_layout)); 133695b7119SSage Weil } 134695b7119SSage Weil 135695b7119SSage Weil static size_t ceph_vxattrcb_layout_pool(struct ceph_inode_info *ci, 136695b7119SSage Weil char *val, size_t size) 137695b7119SSage Weil { 138695b7119SSage Weil int ret; 139695b7119SSage Weil struct ceph_fs_client *fsc = ceph_sb_to_client(ci->vfs_inode.i_sb); 140695b7119SSage Weil struct ceph_osd_client *osdc = &fsc->client->osdc; 141695b7119SSage Weil s64 pool = ceph_file_layout_pg_pool(ci->i_layout); 142695b7119SSage Weil const char *pool_name; 143695b7119SSage Weil 144695b7119SSage Weil down_read(&osdc->map_sem); 145695b7119SSage Weil pool_name = ceph_pg_pool_name_by_id(osdc->osdmap, pool); 146695b7119SSage Weil if (pool_name) 147695b7119SSage Weil ret = snprintf(val, size, "%s", pool_name); 148695b7119SSage Weil else 149695b7119SSage Weil ret = snprintf(val, size, "%lld", (unsigned long long)pool); 150695b7119SSage Weil up_read(&osdc->map_sem); 151695b7119SSage Weil return ret; 152695b7119SSage Weil } 153695b7119SSage Weil 154355da1ebSSage Weil /* directories */ 155355da1ebSSage Weil 156aa4066edSAlex Elder static size_t ceph_vxattrcb_dir_entries(struct ceph_inode_info *ci, char *val, 157355da1ebSSage Weil size_t size) 158355da1ebSSage Weil { 159355da1ebSSage Weil return snprintf(val, size, "%lld", ci->i_files + ci->i_subdirs); 160355da1ebSSage Weil } 161355da1ebSSage Weil 162aa4066edSAlex Elder static size_t ceph_vxattrcb_dir_files(struct ceph_inode_info *ci, char *val, 163355da1ebSSage Weil size_t size) 164355da1ebSSage Weil { 165355da1ebSSage Weil return snprintf(val, size, "%lld", ci->i_files); 166355da1ebSSage Weil } 167355da1ebSSage Weil 168aa4066edSAlex Elder static size_t ceph_vxattrcb_dir_subdirs(struct ceph_inode_info *ci, char *val, 169355da1ebSSage Weil size_t size) 170355da1ebSSage Weil { 171355da1ebSSage Weil return snprintf(val, size, "%lld", ci->i_subdirs); 172355da1ebSSage Weil } 173355da1ebSSage Weil 174aa4066edSAlex Elder static size_t ceph_vxattrcb_dir_rentries(struct ceph_inode_info *ci, char *val, 175355da1ebSSage Weil size_t size) 176355da1ebSSage Weil { 177355da1ebSSage Weil return snprintf(val, size, "%lld", ci->i_rfiles + ci->i_rsubdirs); 178355da1ebSSage Weil } 179355da1ebSSage Weil 180aa4066edSAlex Elder static size_t ceph_vxattrcb_dir_rfiles(struct ceph_inode_info *ci, char *val, 181355da1ebSSage Weil size_t size) 182355da1ebSSage Weil { 183355da1ebSSage Weil return snprintf(val, size, "%lld", ci->i_rfiles); 184355da1ebSSage Weil } 185355da1ebSSage Weil 186aa4066edSAlex Elder static size_t ceph_vxattrcb_dir_rsubdirs(struct ceph_inode_info *ci, char *val, 187355da1ebSSage Weil size_t size) 188355da1ebSSage Weil { 189355da1ebSSage Weil return snprintf(val, size, "%lld", ci->i_rsubdirs); 190355da1ebSSage Weil } 191355da1ebSSage Weil 192aa4066edSAlex Elder static size_t ceph_vxattrcb_dir_rbytes(struct ceph_inode_info *ci, char *val, 193355da1ebSSage Weil size_t size) 194355da1ebSSage Weil { 195355da1ebSSage Weil return snprintf(val, size, "%lld", ci->i_rbytes); 196355da1ebSSage Weil } 197355da1ebSSage Weil 198aa4066edSAlex Elder static size_t ceph_vxattrcb_dir_rctime(struct ceph_inode_info *ci, char *val, 199355da1ebSSage Weil size_t size) 200355da1ebSSage Weil { 2013489b42aSAlex Elder return snprintf(val, size, "%ld.09%ld", (long)ci->i_rctime.tv_sec, 202355da1ebSSage Weil (long)ci->i_rctime.tv_nsec); 203355da1ebSSage Weil } 204355da1ebSSage Weil 20532ab0bd7SSage Weil 206eb788084SAlex Elder #define CEPH_XATTR_NAME(_type, _name) XATTR_CEPH_PREFIX #_type "." #_name 207695b7119SSage Weil #define CEPH_XATTR_NAME2(_type, _name, _name2) \ 208695b7119SSage Weil XATTR_CEPH_PREFIX #_type "." #_name "." #_name2 209eb788084SAlex Elder 210eb788084SAlex Elder #define XATTR_NAME_CEPH(_type, _name) \ 211eb788084SAlex Elder { \ 212eb788084SAlex Elder .name = CEPH_XATTR_NAME(_type, _name), \ 2133ce6cd12SAlex Elder .name_size = sizeof (CEPH_XATTR_NAME(_type, _name)), \ 214aa4066edSAlex Elder .getxattr_cb = ceph_vxattrcb_ ## _type ## _ ## _name, \ 215eb788084SAlex Elder .readonly = true, \ 2168860147aSSage Weil .hidden = false, \ 217f36e4472SSage Weil .exists_cb = NULL, \ 218eb788084SAlex Elder } 219695b7119SSage Weil #define XATTR_LAYOUT_FIELD(_type, _name, _field) \ 220695b7119SSage Weil { \ 221695b7119SSage Weil .name = CEPH_XATTR_NAME2(_type, _name, _field), \ 222695b7119SSage Weil .name_size = sizeof (CEPH_XATTR_NAME2(_type, _name, _field)), \ 223695b7119SSage Weil .getxattr_cb = ceph_vxattrcb_ ## _name ## _ ## _field, \ 224695b7119SSage Weil .readonly = false, \ 225695b7119SSage Weil .hidden = true, \ 226695b7119SSage Weil .exists_cb = ceph_vxattrcb_layout_exists, \ 227695b7119SSage Weil } 228eb788084SAlex Elder 229881a5fa2SAlex Elder static struct ceph_vxattr ceph_dir_vxattrs[] = { 2301f08f2b0SSage Weil { 2311f08f2b0SSage Weil .name = "ceph.dir.layout", 2321f08f2b0SSage Weil .name_size = sizeof("ceph.dir.layout"), 2331f08f2b0SSage Weil .getxattr_cb = ceph_vxattrcb_layout, 2341f08f2b0SSage Weil .readonly = false, 235cc48c3e8SYan, Zheng .hidden = true, 2361f08f2b0SSage Weil .exists_cb = ceph_vxattrcb_layout_exists, 2371f08f2b0SSage Weil }, 238695b7119SSage Weil XATTR_LAYOUT_FIELD(dir, layout, stripe_unit), 239695b7119SSage Weil XATTR_LAYOUT_FIELD(dir, layout, stripe_count), 240695b7119SSage Weil XATTR_LAYOUT_FIELD(dir, layout, object_size), 241695b7119SSage Weil XATTR_LAYOUT_FIELD(dir, layout, pool), 242eb788084SAlex Elder XATTR_NAME_CEPH(dir, entries), 243eb788084SAlex Elder XATTR_NAME_CEPH(dir, files), 244eb788084SAlex Elder XATTR_NAME_CEPH(dir, subdirs), 245eb788084SAlex Elder XATTR_NAME_CEPH(dir, rentries), 246eb788084SAlex Elder XATTR_NAME_CEPH(dir, rfiles), 247eb788084SAlex Elder XATTR_NAME_CEPH(dir, rsubdirs), 248eb788084SAlex Elder XATTR_NAME_CEPH(dir, rbytes), 249eb788084SAlex Elder XATTR_NAME_CEPH(dir, rctime), 2502c3dd4ffSAlex Elder { .name = NULL, 0 } /* Required table terminator */ 251355da1ebSSage Weil }; 2523ce6cd12SAlex Elder static size_t ceph_dir_vxattrs_name_size; /* total size of all names */ 253355da1ebSSage Weil 254355da1ebSSage Weil /* files */ 255355da1ebSSage Weil 256881a5fa2SAlex Elder static struct ceph_vxattr ceph_file_vxattrs[] = { 25732ab0bd7SSage Weil { 25832ab0bd7SSage Weil .name = "ceph.file.layout", 25932ab0bd7SSage Weil .name_size = sizeof("ceph.file.layout"), 26032ab0bd7SSage Weil .getxattr_cb = ceph_vxattrcb_layout, 26132ab0bd7SSage Weil .readonly = false, 262cc48c3e8SYan, Zheng .hidden = true, 26332ab0bd7SSage Weil .exists_cb = ceph_vxattrcb_layout_exists, 26432ab0bd7SSage Weil }, 265695b7119SSage Weil XATTR_LAYOUT_FIELD(file, layout, stripe_unit), 266695b7119SSage Weil XATTR_LAYOUT_FIELD(file, layout, stripe_count), 267695b7119SSage Weil XATTR_LAYOUT_FIELD(file, layout, object_size), 268695b7119SSage Weil XATTR_LAYOUT_FIELD(file, layout, pool), 2692c3dd4ffSAlex Elder { .name = NULL, 0 } /* Required table terminator */ 270355da1ebSSage Weil }; 2713ce6cd12SAlex Elder static size_t ceph_file_vxattrs_name_size; /* total size of all names */ 272355da1ebSSage Weil 273881a5fa2SAlex Elder static struct ceph_vxattr *ceph_inode_vxattrs(struct inode *inode) 274355da1ebSSage Weil { 275355da1ebSSage Weil if (S_ISDIR(inode->i_mode)) 276355da1ebSSage Weil return ceph_dir_vxattrs; 277355da1ebSSage Weil else if (S_ISREG(inode->i_mode)) 278355da1ebSSage Weil return ceph_file_vxattrs; 279355da1ebSSage Weil return NULL; 280355da1ebSSage Weil } 281355da1ebSSage Weil 2823ce6cd12SAlex Elder static size_t ceph_vxattrs_name_size(struct ceph_vxattr *vxattrs) 2833ce6cd12SAlex Elder { 2843ce6cd12SAlex Elder if (vxattrs == ceph_dir_vxattrs) 2853ce6cd12SAlex Elder return ceph_dir_vxattrs_name_size; 2863ce6cd12SAlex Elder if (vxattrs == ceph_file_vxattrs) 2873ce6cd12SAlex Elder return ceph_file_vxattrs_name_size; 2880abb43dcSYan, Zheng BUG_ON(vxattrs); 2893ce6cd12SAlex Elder return 0; 2903ce6cd12SAlex Elder } 2913ce6cd12SAlex Elder 2923ce6cd12SAlex Elder /* 2933ce6cd12SAlex Elder * Compute the aggregate size (including terminating '\0') of all 2943ce6cd12SAlex Elder * virtual extended attribute names in the given vxattr table. 2953ce6cd12SAlex Elder */ 2963ce6cd12SAlex Elder static size_t __init vxattrs_name_size(struct ceph_vxattr *vxattrs) 2973ce6cd12SAlex Elder { 2983ce6cd12SAlex Elder struct ceph_vxattr *vxattr; 2993ce6cd12SAlex Elder size_t size = 0; 3003ce6cd12SAlex Elder 3013ce6cd12SAlex Elder for (vxattr = vxattrs; vxattr->name; vxattr++) 3028860147aSSage Weil if (!vxattr->hidden) 3033ce6cd12SAlex Elder size += vxattr->name_size; 3043ce6cd12SAlex Elder 3053ce6cd12SAlex Elder return size; 3063ce6cd12SAlex Elder } 3073ce6cd12SAlex Elder 3083ce6cd12SAlex Elder /* Routines called at initialization and exit time */ 3093ce6cd12SAlex Elder 3103ce6cd12SAlex Elder void __init ceph_xattr_init(void) 3113ce6cd12SAlex Elder { 3123ce6cd12SAlex Elder ceph_dir_vxattrs_name_size = vxattrs_name_size(ceph_dir_vxattrs); 3133ce6cd12SAlex Elder ceph_file_vxattrs_name_size = vxattrs_name_size(ceph_file_vxattrs); 3143ce6cd12SAlex Elder } 3153ce6cd12SAlex Elder 3163ce6cd12SAlex Elder void ceph_xattr_exit(void) 3173ce6cd12SAlex Elder { 3183ce6cd12SAlex Elder ceph_dir_vxattrs_name_size = 0; 3193ce6cd12SAlex Elder ceph_file_vxattrs_name_size = 0; 3203ce6cd12SAlex Elder } 3213ce6cd12SAlex Elder 322881a5fa2SAlex Elder static struct ceph_vxattr *ceph_match_vxattr(struct inode *inode, 323355da1ebSSage Weil const char *name) 324355da1ebSSage Weil { 325881a5fa2SAlex Elder struct ceph_vxattr *vxattr = ceph_inode_vxattrs(inode); 32606476a69SAlex Elder 32706476a69SAlex Elder if (vxattr) { 32806476a69SAlex Elder while (vxattr->name) { 32906476a69SAlex Elder if (!strcmp(vxattr->name, name)) 330355da1ebSSage Weil return vxattr; 331355da1ebSSage Weil vxattr++; 33206476a69SAlex Elder } 33306476a69SAlex Elder } 33406476a69SAlex Elder 335355da1ebSSage Weil return NULL; 336355da1ebSSage Weil } 337355da1ebSSage Weil 338355da1ebSSage Weil static int __set_xattr(struct ceph_inode_info *ci, 339355da1ebSSage Weil const char *name, int name_len, 340355da1ebSSage Weil const char *val, int val_len, 341fbc0b970SYan, Zheng int flags, int update_xattr, 342355da1ebSSage Weil struct ceph_inode_xattr **newxattr) 343355da1ebSSage Weil { 344355da1ebSSage Weil struct rb_node **p; 345355da1ebSSage Weil struct rb_node *parent = NULL; 346355da1ebSSage Weil struct ceph_inode_xattr *xattr = NULL; 347355da1ebSSage Weil int c; 348355da1ebSSage Weil int new = 0; 349355da1ebSSage Weil 350355da1ebSSage Weil p = &ci->i_xattrs.index.rb_node; 351355da1ebSSage Weil while (*p) { 352355da1ebSSage Weil parent = *p; 353355da1ebSSage Weil xattr = rb_entry(parent, struct ceph_inode_xattr, node); 354355da1ebSSage Weil c = strncmp(name, xattr->name, min(name_len, xattr->name_len)); 355355da1ebSSage Weil if (c < 0) 356355da1ebSSage Weil p = &(*p)->rb_left; 357355da1ebSSage Weil else if (c > 0) 358355da1ebSSage Weil p = &(*p)->rb_right; 359355da1ebSSage Weil else { 360355da1ebSSage Weil if (name_len == xattr->name_len) 361355da1ebSSage Weil break; 362355da1ebSSage Weil else if (name_len < xattr->name_len) 363355da1ebSSage Weil p = &(*p)->rb_left; 364355da1ebSSage Weil else 365355da1ebSSage Weil p = &(*p)->rb_right; 366355da1ebSSage Weil } 367355da1ebSSage Weil xattr = NULL; 368355da1ebSSage Weil } 369355da1ebSSage Weil 370fbc0b970SYan, Zheng if (update_xattr) { 371fbc0b970SYan, Zheng int err = 0; 372fbc0b970SYan, Zheng if (xattr && (flags & XATTR_CREATE)) 373fbc0b970SYan, Zheng err = -EEXIST; 374fbc0b970SYan, Zheng else if (!xattr && (flags & XATTR_REPLACE)) 375fbc0b970SYan, Zheng err = -ENODATA; 376fbc0b970SYan, Zheng if (err) { 377fbc0b970SYan, Zheng kfree(name); 378fbc0b970SYan, Zheng kfree(val); 379fbc0b970SYan, Zheng return err; 380fbc0b970SYan, Zheng } 381bcdfeb2eSYan, Zheng if (update_xattr < 0) { 382bcdfeb2eSYan, Zheng if (xattr) 383bcdfeb2eSYan, Zheng __remove_xattr(ci, xattr); 384bcdfeb2eSYan, Zheng kfree(name); 385bcdfeb2eSYan, Zheng return 0; 386bcdfeb2eSYan, Zheng } 387fbc0b970SYan, Zheng } 388fbc0b970SYan, Zheng 389355da1ebSSage Weil if (!xattr) { 390355da1ebSSage Weil new = 1; 391355da1ebSSage Weil xattr = *newxattr; 392355da1ebSSage Weil xattr->name = name; 393355da1ebSSage Weil xattr->name_len = name_len; 394fbc0b970SYan, Zheng xattr->should_free_name = update_xattr; 395355da1ebSSage Weil 396355da1ebSSage Weil ci->i_xattrs.count++; 397355da1ebSSage Weil dout("__set_xattr count=%d\n", ci->i_xattrs.count); 398355da1ebSSage Weil } else { 399355da1ebSSage Weil kfree(*newxattr); 400355da1ebSSage Weil *newxattr = NULL; 401355da1ebSSage Weil if (xattr->should_free_val) 402355da1ebSSage Weil kfree((void *)xattr->val); 403355da1ebSSage Weil 404fbc0b970SYan, Zheng if (update_xattr) { 405355da1ebSSage Weil kfree((void *)name); 406355da1ebSSage Weil name = xattr->name; 407355da1ebSSage Weil } 408355da1ebSSage Weil ci->i_xattrs.names_size -= xattr->name_len; 409355da1ebSSage Weil ci->i_xattrs.vals_size -= xattr->val_len; 410355da1ebSSage Weil } 411355da1ebSSage Weil ci->i_xattrs.names_size += name_len; 412355da1ebSSage Weil ci->i_xattrs.vals_size += val_len; 413355da1ebSSage Weil if (val) 414355da1ebSSage Weil xattr->val = val; 415355da1ebSSage Weil else 416355da1ebSSage Weil xattr->val = ""; 417355da1ebSSage Weil 418355da1ebSSage Weil xattr->val_len = val_len; 419fbc0b970SYan, Zheng xattr->dirty = update_xattr; 420fbc0b970SYan, Zheng xattr->should_free_val = (val && update_xattr); 421355da1ebSSage Weil 422355da1ebSSage Weil if (new) { 423355da1ebSSage Weil rb_link_node(&xattr->node, parent, p); 424355da1ebSSage Weil rb_insert_color(&xattr->node, &ci->i_xattrs.index); 425355da1ebSSage Weil dout("__set_xattr_val p=%p\n", p); 426355da1ebSSage Weil } 427355da1ebSSage Weil 428355da1ebSSage Weil dout("__set_xattr_val added %llx.%llx xattr %p %s=%.*s\n", 429355da1ebSSage Weil ceph_vinop(&ci->vfs_inode), xattr, name, val_len, val); 430355da1ebSSage Weil 431355da1ebSSage Weil return 0; 432355da1ebSSage Weil } 433355da1ebSSage Weil 434355da1ebSSage Weil static struct ceph_inode_xattr *__get_xattr(struct ceph_inode_info *ci, 435355da1ebSSage Weil const char *name) 436355da1ebSSage Weil { 437355da1ebSSage Weil struct rb_node **p; 438355da1ebSSage Weil struct rb_node *parent = NULL; 439355da1ebSSage Weil struct ceph_inode_xattr *xattr = NULL; 44017db143fSSage Weil int name_len = strlen(name); 441355da1ebSSage Weil int c; 442355da1ebSSage Weil 443355da1ebSSage Weil p = &ci->i_xattrs.index.rb_node; 444355da1ebSSage Weil while (*p) { 445355da1ebSSage Weil parent = *p; 446355da1ebSSage Weil xattr = rb_entry(parent, struct ceph_inode_xattr, node); 447355da1ebSSage Weil c = strncmp(name, xattr->name, xattr->name_len); 44817db143fSSage Weil if (c == 0 && name_len > xattr->name_len) 44917db143fSSage Weil c = 1; 450355da1ebSSage Weil if (c < 0) 451355da1ebSSage Weil p = &(*p)->rb_left; 452355da1ebSSage Weil else if (c > 0) 453355da1ebSSage Weil p = &(*p)->rb_right; 454355da1ebSSage Weil else { 455355da1ebSSage Weil dout("__get_xattr %s: found %.*s\n", name, 456355da1ebSSage Weil xattr->val_len, xattr->val); 457355da1ebSSage Weil return xattr; 458355da1ebSSage Weil } 459355da1ebSSage Weil } 460355da1ebSSage Weil 461355da1ebSSage Weil dout("__get_xattr %s: not found\n", name); 462355da1ebSSage Weil 463355da1ebSSage Weil return NULL; 464355da1ebSSage Weil } 465355da1ebSSage Weil 466355da1ebSSage Weil static void __free_xattr(struct ceph_inode_xattr *xattr) 467355da1ebSSage Weil { 468355da1ebSSage Weil BUG_ON(!xattr); 469355da1ebSSage Weil 470355da1ebSSage Weil if (xattr->should_free_name) 471355da1ebSSage Weil kfree((void *)xattr->name); 472355da1ebSSage Weil if (xattr->should_free_val) 473355da1ebSSage Weil kfree((void *)xattr->val); 474355da1ebSSage Weil 475355da1ebSSage Weil kfree(xattr); 476355da1ebSSage Weil } 477355da1ebSSage Weil 478355da1ebSSage Weil static int __remove_xattr(struct ceph_inode_info *ci, 479355da1ebSSage Weil struct ceph_inode_xattr *xattr) 480355da1ebSSage Weil { 481355da1ebSSage Weil if (!xattr) 482524186acSYan, Zheng return -ENODATA; 483355da1ebSSage Weil 484355da1ebSSage Weil rb_erase(&xattr->node, &ci->i_xattrs.index); 485355da1ebSSage Weil 486355da1ebSSage Weil if (xattr->should_free_name) 487355da1ebSSage Weil kfree((void *)xattr->name); 488355da1ebSSage Weil if (xattr->should_free_val) 489355da1ebSSage Weil kfree((void *)xattr->val); 490355da1ebSSage Weil 491355da1ebSSage Weil ci->i_xattrs.names_size -= xattr->name_len; 492355da1ebSSage Weil ci->i_xattrs.vals_size -= xattr->val_len; 493355da1ebSSage Weil ci->i_xattrs.count--; 494355da1ebSSage Weil kfree(xattr); 495355da1ebSSage Weil 496355da1ebSSage Weil return 0; 497355da1ebSSage Weil } 498355da1ebSSage Weil 499355da1ebSSage Weil static int __remove_xattr_by_name(struct ceph_inode_info *ci, 500355da1ebSSage Weil const char *name) 501355da1ebSSage Weil { 502355da1ebSSage Weil struct rb_node **p; 503355da1ebSSage Weil struct ceph_inode_xattr *xattr; 504355da1ebSSage Weil int err; 505355da1ebSSage Weil 506355da1ebSSage Weil p = &ci->i_xattrs.index.rb_node; 507355da1ebSSage Weil xattr = __get_xattr(ci, name); 508355da1ebSSage Weil err = __remove_xattr(ci, xattr); 509355da1ebSSage Weil return err; 510355da1ebSSage Weil } 511355da1ebSSage Weil 512355da1ebSSage Weil static char *__copy_xattr_names(struct ceph_inode_info *ci, 513355da1ebSSage Weil char *dest) 514355da1ebSSage Weil { 515355da1ebSSage Weil struct rb_node *p; 516355da1ebSSage Weil struct ceph_inode_xattr *xattr = NULL; 517355da1ebSSage Weil 518355da1ebSSage Weil p = rb_first(&ci->i_xattrs.index); 519355da1ebSSage Weil dout("__copy_xattr_names count=%d\n", ci->i_xattrs.count); 520355da1ebSSage Weil 521355da1ebSSage Weil while (p) { 522355da1ebSSage Weil xattr = rb_entry(p, struct ceph_inode_xattr, node); 523355da1ebSSage Weil memcpy(dest, xattr->name, xattr->name_len); 524355da1ebSSage Weil dest[xattr->name_len] = '\0'; 525355da1ebSSage Weil 526355da1ebSSage Weil dout("dest=%s %p (%s) (%d/%d)\n", dest, xattr, xattr->name, 527355da1ebSSage Weil xattr->name_len, ci->i_xattrs.names_size); 528355da1ebSSage Weil 529355da1ebSSage Weil dest += xattr->name_len + 1; 530355da1ebSSage Weil p = rb_next(p); 531355da1ebSSage Weil } 532355da1ebSSage Weil 533355da1ebSSage Weil return dest; 534355da1ebSSage Weil } 535355da1ebSSage Weil 536355da1ebSSage Weil void __ceph_destroy_xattrs(struct ceph_inode_info *ci) 537355da1ebSSage Weil { 538355da1ebSSage Weil struct rb_node *p, *tmp; 539355da1ebSSage Weil struct ceph_inode_xattr *xattr = NULL; 540355da1ebSSage Weil 541355da1ebSSage Weil p = rb_first(&ci->i_xattrs.index); 542355da1ebSSage Weil 543355da1ebSSage Weil dout("__ceph_destroy_xattrs p=%p\n", p); 544355da1ebSSage Weil 545355da1ebSSage Weil while (p) { 546355da1ebSSage Weil xattr = rb_entry(p, struct ceph_inode_xattr, node); 547355da1ebSSage Weil tmp = p; 548355da1ebSSage Weil p = rb_next(tmp); 549355da1ebSSage Weil dout("__ceph_destroy_xattrs next p=%p (%.*s)\n", p, 550355da1ebSSage Weil xattr->name_len, xattr->name); 551355da1ebSSage Weil rb_erase(tmp, &ci->i_xattrs.index); 552355da1ebSSage Weil 553355da1ebSSage Weil __free_xattr(xattr); 554355da1ebSSage Weil } 555355da1ebSSage Weil 556355da1ebSSage Weil ci->i_xattrs.names_size = 0; 557355da1ebSSage Weil ci->i_xattrs.vals_size = 0; 558355da1ebSSage Weil ci->i_xattrs.index_version = 0; 559355da1ebSSage Weil ci->i_xattrs.count = 0; 560355da1ebSSage Weil ci->i_xattrs.index = RB_ROOT; 561355da1ebSSage Weil } 562355da1ebSSage Weil 563355da1ebSSage Weil static int __build_xattrs(struct inode *inode) 564be655596SSage Weil __releases(ci->i_ceph_lock) 565be655596SSage Weil __acquires(ci->i_ceph_lock) 566355da1ebSSage Weil { 567355da1ebSSage Weil u32 namelen; 568355da1ebSSage Weil u32 numattr = 0; 569355da1ebSSage Weil void *p, *end; 570355da1ebSSage Weil u32 len; 571355da1ebSSage Weil const char *name, *val; 572355da1ebSSage Weil struct ceph_inode_info *ci = ceph_inode(inode); 573355da1ebSSage Weil int xattr_version; 574355da1ebSSage Weil struct ceph_inode_xattr **xattrs = NULL; 57563ff78b2SSage Weil int err = 0; 576355da1ebSSage Weil int i; 577355da1ebSSage Weil 578355da1ebSSage Weil dout("__build_xattrs() len=%d\n", 579355da1ebSSage Weil ci->i_xattrs.blob ? (int)ci->i_xattrs.blob->vec.iov_len : 0); 580355da1ebSSage Weil 581355da1ebSSage Weil if (ci->i_xattrs.index_version >= ci->i_xattrs.version) 582355da1ebSSage Weil return 0; /* already built */ 583355da1ebSSage Weil 584355da1ebSSage Weil __ceph_destroy_xattrs(ci); 585355da1ebSSage Weil 586355da1ebSSage Weil start: 587355da1ebSSage Weil /* updated internal xattr rb tree */ 588355da1ebSSage Weil if (ci->i_xattrs.blob && ci->i_xattrs.blob->vec.iov_len > 4) { 589355da1ebSSage Weil p = ci->i_xattrs.blob->vec.iov_base; 590355da1ebSSage Weil end = p + ci->i_xattrs.blob->vec.iov_len; 591355da1ebSSage Weil ceph_decode_32_safe(&p, end, numattr, bad); 592355da1ebSSage Weil xattr_version = ci->i_xattrs.version; 593be655596SSage Weil spin_unlock(&ci->i_ceph_lock); 594355da1ebSSage Weil 5957e8a2952SIlya Dryomov xattrs = kcalloc(numattr, sizeof(struct ceph_inode_xattr *), 596355da1ebSSage Weil GFP_NOFS); 597355da1ebSSage Weil err = -ENOMEM; 598355da1ebSSage Weil if (!xattrs) 599355da1ebSSage Weil goto bad_lock; 6001a295bd8SIlya Dryomov 601355da1ebSSage Weil for (i = 0; i < numattr; i++) { 602355da1ebSSage Weil xattrs[i] = kmalloc(sizeof(struct ceph_inode_xattr), 603355da1ebSSage Weil GFP_NOFS); 604355da1ebSSage Weil if (!xattrs[i]) 605355da1ebSSage Weil goto bad_lock; 606355da1ebSSage Weil } 607355da1ebSSage Weil 608be655596SSage Weil spin_lock(&ci->i_ceph_lock); 609355da1ebSSage Weil if (ci->i_xattrs.version != xattr_version) { 610355da1ebSSage Weil /* lost a race, retry */ 611355da1ebSSage Weil for (i = 0; i < numattr; i++) 612355da1ebSSage Weil kfree(xattrs[i]); 613355da1ebSSage Weil kfree(xattrs); 61421ec6ffaSAlan Cox xattrs = NULL; 615355da1ebSSage Weil goto start; 616355da1ebSSage Weil } 617355da1ebSSage Weil err = -EIO; 618355da1ebSSage Weil while (numattr--) { 619355da1ebSSage Weil ceph_decode_32_safe(&p, end, len, bad); 620355da1ebSSage Weil namelen = len; 621355da1ebSSage Weil name = p; 622355da1ebSSage Weil p += len; 623355da1ebSSage Weil ceph_decode_32_safe(&p, end, len, bad); 624355da1ebSSage Weil val = p; 625355da1ebSSage Weil p += len; 626355da1ebSSage Weil 627355da1ebSSage Weil err = __set_xattr(ci, name, namelen, val, len, 628fbc0b970SYan, Zheng 0, 0, &xattrs[numattr]); 629355da1ebSSage Weil 630355da1ebSSage Weil if (err < 0) 631355da1ebSSage Weil goto bad; 632355da1ebSSage Weil } 633355da1ebSSage Weil kfree(xattrs); 634355da1ebSSage Weil } 635355da1ebSSage Weil ci->i_xattrs.index_version = ci->i_xattrs.version; 636355da1ebSSage Weil ci->i_xattrs.dirty = false; 637355da1ebSSage Weil 638355da1ebSSage Weil return err; 639355da1ebSSage Weil bad_lock: 640be655596SSage Weil spin_lock(&ci->i_ceph_lock); 641355da1ebSSage Weil bad: 642355da1ebSSage Weil if (xattrs) { 643355da1ebSSage Weil for (i = 0; i < numattr; i++) 644355da1ebSSage Weil kfree(xattrs[i]); 645355da1ebSSage Weil kfree(xattrs); 646355da1ebSSage Weil } 647355da1ebSSage Weil ci->i_xattrs.names_size = 0; 648355da1ebSSage Weil return err; 649355da1ebSSage Weil } 650355da1ebSSage Weil 651355da1ebSSage Weil static int __get_required_blob_size(struct ceph_inode_info *ci, int name_size, 652355da1ebSSage Weil int val_size) 653355da1ebSSage Weil { 654355da1ebSSage Weil /* 655355da1ebSSage Weil * 4 bytes for the length, and additional 4 bytes per each xattr name, 656355da1ebSSage Weil * 4 bytes per each value 657355da1ebSSage Weil */ 658355da1ebSSage Weil int size = 4 + ci->i_xattrs.count*(4 + 4) + 659355da1ebSSage Weil ci->i_xattrs.names_size + 660355da1ebSSage Weil ci->i_xattrs.vals_size; 661355da1ebSSage Weil dout("__get_required_blob_size c=%d names.size=%d vals.size=%d\n", 662355da1ebSSage Weil ci->i_xattrs.count, ci->i_xattrs.names_size, 663355da1ebSSage Weil ci->i_xattrs.vals_size); 664355da1ebSSage Weil 665355da1ebSSage Weil if (name_size) 666355da1ebSSage Weil size += 4 + 4 + name_size + val_size; 667355da1ebSSage Weil 668355da1ebSSage Weil return size; 669355da1ebSSage Weil } 670355da1ebSSage Weil 671355da1ebSSage Weil /* 672355da1ebSSage Weil * If there are dirty xattrs, reencode xattrs into the prealloc_blob 673355da1ebSSage Weil * and swap into place. 674355da1ebSSage Weil */ 675355da1ebSSage Weil void __ceph_build_xattrs_blob(struct ceph_inode_info *ci) 676355da1ebSSage Weil { 677355da1ebSSage Weil struct rb_node *p; 678355da1ebSSage Weil struct ceph_inode_xattr *xattr = NULL; 679355da1ebSSage Weil void *dest; 680355da1ebSSage Weil 681355da1ebSSage Weil dout("__build_xattrs_blob %p\n", &ci->vfs_inode); 682355da1ebSSage Weil if (ci->i_xattrs.dirty) { 683355da1ebSSage Weil int need = __get_required_blob_size(ci, 0, 0); 684355da1ebSSage Weil 685355da1ebSSage Weil BUG_ON(need > ci->i_xattrs.prealloc_blob->alloc_len); 686355da1ebSSage Weil 687355da1ebSSage Weil p = rb_first(&ci->i_xattrs.index); 688355da1ebSSage Weil dest = ci->i_xattrs.prealloc_blob->vec.iov_base; 689355da1ebSSage Weil 690355da1ebSSage Weil ceph_encode_32(&dest, ci->i_xattrs.count); 691355da1ebSSage Weil while (p) { 692355da1ebSSage Weil xattr = rb_entry(p, struct ceph_inode_xattr, node); 693355da1ebSSage Weil 694355da1ebSSage Weil ceph_encode_32(&dest, xattr->name_len); 695355da1ebSSage Weil memcpy(dest, xattr->name, xattr->name_len); 696355da1ebSSage Weil dest += xattr->name_len; 697355da1ebSSage Weil ceph_encode_32(&dest, xattr->val_len); 698355da1ebSSage Weil memcpy(dest, xattr->val, xattr->val_len); 699355da1ebSSage Weil dest += xattr->val_len; 700355da1ebSSage Weil 701355da1ebSSage Weil p = rb_next(p); 702355da1ebSSage Weil } 703355da1ebSSage Weil 704355da1ebSSage Weil /* adjust buffer len; it may be larger than we need */ 705355da1ebSSage Weil ci->i_xattrs.prealloc_blob->vec.iov_len = 706355da1ebSSage Weil dest - ci->i_xattrs.prealloc_blob->vec.iov_base; 707355da1ebSSage Weil 708b6c1d5b8SSage Weil if (ci->i_xattrs.blob) 709355da1ebSSage Weil ceph_buffer_put(ci->i_xattrs.blob); 710355da1ebSSage Weil ci->i_xattrs.blob = ci->i_xattrs.prealloc_blob; 711355da1ebSSage Weil ci->i_xattrs.prealloc_blob = NULL; 712355da1ebSSage Weil ci->i_xattrs.dirty = false; 7134a625be4SSage Weil ci->i_xattrs.version++; 714355da1ebSSage Weil } 715355da1ebSSage Weil } 716355da1ebSSage Weil 7177221fe4cSGuangliang Zhao ssize_t __ceph_getxattr(struct inode *inode, const char *name, void *value, 718355da1ebSSage Weil size_t size) 719355da1ebSSage Weil { 720355da1ebSSage Weil struct ceph_inode_info *ci = ceph_inode(inode); 721355da1ebSSage Weil int err; 722355da1ebSSage Weil struct ceph_inode_xattr *xattr; 723881a5fa2SAlex Elder struct ceph_vxattr *vxattr = NULL; 724355da1ebSSage Weil 725355da1ebSSage Weil if (!ceph_is_valid_xattr(name)) 726355da1ebSSage Weil return -ENODATA; 727355da1ebSSage Weil 7280bee82fbSSage Weil /* let's see if a virtual xattr was requested */ 7290bee82fbSSage Weil vxattr = ceph_match_vxattr(inode, name); 7300bee82fbSSage Weil if (vxattr && !(vxattr->exists_cb && !vxattr->exists_cb(ci))) { 7310bee82fbSSage Weil err = vxattr->getxattr_cb(ci, value, size); 732a1dc1937Smajianpeng return err; 7330bee82fbSSage Weil } 7340bee82fbSSage Weil 735a1dc1937Smajianpeng spin_lock(&ci->i_ceph_lock); 736a1dc1937Smajianpeng dout("getxattr %p ver=%lld index_ver=%lld\n", inode, 737a1dc1937Smajianpeng ci->i_xattrs.version, ci->i_xattrs.index_version); 738a1dc1937Smajianpeng 739508b32d8SYan, Zheng if (ci->i_xattrs.version == 0 || 740508b32d8SYan, Zheng !__ceph_caps_issued_mask(ci, CEPH_CAP_XATTR_SHARED, 1)) { 741be655596SSage Weil spin_unlock(&ci->i_ceph_lock); 742355da1ebSSage Weil /* get xattrs from mds (if we don't already have them) */ 743508b32d8SYan, Zheng err = ceph_do_getattr(inode, CEPH_STAT_CAP_XATTR, true); 744355da1ebSSage Weil if (err) 745355da1ebSSage Weil return err; 746be655596SSage Weil spin_lock(&ci->i_ceph_lock); 747508b32d8SYan, Zheng } 748355da1ebSSage Weil 749355da1ebSSage Weil err = __build_xattrs(inode); 750355da1ebSSage Weil if (err < 0) 751355da1ebSSage Weil goto out; 752355da1ebSSage Weil 753355da1ebSSage Weil err = -ENODATA; /* == ENOATTR */ 754355da1ebSSage Weil xattr = __get_xattr(ci, name); 7550bee82fbSSage Weil if (!xattr) 756355da1ebSSage Weil goto out; 757355da1ebSSage Weil 758355da1ebSSage Weil err = -ERANGE; 759355da1ebSSage Weil if (size && size < xattr->val_len) 760355da1ebSSage Weil goto out; 761355da1ebSSage Weil 762355da1ebSSage Weil err = xattr->val_len; 763355da1ebSSage Weil if (size == 0) 764355da1ebSSage Weil goto out; 765355da1ebSSage Weil 766355da1ebSSage Weil memcpy(value, xattr->val, xattr->val_len); 767355da1ebSSage Weil 768355da1ebSSage Weil out: 769be655596SSage Weil spin_unlock(&ci->i_ceph_lock); 770355da1ebSSage Weil return err; 771355da1ebSSage Weil } 772355da1ebSSage Weil 7737221fe4cSGuangliang Zhao ssize_t ceph_getxattr(struct dentry *dentry, const char *name, void *value, 7747221fe4cSGuangliang Zhao size_t size) 7757221fe4cSGuangliang Zhao { 7767221fe4cSGuangliang Zhao if (!strncmp(name, XATTR_SYSTEM_PREFIX, XATTR_SYSTEM_PREFIX_LEN)) 7777221fe4cSGuangliang Zhao return generic_getxattr(dentry, name, value, size); 7787221fe4cSGuangliang Zhao 7797221fe4cSGuangliang Zhao return __ceph_getxattr(dentry->d_inode, name, value, size); 7807221fe4cSGuangliang Zhao } 7817221fe4cSGuangliang Zhao 782355da1ebSSage Weil ssize_t ceph_listxattr(struct dentry *dentry, char *names, size_t size) 783355da1ebSSage Weil { 784355da1ebSSage Weil struct inode *inode = dentry->d_inode; 785355da1ebSSage Weil struct ceph_inode_info *ci = ceph_inode(inode); 786881a5fa2SAlex Elder struct ceph_vxattr *vxattrs = ceph_inode_vxattrs(inode); 787355da1ebSSage Weil u32 vir_namelen = 0; 788355da1ebSSage Weil u32 namelen; 789355da1ebSSage Weil int err; 790355da1ebSSage Weil u32 len; 791355da1ebSSage Weil int i; 792355da1ebSSage Weil 793be655596SSage Weil spin_lock(&ci->i_ceph_lock); 794355da1ebSSage Weil dout("listxattr %p ver=%lld index_ver=%lld\n", inode, 795355da1ebSSage Weil ci->i_xattrs.version, ci->i_xattrs.index_version); 796355da1ebSSage Weil 797508b32d8SYan, Zheng if (ci->i_xattrs.version == 0 || 798508b32d8SYan, Zheng !__ceph_caps_issued_mask(ci, CEPH_CAP_XATTR_SHARED, 1)) { 799be655596SSage Weil spin_unlock(&ci->i_ceph_lock); 800508b32d8SYan, Zheng err = ceph_do_getattr(inode, CEPH_STAT_CAP_XATTR, true); 801355da1ebSSage Weil if (err) 802355da1ebSSage Weil return err; 803be655596SSage Weil spin_lock(&ci->i_ceph_lock); 804508b32d8SYan, Zheng } 805355da1ebSSage Weil 806355da1ebSSage Weil err = __build_xattrs(inode); 807355da1ebSSage Weil if (err < 0) 808355da1ebSSage Weil goto out; 8093ce6cd12SAlex Elder /* 8103ce6cd12SAlex Elder * Start with virtual dir xattr names (if any) (including 8113ce6cd12SAlex Elder * terminating '\0' characters for each). 8123ce6cd12SAlex Elder */ 8133ce6cd12SAlex Elder vir_namelen = ceph_vxattrs_name_size(vxattrs); 8143ce6cd12SAlex Elder 815355da1ebSSage Weil /* adding 1 byte per each variable due to the null termination */ 816b65917ddSSage Weil namelen = ci->i_xattrs.names_size + ci->i_xattrs.count; 817355da1ebSSage Weil err = -ERANGE; 818b65917ddSSage Weil if (size && vir_namelen + namelen > size) 819355da1ebSSage Weil goto out; 820355da1ebSSage Weil 821b65917ddSSage Weil err = namelen + vir_namelen; 822355da1ebSSage Weil if (size == 0) 823355da1ebSSage Weil goto out; 824355da1ebSSage Weil 825355da1ebSSage Weil names = __copy_xattr_names(ci, names); 826355da1ebSSage Weil 827355da1ebSSage Weil /* virtual xattr names, too */ 828b65917ddSSage Weil err = namelen; 829b65917ddSSage Weil if (vxattrs) { 830355da1ebSSage Weil for (i = 0; vxattrs[i].name; i++) { 831b65917ddSSage Weil if (!vxattrs[i].hidden && 832b65917ddSSage Weil !(vxattrs[i].exists_cb && 833b65917ddSSage Weil !vxattrs[i].exists_cb(ci))) { 834355da1ebSSage Weil len = sprintf(names, "%s", vxattrs[i].name); 835355da1ebSSage Weil names += len + 1; 836b65917ddSSage Weil err += len + 1; 837b65917ddSSage Weil } 838b65917ddSSage Weil } 839355da1ebSSage Weil } 840355da1ebSSage Weil 841355da1ebSSage Weil out: 842be655596SSage Weil spin_unlock(&ci->i_ceph_lock); 843355da1ebSSage Weil return err; 844355da1ebSSage Weil } 845355da1ebSSage Weil 846355da1ebSSage Weil static int ceph_sync_setxattr(struct dentry *dentry, const char *name, 847355da1ebSSage Weil const char *value, size_t size, int flags) 848355da1ebSSage Weil { 8493d14c5d2SYehuda Sadeh struct ceph_fs_client *fsc = ceph_sb_to_client(dentry->d_sb); 850355da1ebSSage Weil struct inode *inode = dentry->d_inode; 851355da1ebSSage Weil struct ceph_inode_info *ci = ceph_inode(inode); 852355da1ebSSage Weil struct ceph_mds_request *req; 8533d14c5d2SYehuda Sadeh struct ceph_mds_client *mdsc = fsc->mdsc; 854*25e6bae3SYan, Zheng struct ceph_pagelist *pagelist = NULL; 855355da1ebSSage Weil int err; 856355da1ebSSage Weil 857*25e6bae3SYan, Zheng if (value) { 858*25e6bae3SYan, Zheng /* copy value into pagelist */ 859*25e6bae3SYan, Zheng pagelist = kmalloc(sizeof(*pagelist), GFP_NOFS); 860*25e6bae3SYan, Zheng if (!pagelist) 861355da1ebSSage Weil return -ENOMEM; 862*25e6bae3SYan, Zheng 863*25e6bae3SYan, Zheng ceph_pagelist_init(pagelist); 864*25e6bae3SYan, Zheng err = ceph_pagelist_append(pagelist, value, size); 865*25e6bae3SYan, Zheng if (err) 866355da1ebSSage Weil goto out; 867*25e6bae3SYan, Zheng } else { 868*25e6bae3SYan, Zheng flags |= CEPH_XATTR_REMOVE; 869355da1ebSSage Weil } 870355da1ebSSage Weil 871355da1ebSSage Weil dout("setxattr value=%.*s\n", (int)size, value); 872355da1ebSSage Weil 873355da1ebSSage Weil /* do request */ 874355da1ebSSage Weil req = ceph_mdsc_create_request(mdsc, CEPH_MDS_OP_SETXATTR, 875355da1ebSSage Weil USE_AUTH_MDS); 87660d87733SJulia Lawall if (IS_ERR(req)) { 87760d87733SJulia Lawall err = PTR_ERR(req); 87860d87733SJulia Lawall goto out; 87960d87733SJulia Lawall } 88070b666c3SSage Weil req->r_inode = inode; 88170b666c3SSage Weil ihold(inode); 882355da1ebSSage Weil req->r_inode_drop = CEPH_CAP_XATTR_SHARED; 883355da1ebSSage Weil req->r_num_caps = 1; 884355da1ebSSage Weil req->r_args.setxattr.flags = cpu_to_le32(flags); 885355da1ebSSage Weil req->r_path2 = kstrdup(name, GFP_NOFS); 886355da1ebSSage Weil 887*25e6bae3SYan, Zheng req->r_pagelist = pagelist; 888*25e6bae3SYan, Zheng pagelist = NULL; 889355da1ebSSage Weil 890355da1ebSSage Weil dout("xattr.ver (before): %lld\n", ci->i_xattrs.version); 891752c8bdcSSage Weil err = ceph_mdsc_do_request(mdsc, NULL, req); 892355da1ebSSage Weil ceph_mdsc_put_request(req); 893355da1ebSSage Weil dout("xattr.ver (after): %lld\n", ci->i_xattrs.version); 894355da1ebSSage Weil 895355da1ebSSage Weil out: 896*25e6bae3SYan, Zheng if (pagelist) 897*25e6bae3SYan, Zheng ceph_pagelist_release(pagelist); 898355da1ebSSage Weil return err; 899355da1ebSSage Weil } 900355da1ebSSage Weil 9017221fe4cSGuangliang Zhao int __ceph_setxattr(struct dentry *dentry, const char *name, 902355da1ebSSage Weil const void *value, size_t size, int flags) 903355da1ebSSage Weil { 904355da1ebSSage Weil struct inode *inode = dentry->d_inode; 905881a5fa2SAlex Elder struct ceph_vxattr *vxattr; 906355da1ebSSage Weil struct ceph_inode_info *ci = ceph_inode(inode); 90718fa8b3fSAlex Elder int issued; 908355da1ebSSage Weil int err; 909fbc0b970SYan, Zheng int dirty = 0; 910355da1ebSSage Weil int name_len = strlen(name); 911355da1ebSSage Weil int val_len = size; 912355da1ebSSage Weil char *newname = NULL; 913355da1ebSSage Weil char *newval = NULL; 914355da1ebSSage Weil struct ceph_inode_xattr *xattr = NULL; 915355da1ebSSage Weil int required_blob_size; 916355da1ebSSage Weil 917355da1ebSSage Weil if (!ceph_is_valid_xattr(name)) 918355da1ebSSage Weil return -EOPNOTSUPP; 919355da1ebSSage Weil 92006476a69SAlex Elder vxattr = ceph_match_vxattr(inode, name); 921355da1ebSSage Weil if (vxattr && vxattr->readonly) 922355da1ebSSage Weil return -EOPNOTSUPP; 923355da1ebSSage Weil 9243adf654dSSage Weil /* pass any unhandled ceph.* xattrs through to the MDS */ 9253adf654dSSage Weil if (!strncmp(name, XATTR_CEPH_PREFIX, XATTR_CEPH_PREFIX_LEN)) 9263adf654dSSage Weil goto do_sync_unlocked; 9273adf654dSSage Weil 928355da1ebSSage Weil /* preallocate memory for xattr name, value, index node */ 929355da1ebSSage Weil err = -ENOMEM; 93061413c2fSJulia Lawall newname = kmemdup(name, name_len + 1, GFP_NOFS); 931355da1ebSSage Weil if (!newname) 932355da1ebSSage Weil goto out; 933355da1ebSSage Weil 934355da1ebSSage Weil if (val_len) { 935b829c195SAlex Elder newval = kmemdup(value, val_len, GFP_NOFS); 936355da1ebSSage Weil if (!newval) 937355da1ebSSage Weil goto out; 938355da1ebSSage Weil } 939355da1ebSSage Weil 940355da1ebSSage Weil xattr = kmalloc(sizeof(struct ceph_inode_xattr), GFP_NOFS); 941355da1ebSSage Weil if (!xattr) 942355da1ebSSage Weil goto out; 943355da1ebSSage Weil 944be655596SSage Weil spin_lock(&ci->i_ceph_lock); 945355da1ebSSage Weil retry: 946355da1ebSSage Weil issued = __ceph_caps_issued(ci, NULL); 94718fa8b3fSAlex Elder dout("setxattr %p issued %s\n", inode, ceph_cap_string(issued)); 948508b32d8SYan, Zheng if (ci->i_xattrs.version == 0 || !(issued & CEPH_CAP_XATTR_EXCL)) 949355da1ebSSage Weil goto do_sync; 950355da1ebSSage Weil __build_xattrs(inode); 951355da1ebSSage Weil 952355da1ebSSage Weil required_blob_size = __get_required_blob_size(ci, name_len, val_len); 953355da1ebSSage Weil 954355da1ebSSage Weil if (!ci->i_xattrs.prealloc_blob || 955355da1ebSSage Weil required_blob_size > ci->i_xattrs.prealloc_blob->alloc_len) { 95618fa8b3fSAlex Elder struct ceph_buffer *blob; 957355da1ebSSage Weil 958be655596SSage Weil spin_unlock(&ci->i_ceph_lock); 959355da1ebSSage Weil dout(" preaallocating new blob size=%d\n", required_blob_size); 960b6c1d5b8SSage Weil blob = ceph_buffer_new(required_blob_size, GFP_NOFS); 961355da1ebSSage Weil if (!blob) 962355da1ebSSage Weil goto out; 963be655596SSage Weil spin_lock(&ci->i_ceph_lock); 964b6c1d5b8SSage Weil if (ci->i_xattrs.prealloc_blob) 965355da1ebSSage Weil ceph_buffer_put(ci->i_xattrs.prealloc_blob); 966355da1ebSSage Weil ci->i_xattrs.prealloc_blob = blob; 967355da1ebSSage Weil goto retry; 968355da1ebSSage Weil } 969355da1ebSSage Weil 970bcdfeb2eSYan, Zheng err = __set_xattr(ci, newname, name_len, newval, val_len, 971bcdfeb2eSYan, Zheng flags, value ? 1 : -1, &xattr); 97218fa8b3fSAlex Elder 973fbc0b970SYan, Zheng if (!err) { 974fca65b4aSSage Weil dirty = __ceph_mark_dirty_caps(ci, CEPH_CAP_XATTR_EXCL); 975355da1ebSSage Weil ci->i_xattrs.dirty = true; 976355da1ebSSage Weil inode->i_ctime = CURRENT_TIME; 977fbc0b970SYan, Zheng } 97818fa8b3fSAlex Elder 979be655596SSage Weil spin_unlock(&ci->i_ceph_lock); 980fca65b4aSSage Weil if (dirty) 981fca65b4aSSage Weil __mark_inode_dirty(inode, dirty); 982355da1ebSSage Weil return err; 983355da1ebSSage Weil 984355da1ebSSage Weil do_sync: 985be655596SSage Weil spin_unlock(&ci->i_ceph_lock); 9863adf654dSSage Weil do_sync_unlocked: 987355da1ebSSage Weil err = ceph_sync_setxattr(dentry, name, value, size, flags); 988355da1ebSSage Weil out: 989355da1ebSSage Weil kfree(newname); 990355da1ebSSage Weil kfree(newval); 991355da1ebSSage Weil kfree(xattr); 992355da1ebSSage Weil return err; 993355da1ebSSage Weil } 994355da1ebSSage Weil 9957221fe4cSGuangliang Zhao int ceph_setxattr(struct dentry *dentry, const char *name, 9967221fe4cSGuangliang Zhao const void *value, size_t size, int flags) 9977221fe4cSGuangliang Zhao { 9987221fe4cSGuangliang Zhao if (ceph_snap(dentry->d_inode) != CEPH_NOSNAP) 9997221fe4cSGuangliang Zhao return -EROFS; 10007221fe4cSGuangliang Zhao 10017221fe4cSGuangliang Zhao if (!strncmp(name, XATTR_SYSTEM_PREFIX, XATTR_SYSTEM_PREFIX_LEN)) 10027221fe4cSGuangliang Zhao return generic_setxattr(dentry, name, value, size, flags); 10037221fe4cSGuangliang Zhao 10047221fe4cSGuangliang Zhao return __ceph_setxattr(dentry, name, value, size, flags); 10057221fe4cSGuangliang Zhao } 10067221fe4cSGuangliang Zhao 1007355da1ebSSage Weil static int ceph_send_removexattr(struct dentry *dentry, const char *name) 1008355da1ebSSage Weil { 10093d14c5d2SYehuda Sadeh struct ceph_fs_client *fsc = ceph_sb_to_client(dentry->d_sb); 10103d14c5d2SYehuda Sadeh struct ceph_mds_client *mdsc = fsc->mdsc; 1011355da1ebSSage Weil struct inode *inode = dentry->d_inode; 1012355da1ebSSage Weil struct ceph_mds_request *req; 1013355da1ebSSage Weil int err; 1014355da1ebSSage Weil 1015355da1ebSSage Weil req = ceph_mdsc_create_request(mdsc, CEPH_MDS_OP_RMXATTR, 1016355da1ebSSage Weil USE_AUTH_MDS); 1017355da1ebSSage Weil if (IS_ERR(req)) 1018355da1ebSSage Weil return PTR_ERR(req); 101970b666c3SSage Weil req->r_inode = inode; 102070b666c3SSage Weil ihold(inode); 1021355da1ebSSage Weil req->r_inode_drop = CEPH_CAP_XATTR_SHARED; 1022355da1ebSSage Weil req->r_num_caps = 1; 1023355da1ebSSage Weil req->r_path2 = kstrdup(name, GFP_NOFS); 1024355da1ebSSage Weil 1025752c8bdcSSage Weil err = ceph_mdsc_do_request(mdsc, NULL, req); 1026355da1ebSSage Weil ceph_mdsc_put_request(req); 1027355da1ebSSage Weil return err; 1028355da1ebSSage Weil } 1029355da1ebSSage Weil 10307221fe4cSGuangliang Zhao int __ceph_removexattr(struct dentry *dentry, const char *name) 1031355da1ebSSage Weil { 1032355da1ebSSage Weil struct inode *inode = dentry->d_inode; 1033881a5fa2SAlex Elder struct ceph_vxattr *vxattr; 1034355da1ebSSage Weil struct ceph_inode_info *ci = ceph_inode(inode); 1035355da1ebSSage Weil int issued; 1036355da1ebSSage Weil int err; 103783eb26afSAlex Elder int required_blob_size; 1038fca65b4aSSage Weil int dirty; 1039355da1ebSSage Weil 1040355da1ebSSage Weil if (!ceph_is_valid_xattr(name)) 1041355da1ebSSage Weil return -EOPNOTSUPP; 1042355da1ebSSage Weil 104306476a69SAlex Elder vxattr = ceph_match_vxattr(inode, name); 1044355da1ebSSage Weil if (vxattr && vxattr->readonly) 1045355da1ebSSage Weil return -EOPNOTSUPP; 1046355da1ebSSage Weil 1047d421acb1SSage Weil /* pass any unhandled ceph.* xattrs through to the MDS */ 1048d421acb1SSage Weil if (!strncmp(name, XATTR_CEPH_PREFIX, XATTR_CEPH_PREFIX_LEN)) 1049d421acb1SSage Weil goto do_sync_unlocked; 1050d421acb1SSage Weil 105183eb26afSAlex Elder err = -ENOMEM; 1052be655596SSage Weil spin_lock(&ci->i_ceph_lock); 105383eb26afSAlex Elder retry: 1054355da1ebSSage Weil issued = __ceph_caps_issued(ci, NULL); 1055355da1ebSSage Weil dout("removexattr %p issued %s\n", inode, ceph_cap_string(issued)); 1056355da1ebSSage Weil 1057508b32d8SYan, Zheng if (ci->i_xattrs.version == 0 || !(issued & CEPH_CAP_XATTR_EXCL)) 1058355da1ebSSage Weil goto do_sync; 105918fa8b3fSAlex Elder __build_xattrs(inode); 1060355da1ebSSage Weil 106183eb26afSAlex Elder required_blob_size = __get_required_blob_size(ci, 0, 0); 106283eb26afSAlex Elder 106383eb26afSAlex Elder if (!ci->i_xattrs.prealloc_blob || 106483eb26afSAlex Elder required_blob_size > ci->i_xattrs.prealloc_blob->alloc_len) { 106583eb26afSAlex Elder struct ceph_buffer *blob; 106683eb26afSAlex Elder 106783eb26afSAlex Elder spin_unlock(&ci->i_ceph_lock); 106883eb26afSAlex Elder dout(" preaallocating new blob size=%d\n", required_blob_size); 106983eb26afSAlex Elder blob = ceph_buffer_new(required_blob_size, GFP_NOFS); 107083eb26afSAlex Elder if (!blob) 107183eb26afSAlex Elder goto out; 107283eb26afSAlex Elder spin_lock(&ci->i_ceph_lock); 107383eb26afSAlex Elder if (ci->i_xattrs.prealloc_blob) 107483eb26afSAlex Elder ceph_buffer_put(ci->i_xattrs.prealloc_blob); 107583eb26afSAlex Elder ci->i_xattrs.prealloc_blob = blob; 107683eb26afSAlex Elder goto retry; 107783eb26afSAlex Elder } 107883eb26afSAlex Elder 1079355da1ebSSage Weil err = __remove_xattr_by_name(ceph_inode(inode), name); 108018fa8b3fSAlex Elder 1081fca65b4aSSage Weil dirty = __ceph_mark_dirty_caps(ci, CEPH_CAP_XATTR_EXCL); 1082355da1ebSSage Weil ci->i_xattrs.dirty = true; 1083355da1ebSSage Weil inode->i_ctime = CURRENT_TIME; 1084be655596SSage Weil spin_unlock(&ci->i_ceph_lock); 1085fca65b4aSSage Weil if (dirty) 1086fca65b4aSSage Weil __mark_inode_dirty(inode, dirty); 1087355da1ebSSage Weil return err; 1088355da1ebSSage Weil do_sync: 1089be655596SSage Weil spin_unlock(&ci->i_ceph_lock); 1090d421acb1SSage Weil do_sync_unlocked: 1091355da1ebSSage Weil err = ceph_send_removexattr(dentry, name); 109283eb26afSAlex Elder out: 1093355da1ebSSage Weil return err; 1094355da1ebSSage Weil } 1095355da1ebSSage Weil 10967221fe4cSGuangliang Zhao int ceph_removexattr(struct dentry *dentry, const char *name) 10977221fe4cSGuangliang Zhao { 10987221fe4cSGuangliang Zhao if (ceph_snap(dentry->d_inode) != CEPH_NOSNAP) 10997221fe4cSGuangliang Zhao return -EROFS; 11007221fe4cSGuangliang Zhao 11017221fe4cSGuangliang Zhao if (!strncmp(name, XATTR_SYSTEM_PREFIX, XATTR_SYSTEM_PREFIX_LEN)) 11027221fe4cSGuangliang Zhao return generic_removexattr(dentry, name); 11037221fe4cSGuangliang Zhao 11047221fe4cSGuangliang Zhao return __ceph_removexattr(dentry, name); 11057221fe4cSGuangliang Zhao } 1106