1b2441318SGreg Kroah-Hartman // SPDX-License-Identifier: GPL-2.0 23d14c5d2SYehuda Sadeh #include <linux/ceph/ceph_debug.h> 325e6bae3SYan, Zheng #include <linux/ceph/pagelist.h> 43d14c5d2SYehuda Sadeh 5355da1ebSSage Weil #include "super.h" 63d14c5d2SYehuda Sadeh #include "mds_client.h" 73d14c5d2SYehuda Sadeh 83d14c5d2SYehuda Sadeh #include <linux/ceph/decode.h> 9355da1ebSSage Weil 10355da1ebSSage Weil #include <linux/xattr.h> 11ac6713ccSYan, Zheng #include <linux/security.h> 124db658eaSLinus Torvalds #include <linux/posix_acl_xattr.h> 135a0e3ad6STejun Heo #include <linux/slab.h> 14355da1ebSSage Weil 1522891907SAlex Elder #define XATTR_CEPH_PREFIX "ceph." 1622891907SAlex Elder #define XATTR_CEPH_PREFIX_LEN (sizeof (XATTR_CEPH_PREFIX) - 1) 1722891907SAlex Elder 18bcdfeb2eSYan, Zheng static int __remove_xattr(struct ceph_inode_info *ci, 19bcdfeb2eSYan, Zheng struct ceph_inode_xattr *xattr); 20bcdfeb2eSYan, Zheng 21355da1ebSSage Weil static bool ceph_is_valid_xattr(const char *name) 22355da1ebSSage Weil { 23b8fe918bSJeff Layton return !strncmp(name, XATTR_SECURITY_PREFIX, XATTR_SECURITY_PREFIX_LEN) || 24b8fe918bSJeff Layton !strncmp(name, XATTR_CEPH_PREFIX, XATTR_CEPH_PREFIX_LEN) || 25355da1ebSSage Weil !strncmp(name, XATTR_TRUSTED_PREFIX, XATTR_TRUSTED_PREFIX_LEN) || 26355da1ebSSage Weil !strncmp(name, XATTR_USER_PREFIX, XATTR_USER_PREFIX_LEN); 27355da1ebSSage Weil } 28355da1ebSSage Weil 29355da1ebSSage Weil /* 30355da1ebSSage Weil * These define virtual xattrs exposing the recursive directory 31355da1ebSSage Weil * statistics and layout metadata. 32355da1ebSSage Weil */ 33881a5fa2SAlex Elder struct ceph_vxattr { 34355da1ebSSage Weil char *name; 353ce6cd12SAlex Elder size_t name_size; /* strlen(name) + 1 (for '\0') */ 36f1d1b51dSJeff Layton ssize_t (*getxattr_cb)(struct ceph_inode_info *ci, char *val, 37355da1ebSSage Weil size_t size); 38f36e4472SSage Weil bool (*exists_cb)(struct ceph_inode_info *ci); 394e9906e7SYan, Zheng unsigned int flags; 40355da1ebSSage Weil }; 41355da1ebSSage Weil 424e9906e7SYan, Zheng #define VXATTR_FLAG_READONLY (1<<0) 434e9906e7SYan, Zheng #define VXATTR_FLAG_HIDDEN (1<<1) 4449a9f4f6SYan, Zheng #define VXATTR_FLAG_RSTAT (1<<2) 4581048c00SJeff Layton #define VXATTR_FLAG_DIRSTAT (1<<3) 464e9906e7SYan, Zheng 4732ab0bd7SSage Weil /* layouts */ 4832ab0bd7SSage Weil 4932ab0bd7SSage Weil static bool ceph_vxattrcb_layout_exists(struct ceph_inode_info *ci) 5032ab0bd7SSage Weil { 51779fe0fbSYan, Zheng struct ceph_file_layout *fl = &ci->i_layout; 52779fe0fbSYan, Zheng return (fl->stripe_unit > 0 || fl->stripe_count > 0 || 53779fe0fbSYan, Zheng fl->object_size > 0 || fl->pool_id >= 0 || 54779fe0fbSYan, Zheng rcu_dereference_raw(fl->pool_ns) != NULL); 5532ab0bd7SSage Weil } 5632ab0bd7SSage Weil 57f1d1b51dSJeff Layton static ssize_t ceph_vxattrcb_layout(struct ceph_inode_info *ci, char *val, 5832ab0bd7SSage Weil size_t size) 5932ab0bd7SSage Weil { 6032ab0bd7SSage Weil struct ceph_fs_client *fsc = ceph_sb_to_client(ci->vfs_inode.i_sb); 6132ab0bd7SSage Weil struct ceph_osd_client *osdc = &fsc->client->osdc; 62779fe0fbSYan, Zheng struct ceph_string *pool_ns; 637627151eSYan, Zheng s64 pool = ci->i_layout.pool_id; 6432ab0bd7SSage Weil const char *pool_name; 65779fe0fbSYan, Zheng const char *ns_field = " pool_namespace="; 661e5c6649SYan, Zheng char buf[128]; 67779fe0fbSYan, Zheng size_t len, total_len = 0; 683b421018SJeff Layton ssize_t ret; 69779fe0fbSYan, Zheng 70779fe0fbSYan, Zheng pool_ns = ceph_try_get_string(ci->i_layout.pool_ns); 7132ab0bd7SSage Weil 7232ab0bd7SSage Weil dout("ceph_vxattrcb_layout %p\n", &ci->vfs_inode); 735aea3dcdSIlya Dryomov down_read(&osdc->lock); 7432ab0bd7SSage Weil pool_name = ceph_pg_pool_name_by_id(osdc->osdmap, pool); 751e5c6649SYan, Zheng if (pool_name) { 76779fe0fbSYan, Zheng len = snprintf(buf, sizeof(buf), 777627151eSYan, Zheng "stripe_unit=%u stripe_count=%u object_size=%u pool=", 787627151eSYan, Zheng ci->i_layout.stripe_unit, ci->i_layout.stripe_count, 797627151eSYan, Zheng ci->i_layout.object_size); 80779fe0fbSYan, Zheng total_len = len + strlen(pool_name); 811e5c6649SYan, Zheng } else { 82779fe0fbSYan, Zheng len = snprintf(buf, sizeof(buf), 837627151eSYan, Zheng "stripe_unit=%u stripe_count=%u object_size=%u pool=%lld", 847627151eSYan, Zheng ci->i_layout.stripe_unit, ci->i_layout.stripe_count, 85f1d1b51dSJeff Layton ci->i_layout.object_size, pool); 86779fe0fbSYan, Zheng total_len = len; 87779fe0fbSYan, Zheng } 88779fe0fbSYan, Zheng 89779fe0fbSYan, Zheng if (pool_ns) 90779fe0fbSYan, Zheng total_len += strlen(ns_field) + pool_ns->len; 91779fe0fbSYan, Zheng 92779fe0fbSYan, Zheng ret = total_len; 933b421018SJeff Layton if (size >= total_len) { 94779fe0fbSYan, Zheng memcpy(val, buf, len); 95779fe0fbSYan, Zheng ret = len; 96779fe0fbSYan, Zheng if (pool_name) { 97779fe0fbSYan, Zheng len = strlen(pool_name); 98779fe0fbSYan, Zheng memcpy(val + ret, pool_name, len); 99779fe0fbSYan, Zheng ret += len; 100779fe0fbSYan, Zheng } 101779fe0fbSYan, Zheng if (pool_ns) { 102779fe0fbSYan, Zheng len = strlen(ns_field); 103779fe0fbSYan, Zheng memcpy(val + ret, ns_field, len); 104779fe0fbSYan, Zheng ret += len; 105779fe0fbSYan, Zheng memcpy(val + ret, pool_ns->str, pool_ns->len); 106779fe0fbSYan, Zheng ret += pool_ns->len; 1071e5c6649SYan, Zheng } 1081e5c6649SYan, Zheng } 1095aea3dcdSIlya Dryomov up_read(&osdc->lock); 110779fe0fbSYan, Zheng ceph_put_string(pool_ns); 11132ab0bd7SSage Weil return ret; 11232ab0bd7SSage Weil } 11332ab0bd7SSage Weil 11426350535SJeff Layton /* 11526350535SJeff Layton * The convention with strings in xattrs is that they should not be NULL 11626350535SJeff Layton * terminated, since we're returning the length with them. snprintf always 11726350535SJeff Layton * NULL terminates however, so call it on a temporary buffer and then memcpy 11826350535SJeff Layton * the result into place. 11926350535SJeff Layton */ 120f6fbdcd9SIlya Dryomov static __printf(3, 4) 121f6fbdcd9SIlya Dryomov int ceph_fmt_xattr(char *val, size_t size, const char *fmt, ...) 12226350535SJeff Layton { 12326350535SJeff Layton int ret; 12426350535SJeff Layton va_list args; 12526350535SJeff Layton char buf[96]; /* NB: reevaluate size if new vxattrs are added */ 12626350535SJeff Layton 12726350535SJeff Layton va_start(args, fmt); 12826350535SJeff Layton ret = vsnprintf(buf, size ? sizeof(buf) : 0, fmt, args); 12926350535SJeff Layton va_end(args); 13026350535SJeff Layton 13126350535SJeff Layton /* Sanity check */ 13226350535SJeff Layton if (size && ret + 1 > sizeof(buf)) { 13326350535SJeff Layton WARN_ONCE(true, "Returned length too big (%d)", ret); 13426350535SJeff Layton return -E2BIG; 13526350535SJeff Layton } 13626350535SJeff Layton 13726350535SJeff Layton if (ret <= size) 13826350535SJeff Layton memcpy(val, buf, ret); 13926350535SJeff Layton return ret; 14026350535SJeff Layton } 14126350535SJeff Layton 142f1d1b51dSJeff Layton static ssize_t ceph_vxattrcb_layout_stripe_unit(struct ceph_inode_info *ci, 143695b7119SSage Weil char *val, size_t size) 144695b7119SSage Weil { 14526350535SJeff Layton return ceph_fmt_xattr(val, size, "%u", ci->i_layout.stripe_unit); 146695b7119SSage Weil } 147695b7119SSage Weil 148f1d1b51dSJeff Layton static ssize_t ceph_vxattrcb_layout_stripe_count(struct ceph_inode_info *ci, 149695b7119SSage Weil char *val, size_t size) 150695b7119SSage Weil { 15126350535SJeff Layton return ceph_fmt_xattr(val, size, "%u", ci->i_layout.stripe_count); 152695b7119SSage Weil } 153695b7119SSage Weil 154f1d1b51dSJeff Layton static ssize_t ceph_vxattrcb_layout_object_size(struct ceph_inode_info *ci, 155695b7119SSage Weil char *val, size_t size) 156695b7119SSage Weil { 15726350535SJeff Layton return ceph_fmt_xattr(val, size, "%u", ci->i_layout.object_size); 158695b7119SSage Weil } 159695b7119SSage Weil 160f1d1b51dSJeff Layton static ssize_t ceph_vxattrcb_layout_pool(struct ceph_inode_info *ci, 161695b7119SSage Weil char *val, size_t size) 162695b7119SSage Weil { 163f1d1b51dSJeff Layton ssize_t ret; 164695b7119SSage Weil struct ceph_fs_client *fsc = ceph_sb_to_client(ci->vfs_inode.i_sb); 165695b7119SSage Weil struct ceph_osd_client *osdc = &fsc->client->osdc; 1667627151eSYan, Zheng s64 pool = ci->i_layout.pool_id; 167695b7119SSage Weil const char *pool_name; 168695b7119SSage Weil 1695aea3dcdSIlya Dryomov down_read(&osdc->lock); 170695b7119SSage Weil pool_name = ceph_pg_pool_name_by_id(osdc->osdmap, pool); 17126350535SJeff Layton if (pool_name) { 17226350535SJeff Layton ret = strlen(pool_name); 17326350535SJeff Layton if (ret <= size) 17426350535SJeff Layton memcpy(val, pool_name, ret); 17526350535SJeff Layton } else { 17626350535SJeff Layton ret = ceph_fmt_xattr(val, size, "%lld", pool); 17726350535SJeff Layton } 1785aea3dcdSIlya Dryomov up_read(&osdc->lock); 179695b7119SSage Weil return ret; 180695b7119SSage Weil } 181695b7119SSage Weil 182f1d1b51dSJeff Layton static ssize_t ceph_vxattrcb_layout_pool_namespace(struct ceph_inode_info *ci, 183779fe0fbSYan, Zheng char *val, size_t size) 184779fe0fbSYan, Zheng { 18526350535SJeff Layton ssize_t ret = 0; 186779fe0fbSYan, Zheng struct ceph_string *ns = ceph_try_get_string(ci->i_layout.pool_ns); 18726350535SJeff Layton 188779fe0fbSYan, Zheng if (ns) { 18926350535SJeff Layton ret = ns->len; 19026350535SJeff Layton if (ret <= size) 19126350535SJeff Layton memcpy(val, ns->str, ret); 192779fe0fbSYan, Zheng ceph_put_string(ns); 193779fe0fbSYan, Zheng } 194779fe0fbSYan, Zheng return ret; 195779fe0fbSYan, Zheng } 196779fe0fbSYan, Zheng 197355da1ebSSage Weil /* directories */ 198355da1ebSSage Weil 199f1d1b51dSJeff Layton static ssize_t ceph_vxattrcb_dir_entries(struct ceph_inode_info *ci, char *val, 200355da1ebSSage Weil size_t size) 201355da1ebSSage Weil { 20226350535SJeff Layton return ceph_fmt_xattr(val, size, "%lld", ci->i_files + ci->i_subdirs); 203355da1ebSSage Weil } 204355da1ebSSage Weil 205f1d1b51dSJeff Layton static ssize_t ceph_vxattrcb_dir_files(struct ceph_inode_info *ci, char *val, 206355da1ebSSage Weil size_t size) 207355da1ebSSage Weil { 20826350535SJeff Layton return ceph_fmt_xattr(val, size, "%lld", ci->i_files); 209355da1ebSSage Weil } 210355da1ebSSage Weil 211f1d1b51dSJeff Layton static ssize_t ceph_vxattrcb_dir_subdirs(struct ceph_inode_info *ci, char *val, 212355da1ebSSage Weil size_t size) 213355da1ebSSage Weil { 21426350535SJeff Layton return ceph_fmt_xattr(val, size, "%lld", ci->i_subdirs); 215355da1ebSSage Weil } 216355da1ebSSage Weil 217f1d1b51dSJeff Layton static ssize_t ceph_vxattrcb_dir_rentries(struct ceph_inode_info *ci, char *val, 218355da1ebSSage Weil size_t size) 219355da1ebSSage Weil { 22026350535SJeff Layton return ceph_fmt_xattr(val, size, "%lld", 22126350535SJeff Layton ci->i_rfiles + ci->i_rsubdirs); 222355da1ebSSage Weil } 223355da1ebSSage Weil 224f1d1b51dSJeff Layton static ssize_t ceph_vxattrcb_dir_rfiles(struct ceph_inode_info *ci, char *val, 225355da1ebSSage Weil size_t size) 226355da1ebSSage Weil { 22726350535SJeff Layton return ceph_fmt_xattr(val, size, "%lld", ci->i_rfiles); 228355da1ebSSage Weil } 229355da1ebSSage Weil 230f1d1b51dSJeff Layton static ssize_t ceph_vxattrcb_dir_rsubdirs(struct ceph_inode_info *ci, char *val, 231355da1ebSSage Weil size_t size) 232355da1ebSSage Weil { 23326350535SJeff Layton return ceph_fmt_xattr(val, size, "%lld", ci->i_rsubdirs); 234355da1ebSSage Weil } 235355da1ebSSage Weil 236e7f72952SYanhu Cao static ssize_t ceph_vxattrcb_dir_rsnaps(struct ceph_inode_info *ci, char *val, 237e7f72952SYanhu Cao size_t size) 238e7f72952SYanhu Cao { 239e7f72952SYanhu Cao return ceph_fmt_xattr(val, size, "%lld", ci->i_rsnaps); 240e7f72952SYanhu Cao } 241e7f72952SYanhu Cao 242f1d1b51dSJeff Layton static ssize_t ceph_vxattrcb_dir_rbytes(struct ceph_inode_info *ci, char *val, 243355da1ebSSage Weil size_t size) 244355da1ebSSage Weil { 24526350535SJeff Layton return ceph_fmt_xattr(val, size, "%lld", ci->i_rbytes); 246355da1ebSSage Weil } 247355da1ebSSage Weil 248f1d1b51dSJeff Layton static ssize_t ceph_vxattrcb_dir_rctime(struct ceph_inode_info *ci, char *val, 249355da1ebSSage Weil size_t size) 250355da1ebSSage Weil { 25126350535SJeff Layton return ceph_fmt_xattr(val, size, "%lld.%09ld", ci->i_rctime.tv_sec, 2529bbeab41SArnd Bergmann ci->i_rctime.tv_nsec); 253355da1ebSSage Weil } 254355da1ebSSage Weil 25508796873SYan, Zheng /* dir pin */ 25608796873SYan, Zheng static bool ceph_vxattrcb_dir_pin_exists(struct ceph_inode_info *ci) 25708796873SYan, Zheng { 25808796873SYan, Zheng return ci->i_dir_pin != -ENODATA; 25908796873SYan, Zheng } 260fb18a575SLuis Henriques 261f1d1b51dSJeff Layton static ssize_t ceph_vxattrcb_dir_pin(struct ceph_inode_info *ci, char *val, 26208796873SYan, Zheng size_t size) 26308796873SYan, Zheng { 26426350535SJeff Layton return ceph_fmt_xattr(val, size, "%d", (int)ci->i_dir_pin); 26508796873SYan, Zheng } 26608796873SYan, Zheng 26708796873SYan, Zheng /* quotas */ 268fb18a575SLuis Henriques static bool ceph_vxattrcb_quota_exists(struct ceph_inode_info *ci) 269fb18a575SLuis Henriques { 270f1919826SYan, Zheng bool ret = false; 271f1919826SYan, Zheng spin_lock(&ci->i_ceph_lock); 272f1919826SYan, Zheng if ((ci->i_max_files || ci->i_max_bytes) && 273f1919826SYan, Zheng ci->i_vino.snap == CEPH_NOSNAP && 274f1919826SYan, Zheng ci->i_snap_realm && 275f1919826SYan, Zheng ci->i_snap_realm->ino == ci->i_vino.ino) 276f1919826SYan, Zheng ret = true; 277f1919826SYan, Zheng spin_unlock(&ci->i_ceph_lock); 278f1919826SYan, Zheng return ret; 279fb18a575SLuis Henriques } 280fb18a575SLuis Henriques 281f1d1b51dSJeff Layton static ssize_t ceph_vxattrcb_quota(struct ceph_inode_info *ci, char *val, 282fb18a575SLuis Henriques size_t size) 283fb18a575SLuis Henriques { 28426350535SJeff Layton return ceph_fmt_xattr(val, size, "max_bytes=%llu max_files=%llu", 285fb18a575SLuis Henriques ci->i_max_bytes, ci->i_max_files); 286fb18a575SLuis Henriques } 287fb18a575SLuis Henriques 288f1d1b51dSJeff Layton static ssize_t ceph_vxattrcb_quota_max_bytes(struct ceph_inode_info *ci, 289fb18a575SLuis Henriques char *val, size_t size) 290fb18a575SLuis Henriques { 29126350535SJeff Layton return ceph_fmt_xattr(val, size, "%llu", ci->i_max_bytes); 292fb18a575SLuis Henriques } 293fb18a575SLuis Henriques 294f1d1b51dSJeff Layton static ssize_t ceph_vxattrcb_quota_max_files(struct ceph_inode_info *ci, 295fb18a575SLuis Henriques char *val, size_t size) 296fb18a575SLuis Henriques { 29726350535SJeff Layton return ceph_fmt_xattr(val, size, "%llu", ci->i_max_files); 298fb18a575SLuis Henriques } 29932ab0bd7SSage Weil 300100cc610SDavid Disseldorp /* snapshots */ 301100cc610SDavid Disseldorp static bool ceph_vxattrcb_snap_btime_exists(struct ceph_inode_info *ci) 302100cc610SDavid Disseldorp { 303100cc610SDavid Disseldorp return (ci->i_snap_btime.tv_sec != 0 || ci->i_snap_btime.tv_nsec != 0); 304100cc610SDavid Disseldorp } 305100cc610SDavid Disseldorp 306f1d1b51dSJeff Layton static ssize_t ceph_vxattrcb_snap_btime(struct ceph_inode_info *ci, char *val, 307100cc610SDavid Disseldorp size_t size) 308100cc610SDavid Disseldorp { 30926350535SJeff Layton return ceph_fmt_xattr(val, size, "%lld.%09ld", ci->i_snap_btime.tv_sec, 310100cc610SDavid Disseldorp ci->i_snap_btime.tv_nsec); 311100cc610SDavid Disseldorp } 312100cc610SDavid Disseldorp 3135a9e2f5dSXiubo Li static ssize_t ceph_vxattrcb_cluster_fsid(struct ceph_inode_info *ci, 3145a9e2f5dSXiubo Li char *val, size_t size) 3155a9e2f5dSXiubo Li { 3165a9e2f5dSXiubo Li struct ceph_fs_client *fsc = ceph_sb_to_client(ci->vfs_inode.i_sb); 3175a9e2f5dSXiubo Li 3185a9e2f5dSXiubo Li return ceph_fmt_xattr(val, size, "%pU", &fsc->client->fsid); 3195a9e2f5dSXiubo Li } 3205a9e2f5dSXiubo Li 3215a9e2f5dSXiubo Li static ssize_t ceph_vxattrcb_client_id(struct ceph_inode_info *ci, 3225a9e2f5dSXiubo Li char *val, size_t size) 3235a9e2f5dSXiubo Li { 3245a9e2f5dSXiubo Li struct ceph_fs_client *fsc = ceph_sb_to_client(ci->vfs_inode.i_sb); 3255a9e2f5dSXiubo Li 3265a9e2f5dSXiubo Li return ceph_fmt_xattr(val, size, "client%lld", 3275a9e2f5dSXiubo Li ceph_client_gid(fsc->client)); 3285a9e2f5dSXiubo Li } 3295a9e2f5dSXiubo Li 330dd980fc0SLuis Henriques static ssize_t ceph_vxattrcb_caps(struct ceph_inode_info *ci, char *val, 331dd980fc0SLuis Henriques size_t size) 332dd980fc0SLuis Henriques { 333dd980fc0SLuis Henriques int issued; 334dd980fc0SLuis Henriques 335dd980fc0SLuis Henriques spin_lock(&ci->i_ceph_lock); 336dd980fc0SLuis Henriques issued = __ceph_caps_issued(ci, NULL); 337dd980fc0SLuis Henriques spin_unlock(&ci->i_ceph_lock); 338dd980fc0SLuis Henriques 339dd980fc0SLuis Henriques return ceph_fmt_xattr(val, size, "%s/0x%x", 340dd980fc0SLuis Henriques ceph_cap_string(issued), issued); 341dd980fc0SLuis Henriques } 342dd980fc0SLuis Henriques 34340e309deSJeff Layton static ssize_t ceph_vxattrcb_auth_mds(struct ceph_inode_info *ci, 34440e309deSJeff Layton char *val, size_t size) 34540e309deSJeff Layton { 34640e309deSJeff Layton int ret; 34740e309deSJeff Layton 34840e309deSJeff Layton spin_lock(&ci->i_ceph_lock); 34940e309deSJeff Layton ret = ceph_fmt_xattr(val, size, "%d", 35040e309deSJeff Layton ci->i_auth_cap ? ci->i_auth_cap->session->s_mds : -1); 35140e309deSJeff Layton spin_unlock(&ci->i_ceph_lock); 35240e309deSJeff Layton return ret; 35340e309deSJeff Layton } 35440e309deSJeff Layton 355eb788084SAlex Elder #define CEPH_XATTR_NAME(_type, _name) XATTR_CEPH_PREFIX #_type "." #_name 356695b7119SSage Weil #define CEPH_XATTR_NAME2(_type, _name, _name2) \ 357695b7119SSage Weil XATTR_CEPH_PREFIX #_type "." #_name "." #_name2 358eb788084SAlex Elder 35949a9f4f6SYan, Zheng #define XATTR_NAME_CEPH(_type, _name, _flags) \ 360eb788084SAlex Elder { \ 361eb788084SAlex Elder .name = CEPH_XATTR_NAME(_type, _name), \ 3623ce6cd12SAlex Elder .name_size = sizeof (CEPH_XATTR_NAME(_type, _name)), \ 363aa4066edSAlex Elder .getxattr_cb = ceph_vxattrcb_ ## _type ## _ ## _name, \ 364f36e4472SSage Weil .exists_cb = NULL, \ 36549a9f4f6SYan, Zheng .flags = (VXATTR_FLAG_READONLY | _flags), \ 366eb788084SAlex Elder } 36749a9f4f6SYan, Zheng #define XATTR_RSTAT_FIELD(_type, _name) \ 36849a9f4f6SYan, Zheng XATTR_NAME_CEPH(_type, _name, VXATTR_FLAG_RSTAT) 369695b7119SSage Weil #define XATTR_LAYOUT_FIELD(_type, _name, _field) \ 370695b7119SSage Weil { \ 371695b7119SSage Weil .name = CEPH_XATTR_NAME2(_type, _name, _field), \ 372695b7119SSage Weil .name_size = sizeof (CEPH_XATTR_NAME2(_type, _name, _field)), \ 373695b7119SSage Weil .getxattr_cb = ceph_vxattrcb_ ## _name ## _ ## _field, \ 374695b7119SSage Weil .exists_cb = ceph_vxattrcb_layout_exists, \ 3754e9906e7SYan, Zheng .flags = VXATTR_FLAG_HIDDEN, \ 376695b7119SSage Weil } 377fb18a575SLuis Henriques #define XATTR_QUOTA_FIELD(_type, _name) \ 378fb18a575SLuis Henriques { \ 379fb18a575SLuis Henriques .name = CEPH_XATTR_NAME(_type, _name), \ 380fb18a575SLuis Henriques .name_size = sizeof(CEPH_XATTR_NAME(_type, _name)), \ 381fb18a575SLuis Henriques .getxattr_cb = ceph_vxattrcb_ ## _type ## _ ## _name, \ 382fb18a575SLuis Henriques .exists_cb = ceph_vxattrcb_quota_exists, \ 3834e9906e7SYan, Zheng .flags = VXATTR_FLAG_HIDDEN, \ 384fb18a575SLuis Henriques } 385eb788084SAlex Elder 386881a5fa2SAlex Elder static struct ceph_vxattr ceph_dir_vxattrs[] = { 3871f08f2b0SSage Weil { 3881f08f2b0SSage Weil .name = "ceph.dir.layout", 3891f08f2b0SSage Weil .name_size = sizeof("ceph.dir.layout"), 3901f08f2b0SSage Weil .getxattr_cb = ceph_vxattrcb_layout, 3911f08f2b0SSage Weil .exists_cb = ceph_vxattrcb_layout_exists, 3924e9906e7SYan, Zheng .flags = VXATTR_FLAG_HIDDEN, 3931f08f2b0SSage Weil }, 394695b7119SSage Weil XATTR_LAYOUT_FIELD(dir, layout, stripe_unit), 395695b7119SSage Weil XATTR_LAYOUT_FIELD(dir, layout, stripe_count), 396695b7119SSage Weil XATTR_LAYOUT_FIELD(dir, layout, object_size), 397695b7119SSage Weil XATTR_LAYOUT_FIELD(dir, layout, pool), 398779fe0fbSYan, Zheng XATTR_LAYOUT_FIELD(dir, layout, pool_namespace), 39981048c00SJeff Layton XATTR_NAME_CEPH(dir, entries, VXATTR_FLAG_DIRSTAT), 40081048c00SJeff Layton XATTR_NAME_CEPH(dir, files, VXATTR_FLAG_DIRSTAT), 40181048c00SJeff Layton XATTR_NAME_CEPH(dir, subdirs, VXATTR_FLAG_DIRSTAT), 40249a9f4f6SYan, Zheng XATTR_RSTAT_FIELD(dir, rentries), 40349a9f4f6SYan, Zheng XATTR_RSTAT_FIELD(dir, rfiles), 40449a9f4f6SYan, Zheng XATTR_RSTAT_FIELD(dir, rsubdirs), 405e7f72952SYanhu Cao XATTR_RSTAT_FIELD(dir, rsnaps), 40649a9f4f6SYan, Zheng XATTR_RSTAT_FIELD(dir, rbytes), 40749a9f4f6SYan, Zheng XATTR_RSTAT_FIELD(dir, rctime), 408fb18a575SLuis Henriques { 40908796873SYan, Zheng .name = "ceph.dir.pin", 410e1b81439SDavid Disseldorp .name_size = sizeof("ceph.dir.pin"), 41108796873SYan, Zheng .getxattr_cb = ceph_vxattrcb_dir_pin, 41208796873SYan, Zheng .exists_cb = ceph_vxattrcb_dir_pin_exists, 41308796873SYan, Zheng .flags = VXATTR_FLAG_HIDDEN, 41408796873SYan, Zheng }, 41508796873SYan, Zheng { 416fb18a575SLuis Henriques .name = "ceph.quota", 417fb18a575SLuis Henriques .name_size = sizeof("ceph.quota"), 418fb18a575SLuis Henriques .getxattr_cb = ceph_vxattrcb_quota, 419fb18a575SLuis Henriques .exists_cb = ceph_vxattrcb_quota_exists, 4204e9906e7SYan, Zheng .flags = VXATTR_FLAG_HIDDEN, 421fb18a575SLuis Henriques }, 422fb18a575SLuis Henriques XATTR_QUOTA_FIELD(quota, max_bytes), 423fb18a575SLuis Henriques XATTR_QUOTA_FIELD(quota, max_files), 424100cc610SDavid Disseldorp { 425100cc610SDavid Disseldorp .name = "ceph.snap.btime", 426100cc610SDavid Disseldorp .name_size = sizeof("ceph.snap.btime"), 427100cc610SDavid Disseldorp .getxattr_cb = ceph_vxattrcb_snap_btime, 428100cc610SDavid Disseldorp .exists_cb = ceph_vxattrcb_snap_btime_exists, 429100cc610SDavid Disseldorp .flags = VXATTR_FLAG_READONLY, 430100cc610SDavid Disseldorp }, 431dd980fc0SLuis Henriques { 432dd980fc0SLuis Henriques .name = "ceph.caps", 433dd980fc0SLuis Henriques .name_size = sizeof("ceph.caps"), 434dd980fc0SLuis Henriques .getxattr_cb = ceph_vxattrcb_caps, 435dd980fc0SLuis Henriques .exists_cb = NULL, 436dd980fc0SLuis Henriques .flags = VXATTR_FLAG_HIDDEN, 437dd980fc0SLuis Henriques }, 4382c3dd4ffSAlex Elder { .name = NULL, 0 } /* Required table terminator */ 439355da1ebSSage Weil }; 440355da1ebSSage Weil 441355da1ebSSage Weil /* files */ 442355da1ebSSage Weil 443881a5fa2SAlex Elder static struct ceph_vxattr ceph_file_vxattrs[] = { 44432ab0bd7SSage Weil { 44532ab0bd7SSage Weil .name = "ceph.file.layout", 44632ab0bd7SSage Weil .name_size = sizeof("ceph.file.layout"), 44732ab0bd7SSage Weil .getxattr_cb = ceph_vxattrcb_layout, 44832ab0bd7SSage Weil .exists_cb = ceph_vxattrcb_layout_exists, 4494e9906e7SYan, Zheng .flags = VXATTR_FLAG_HIDDEN, 45032ab0bd7SSage Weil }, 451695b7119SSage Weil XATTR_LAYOUT_FIELD(file, layout, stripe_unit), 452695b7119SSage Weil XATTR_LAYOUT_FIELD(file, layout, stripe_count), 453695b7119SSage Weil XATTR_LAYOUT_FIELD(file, layout, object_size), 454695b7119SSage Weil XATTR_LAYOUT_FIELD(file, layout, pool), 455779fe0fbSYan, Zheng XATTR_LAYOUT_FIELD(file, layout, pool_namespace), 456100cc610SDavid Disseldorp { 457100cc610SDavid Disseldorp .name = "ceph.snap.btime", 458100cc610SDavid Disseldorp .name_size = sizeof("ceph.snap.btime"), 459100cc610SDavid Disseldorp .getxattr_cb = ceph_vxattrcb_snap_btime, 460100cc610SDavid Disseldorp .exists_cb = ceph_vxattrcb_snap_btime_exists, 461100cc610SDavid Disseldorp .flags = VXATTR_FLAG_READONLY, 462100cc610SDavid Disseldorp }, 463dd980fc0SLuis Henriques { 464dd980fc0SLuis Henriques .name = "ceph.caps", 465dd980fc0SLuis Henriques .name_size = sizeof("ceph.caps"), 466dd980fc0SLuis Henriques .getxattr_cb = ceph_vxattrcb_caps, 467dd980fc0SLuis Henriques .exists_cb = NULL, 468dd980fc0SLuis Henriques .flags = VXATTR_FLAG_HIDDEN, 469dd980fc0SLuis Henriques }, 4702c3dd4ffSAlex Elder { .name = NULL, 0 } /* Required table terminator */ 471355da1ebSSage Weil }; 472355da1ebSSage Weil 4735a9e2f5dSXiubo Li static struct ceph_vxattr ceph_common_vxattrs[] = { 4745a9e2f5dSXiubo Li { 4755a9e2f5dSXiubo Li .name = "ceph.cluster_fsid", 4765a9e2f5dSXiubo Li .name_size = sizeof("ceph.cluster_fsid"), 4775a9e2f5dSXiubo Li .getxattr_cb = ceph_vxattrcb_cluster_fsid, 4785a9e2f5dSXiubo Li .exists_cb = NULL, 4795a9e2f5dSXiubo Li .flags = VXATTR_FLAG_READONLY, 4805a9e2f5dSXiubo Li }, 4815a9e2f5dSXiubo Li { 4825a9e2f5dSXiubo Li .name = "ceph.client_id", 4835a9e2f5dSXiubo Li .name_size = sizeof("ceph.client_id"), 4845a9e2f5dSXiubo Li .getxattr_cb = ceph_vxattrcb_client_id, 4855a9e2f5dSXiubo Li .exists_cb = NULL, 4865a9e2f5dSXiubo Li .flags = VXATTR_FLAG_READONLY, 4875a9e2f5dSXiubo Li }, 48840e309deSJeff Layton { 48940e309deSJeff Layton .name = "ceph.auth_mds", 49040e309deSJeff Layton .name_size = sizeof("ceph.auth_mds"), 49140e309deSJeff Layton .getxattr_cb = ceph_vxattrcb_auth_mds, 49240e309deSJeff Layton .exists_cb = NULL, 49340e309deSJeff Layton .flags = VXATTR_FLAG_READONLY, 49440e309deSJeff Layton }, 4955a9e2f5dSXiubo Li { .name = NULL, 0 } /* Required table terminator */ 4965a9e2f5dSXiubo Li }; 4975a9e2f5dSXiubo Li 498881a5fa2SAlex Elder static struct ceph_vxattr *ceph_inode_vxattrs(struct inode *inode) 499355da1ebSSage Weil { 500355da1ebSSage Weil if (S_ISDIR(inode->i_mode)) 501355da1ebSSage Weil return ceph_dir_vxattrs; 502355da1ebSSage Weil else if (S_ISREG(inode->i_mode)) 503355da1ebSSage Weil return ceph_file_vxattrs; 504355da1ebSSage Weil return NULL; 505355da1ebSSage Weil } 506355da1ebSSage Weil 507881a5fa2SAlex Elder static struct ceph_vxattr *ceph_match_vxattr(struct inode *inode, 508355da1ebSSage Weil const char *name) 509355da1ebSSage Weil { 510881a5fa2SAlex Elder struct ceph_vxattr *vxattr = ceph_inode_vxattrs(inode); 51106476a69SAlex Elder 51206476a69SAlex Elder if (vxattr) { 51306476a69SAlex Elder while (vxattr->name) { 51406476a69SAlex Elder if (!strcmp(vxattr->name, name)) 515355da1ebSSage Weil return vxattr; 516355da1ebSSage Weil vxattr++; 51706476a69SAlex Elder } 51806476a69SAlex Elder } 51906476a69SAlex Elder 5205a9e2f5dSXiubo Li vxattr = ceph_common_vxattrs; 5215a9e2f5dSXiubo Li while (vxattr->name) { 5225a9e2f5dSXiubo Li if (!strcmp(vxattr->name, name)) 5235a9e2f5dSXiubo Li return vxattr; 5245a9e2f5dSXiubo Li vxattr++; 5255a9e2f5dSXiubo Li } 5265a9e2f5dSXiubo Li 527355da1ebSSage Weil return NULL; 528355da1ebSSage Weil } 529355da1ebSSage Weil 530355da1ebSSage Weil static int __set_xattr(struct ceph_inode_info *ci, 531355da1ebSSage Weil const char *name, int name_len, 532355da1ebSSage Weil const char *val, int val_len, 533fbc0b970SYan, Zheng int flags, int update_xattr, 534355da1ebSSage Weil struct ceph_inode_xattr **newxattr) 535355da1ebSSage Weil { 536355da1ebSSage Weil struct rb_node **p; 537355da1ebSSage Weil struct rb_node *parent = NULL; 538355da1ebSSage Weil struct ceph_inode_xattr *xattr = NULL; 539355da1ebSSage Weil int c; 540355da1ebSSage Weil int new = 0; 541355da1ebSSage Weil 542355da1ebSSage Weil p = &ci->i_xattrs.index.rb_node; 543355da1ebSSage Weil while (*p) { 544355da1ebSSage Weil parent = *p; 545355da1ebSSage Weil xattr = rb_entry(parent, struct ceph_inode_xattr, node); 546355da1ebSSage Weil c = strncmp(name, xattr->name, min(name_len, xattr->name_len)); 547355da1ebSSage Weil if (c < 0) 548355da1ebSSage Weil p = &(*p)->rb_left; 549355da1ebSSage Weil else if (c > 0) 550355da1ebSSage Weil p = &(*p)->rb_right; 551355da1ebSSage Weil else { 552355da1ebSSage Weil if (name_len == xattr->name_len) 553355da1ebSSage Weil break; 554355da1ebSSage Weil else if (name_len < xattr->name_len) 555355da1ebSSage Weil p = &(*p)->rb_left; 556355da1ebSSage Weil else 557355da1ebSSage Weil p = &(*p)->rb_right; 558355da1ebSSage Weil } 559355da1ebSSage Weil xattr = NULL; 560355da1ebSSage Weil } 561355da1ebSSage Weil 562fbc0b970SYan, Zheng if (update_xattr) { 563fbc0b970SYan, Zheng int err = 0; 564eeca958dSLuis Henriques 565fbc0b970SYan, Zheng if (xattr && (flags & XATTR_CREATE)) 566fbc0b970SYan, Zheng err = -EEXIST; 567fbc0b970SYan, Zheng else if (!xattr && (flags & XATTR_REPLACE)) 568fbc0b970SYan, Zheng err = -ENODATA; 569fbc0b970SYan, Zheng if (err) { 570fbc0b970SYan, Zheng kfree(name); 571fbc0b970SYan, Zheng kfree(val); 572eeca958dSLuis Henriques kfree(*newxattr); 573fbc0b970SYan, Zheng return err; 574fbc0b970SYan, Zheng } 575bcdfeb2eSYan, Zheng if (update_xattr < 0) { 576bcdfeb2eSYan, Zheng if (xattr) 577bcdfeb2eSYan, Zheng __remove_xattr(ci, xattr); 578bcdfeb2eSYan, Zheng kfree(name); 579eeca958dSLuis Henriques kfree(*newxattr); 580bcdfeb2eSYan, Zheng return 0; 581bcdfeb2eSYan, Zheng } 582fbc0b970SYan, Zheng } 583fbc0b970SYan, Zheng 584355da1ebSSage Weil if (!xattr) { 585355da1ebSSage Weil new = 1; 586355da1ebSSage Weil xattr = *newxattr; 587355da1ebSSage Weil xattr->name = name; 588355da1ebSSage Weil xattr->name_len = name_len; 589fbc0b970SYan, Zheng xattr->should_free_name = update_xattr; 590355da1ebSSage Weil 591355da1ebSSage Weil ci->i_xattrs.count++; 592355da1ebSSage Weil dout("__set_xattr count=%d\n", ci->i_xattrs.count); 593355da1ebSSage Weil } else { 594355da1ebSSage Weil kfree(*newxattr); 595355da1ebSSage Weil *newxattr = NULL; 596355da1ebSSage Weil if (xattr->should_free_val) 597c00e4522SXu Wang kfree(xattr->val); 598355da1ebSSage Weil 599fbc0b970SYan, Zheng if (update_xattr) { 600c00e4522SXu Wang kfree(name); 601355da1ebSSage Weil name = xattr->name; 602355da1ebSSage Weil } 603355da1ebSSage Weil ci->i_xattrs.names_size -= xattr->name_len; 604355da1ebSSage Weil ci->i_xattrs.vals_size -= xattr->val_len; 605355da1ebSSage Weil } 606355da1ebSSage Weil ci->i_xattrs.names_size += name_len; 607355da1ebSSage Weil ci->i_xattrs.vals_size += val_len; 608355da1ebSSage Weil if (val) 609355da1ebSSage Weil xattr->val = val; 610355da1ebSSage Weil else 611355da1ebSSage Weil xattr->val = ""; 612355da1ebSSage Weil 613355da1ebSSage Weil xattr->val_len = val_len; 614fbc0b970SYan, Zheng xattr->dirty = update_xattr; 615fbc0b970SYan, Zheng xattr->should_free_val = (val && update_xattr); 616355da1ebSSage Weil 617355da1ebSSage Weil if (new) { 618355da1ebSSage Weil rb_link_node(&xattr->node, parent, p); 619355da1ebSSage Weil rb_insert_color(&xattr->node, &ci->i_xattrs.index); 620355da1ebSSage Weil dout("__set_xattr_val p=%p\n", p); 621355da1ebSSage Weil } 622355da1ebSSage Weil 62305729781SYan, Zheng dout("__set_xattr_val added %llx.%llx xattr %p %.*s=%.*s\n", 62405729781SYan, Zheng ceph_vinop(&ci->vfs_inode), xattr, name_len, name, val_len, val); 625355da1ebSSage Weil 626355da1ebSSage Weil return 0; 627355da1ebSSage Weil } 628355da1ebSSage Weil 629355da1ebSSage Weil static struct ceph_inode_xattr *__get_xattr(struct ceph_inode_info *ci, 630355da1ebSSage Weil const char *name) 631355da1ebSSage Weil { 632355da1ebSSage Weil struct rb_node **p; 633355da1ebSSage Weil struct rb_node *parent = NULL; 634355da1ebSSage Weil struct ceph_inode_xattr *xattr = NULL; 63517db143fSSage Weil int name_len = strlen(name); 636355da1ebSSage Weil int c; 637355da1ebSSage Weil 638355da1ebSSage Weil p = &ci->i_xattrs.index.rb_node; 639355da1ebSSage Weil while (*p) { 640355da1ebSSage Weil parent = *p; 641355da1ebSSage Weil xattr = rb_entry(parent, struct ceph_inode_xattr, node); 642355da1ebSSage Weil c = strncmp(name, xattr->name, xattr->name_len); 64317db143fSSage Weil if (c == 0 && name_len > xattr->name_len) 64417db143fSSage Weil c = 1; 645355da1ebSSage Weil if (c < 0) 646355da1ebSSage Weil p = &(*p)->rb_left; 647355da1ebSSage Weil else if (c > 0) 648355da1ebSSage Weil p = &(*p)->rb_right; 649355da1ebSSage Weil else { 650355da1ebSSage Weil dout("__get_xattr %s: found %.*s\n", name, 651355da1ebSSage Weil xattr->val_len, xattr->val); 652355da1ebSSage Weil return xattr; 653355da1ebSSage Weil } 654355da1ebSSage Weil } 655355da1ebSSage Weil 656355da1ebSSage Weil dout("__get_xattr %s: not found\n", name); 657355da1ebSSage Weil 658355da1ebSSage Weil return NULL; 659355da1ebSSage Weil } 660355da1ebSSage Weil 661355da1ebSSage Weil static void __free_xattr(struct ceph_inode_xattr *xattr) 662355da1ebSSage Weil { 663355da1ebSSage Weil BUG_ON(!xattr); 664355da1ebSSage Weil 665355da1ebSSage Weil if (xattr->should_free_name) 666c00e4522SXu Wang kfree(xattr->name); 667355da1ebSSage Weil if (xattr->should_free_val) 668c00e4522SXu Wang kfree(xattr->val); 669355da1ebSSage Weil 670355da1ebSSage Weil kfree(xattr); 671355da1ebSSage Weil } 672355da1ebSSage Weil 673355da1ebSSage Weil static int __remove_xattr(struct ceph_inode_info *ci, 674355da1ebSSage Weil struct ceph_inode_xattr *xattr) 675355da1ebSSage Weil { 676355da1ebSSage Weil if (!xattr) 677524186acSYan, Zheng return -ENODATA; 678355da1ebSSage Weil 679355da1ebSSage Weil rb_erase(&xattr->node, &ci->i_xattrs.index); 680355da1ebSSage Weil 681355da1ebSSage Weil if (xattr->should_free_name) 682c00e4522SXu Wang kfree(xattr->name); 683355da1ebSSage Weil if (xattr->should_free_val) 684c00e4522SXu Wang kfree(xattr->val); 685355da1ebSSage Weil 686355da1ebSSage Weil ci->i_xattrs.names_size -= xattr->name_len; 687355da1ebSSage Weil ci->i_xattrs.vals_size -= xattr->val_len; 688355da1ebSSage Weil ci->i_xattrs.count--; 689355da1ebSSage Weil kfree(xattr); 690355da1ebSSage Weil 691355da1ebSSage Weil return 0; 692355da1ebSSage Weil } 693355da1ebSSage Weil 694355da1ebSSage Weil static char *__copy_xattr_names(struct ceph_inode_info *ci, 695355da1ebSSage Weil char *dest) 696355da1ebSSage Weil { 697355da1ebSSage Weil struct rb_node *p; 698355da1ebSSage Weil struct ceph_inode_xattr *xattr = NULL; 699355da1ebSSage Weil 700355da1ebSSage Weil p = rb_first(&ci->i_xattrs.index); 701355da1ebSSage Weil dout("__copy_xattr_names count=%d\n", ci->i_xattrs.count); 702355da1ebSSage Weil 703355da1ebSSage Weil while (p) { 704355da1ebSSage Weil xattr = rb_entry(p, struct ceph_inode_xattr, node); 705355da1ebSSage Weil memcpy(dest, xattr->name, xattr->name_len); 706355da1ebSSage Weil dest[xattr->name_len] = '\0'; 707355da1ebSSage Weil 708355da1ebSSage Weil dout("dest=%s %p (%s) (%d/%d)\n", dest, xattr, xattr->name, 709355da1ebSSage Weil xattr->name_len, ci->i_xattrs.names_size); 710355da1ebSSage Weil 711355da1ebSSage Weil dest += xattr->name_len + 1; 712355da1ebSSage Weil p = rb_next(p); 713355da1ebSSage Weil } 714355da1ebSSage Weil 715355da1ebSSage Weil return dest; 716355da1ebSSage Weil } 717355da1ebSSage Weil 718355da1ebSSage Weil void __ceph_destroy_xattrs(struct ceph_inode_info *ci) 719355da1ebSSage Weil { 720355da1ebSSage Weil struct rb_node *p, *tmp; 721355da1ebSSage Weil struct ceph_inode_xattr *xattr = NULL; 722355da1ebSSage Weil 723355da1ebSSage Weil p = rb_first(&ci->i_xattrs.index); 724355da1ebSSage Weil 725355da1ebSSage Weil dout("__ceph_destroy_xattrs p=%p\n", p); 726355da1ebSSage Weil 727355da1ebSSage Weil while (p) { 728355da1ebSSage Weil xattr = rb_entry(p, struct ceph_inode_xattr, node); 729355da1ebSSage Weil tmp = p; 730355da1ebSSage Weil p = rb_next(tmp); 731355da1ebSSage Weil dout("__ceph_destroy_xattrs next p=%p (%.*s)\n", p, 732355da1ebSSage Weil xattr->name_len, xattr->name); 733355da1ebSSage Weil rb_erase(tmp, &ci->i_xattrs.index); 734355da1ebSSage Weil 735355da1ebSSage Weil __free_xattr(xattr); 736355da1ebSSage Weil } 737355da1ebSSage Weil 738355da1ebSSage Weil ci->i_xattrs.names_size = 0; 739355da1ebSSage Weil ci->i_xattrs.vals_size = 0; 740355da1ebSSage Weil ci->i_xattrs.index_version = 0; 741355da1ebSSage Weil ci->i_xattrs.count = 0; 742355da1ebSSage Weil ci->i_xattrs.index = RB_ROOT; 743355da1ebSSage Weil } 744355da1ebSSage Weil 745355da1ebSSage Weil static int __build_xattrs(struct inode *inode) 746be655596SSage Weil __releases(ci->i_ceph_lock) 747be655596SSage Weil __acquires(ci->i_ceph_lock) 748355da1ebSSage Weil { 749355da1ebSSage Weil u32 namelen; 750355da1ebSSage Weil u32 numattr = 0; 751355da1ebSSage Weil void *p, *end; 752355da1ebSSage Weil u32 len; 753355da1ebSSage Weil const char *name, *val; 754355da1ebSSage Weil struct ceph_inode_info *ci = ceph_inode(inode); 7550eb30853SXiubo Li u64 xattr_version; 756355da1ebSSage Weil struct ceph_inode_xattr **xattrs = NULL; 75763ff78b2SSage Weil int err = 0; 758355da1ebSSage Weil int i; 759355da1ebSSage Weil 760355da1ebSSage Weil dout("__build_xattrs() len=%d\n", 761355da1ebSSage Weil ci->i_xattrs.blob ? (int)ci->i_xattrs.blob->vec.iov_len : 0); 762355da1ebSSage Weil 763355da1ebSSage Weil if (ci->i_xattrs.index_version >= ci->i_xattrs.version) 764355da1ebSSage Weil return 0; /* already built */ 765355da1ebSSage Weil 766355da1ebSSage Weil __ceph_destroy_xattrs(ci); 767355da1ebSSage Weil 768355da1ebSSage Weil start: 769355da1ebSSage Weil /* updated internal xattr rb tree */ 770355da1ebSSage Weil if (ci->i_xattrs.blob && ci->i_xattrs.blob->vec.iov_len > 4) { 771355da1ebSSage Weil p = ci->i_xattrs.blob->vec.iov_base; 772355da1ebSSage Weil end = p + ci->i_xattrs.blob->vec.iov_len; 773355da1ebSSage Weil ceph_decode_32_safe(&p, end, numattr, bad); 774355da1ebSSage Weil xattr_version = ci->i_xattrs.version; 775be655596SSage Weil spin_unlock(&ci->i_ceph_lock); 776355da1ebSSage Weil 7777e8a2952SIlya Dryomov xattrs = kcalloc(numattr, sizeof(struct ceph_inode_xattr *), 778355da1ebSSage Weil GFP_NOFS); 779355da1ebSSage Weil err = -ENOMEM; 780355da1ebSSage Weil if (!xattrs) 781355da1ebSSage Weil goto bad_lock; 7821a295bd8SIlya Dryomov 783355da1ebSSage Weil for (i = 0; i < numattr; i++) { 784355da1ebSSage Weil xattrs[i] = kmalloc(sizeof(struct ceph_inode_xattr), 785355da1ebSSage Weil GFP_NOFS); 786355da1ebSSage Weil if (!xattrs[i]) 787355da1ebSSage Weil goto bad_lock; 788355da1ebSSage Weil } 789355da1ebSSage Weil 790be655596SSage Weil spin_lock(&ci->i_ceph_lock); 791355da1ebSSage Weil if (ci->i_xattrs.version != xattr_version) { 792355da1ebSSage Weil /* lost a race, retry */ 793355da1ebSSage Weil for (i = 0; i < numattr; i++) 794355da1ebSSage Weil kfree(xattrs[i]); 795355da1ebSSage Weil kfree(xattrs); 79621ec6ffaSAlan Cox xattrs = NULL; 797355da1ebSSage Weil goto start; 798355da1ebSSage Weil } 799355da1ebSSage Weil err = -EIO; 800355da1ebSSage Weil while (numattr--) { 801355da1ebSSage Weil ceph_decode_32_safe(&p, end, len, bad); 802355da1ebSSage Weil namelen = len; 803355da1ebSSage Weil name = p; 804355da1ebSSage Weil p += len; 805355da1ebSSage Weil ceph_decode_32_safe(&p, end, len, bad); 806355da1ebSSage Weil val = p; 807355da1ebSSage Weil p += len; 808355da1ebSSage Weil 809355da1ebSSage Weil err = __set_xattr(ci, name, namelen, val, len, 810fbc0b970SYan, Zheng 0, 0, &xattrs[numattr]); 811355da1ebSSage Weil 812355da1ebSSage Weil if (err < 0) 813355da1ebSSage Weil goto bad; 814355da1ebSSage Weil } 815355da1ebSSage Weil kfree(xattrs); 816355da1ebSSage Weil } 817355da1ebSSage Weil ci->i_xattrs.index_version = ci->i_xattrs.version; 818355da1ebSSage Weil ci->i_xattrs.dirty = false; 819355da1ebSSage Weil 820355da1ebSSage Weil return err; 821355da1ebSSage Weil bad_lock: 822be655596SSage Weil spin_lock(&ci->i_ceph_lock); 823355da1ebSSage Weil bad: 824355da1ebSSage Weil if (xattrs) { 825355da1ebSSage Weil for (i = 0; i < numattr; i++) 826355da1ebSSage Weil kfree(xattrs[i]); 827355da1ebSSage Weil kfree(xattrs); 828355da1ebSSage Weil } 829355da1ebSSage Weil ci->i_xattrs.names_size = 0; 830355da1ebSSage Weil return err; 831355da1ebSSage Weil } 832355da1ebSSage Weil 833355da1ebSSage Weil static int __get_required_blob_size(struct ceph_inode_info *ci, int name_size, 834355da1ebSSage Weil int val_size) 835355da1ebSSage Weil { 836355da1ebSSage Weil /* 837355da1ebSSage Weil * 4 bytes for the length, and additional 4 bytes per each xattr name, 838355da1ebSSage Weil * 4 bytes per each value 839355da1ebSSage Weil */ 840355da1ebSSage Weil int size = 4 + ci->i_xattrs.count*(4 + 4) + 841355da1ebSSage Weil ci->i_xattrs.names_size + 842355da1ebSSage Weil ci->i_xattrs.vals_size; 843355da1ebSSage Weil dout("__get_required_blob_size c=%d names.size=%d vals.size=%d\n", 844355da1ebSSage Weil ci->i_xattrs.count, ci->i_xattrs.names_size, 845355da1ebSSage Weil ci->i_xattrs.vals_size); 846355da1ebSSage Weil 847355da1ebSSage Weil if (name_size) 848355da1ebSSage Weil size += 4 + 4 + name_size + val_size; 849355da1ebSSage Weil 850355da1ebSSage Weil return size; 851355da1ebSSage Weil } 852355da1ebSSage Weil 853355da1ebSSage Weil /* 854355da1ebSSage Weil * If there are dirty xattrs, reencode xattrs into the prealloc_blob 85512fe3ddaSLuis Henriques * and swap into place. It returns the old i_xattrs.blob (or NULL) so 85612fe3ddaSLuis Henriques * that it can be freed by the caller as the i_ceph_lock is likely to be 85712fe3ddaSLuis Henriques * held. 858355da1ebSSage Weil */ 85912fe3ddaSLuis Henriques struct ceph_buffer *__ceph_build_xattrs_blob(struct ceph_inode_info *ci) 860355da1ebSSage Weil { 861355da1ebSSage Weil struct rb_node *p; 862355da1ebSSage Weil struct ceph_inode_xattr *xattr = NULL; 86312fe3ddaSLuis Henriques struct ceph_buffer *old_blob = NULL; 864355da1ebSSage Weil void *dest; 865355da1ebSSage Weil 866355da1ebSSage Weil dout("__build_xattrs_blob %p\n", &ci->vfs_inode); 867355da1ebSSage Weil if (ci->i_xattrs.dirty) { 868355da1ebSSage Weil int need = __get_required_blob_size(ci, 0, 0); 869355da1ebSSage Weil 870355da1ebSSage Weil BUG_ON(need > ci->i_xattrs.prealloc_blob->alloc_len); 871355da1ebSSage Weil 872355da1ebSSage Weil p = rb_first(&ci->i_xattrs.index); 873355da1ebSSage Weil dest = ci->i_xattrs.prealloc_blob->vec.iov_base; 874355da1ebSSage Weil 875355da1ebSSage Weil ceph_encode_32(&dest, ci->i_xattrs.count); 876355da1ebSSage Weil while (p) { 877355da1ebSSage Weil xattr = rb_entry(p, struct ceph_inode_xattr, node); 878355da1ebSSage Weil 879355da1ebSSage Weil ceph_encode_32(&dest, xattr->name_len); 880355da1ebSSage Weil memcpy(dest, xattr->name, xattr->name_len); 881355da1ebSSage Weil dest += xattr->name_len; 882355da1ebSSage Weil ceph_encode_32(&dest, xattr->val_len); 883355da1ebSSage Weil memcpy(dest, xattr->val, xattr->val_len); 884355da1ebSSage Weil dest += xattr->val_len; 885355da1ebSSage Weil 886355da1ebSSage Weil p = rb_next(p); 887355da1ebSSage Weil } 888355da1ebSSage Weil 889355da1ebSSage Weil /* adjust buffer len; it may be larger than we need */ 890355da1ebSSage Weil ci->i_xattrs.prealloc_blob->vec.iov_len = 891355da1ebSSage Weil dest - ci->i_xattrs.prealloc_blob->vec.iov_base; 892355da1ebSSage Weil 893b6c1d5b8SSage Weil if (ci->i_xattrs.blob) 89412fe3ddaSLuis Henriques old_blob = ci->i_xattrs.blob; 895355da1ebSSage Weil ci->i_xattrs.blob = ci->i_xattrs.prealloc_blob; 896355da1ebSSage Weil ci->i_xattrs.prealloc_blob = NULL; 897355da1ebSSage Weil ci->i_xattrs.dirty = false; 8984a625be4SSage Weil ci->i_xattrs.version++; 899355da1ebSSage Weil } 90012fe3ddaSLuis Henriques 90112fe3ddaSLuis Henriques return old_blob; 902355da1ebSSage Weil } 903355da1ebSSage Weil 904315f2408SYan, Zheng static inline int __get_request_mask(struct inode *in) { 905315f2408SYan, Zheng struct ceph_mds_request *req = current->journal_info; 906315f2408SYan, Zheng int mask = 0; 907315f2408SYan, Zheng if (req && req->r_target_inode == in) { 908315f2408SYan, Zheng if (req->r_op == CEPH_MDS_OP_LOOKUP || 909315f2408SYan, Zheng req->r_op == CEPH_MDS_OP_LOOKUPINO || 910315f2408SYan, Zheng req->r_op == CEPH_MDS_OP_LOOKUPPARENT || 911315f2408SYan, Zheng req->r_op == CEPH_MDS_OP_GETATTR) { 912315f2408SYan, Zheng mask = le32_to_cpu(req->r_args.getattr.mask); 913315f2408SYan, Zheng } else if (req->r_op == CEPH_MDS_OP_OPEN || 914315f2408SYan, Zheng req->r_op == CEPH_MDS_OP_CREATE) { 915315f2408SYan, Zheng mask = le32_to_cpu(req->r_args.open.mask); 916315f2408SYan, Zheng } 917315f2408SYan, Zheng } 918315f2408SYan, Zheng return mask; 919315f2408SYan, Zheng } 920315f2408SYan, Zheng 9217221fe4cSGuangliang Zhao ssize_t __ceph_getxattr(struct inode *inode, const char *name, void *value, 922355da1ebSSage Weil size_t size) 923355da1ebSSage Weil { 924355da1ebSSage Weil struct ceph_inode_info *ci = ceph_inode(inode); 925355da1ebSSage Weil struct ceph_inode_xattr *xattr; 926*6ddf5f16SMilind Changire struct ceph_vxattr *vxattr; 927315f2408SYan, Zheng int req_mask; 928f1d1b51dSJeff Layton ssize_t err; 929355da1ebSSage Weil 930*6ddf5f16SMilind Changire if (strncmp(name, XATTR_CEPH_PREFIX, XATTR_CEPH_PREFIX_LEN)) 931*6ddf5f16SMilind Changire goto handle_non_vxattrs; 932*6ddf5f16SMilind Changire 9330bee82fbSSage Weil /* let's see if a virtual xattr was requested */ 9340bee82fbSSage Weil vxattr = ceph_match_vxattr(inode, name); 93529dccfa5SYan, Zheng if (vxattr) { 93649a9f4f6SYan, Zheng int mask = 0; 93749a9f4f6SYan, Zheng if (vxattr->flags & VXATTR_FLAG_RSTAT) 93849a9f4f6SYan, Zheng mask |= CEPH_STAT_RSTAT; 93981048c00SJeff Layton if (vxattr->flags & VXATTR_FLAG_DIRSTAT) 94081048c00SJeff Layton mask |= CEPH_CAP_FILE_SHARED; 94149a9f4f6SYan, Zheng err = ceph_do_getattr(inode, mask, true); 9421684dd03SYan, Zheng if (err) 9431684dd03SYan, Zheng return err; 94429dccfa5SYan, Zheng err = -ENODATA; 9453b421018SJeff Layton if (!(vxattr->exists_cb && !vxattr->exists_cb(ci))) { 9460bee82fbSSage Weil err = vxattr->getxattr_cb(ci, value, size); 9473b421018SJeff Layton if (size && size < err) 9483b421018SJeff Layton err = -ERANGE; 9493b421018SJeff Layton } 950a1dc1937Smajianpeng return err; 951*6ddf5f16SMilind Changire } else { 952*6ddf5f16SMilind Changire err = ceph_do_getvxattr(inode, name, value, size); 953*6ddf5f16SMilind Changire /* this would happen with a new client and old server combo */ 954*6ddf5f16SMilind Changire if (err == -EOPNOTSUPP) 955*6ddf5f16SMilind Changire err = -ENODATA; 956*6ddf5f16SMilind Changire return err; 9570bee82fbSSage Weil } 958*6ddf5f16SMilind Changire handle_non_vxattrs: 959315f2408SYan, Zheng req_mask = __get_request_mask(inode); 960315f2408SYan, Zheng 961a1dc1937Smajianpeng spin_lock(&ci->i_ceph_lock); 962d36e0b62SJeff Layton dout("getxattr %p name '%s' ver=%lld index_ver=%lld\n", inode, name, 963a1dc1937Smajianpeng ci->i_xattrs.version, ci->i_xattrs.index_version); 964a1dc1937Smajianpeng 965508b32d8SYan, Zheng if (ci->i_xattrs.version == 0 || 966315f2408SYan, Zheng !((req_mask & CEPH_CAP_XATTR_SHARED) || 9671af16d54SXiubo Li __ceph_caps_issued_mask_metric(ci, CEPH_CAP_XATTR_SHARED, 1))) { 968be655596SSage Weil spin_unlock(&ci->i_ceph_lock); 969315f2408SYan, Zheng 970315f2408SYan, Zheng /* security module gets xattr while filling trace */ 971d37b1d99SMarkus Elfring if (current->journal_info) { 972315f2408SYan, Zheng pr_warn_ratelimited("sync getxattr %p " 973315f2408SYan, Zheng "during filling trace\n", inode); 974315f2408SYan, Zheng return -EBUSY; 975315f2408SYan, Zheng } 976315f2408SYan, Zheng 977355da1ebSSage Weil /* get xattrs from mds (if we don't already have them) */ 978508b32d8SYan, Zheng err = ceph_do_getattr(inode, CEPH_STAT_CAP_XATTR, true); 979355da1ebSSage Weil if (err) 980355da1ebSSage Weil return err; 981be655596SSage Weil spin_lock(&ci->i_ceph_lock); 982508b32d8SYan, Zheng } 983355da1ebSSage Weil 984355da1ebSSage Weil err = __build_xattrs(inode); 985355da1ebSSage Weil if (err < 0) 986355da1ebSSage Weil goto out; 987355da1ebSSage Weil 988355da1ebSSage Weil err = -ENODATA; /* == ENOATTR */ 989355da1ebSSage Weil xattr = __get_xattr(ci, name); 9900bee82fbSSage Weil if (!xattr) 991355da1ebSSage Weil goto out; 992355da1ebSSage Weil 993355da1ebSSage Weil err = -ERANGE; 994355da1ebSSage Weil if (size && size < xattr->val_len) 995355da1ebSSage Weil goto out; 996355da1ebSSage Weil 997355da1ebSSage Weil err = xattr->val_len; 998355da1ebSSage Weil if (size == 0) 999355da1ebSSage Weil goto out; 1000355da1ebSSage Weil 1001355da1ebSSage Weil memcpy(value, xattr->val, xattr->val_len); 1002355da1ebSSage Weil 1003d37b1d99SMarkus Elfring if (current->journal_info && 1004026105ebSJeff Layton !strncmp(name, XATTR_SECURITY_PREFIX, XATTR_SECURITY_PREFIX_LEN) && 1005026105ebSJeff Layton security_ismaclabel(name + XATTR_SECURITY_PREFIX_LEN)) 1006315f2408SYan, Zheng ci->i_ceph_flags |= CEPH_I_SEC_INITED; 1007355da1ebSSage Weil out: 1008be655596SSage Weil spin_unlock(&ci->i_ceph_lock); 1009355da1ebSSage Weil return err; 1010355da1ebSSage Weil } 1011355da1ebSSage Weil 1012355da1ebSSage Weil ssize_t ceph_listxattr(struct dentry *dentry, char *names, size_t size) 1013355da1ebSSage Weil { 10142b0143b5SDavid Howells struct inode *inode = d_inode(dentry); 1015355da1ebSSage Weil struct ceph_inode_info *ci = ceph_inode(inode); 10162b2abcacSDavid Disseldorp bool len_only = (size == 0); 1017355da1ebSSage Weil u32 namelen; 1018355da1ebSSage Weil int err; 1019355da1ebSSage Weil 1020be655596SSage Weil spin_lock(&ci->i_ceph_lock); 1021355da1ebSSage Weil dout("listxattr %p ver=%lld index_ver=%lld\n", inode, 1022355da1ebSSage Weil ci->i_xattrs.version, ci->i_xattrs.index_version); 1023355da1ebSSage Weil 1024508b32d8SYan, Zheng if (ci->i_xattrs.version == 0 || 10251af16d54SXiubo Li !__ceph_caps_issued_mask_metric(ci, CEPH_CAP_XATTR_SHARED, 1)) { 1026be655596SSage Weil spin_unlock(&ci->i_ceph_lock); 1027508b32d8SYan, Zheng err = ceph_do_getattr(inode, CEPH_STAT_CAP_XATTR, true); 1028355da1ebSSage Weil if (err) 1029355da1ebSSage Weil return err; 1030be655596SSage Weil spin_lock(&ci->i_ceph_lock); 1031508b32d8SYan, Zheng } 1032355da1ebSSage Weil 1033355da1ebSSage Weil err = __build_xattrs(inode); 1034355da1ebSSage Weil if (err < 0) 1035355da1ebSSage Weil goto out; 10363ce6cd12SAlex Elder 10372b2abcacSDavid Disseldorp /* add 1 byte for each xattr due to the null termination */ 1038b65917ddSSage Weil namelen = ci->i_xattrs.names_size + ci->i_xattrs.count; 10392b2abcacSDavid Disseldorp if (!len_only) { 10402b2abcacSDavid Disseldorp if (namelen > size) { 1041355da1ebSSage Weil err = -ERANGE; 1042355da1ebSSage Weil goto out; 10432b2abcacSDavid Disseldorp } 1044355da1ebSSage Weil names = __copy_xattr_names(ci, names); 10452b2abcacSDavid Disseldorp size -= namelen; 10462b2abcacSDavid Disseldorp } 10472b2abcacSDavid Disseldorp err = namelen; 1048355da1ebSSage Weil out: 1049be655596SSage Weil spin_unlock(&ci->i_ceph_lock); 1050355da1ebSSage Weil return err; 1051355da1ebSSage Weil } 1052355da1ebSSage Weil 1053a26feccaSAndreas Gruenbacher static int ceph_sync_setxattr(struct inode *inode, const char *name, 1054355da1ebSSage Weil const char *value, size_t size, int flags) 1055355da1ebSSage Weil { 1056a26feccaSAndreas Gruenbacher struct ceph_fs_client *fsc = ceph_sb_to_client(inode->i_sb); 1057355da1ebSSage Weil struct ceph_inode_info *ci = ceph_inode(inode); 1058355da1ebSSage Weil struct ceph_mds_request *req; 10593d14c5d2SYehuda Sadeh struct ceph_mds_client *mdsc = fsc->mdsc; 1060968cd14eSXiubo Li struct ceph_osd_client *osdc = &fsc->client->osdc; 106125e6bae3SYan, Zheng struct ceph_pagelist *pagelist = NULL; 106204303d8aSYan, Zheng int op = CEPH_MDS_OP_SETXATTR; 1063355da1ebSSage Weil int err; 1064355da1ebSSage Weil 10650aeff37aSYan, Zheng if (size > 0) { 106625e6bae3SYan, Zheng /* copy value into pagelist */ 106733165d47SIlya Dryomov pagelist = ceph_pagelist_alloc(GFP_NOFS); 106825e6bae3SYan, Zheng if (!pagelist) 1069355da1ebSSage Weil return -ENOMEM; 107025e6bae3SYan, Zheng 107125e6bae3SYan, Zheng err = ceph_pagelist_append(pagelist, value, size); 107225e6bae3SYan, Zheng if (err) 1073355da1ebSSage Weil goto out; 10740aeff37aSYan, Zheng } else if (!value) { 107504303d8aSYan, Zheng if (flags & CEPH_XATTR_REPLACE) 107604303d8aSYan, Zheng op = CEPH_MDS_OP_RMXATTR; 107704303d8aSYan, Zheng else 107825e6bae3SYan, Zheng flags |= CEPH_XATTR_REMOVE; 1079355da1ebSSage Weil } 1080355da1ebSSage Weil 1081355da1ebSSage Weil dout("setxattr value=%.*s\n", (int)size, value); 1082355da1ebSSage Weil 1083355da1ebSSage Weil /* do request */ 108404303d8aSYan, Zheng req = ceph_mdsc_create_request(mdsc, op, USE_AUTH_MDS); 108560d87733SJulia Lawall if (IS_ERR(req)) { 108660d87733SJulia Lawall err = PTR_ERR(req); 108760d87733SJulia Lawall goto out; 108860d87733SJulia Lawall } 1089a149bb9aSSanidhya Kashyap 1090355da1ebSSage Weil req->r_path2 = kstrdup(name, GFP_NOFS); 1091a149bb9aSSanidhya Kashyap if (!req->r_path2) { 1092a149bb9aSSanidhya Kashyap ceph_mdsc_put_request(req); 1093a149bb9aSSanidhya Kashyap err = -ENOMEM; 1094a149bb9aSSanidhya Kashyap goto out; 1095a149bb9aSSanidhya Kashyap } 1096355da1ebSSage Weil 109704303d8aSYan, Zheng if (op == CEPH_MDS_OP_SETXATTR) { 109804303d8aSYan, Zheng req->r_args.setxattr.flags = cpu_to_le32(flags); 1099968cd14eSXiubo Li req->r_args.setxattr.osdmap_epoch = 1100968cd14eSXiubo Li cpu_to_le32(osdc->osdmap->epoch); 110125e6bae3SYan, Zheng req->r_pagelist = pagelist; 110225e6bae3SYan, Zheng pagelist = NULL; 110304303d8aSYan, Zheng } 1104355da1ebSSage Weil 1105a149bb9aSSanidhya Kashyap req->r_inode = inode; 1106a149bb9aSSanidhya Kashyap ihold(inode); 1107a149bb9aSSanidhya Kashyap req->r_num_caps = 1; 1108a149bb9aSSanidhya Kashyap req->r_inode_drop = CEPH_CAP_XATTR_SHARED; 1109a149bb9aSSanidhya Kashyap 1110355da1ebSSage Weil dout("xattr.ver (before): %lld\n", ci->i_xattrs.version); 1111752c8bdcSSage Weil err = ceph_mdsc_do_request(mdsc, NULL, req); 1112355da1ebSSage Weil ceph_mdsc_put_request(req); 1113355da1ebSSage Weil dout("xattr.ver (after): %lld\n", ci->i_xattrs.version); 1114355da1ebSSage Weil 1115355da1ebSSage Weil out: 111625e6bae3SYan, Zheng if (pagelist) 111725e6bae3SYan, Zheng ceph_pagelist_release(pagelist); 1118355da1ebSSage Weil return err; 1119355da1ebSSage Weil } 1120355da1ebSSage Weil 1121a26feccaSAndreas Gruenbacher int __ceph_setxattr(struct inode *inode, const char *name, 1122355da1ebSSage Weil const void *value, size_t size, int flags) 1123355da1ebSSage Weil { 1124881a5fa2SAlex Elder struct ceph_vxattr *vxattr; 1125355da1ebSSage Weil struct ceph_inode_info *ci = ceph_inode(inode); 1126a26feccaSAndreas Gruenbacher struct ceph_mds_client *mdsc = ceph_sb_to_client(inode->i_sb)->mdsc; 1127f66fd9f0SYan, Zheng struct ceph_cap_flush *prealloc_cf = NULL; 112886968ef2SLuis Henriques struct ceph_buffer *old_blob = NULL; 112918fa8b3fSAlex Elder int issued; 1130355da1ebSSage Weil int err; 1131fbc0b970SYan, Zheng int dirty = 0; 1132355da1ebSSage Weil int name_len = strlen(name); 1133355da1ebSSage Weil int val_len = size; 1134355da1ebSSage Weil char *newname = NULL; 1135355da1ebSSage Weil char *newval = NULL; 1136355da1ebSSage Weil struct ceph_inode_xattr *xattr = NULL; 1137355da1ebSSage Weil int required_blob_size; 1138f1919826SYan, Zheng bool check_realm = false; 1139604d1b02SYan, Zheng bool lock_snap_rwsem = false; 1140355da1ebSSage Weil 11412cdeb1e4SAndreas Gruenbacher if (ceph_snap(inode) != CEPH_NOSNAP) 11422cdeb1e4SAndreas Gruenbacher return -EROFS; 1143355da1ebSSage Weil 114406476a69SAlex Elder vxattr = ceph_match_vxattr(inode, name); 1145f1919826SYan, Zheng if (vxattr) { 11464e9906e7SYan, Zheng if (vxattr->flags & VXATTR_FLAG_READONLY) 1147355da1ebSSage Weil return -EOPNOTSUPP; 1148f1919826SYan, Zheng if (value && !strncmp(vxattr->name, "ceph.quota", 10)) 1149f1919826SYan, Zheng check_realm = true; 1150f1919826SYan, Zheng } 1151355da1ebSSage Weil 11523adf654dSSage Weil /* pass any unhandled ceph.* xattrs through to the MDS */ 11533adf654dSSage Weil if (!strncmp(name, XATTR_CEPH_PREFIX, XATTR_CEPH_PREFIX_LEN)) 11543adf654dSSage Weil goto do_sync_unlocked; 11553adf654dSSage Weil 1156355da1ebSSage Weil /* preallocate memory for xattr name, value, index node */ 1157355da1ebSSage Weil err = -ENOMEM; 115861413c2fSJulia Lawall newname = kmemdup(name, name_len + 1, GFP_NOFS); 1159355da1ebSSage Weil if (!newname) 1160355da1ebSSage Weil goto out; 1161355da1ebSSage Weil 1162355da1ebSSage Weil if (val_len) { 1163b829c195SAlex Elder newval = kmemdup(value, val_len, GFP_NOFS); 1164355da1ebSSage Weil if (!newval) 1165355da1ebSSage Weil goto out; 1166355da1ebSSage Weil } 1167355da1ebSSage Weil 1168355da1ebSSage Weil xattr = kmalloc(sizeof(struct ceph_inode_xattr), GFP_NOFS); 1169355da1ebSSage Weil if (!xattr) 1170355da1ebSSage Weil goto out; 1171355da1ebSSage Weil 1172f66fd9f0SYan, Zheng prealloc_cf = ceph_alloc_cap_flush(); 1173f66fd9f0SYan, Zheng if (!prealloc_cf) 1174f66fd9f0SYan, Zheng goto out; 1175f66fd9f0SYan, Zheng 1176be655596SSage Weil spin_lock(&ci->i_ceph_lock); 1177355da1ebSSage Weil retry: 1178355da1ebSSage Weil issued = __ceph_caps_issued(ci, NULL); 1179508b32d8SYan, Zheng if (ci->i_xattrs.version == 0 || !(issued & CEPH_CAP_XATTR_EXCL)) 1180355da1ebSSage Weil goto do_sync; 1181604d1b02SYan, Zheng 1182604d1b02SYan, Zheng if (!lock_snap_rwsem && !ci->i_head_snapc) { 1183604d1b02SYan, Zheng lock_snap_rwsem = true; 1184604d1b02SYan, Zheng if (!down_read_trylock(&mdsc->snap_rwsem)) { 1185604d1b02SYan, Zheng spin_unlock(&ci->i_ceph_lock); 1186604d1b02SYan, Zheng down_read(&mdsc->snap_rwsem); 1187604d1b02SYan, Zheng spin_lock(&ci->i_ceph_lock); 1188604d1b02SYan, Zheng goto retry; 1189604d1b02SYan, Zheng } 1190604d1b02SYan, Zheng } 1191604d1b02SYan, Zheng 1192d36e0b62SJeff Layton dout("setxattr %p name '%s' issued %s\n", inode, name, 1193d36e0b62SJeff Layton ceph_cap_string(issued)); 1194355da1ebSSage Weil __build_xattrs(inode); 1195355da1ebSSage Weil 1196355da1ebSSage Weil required_blob_size = __get_required_blob_size(ci, name_len, val_len); 1197355da1ebSSage Weil 1198355da1ebSSage Weil if (!ci->i_xattrs.prealloc_blob || 1199355da1ebSSage Weil required_blob_size > ci->i_xattrs.prealloc_blob->alloc_len) { 120018fa8b3fSAlex Elder struct ceph_buffer *blob; 1201355da1ebSSage Weil 1202be655596SSage Weil spin_unlock(&ci->i_ceph_lock); 120386968ef2SLuis Henriques ceph_buffer_put(old_blob); /* Shouldn't be required */ 120486968ef2SLuis Henriques dout(" pre-allocating new blob size=%d\n", required_blob_size); 1205b6c1d5b8SSage Weil blob = ceph_buffer_new(required_blob_size, GFP_NOFS); 1206355da1ebSSage Weil if (!blob) 1207604d1b02SYan, Zheng goto do_sync_unlocked; 1208be655596SSage Weil spin_lock(&ci->i_ceph_lock); 120986968ef2SLuis Henriques /* prealloc_blob can't be released while holding i_ceph_lock */ 1210b6c1d5b8SSage Weil if (ci->i_xattrs.prealloc_blob) 121186968ef2SLuis Henriques old_blob = ci->i_xattrs.prealloc_blob; 1212355da1ebSSage Weil ci->i_xattrs.prealloc_blob = blob; 1213355da1ebSSage Weil goto retry; 1214355da1ebSSage Weil } 1215355da1ebSSage Weil 1216bcdfeb2eSYan, Zheng err = __set_xattr(ci, newname, name_len, newval, val_len, 1217bcdfeb2eSYan, Zheng flags, value ? 1 : -1, &xattr); 121818fa8b3fSAlex Elder 1219fbc0b970SYan, Zheng if (!err) { 1220f66fd9f0SYan, Zheng dirty = __ceph_mark_dirty_caps(ci, CEPH_CAP_XATTR_EXCL, 1221f66fd9f0SYan, Zheng &prealloc_cf); 1222355da1ebSSage Weil ci->i_xattrs.dirty = true; 1223c2050a45SDeepa Dinamani inode->i_ctime = current_time(inode); 1224fbc0b970SYan, Zheng } 122518fa8b3fSAlex Elder 1226be655596SSage Weil spin_unlock(&ci->i_ceph_lock); 122786968ef2SLuis Henriques ceph_buffer_put(old_blob); 1228604d1b02SYan, Zheng if (lock_snap_rwsem) 1229604d1b02SYan, Zheng up_read(&mdsc->snap_rwsem); 1230fca65b4aSSage Weil if (dirty) 1231fca65b4aSSage Weil __mark_inode_dirty(inode, dirty); 1232f66fd9f0SYan, Zheng ceph_free_cap_flush(prealloc_cf); 1233355da1ebSSage Weil return err; 1234355da1ebSSage Weil 1235355da1ebSSage Weil do_sync: 1236be655596SSage Weil spin_unlock(&ci->i_ceph_lock); 12373adf654dSSage Weil do_sync_unlocked: 1238604d1b02SYan, Zheng if (lock_snap_rwsem) 1239604d1b02SYan, Zheng up_read(&mdsc->snap_rwsem); 1240315f2408SYan, Zheng 1241315f2408SYan, Zheng /* security module set xattr while filling trace */ 1242d37b1d99SMarkus Elfring if (current->journal_info) { 1243315f2408SYan, Zheng pr_warn_ratelimited("sync setxattr %p " 1244315f2408SYan, Zheng "during filling trace\n", inode); 1245315f2408SYan, Zheng err = -EBUSY; 1246315f2408SYan, Zheng } else { 1247a26feccaSAndreas Gruenbacher err = ceph_sync_setxattr(inode, name, value, size, flags); 1248f1919826SYan, Zheng if (err >= 0 && check_realm) { 1249f1919826SYan, Zheng /* check if snaprealm was created for quota inode */ 1250f1919826SYan, Zheng spin_lock(&ci->i_ceph_lock); 1251f1919826SYan, Zheng if ((ci->i_max_files || ci->i_max_bytes) && 1252f1919826SYan, Zheng !(ci->i_snap_realm && 1253f1919826SYan, Zheng ci->i_snap_realm->ino == ci->i_vino.ino)) 1254f1919826SYan, Zheng err = -EOPNOTSUPP; 1255f1919826SYan, Zheng spin_unlock(&ci->i_ceph_lock); 1256f1919826SYan, Zheng } 1257315f2408SYan, Zheng } 1258355da1ebSSage Weil out: 1259f66fd9f0SYan, Zheng ceph_free_cap_flush(prealloc_cf); 1260355da1ebSSage Weil kfree(newname); 1261355da1ebSSage Weil kfree(newval); 1262355da1ebSSage Weil kfree(xattr); 1263355da1ebSSage Weil return err; 1264355da1ebSSage Weil } 1265355da1ebSSage Weil 12662cdeb1e4SAndreas Gruenbacher static int ceph_get_xattr_handler(const struct xattr_handler *handler, 12672cdeb1e4SAndreas Gruenbacher struct dentry *dentry, struct inode *inode, 12682cdeb1e4SAndreas Gruenbacher const char *name, void *value, size_t size) 12697221fe4cSGuangliang Zhao { 12702cdeb1e4SAndreas Gruenbacher if (!ceph_is_valid_xattr(name)) 12712cdeb1e4SAndreas Gruenbacher return -EOPNOTSUPP; 12722cdeb1e4SAndreas Gruenbacher return __ceph_getxattr(inode, name, value, size); 12737221fe4cSGuangliang Zhao } 1274315f2408SYan, Zheng 12752cdeb1e4SAndreas Gruenbacher static int ceph_set_xattr_handler(const struct xattr_handler *handler, 1276e65ce2a5SChristian Brauner struct user_namespace *mnt_userns, 127759301226SAl Viro struct dentry *unused, struct inode *inode, 127859301226SAl Viro const char *name, const void *value, 127959301226SAl Viro size_t size, int flags) 12802cdeb1e4SAndreas Gruenbacher { 12812cdeb1e4SAndreas Gruenbacher if (!ceph_is_valid_xattr(name)) 12822cdeb1e4SAndreas Gruenbacher return -EOPNOTSUPP; 128359301226SAl Viro return __ceph_setxattr(inode, name, value, size, flags); 12842cdeb1e4SAndreas Gruenbacher } 12852cdeb1e4SAndreas Gruenbacher 12865130cceaSWei Yongjun static const struct xattr_handler ceph_other_xattr_handler = { 12872cdeb1e4SAndreas Gruenbacher .prefix = "", /* match any name => handlers called with full name */ 12882cdeb1e4SAndreas Gruenbacher .get = ceph_get_xattr_handler, 12892cdeb1e4SAndreas Gruenbacher .set = ceph_set_xattr_handler, 12902cdeb1e4SAndreas Gruenbacher }; 12912cdeb1e4SAndreas Gruenbacher 1292315f2408SYan, Zheng #ifdef CONFIG_SECURITY 1293315f2408SYan, Zheng bool ceph_security_xattr_wanted(struct inode *in) 1294315f2408SYan, Zheng { 1295315f2408SYan, Zheng return in->i_security != NULL; 1296315f2408SYan, Zheng } 1297315f2408SYan, Zheng 1298315f2408SYan, Zheng bool ceph_security_xattr_deadlock(struct inode *in) 1299315f2408SYan, Zheng { 1300315f2408SYan, Zheng struct ceph_inode_info *ci; 1301315f2408SYan, Zheng bool ret; 1302d37b1d99SMarkus Elfring if (!in->i_security) 1303315f2408SYan, Zheng return false; 1304315f2408SYan, Zheng ci = ceph_inode(in); 1305315f2408SYan, Zheng spin_lock(&ci->i_ceph_lock); 1306315f2408SYan, Zheng ret = !(ci->i_ceph_flags & CEPH_I_SEC_INITED) && 1307315f2408SYan, Zheng !(ci->i_xattrs.version > 0 && 1308315f2408SYan, Zheng __ceph_caps_issued_mask(ci, CEPH_CAP_XATTR_SHARED, 0)); 1309315f2408SYan, Zheng spin_unlock(&ci->i_ceph_lock); 1310315f2408SYan, Zheng return ret; 1311315f2408SYan, Zheng } 1312ac6713ccSYan, Zheng 1313ac6713ccSYan, Zheng #ifdef CONFIG_CEPH_FS_SECURITY_LABEL 1314ac6713ccSYan, Zheng int ceph_security_init_secctx(struct dentry *dentry, umode_t mode, 1315ac6713ccSYan, Zheng struct ceph_acl_sec_ctx *as_ctx) 1316ac6713ccSYan, Zheng { 1317ac6713ccSYan, Zheng struct ceph_pagelist *pagelist = as_ctx->pagelist; 1318ac6713ccSYan, Zheng const char *name; 1319ac6713ccSYan, Zheng size_t name_len; 1320ac6713ccSYan, Zheng int err; 1321ac6713ccSYan, Zheng 1322ac6713ccSYan, Zheng err = security_dentry_init_security(dentry, mode, &dentry->d_name, 132315bf3239SVivek Goyal &name, &as_ctx->sec_ctx, 1324ac6713ccSYan, Zheng &as_ctx->sec_ctxlen); 1325ac6713ccSYan, Zheng if (err < 0) { 1326ac6713ccSYan, Zheng WARN_ON_ONCE(err != -EOPNOTSUPP); 1327ac6713ccSYan, Zheng err = 0; /* do nothing */ 1328ac6713ccSYan, Zheng goto out; 1329ac6713ccSYan, Zheng } 1330ac6713ccSYan, Zheng 1331ac6713ccSYan, Zheng err = -ENOMEM; 1332ac6713ccSYan, Zheng if (!pagelist) { 1333ac6713ccSYan, Zheng pagelist = ceph_pagelist_alloc(GFP_KERNEL); 1334ac6713ccSYan, Zheng if (!pagelist) 1335ac6713ccSYan, Zheng goto out; 1336ac6713ccSYan, Zheng err = ceph_pagelist_reserve(pagelist, PAGE_SIZE); 1337ac6713ccSYan, Zheng if (err) 1338ac6713ccSYan, Zheng goto out; 1339ac6713ccSYan, Zheng ceph_pagelist_encode_32(pagelist, 1); 1340ac6713ccSYan, Zheng } 1341ac6713ccSYan, Zheng 1342ac6713ccSYan, Zheng /* 1343ac6713ccSYan, Zheng * FIXME: Make security_dentry_init_security() generic. Currently 1344ac6713ccSYan, Zheng * It only supports single security module and only selinux has 1345ac6713ccSYan, Zheng * dentry_init_security hook. 1346ac6713ccSYan, Zheng */ 1347ac6713ccSYan, Zheng name_len = strlen(name); 1348ac6713ccSYan, Zheng err = ceph_pagelist_reserve(pagelist, 1349ac6713ccSYan, Zheng 4 * 2 + name_len + as_ctx->sec_ctxlen); 1350ac6713ccSYan, Zheng if (err) 1351ac6713ccSYan, Zheng goto out; 1352ac6713ccSYan, Zheng 1353ac6713ccSYan, Zheng if (as_ctx->pagelist) { 1354ac6713ccSYan, Zheng /* update count of KV pairs */ 1355ac6713ccSYan, Zheng BUG_ON(pagelist->length <= sizeof(__le32)); 1356ac6713ccSYan, Zheng if (list_is_singular(&pagelist->head)) { 1357ac6713ccSYan, Zheng le32_add_cpu((__le32*)pagelist->mapped_tail, 1); 1358ac6713ccSYan, Zheng } else { 1359ac6713ccSYan, Zheng struct page *page = list_first_entry(&pagelist->head, 1360ac6713ccSYan, Zheng struct page, lru); 1361ac6713ccSYan, Zheng void *addr = kmap_atomic(page); 1362ac6713ccSYan, Zheng le32_add_cpu((__le32*)addr, 1); 1363ac6713ccSYan, Zheng kunmap_atomic(addr); 1364ac6713ccSYan, Zheng } 1365ac6713ccSYan, Zheng } else { 1366ac6713ccSYan, Zheng as_ctx->pagelist = pagelist; 1367ac6713ccSYan, Zheng } 1368ac6713ccSYan, Zheng 1369ac6713ccSYan, Zheng ceph_pagelist_encode_32(pagelist, name_len); 1370ac6713ccSYan, Zheng ceph_pagelist_append(pagelist, name, name_len); 1371ac6713ccSYan, Zheng 1372ac6713ccSYan, Zheng ceph_pagelist_encode_32(pagelist, as_ctx->sec_ctxlen); 1373ac6713ccSYan, Zheng ceph_pagelist_append(pagelist, as_ctx->sec_ctx, as_ctx->sec_ctxlen); 1374ac6713ccSYan, Zheng 1375ac6713ccSYan, Zheng err = 0; 1376ac6713ccSYan, Zheng out: 1377ac6713ccSYan, Zheng if (pagelist && !as_ctx->pagelist) 1378ac6713ccSYan, Zheng ceph_pagelist_release(pagelist); 1379ac6713ccSYan, Zheng return err; 1380ac6713ccSYan, Zheng } 1381668959a5SJeff Layton #endif /* CONFIG_CEPH_FS_SECURITY_LABEL */ 1382668959a5SJeff Layton #endif /* CONFIG_SECURITY */ 13835c31e92dSYan, Zheng 13845c31e92dSYan, Zheng void ceph_release_acl_sec_ctx(struct ceph_acl_sec_ctx *as_ctx) 13855c31e92dSYan, Zheng { 13865c31e92dSYan, Zheng #ifdef CONFIG_CEPH_FS_POSIX_ACL 13875c31e92dSYan, Zheng posix_acl_release(as_ctx->acl); 13885c31e92dSYan, Zheng posix_acl_release(as_ctx->default_acl); 13895c31e92dSYan, Zheng #endif 1390ac6713ccSYan, Zheng #ifdef CONFIG_CEPH_FS_SECURITY_LABEL 1391ac6713ccSYan, Zheng security_release_secctx(as_ctx->sec_ctx, as_ctx->sec_ctxlen); 1392ac6713ccSYan, Zheng #endif 13935c31e92dSYan, Zheng if (as_ctx->pagelist) 13945c31e92dSYan, Zheng ceph_pagelist_release(as_ctx->pagelist); 13955c31e92dSYan, Zheng } 1396ac6713ccSYan, Zheng 1397ac6713ccSYan, Zheng /* 1398ac6713ccSYan, Zheng * List of handlers for synthetic system.* attributes. Other 1399ac6713ccSYan, Zheng * attributes are handled directly. 1400ac6713ccSYan, Zheng */ 1401ac6713ccSYan, Zheng const struct xattr_handler *ceph_xattr_handlers[] = { 1402ac6713ccSYan, Zheng #ifdef CONFIG_CEPH_FS_POSIX_ACL 1403ac6713ccSYan, Zheng &posix_acl_access_xattr_handler, 1404ac6713ccSYan, Zheng &posix_acl_default_xattr_handler, 1405ac6713ccSYan, Zheng #endif 1406ac6713ccSYan, Zheng &ceph_other_xattr_handler, 1407ac6713ccSYan, Zheng NULL, 1408ac6713ccSYan, Zheng }; 1409