1b2441318SGreg Kroah-Hartman // SPDX-License-Identifier: GPL-2.0 23d14c5d2SYehuda Sadeh #include <linux/ceph/ceph_debug.h> 325e6bae3SYan, Zheng #include <linux/ceph/pagelist.h> 43d14c5d2SYehuda Sadeh 5355da1ebSSage Weil #include "super.h" 63d14c5d2SYehuda Sadeh #include "mds_client.h" 73d14c5d2SYehuda Sadeh 83d14c5d2SYehuda Sadeh #include <linux/ceph/decode.h> 9355da1ebSSage Weil 10355da1ebSSage Weil #include <linux/xattr.h> 11ac6713ccSYan, Zheng #include <linux/security.h> 124db658eaSLinus Torvalds #include <linux/posix_acl_xattr.h> 135a0e3ad6STejun Heo #include <linux/slab.h> 14355da1ebSSage Weil 1522891907SAlex Elder #define XATTR_CEPH_PREFIX "ceph." 1622891907SAlex Elder #define XATTR_CEPH_PREFIX_LEN (sizeof (XATTR_CEPH_PREFIX) - 1) 1722891907SAlex Elder 18bcdfeb2eSYan, Zheng static int __remove_xattr(struct ceph_inode_info *ci, 19bcdfeb2eSYan, Zheng struct ceph_inode_xattr *xattr); 20bcdfeb2eSYan, Zheng 21355da1ebSSage Weil static bool ceph_is_valid_xattr(const char *name) 22355da1ebSSage Weil { 23b8fe918bSJeff Layton return !strncmp(name, XATTR_SECURITY_PREFIX, XATTR_SECURITY_PREFIX_LEN) || 24b8fe918bSJeff Layton !strncmp(name, XATTR_CEPH_PREFIX, XATTR_CEPH_PREFIX_LEN) || 25355da1ebSSage Weil !strncmp(name, XATTR_TRUSTED_PREFIX, XATTR_TRUSTED_PREFIX_LEN) || 26355da1ebSSage Weil !strncmp(name, XATTR_USER_PREFIX, XATTR_USER_PREFIX_LEN); 27355da1ebSSage Weil } 28355da1ebSSage Weil 29355da1ebSSage Weil /* 30355da1ebSSage Weil * These define virtual xattrs exposing the recursive directory 31355da1ebSSage Weil * statistics and layout metadata. 32355da1ebSSage Weil */ 33881a5fa2SAlex Elder struct ceph_vxattr { 34355da1ebSSage Weil char *name; 353ce6cd12SAlex Elder size_t name_size; /* strlen(name) + 1 (for '\0') */ 36f1d1b51dSJeff Layton ssize_t (*getxattr_cb)(struct ceph_inode_info *ci, char *val, 37355da1ebSSage Weil size_t size); 38f36e4472SSage Weil bool (*exists_cb)(struct ceph_inode_info *ci); 394e9906e7SYan, Zheng unsigned int flags; 40355da1ebSSage Weil }; 41355da1ebSSage Weil 424e9906e7SYan, Zheng #define VXATTR_FLAG_READONLY (1<<0) 434e9906e7SYan, Zheng #define VXATTR_FLAG_HIDDEN (1<<1) 4449a9f4f6SYan, Zheng #define VXATTR_FLAG_RSTAT (1<<2) 4581048c00SJeff Layton #define VXATTR_FLAG_DIRSTAT (1<<3) 464e9906e7SYan, Zheng 4732ab0bd7SSage Weil /* layouts */ 4832ab0bd7SSage Weil 4932ab0bd7SSage Weil static bool ceph_vxattrcb_layout_exists(struct ceph_inode_info *ci) 5032ab0bd7SSage Weil { 51779fe0fbSYan, Zheng struct ceph_file_layout *fl = &ci->i_layout; 52779fe0fbSYan, Zheng return (fl->stripe_unit > 0 || fl->stripe_count > 0 || 53779fe0fbSYan, Zheng fl->object_size > 0 || fl->pool_id >= 0 || 54779fe0fbSYan, Zheng rcu_dereference_raw(fl->pool_ns) != NULL); 5532ab0bd7SSage Weil } 5632ab0bd7SSage Weil 57f1d1b51dSJeff Layton static ssize_t ceph_vxattrcb_layout(struct ceph_inode_info *ci, char *val, 5832ab0bd7SSage Weil size_t size) 5932ab0bd7SSage Weil { 6032ab0bd7SSage Weil struct ceph_fs_client *fsc = ceph_sb_to_client(ci->vfs_inode.i_sb); 6132ab0bd7SSage Weil struct ceph_osd_client *osdc = &fsc->client->osdc; 62779fe0fbSYan, Zheng struct ceph_string *pool_ns; 637627151eSYan, Zheng s64 pool = ci->i_layout.pool_id; 6432ab0bd7SSage Weil const char *pool_name; 65779fe0fbSYan, Zheng const char *ns_field = " pool_namespace="; 661e5c6649SYan, Zheng char buf[128]; 67779fe0fbSYan, Zheng size_t len, total_len = 0; 683b421018SJeff Layton ssize_t ret; 69779fe0fbSYan, Zheng 70779fe0fbSYan, Zheng pool_ns = ceph_try_get_string(ci->i_layout.pool_ns); 7132ab0bd7SSage Weil 7232ab0bd7SSage Weil dout("ceph_vxattrcb_layout %p\n", &ci->vfs_inode); 735aea3dcdSIlya Dryomov down_read(&osdc->lock); 7432ab0bd7SSage Weil pool_name = ceph_pg_pool_name_by_id(osdc->osdmap, pool); 751e5c6649SYan, Zheng if (pool_name) { 76779fe0fbSYan, Zheng len = snprintf(buf, sizeof(buf), 777627151eSYan, Zheng "stripe_unit=%u stripe_count=%u object_size=%u pool=", 787627151eSYan, Zheng ci->i_layout.stripe_unit, ci->i_layout.stripe_count, 797627151eSYan, Zheng ci->i_layout.object_size); 80779fe0fbSYan, Zheng total_len = len + strlen(pool_name); 811e5c6649SYan, Zheng } else { 82779fe0fbSYan, Zheng len = snprintf(buf, sizeof(buf), 837627151eSYan, Zheng "stripe_unit=%u stripe_count=%u object_size=%u pool=%lld", 847627151eSYan, Zheng ci->i_layout.stripe_unit, ci->i_layout.stripe_count, 85f1d1b51dSJeff Layton ci->i_layout.object_size, pool); 86779fe0fbSYan, Zheng total_len = len; 87779fe0fbSYan, Zheng } 88779fe0fbSYan, Zheng 89779fe0fbSYan, Zheng if (pool_ns) 90779fe0fbSYan, Zheng total_len += strlen(ns_field) + pool_ns->len; 91779fe0fbSYan, Zheng 92779fe0fbSYan, Zheng ret = total_len; 933b421018SJeff Layton if (size >= total_len) { 94779fe0fbSYan, Zheng memcpy(val, buf, len); 95779fe0fbSYan, Zheng ret = len; 96779fe0fbSYan, Zheng if (pool_name) { 97779fe0fbSYan, Zheng len = strlen(pool_name); 98779fe0fbSYan, Zheng memcpy(val + ret, pool_name, len); 99779fe0fbSYan, Zheng ret += len; 100779fe0fbSYan, Zheng } 101779fe0fbSYan, Zheng if (pool_ns) { 102779fe0fbSYan, Zheng len = strlen(ns_field); 103779fe0fbSYan, Zheng memcpy(val + ret, ns_field, len); 104779fe0fbSYan, Zheng ret += len; 105779fe0fbSYan, Zheng memcpy(val + ret, pool_ns->str, pool_ns->len); 106779fe0fbSYan, Zheng ret += pool_ns->len; 1071e5c6649SYan, Zheng } 1081e5c6649SYan, Zheng } 1095aea3dcdSIlya Dryomov up_read(&osdc->lock); 110779fe0fbSYan, Zheng ceph_put_string(pool_ns); 11132ab0bd7SSage Weil return ret; 11232ab0bd7SSage Weil } 11332ab0bd7SSage Weil 11426350535SJeff Layton /* 11526350535SJeff Layton * The convention with strings in xattrs is that they should not be NULL 11626350535SJeff Layton * terminated, since we're returning the length with them. snprintf always 11726350535SJeff Layton * NULL terminates however, so call it on a temporary buffer and then memcpy 11826350535SJeff Layton * the result into place. 11926350535SJeff Layton */ 120f6fbdcd9SIlya Dryomov static __printf(3, 4) 121f6fbdcd9SIlya Dryomov int ceph_fmt_xattr(char *val, size_t size, const char *fmt, ...) 12226350535SJeff Layton { 12326350535SJeff Layton int ret; 12426350535SJeff Layton va_list args; 12526350535SJeff Layton char buf[96]; /* NB: reevaluate size if new vxattrs are added */ 12626350535SJeff Layton 12726350535SJeff Layton va_start(args, fmt); 12826350535SJeff Layton ret = vsnprintf(buf, size ? sizeof(buf) : 0, fmt, args); 12926350535SJeff Layton va_end(args); 13026350535SJeff Layton 13126350535SJeff Layton /* Sanity check */ 13226350535SJeff Layton if (size && ret + 1 > sizeof(buf)) { 13326350535SJeff Layton WARN_ONCE(true, "Returned length too big (%d)", ret); 13426350535SJeff Layton return -E2BIG; 13526350535SJeff Layton } 13626350535SJeff Layton 13726350535SJeff Layton if (ret <= size) 13826350535SJeff Layton memcpy(val, buf, ret); 13926350535SJeff Layton return ret; 14026350535SJeff Layton } 14126350535SJeff Layton 142f1d1b51dSJeff Layton static ssize_t ceph_vxattrcb_layout_stripe_unit(struct ceph_inode_info *ci, 143695b7119SSage Weil char *val, size_t size) 144695b7119SSage Weil { 14526350535SJeff Layton return ceph_fmt_xattr(val, size, "%u", ci->i_layout.stripe_unit); 146695b7119SSage Weil } 147695b7119SSage Weil 148f1d1b51dSJeff Layton static ssize_t ceph_vxattrcb_layout_stripe_count(struct ceph_inode_info *ci, 149695b7119SSage Weil char *val, size_t size) 150695b7119SSage Weil { 15126350535SJeff Layton return ceph_fmt_xattr(val, size, "%u", ci->i_layout.stripe_count); 152695b7119SSage Weil } 153695b7119SSage Weil 154f1d1b51dSJeff Layton static ssize_t ceph_vxattrcb_layout_object_size(struct ceph_inode_info *ci, 155695b7119SSage Weil char *val, size_t size) 156695b7119SSage Weil { 15726350535SJeff Layton return ceph_fmt_xattr(val, size, "%u", ci->i_layout.object_size); 158695b7119SSage Weil } 159695b7119SSage Weil 160f1d1b51dSJeff Layton static ssize_t ceph_vxattrcb_layout_pool(struct ceph_inode_info *ci, 161695b7119SSage Weil char *val, size_t size) 162695b7119SSage Weil { 163f1d1b51dSJeff Layton ssize_t ret; 164695b7119SSage Weil struct ceph_fs_client *fsc = ceph_sb_to_client(ci->vfs_inode.i_sb); 165695b7119SSage Weil struct ceph_osd_client *osdc = &fsc->client->osdc; 1667627151eSYan, Zheng s64 pool = ci->i_layout.pool_id; 167695b7119SSage Weil const char *pool_name; 168695b7119SSage Weil 1695aea3dcdSIlya Dryomov down_read(&osdc->lock); 170695b7119SSage Weil pool_name = ceph_pg_pool_name_by_id(osdc->osdmap, pool); 17126350535SJeff Layton if (pool_name) { 17226350535SJeff Layton ret = strlen(pool_name); 17326350535SJeff Layton if (ret <= size) 17426350535SJeff Layton memcpy(val, pool_name, ret); 17526350535SJeff Layton } else { 17626350535SJeff Layton ret = ceph_fmt_xattr(val, size, "%lld", pool); 17726350535SJeff Layton } 1785aea3dcdSIlya Dryomov up_read(&osdc->lock); 179695b7119SSage Weil return ret; 180695b7119SSage Weil } 181695b7119SSage Weil 182f1d1b51dSJeff Layton static ssize_t ceph_vxattrcb_layout_pool_namespace(struct ceph_inode_info *ci, 183779fe0fbSYan, Zheng char *val, size_t size) 184779fe0fbSYan, Zheng { 18526350535SJeff Layton ssize_t ret = 0; 186779fe0fbSYan, Zheng struct ceph_string *ns = ceph_try_get_string(ci->i_layout.pool_ns); 18726350535SJeff Layton 188779fe0fbSYan, Zheng if (ns) { 18926350535SJeff Layton ret = ns->len; 19026350535SJeff Layton if (ret <= size) 19126350535SJeff Layton memcpy(val, ns->str, ret); 192779fe0fbSYan, Zheng ceph_put_string(ns); 193779fe0fbSYan, Zheng } 194779fe0fbSYan, Zheng return ret; 195779fe0fbSYan, Zheng } 196779fe0fbSYan, Zheng 197355da1ebSSage Weil /* directories */ 198355da1ebSSage Weil 199f1d1b51dSJeff Layton static ssize_t ceph_vxattrcb_dir_entries(struct ceph_inode_info *ci, char *val, 200355da1ebSSage Weil size_t size) 201355da1ebSSage Weil { 20226350535SJeff Layton return ceph_fmt_xattr(val, size, "%lld", ci->i_files + ci->i_subdirs); 203355da1ebSSage Weil } 204355da1ebSSage Weil 205f1d1b51dSJeff Layton static ssize_t ceph_vxattrcb_dir_files(struct ceph_inode_info *ci, char *val, 206355da1ebSSage Weil size_t size) 207355da1ebSSage Weil { 20826350535SJeff Layton return ceph_fmt_xattr(val, size, "%lld", ci->i_files); 209355da1ebSSage Weil } 210355da1ebSSage Weil 211f1d1b51dSJeff Layton static ssize_t ceph_vxattrcb_dir_subdirs(struct ceph_inode_info *ci, char *val, 212355da1ebSSage Weil size_t size) 213355da1ebSSage Weil { 21426350535SJeff Layton return ceph_fmt_xattr(val, size, "%lld", ci->i_subdirs); 215355da1ebSSage Weil } 216355da1ebSSage Weil 217f1d1b51dSJeff Layton static ssize_t ceph_vxattrcb_dir_rentries(struct ceph_inode_info *ci, char *val, 218355da1ebSSage Weil size_t size) 219355da1ebSSage Weil { 22026350535SJeff Layton return ceph_fmt_xattr(val, size, "%lld", 22126350535SJeff Layton ci->i_rfiles + ci->i_rsubdirs); 222355da1ebSSage Weil } 223355da1ebSSage Weil 224f1d1b51dSJeff Layton static ssize_t ceph_vxattrcb_dir_rfiles(struct ceph_inode_info *ci, char *val, 225355da1ebSSage Weil size_t size) 226355da1ebSSage Weil { 22726350535SJeff Layton return ceph_fmt_xattr(val, size, "%lld", ci->i_rfiles); 228355da1ebSSage Weil } 229355da1ebSSage Weil 230f1d1b51dSJeff Layton static ssize_t ceph_vxattrcb_dir_rsubdirs(struct ceph_inode_info *ci, char *val, 231355da1ebSSage Weil size_t size) 232355da1ebSSage Weil { 23326350535SJeff Layton return ceph_fmt_xattr(val, size, "%lld", ci->i_rsubdirs); 234355da1ebSSage Weil } 235355da1ebSSage Weil 236f1d1b51dSJeff Layton static ssize_t ceph_vxattrcb_dir_rbytes(struct ceph_inode_info *ci, char *val, 237355da1ebSSage Weil size_t size) 238355da1ebSSage Weil { 23926350535SJeff Layton return ceph_fmt_xattr(val, size, "%lld", ci->i_rbytes); 240355da1ebSSage Weil } 241355da1ebSSage Weil 242f1d1b51dSJeff Layton static ssize_t ceph_vxattrcb_dir_rctime(struct ceph_inode_info *ci, char *val, 243355da1ebSSage Weil size_t size) 244355da1ebSSage Weil { 24526350535SJeff Layton return ceph_fmt_xattr(val, size, "%lld.%09ld", ci->i_rctime.tv_sec, 2469bbeab41SArnd Bergmann ci->i_rctime.tv_nsec); 247355da1ebSSage Weil } 248355da1ebSSage Weil 24908796873SYan, Zheng /* dir pin */ 25008796873SYan, Zheng static bool ceph_vxattrcb_dir_pin_exists(struct ceph_inode_info *ci) 25108796873SYan, Zheng { 25208796873SYan, Zheng return ci->i_dir_pin != -ENODATA; 25308796873SYan, Zheng } 254fb18a575SLuis Henriques 255f1d1b51dSJeff Layton static ssize_t ceph_vxattrcb_dir_pin(struct ceph_inode_info *ci, char *val, 25608796873SYan, Zheng size_t size) 25708796873SYan, Zheng { 25826350535SJeff Layton return ceph_fmt_xattr(val, size, "%d", (int)ci->i_dir_pin); 25908796873SYan, Zheng } 26008796873SYan, Zheng 26108796873SYan, Zheng /* quotas */ 262fb18a575SLuis Henriques static bool ceph_vxattrcb_quota_exists(struct ceph_inode_info *ci) 263fb18a575SLuis Henriques { 264f1919826SYan, Zheng bool ret = false; 265f1919826SYan, Zheng spin_lock(&ci->i_ceph_lock); 266f1919826SYan, Zheng if ((ci->i_max_files || ci->i_max_bytes) && 267f1919826SYan, Zheng ci->i_vino.snap == CEPH_NOSNAP && 268f1919826SYan, Zheng ci->i_snap_realm && 269f1919826SYan, Zheng ci->i_snap_realm->ino == ci->i_vino.ino) 270f1919826SYan, Zheng ret = true; 271f1919826SYan, Zheng spin_unlock(&ci->i_ceph_lock); 272f1919826SYan, Zheng return ret; 273fb18a575SLuis Henriques } 274fb18a575SLuis Henriques 275f1d1b51dSJeff Layton static ssize_t ceph_vxattrcb_quota(struct ceph_inode_info *ci, char *val, 276fb18a575SLuis Henriques size_t size) 277fb18a575SLuis Henriques { 27826350535SJeff Layton return ceph_fmt_xattr(val, size, "max_bytes=%llu max_files=%llu", 279fb18a575SLuis Henriques ci->i_max_bytes, ci->i_max_files); 280fb18a575SLuis Henriques } 281fb18a575SLuis Henriques 282f1d1b51dSJeff Layton static ssize_t ceph_vxattrcb_quota_max_bytes(struct ceph_inode_info *ci, 283fb18a575SLuis Henriques char *val, size_t size) 284fb18a575SLuis Henriques { 28526350535SJeff Layton return ceph_fmt_xattr(val, size, "%llu", ci->i_max_bytes); 286fb18a575SLuis Henriques } 287fb18a575SLuis Henriques 288f1d1b51dSJeff Layton static ssize_t ceph_vxattrcb_quota_max_files(struct ceph_inode_info *ci, 289fb18a575SLuis Henriques char *val, size_t size) 290fb18a575SLuis Henriques { 29126350535SJeff Layton return ceph_fmt_xattr(val, size, "%llu", ci->i_max_files); 292fb18a575SLuis Henriques } 29332ab0bd7SSage Weil 294100cc610SDavid Disseldorp /* snapshots */ 295100cc610SDavid Disseldorp static bool ceph_vxattrcb_snap_btime_exists(struct ceph_inode_info *ci) 296100cc610SDavid Disseldorp { 297100cc610SDavid Disseldorp return (ci->i_snap_btime.tv_sec != 0 || ci->i_snap_btime.tv_nsec != 0); 298100cc610SDavid Disseldorp } 299100cc610SDavid Disseldorp 300f1d1b51dSJeff Layton static ssize_t ceph_vxattrcb_snap_btime(struct ceph_inode_info *ci, char *val, 301100cc610SDavid Disseldorp size_t size) 302100cc610SDavid Disseldorp { 30326350535SJeff Layton return ceph_fmt_xattr(val, size, "%lld.%09ld", ci->i_snap_btime.tv_sec, 304100cc610SDavid Disseldorp ci->i_snap_btime.tv_nsec); 305100cc610SDavid Disseldorp } 306100cc610SDavid Disseldorp 307*5a9e2f5dSXiubo Li static ssize_t ceph_vxattrcb_cluster_fsid(struct ceph_inode_info *ci, 308*5a9e2f5dSXiubo Li char *val, size_t size) 309*5a9e2f5dSXiubo Li { 310*5a9e2f5dSXiubo Li struct ceph_fs_client *fsc = ceph_sb_to_client(ci->vfs_inode.i_sb); 311*5a9e2f5dSXiubo Li 312*5a9e2f5dSXiubo Li return ceph_fmt_xattr(val, size, "%pU", &fsc->client->fsid); 313*5a9e2f5dSXiubo Li } 314*5a9e2f5dSXiubo Li 315*5a9e2f5dSXiubo Li static ssize_t ceph_vxattrcb_client_id(struct ceph_inode_info *ci, 316*5a9e2f5dSXiubo Li char *val, size_t size) 317*5a9e2f5dSXiubo Li { 318*5a9e2f5dSXiubo Li struct ceph_fs_client *fsc = ceph_sb_to_client(ci->vfs_inode.i_sb); 319*5a9e2f5dSXiubo Li 320*5a9e2f5dSXiubo Li return ceph_fmt_xattr(val, size, "client%lld", 321*5a9e2f5dSXiubo Li ceph_client_gid(fsc->client)); 322*5a9e2f5dSXiubo Li } 323*5a9e2f5dSXiubo Li 324eb788084SAlex Elder #define CEPH_XATTR_NAME(_type, _name) XATTR_CEPH_PREFIX #_type "." #_name 325695b7119SSage Weil #define CEPH_XATTR_NAME2(_type, _name, _name2) \ 326695b7119SSage Weil XATTR_CEPH_PREFIX #_type "." #_name "." #_name2 327eb788084SAlex Elder 32849a9f4f6SYan, Zheng #define XATTR_NAME_CEPH(_type, _name, _flags) \ 329eb788084SAlex Elder { \ 330eb788084SAlex Elder .name = CEPH_XATTR_NAME(_type, _name), \ 3313ce6cd12SAlex Elder .name_size = sizeof (CEPH_XATTR_NAME(_type, _name)), \ 332aa4066edSAlex Elder .getxattr_cb = ceph_vxattrcb_ ## _type ## _ ## _name, \ 333f36e4472SSage Weil .exists_cb = NULL, \ 33449a9f4f6SYan, Zheng .flags = (VXATTR_FLAG_READONLY | _flags), \ 335eb788084SAlex Elder } 33649a9f4f6SYan, Zheng #define XATTR_RSTAT_FIELD(_type, _name) \ 33749a9f4f6SYan, Zheng XATTR_NAME_CEPH(_type, _name, VXATTR_FLAG_RSTAT) 338695b7119SSage Weil #define XATTR_LAYOUT_FIELD(_type, _name, _field) \ 339695b7119SSage Weil { \ 340695b7119SSage Weil .name = CEPH_XATTR_NAME2(_type, _name, _field), \ 341695b7119SSage Weil .name_size = sizeof (CEPH_XATTR_NAME2(_type, _name, _field)), \ 342695b7119SSage Weil .getxattr_cb = ceph_vxattrcb_ ## _name ## _ ## _field, \ 343695b7119SSage Weil .exists_cb = ceph_vxattrcb_layout_exists, \ 3444e9906e7SYan, Zheng .flags = VXATTR_FLAG_HIDDEN, \ 345695b7119SSage Weil } 346fb18a575SLuis Henriques #define XATTR_QUOTA_FIELD(_type, _name) \ 347fb18a575SLuis Henriques { \ 348fb18a575SLuis Henriques .name = CEPH_XATTR_NAME(_type, _name), \ 349fb18a575SLuis Henriques .name_size = sizeof(CEPH_XATTR_NAME(_type, _name)), \ 350fb18a575SLuis Henriques .getxattr_cb = ceph_vxattrcb_ ## _type ## _ ## _name, \ 351fb18a575SLuis Henriques .exists_cb = ceph_vxattrcb_quota_exists, \ 3524e9906e7SYan, Zheng .flags = VXATTR_FLAG_HIDDEN, \ 353fb18a575SLuis Henriques } 354eb788084SAlex Elder 355881a5fa2SAlex Elder static struct ceph_vxattr ceph_dir_vxattrs[] = { 3561f08f2b0SSage Weil { 3571f08f2b0SSage Weil .name = "ceph.dir.layout", 3581f08f2b0SSage Weil .name_size = sizeof("ceph.dir.layout"), 3591f08f2b0SSage Weil .getxattr_cb = ceph_vxattrcb_layout, 3601f08f2b0SSage Weil .exists_cb = ceph_vxattrcb_layout_exists, 3614e9906e7SYan, Zheng .flags = VXATTR_FLAG_HIDDEN, 3621f08f2b0SSage Weil }, 363695b7119SSage Weil XATTR_LAYOUT_FIELD(dir, layout, stripe_unit), 364695b7119SSage Weil XATTR_LAYOUT_FIELD(dir, layout, stripe_count), 365695b7119SSage Weil XATTR_LAYOUT_FIELD(dir, layout, object_size), 366695b7119SSage Weil XATTR_LAYOUT_FIELD(dir, layout, pool), 367779fe0fbSYan, Zheng XATTR_LAYOUT_FIELD(dir, layout, pool_namespace), 36881048c00SJeff Layton XATTR_NAME_CEPH(dir, entries, VXATTR_FLAG_DIRSTAT), 36981048c00SJeff Layton XATTR_NAME_CEPH(dir, files, VXATTR_FLAG_DIRSTAT), 37081048c00SJeff Layton XATTR_NAME_CEPH(dir, subdirs, VXATTR_FLAG_DIRSTAT), 37149a9f4f6SYan, Zheng XATTR_RSTAT_FIELD(dir, rentries), 37249a9f4f6SYan, Zheng XATTR_RSTAT_FIELD(dir, rfiles), 37349a9f4f6SYan, Zheng XATTR_RSTAT_FIELD(dir, rsubdirs), 37449a9f4f6SYan, Zheng XATTR_RSTAT_FIELD(dir, rbytes), 37549a9f4f6SYan, Zheng XATTR_RSTAT_FIELD(dir, rctime), 376fb18a575SLuis Henriques { 37708796873SYan, Zheng .name = "ceph.dir.pin", 378e1b81439SDavid Disseldorp .name_size = sizeof("ceph.dir.pin"), 37908796873SYan, Zheng .getxattr_cb = ceph_vxattrcb_dir_pin, 38008796873SYan, Zheng .exists_cb = ceph_vxattrcb_dir_pin_exists, 38108796873SYan, Zheng .flags = VXATTR_FLAG_HIDDEN, 38208796873SYan, Zheng }, 38308796873SYan, Zheng { 384fb18a575SLuis Henriques .name = "ceph.quota", 385fb18a575SLuis Henriques .name_size = sizeof("ceph.quota"), 386fb18a575SLuis Henriques .getxattr_cb = ceph_vxattrcb_quota, 387fb18a575SLuis Henriques .exists_cb = ceph_vxattrcb_quota_exists, 3884e9906e7SYan, Zheng .flags = VXATTR_FLAG_HIDDEN, 389fb18a575SLuis Henriques }, 390fb18a575SLuis Henriques XATTR_QUOTA_FIELD(quota, max_bytes), 391fb18a575SLuis Henriques XATTR_QUOTA_FIELD(quota, max_files), 392100cc610SDavid Disseldorp { 393100cc610SDavid Disseldorp .name = "ceph.snap.btime", 394100cc610SDavid Disseldorp .name_size = sizeof("ceph.snap.btime"), 395100cc610SDavid Disseldorp .getxattr_cb = ceph_vxattrcb_snap_btime, 396100cc610SDavid Disseldorp .exists_cb = ceph_vxattrcb_snap_btime_exists, 397100cc610SDavid Disseldorp .flags = VXATTR_FLAG_READONLY, 398100cc610SDavid Disseldorp }, 3992c3dd4ffSAlex Elder { .name = NULL, 0 } /* Required table terminator */ 400355da1ebSSage Weil }; 401355da1ebSSage Weil 402355da1ebSSage Weil /* files */ 403355da1ebSSage Weil 404881a5fa2SAlex Elder static struct ceph_vxattr ceph_file_vxattrs[] = { 40532ab0bd7SSage Weil { 40632ab0bd7SSage Weil .name = "ceph.file.layout", 40732ab0bd7SSage Weil .name_size = sizeof("ceph.file.layout"), 40832ab0bd7SSage Weil .getxattr_cb = ceph_vxattrcb_layout, 40932ab0bd7SSage Weil .exists_cb = ceph_vxattrcb_layout_exists, 4104e9906e7SYan, Zheng .flags = VXATTR_FLAG_HIDDEN, 41132ab0bd7SSage Weil }, 412695b7119SSage Weil XATTR_LAYOUT_FIELD(file, layout, stripe_unit), 413695b7119SSage Weil XATTR_LAYOUT_FIELD(file, layout, stripe_count), 414695b7119SSage Weil XATTR_LAYOUT_FIELD(file, layout, object_size), 415695b7119SSage Weil XATTR_LAYOUT_FIELD(file, layout, pool), 416779fe0fbSYan, Zheng XATTR_LAYOUT_FIELD(file, layout, pool_namespace), 417100cc610SDavid Disseldorp { 418100cc610SDavid Disseldorp .name = "ceph.snap.btime", 419100cc610SDavid Disseldorp .name_size = sizeof("ceph.snap.btime"), 420100cc610SDavid Disseldorp .getxattr_cb = ceph_vxattrcb_snap_btime, 421100cc610SDavid Disseldorp .exists_cb = ceph_vxattrcb_snap_btime_exists, 422100cc610SDavid Disseldorp .flags = VXATTR_FLAG_READONLY, 423100cc610SDavid Disseldorp }, 4242c3dd4ffSAlex Elder { .name = NULL, 0 } /* Required table terminator */ 425355da1ebSSage Weil }; 426355da1ebSSage Weil 427*5a9e2f5dSXiubo Li static struct ceph_vxattr ceph_common_vxattrs[] = { 428*5a9e2f5dSXiubo Li { 429*5a9e2f5dSXiubo Li .name = "ceph.cluster_fsid", 430*5a9e2f5dSXiubo Li .name_size = sizeof("ceph.cluster_fsid"), 431*5a9e2f5dSXiubo Li .getxattr_cb = ceph_vxattrcb_cluster_fsid, 432*5a9e2f5dSXiubo Li .exists_cb = NULL, 433*5a9e2f5dSXiubo Li .flags = VXATTR_FLAG_READONLY, 434*5a9e2f5dSXiubo Li }, 435*5a9e2f5dSXiubo Li { 436*5a9e2f5dSXiubo Li .name = "ceph.client_id", 437*5a9e2f5dSXiubo Li .name_size = sizeof("ceph.client_id"), 438*5a9e2f5dSXiubo Li .getxattr_cb = ceph_vxattrcb_client_id, 439*5a9e2f5dSXiubo Li .exists_cb = NULL, 440*5a9e2f5dSXiubo Li .flags = VXATTR_FLAG_READONLY, 441*5a9e2f5dSXiubo Li }, 442*5a9e2f5dSXiubo Li { .name = NULL, 0 } /* Required table terminator */ 443*5a9e2f5dSXiubo Li }; 444*5a9e2f5dSXiubo Li 445881a5fa2SAlex Elder static struct ceph_vxattr *ceph_inode_vxattrs(struct inode *inode) 446355da1ebSSage Weil { 447355da1ebSSage Weil if (S_ISDIR(inode->i_mode)) 448355da1ebSSage Weil return ceph_dir_vxattrs; 449355da1ebSSage Weil else if (S_ISREG(inode->i_mode)) 450355da1ebSSage Weil return ceph_file_vxattrs; 451355da1ebSSage Weil return NULL; 452355da1ebSSage Weil } 453355da1ebSSage Weil 454881a5fa2SAlex Elder static struct ceph_vxattr *ceph_match_vxattr(struct inode *inode, 455355da1ebSSage Weil const char *name) 456355da1ebSSage Weil { 457881a5fa2SAlex Elder struct ceph_vxattr *vxattr = ceph_inode_vxattrs(inode); 45806476a69SAlex Elder 45906476a69SAlex Elder if (vxattr) { 46006476a69SAlex Elder while (vxattr->name) { 46106476a69SAlex Elder if (!strcmp(vxattr->name, name)) 462355da1ebSSage Weil return vxattr; 463355da1ebSSage Weil vxattr++; 46406476a69SAlex Elder } 46506476a69SAlex Elder } 46606476a69SAlex Elder 467*5a9e2f5dSXiubo Li vxattr = ceph_common_vxattrs; 468*5a9e2f5dSXiubo Li while (vxattr->name) { 469*5a9e2f5dSXiubo Li if (!strcmp(vxattr->name, name)) 470*5a9e2f5dSXiubo Li return vxattr; 471*5a9e2f5dSXiubo Li vxattr++; 472*5a9e2f5dSXiubo Li } 473*5a9e2f5dSXiubo Li 474355da1ebSSage Weil return NULL; 475355da1ebSSage Weil } 476355da1ebSSage Weil 477355da1ebSSage Weil static int __set_xattr(struct ceph_inode_info *ci, 478355da1ebSSage Weil const char *name, int name_len, 479355da1ebSSage Weil const char *val, int val_len, 480fbc0b970SYan, Zheng int flags, int update_xattr, 481355da1ebSSage Weil struct ceph_inode_xattr **newxattr) 482355da1ebSSage Weil { 483355da1ebSSage Weil struct rb_node **p; 484355da1ebSSage Weil struct rb_node *parent = NULL; 485355da1ebSSage Weil struct ceph_inode_xattr *xattr = NULL; 486355da1ebSSage Weil int c; 487355da1ebSSage Weil int new = 0; 488355da1ebSSage Weil 489355da1ebSSage Weil p = &ci->i_xattrs.index.rb_node; 490355da1ebSSage Weil while (*p) { 491355da1ebSSage Weil parent = *p; 492355da1ebSSage Weil xattr = rb_entry(parent, struct ceph_inode_xattr, node); 493355da1ebSSage Weil c = strncmp(name, xattr->name, min(name_len, xattr->name_len)); 494355da1ebSSage Weil if (c < 0) 495355da1ebSSage Weil p = &(*p)->rb_left; 496355da1ebSSage Weil else if (c > 0) 497355da1ebSSage Weil p = &(*p)->rb_right; 498355da1ebSSage Weil else { 499355da1ebSSage Weil if (name_len == xattr->name_len) 500355da1ebSSage Weil break; 501355da1ebSSage Weil else if (name_len < xattr->name_len) 502355da1ebSSage Weil p = &(*p)->rb_left; 503355da1ebSSage Weil else 504355da1ebSSage Weil p = &(*p)->rb_right; 505355da1ebSSage Weil } 506355da1ebSSage Weil xattr = NULL; 507355da1ebSSage Weil } 508355da1ebSSage Weil 509fbc0b970SYan, Zheng if (update_xattr) { 510fbc0b970SYan, Zheng int err = 0; 511eeca958dSLuis Henriques 512fbc0b970SYan, Zheng if (xattr && (flags & XATTR_CREATE)) 513fbc0b970SYan, Zheng err = -EEXIST; 514fbc0b970SYan, Zheng else if (!xattr && (flags & XATTR_REPLACE)) 515fbc0b970SYan, Zheng err = -ENODATA; 516fbc0b970SYan, Zheng if (err) { 517fbc0b970SYan, Zheng kfree(name); 518fbc0b970SYan, Zheng kfree(val); 519eeca958dSLuis Henriques kfree(*newxattr); 520fbc0b970SYan, Zheng return err; 521fbc0b970SYan, Zheng } 522bcdfeb2eSYan, Zheng if (update_xattr < 0) { 523bcdfeb2eSYan, Zheng if (xattr) 524bcdfeb2eSYan, Zheng __remove_xattr(ci, xattr); 525bcdfeb2eSYan, Zheng kfree(name); 526eeca958dSLuis Henriques kfree(*newxattr); 527bcdfeb2eSYan, Zheng return 0; 528bcdfeb2eSYan, Zheng } 529fbc0b970SYan, Zheng } 530fbc0b970SYan, Zheng 531355da1ebSSage Weil if (!xattr) { 532355da1ebSSage Weil new = 1; 533355da1ebSSage Weil xattr = *newxattr; 534355da1ebSSage Weil xattr->name = name; 535355da1ebSSage Weil xattr->name_len = name_len; 536fbc0b970SYan, Zheng xattr->should_free_name = update_xattr; 537355da1ebSSage Weil 538355da1ebSSage Weil ci->i_xattrs.count++; 539355da1ebSSage Weil dout("__set_xattr count=%d\n", ci->i_xattrs.count); 540355da1ebSSage Weil } else { 541355da1ebSSage Weil kfree(*newxattr); 542355da1ebSSage Weil *newxattr = NULL; 543355da1ebSSage Weil if (xattr->should_free_val) 544c00e4522SXu Wang kfree(xattr->val); 545355da1ebSSage Weil 546fbc0b970SYan, Zheng if (update_xattr) { 547c00e4522SXu Wang kfree(name); 548355da1ebSSage Weil name = xattr->name; 549355da1ebSSage Weil } 550355da1ebSSage Weil ci->i_xattrs.names_size -= xattr->name_len; 551355da1ebSSage Weil ci->i_xattrs.vals_size -= xattr->val_len; 552355da1ebSSage Weil } 553355da1ebSSage Weil ci->i_xattrs.names_size += name_len; 554355da1ebSSage Weil ci->i_xattrs.vals_size += val_len; 555355da1ebSSage Weil if (val) 556355da1ebSSage Weil xattr->val = val; 557355da1ebSSage Weil else 558355da1ebSSage Weil xattr->val = ""; 559355da1ebSSage Weil 560355da1ebSSage Weil xattr->val_len = val_len; 561fbc0b970SYan, Zheng xattr->dirty = update_xattr; 562fbc0b970SYan, Zheng xattr->should_free_val = (val && update_xattr); 563355da1ebSSage Weil 564355da1ebSSage Weil if (new) { 565355da1ebSSage Weil rb_link_node(&xattr->node, parent, p); 566355da1ebSSage Weil rb_insert_color(&xattr->node, &ci->i_xattrs.index); 567355da1ebSSage Weil dout("__set_xattr_val p=%p\n", p); 568355da1ebSSage Weil } 569355da1ebSSage Weil 57005729781SYan, Zheng dout("__set_xattr_val added %llx.%llx xattr %p %.*s=%.*s\n", 57105729781SYan, Zheng ceph_vinop(&ci->vfs_inode), xattr, name_len, name, val_len, val); 572355da1ebSSage Weil 573355da1ebSSage Weil return 0; 574355da1ebSSage Weil } 575355da1ebSSage Weil 576355da1ebSSage Weil static struct ceph_inode_xattr *__get_xattr(struct ceph_inode_info *ci, 577355da1ebSSage Weil const char *name) 578355da1ebSSage Weil { 579355da1ebSSage Weil struct rb_node **p; 580355da1ebSSage Weil struct rb_node *parent = NULL; 581355da1ebSSage Weil struct ceph_inode_xattr *xattr = NULL; 58217db143fSSage Weil int name_len = strlen(name); 583355da1ebSSage Weil int c; 584355da1ebSSage Weil 585355da1ebSSage Weil p = &ci->i_xattrs.index.rb_node; 586355da1ebSSage Weil while (*p) { 587355da1ebSSage Weil parent = *p; 588355da1ebSSage Weil xattr = rb_entry(parent, struct ceph_inode_xattr, node); 589355da1ebSSage Weil c = strncmp(name, xattr->name, xattr->name_len); 59017db143fSSage Weil if (c == 0 && name_len > xattr->name_len) 59117db143fSSage Weil c = 1; 592355da1ebSSage Weil if (c < 0) 593355da1ebSSage Weil p = &(*p)->rb_left; 594355da1ebSSage Weil else if (c > 0) 595355da1ebSSage Weil p = &(*p)->rb_right; 596355da1ebSSage Weil else { 597355da1ebSSage Weil dout("__get_xattr %s: found %.*s\n", name, 598355da1ebSSage Weil xattr->val_len, xattr->val); 599355da1ebSSage Weil return xattr; 600355da1ebSSage Weil } 601355da1ebSSage Weil } 602355da1ebSSage Weil 603355da1ebSSage Weil dout("__get_xattr %s: not found\n", name); 604355da1ebSSage Weil 605355da1ebSSage Weil return NULL; 606355da1ebSSage Weil } 607355da1ebSSage Weil 608355da1ebSSage Weil static void __free_xattr(struct ceph_inode_xattr *xattr) 609355da1ebSSage Weil { 610355da1ebSSage Weil BUG_ON(!xattr); 611355da1ebSSage Weil 612355da1ebSSage Weil if (xattr->should_free_name) 613c00e4522SXu Wang kfree(xattr->name); 614355da1ebSSage Weil if (xattr->should_free_val) 615c00e4522SXu Wang kfree(xattr->val); 616355da1ebSSage Weil 617355da1ebSSage Weil kfree(xattr); 618355da1ebSSage Weil } 619355da1ebSSage Weil 620355da1ebSSage Weil static int __remove_xattr(struct ceph_inode_info *ci, 621355da1ebSSage Weil struct ceph_inode_xattr *xattr) 622355da1ebSSage Weil { 623355da1ebSSage Weil if (!xattr) 624524186acSYan, Zheng return -ENODATA; 625355da1ebSSage Weil 626355da1ebSSage Weil rb_erase(&xattr->node, &ci->i_xattrs.index); 627355da1ebSSage Weil 628355da1ebSSage Weil if (xattr->should_free_name) 629c00e4522SXu Wang kfree(xattr->name); 630355da1ebSSage Weil if (xattr->should_free_val) 631c00e4522SXu Wang kfree(xattr->val); 632355da1ebSSage Weil 633355da1ebSSage Weil ci->i_xattrs.names_size -= xattr->name_len; 634355da1ebSSage Weil ci->i_xattrs.vals_size -= xattr->val_len; 635355da1ebSSage Weil ci->i_xattrs.count--; 636355da1ebSSage Weil kfree(xattr); 637355da1ebSSage Weil 638355da1ebSSage Weil return 0; 639355da1ebSSage Weil } 640355da1ebSSage Weil 641355da1ebSSage Weil static char *__copy_xattr_names(struct ceph_inode_info *ci, 642355da1ebSSage Weil char *dest) 643355da1ebSSage Weil { 644355da1ebSSage Weil struct rb_node *p; 645355da1ebSSage Weil struct ceph_inode_xattr *xattr = NULL; 646355da1ebSSage Weil 647355da1ebSSage Weil p = rb_first(&ci->i_xattrs.index); 648355da1ebSSage Weil dout("__copy_xattr_names count=%d\n", ci->i_xattrs.count); 649355da1ebSSage Weil 650355da1ebSSage Weil while (p) { 651355da1ebSSage Weil xattr = rb_entry(p, struct ceph_inode_xattr, node); 652355da1ebSSage Weil memcpy(dest, xattr->name, xattr->name_len); 653355da1ebSSage Weil dest[xattr->name_len] = '\0'; 654355da1ebSSage Weil 655355da1ebSSage Weil dout("dest=%s %p (%s) (%d/%d)\n", dest, xattr, xattr->name, 656355da1ebSSage Weil xattr->name_len, ci->i_xattrs.names_size); 657355da1ebSSage Weil 658355da1ebSSage Weil dest += xattr->name_len + 1; 659355da1ebSSage Weil p = rb_next(p); 660355da1ebSSage Weil } 661355da1ebSSage Weil 662355da1ebSSage Weil return dest; 663355da1ebSSage Weil } 664355da1ebSSage Weil 665355da1ebSSage Weil void __ceph_destroy_xattrs(struct ceph_inode_info *ci) 666355da1ebSSage Weil { 667355da1ebSSage Weil struct rb_node *p, *tmp; 668355da1ebSSage Weil struct ceph_inode_xattr *xattr = NULL; 669355da1ebSSage Weil 670355da1ebSSage Weil p = rb_first(&ci->i_xattrs.index); 671355da1ebSSage Weil 672355da1ebSSage Weil dout("__ceph_destroy_xattrs p=%p\n", p); 673355da1ebSSage Weil 674355da1ebSSage Weil while (p) { 675355da1ebSSage Weil xattr = rb_entry(p, struct ceph_inode_xattr, node); 676355da1ebSSage Weil tmp = p; 677355da1ebSSage Weil p = rb_next(tmp); 678355da1ebSSage Weil dout("__ceph_destroy_xattrs next p=%p (%.*s)\n", p, 679355da1ebSSage Weil xattr->name_len, xattr->name); 680355da1ebSSage Weil rb_erase(tmp, &ci->i_xattrs.index); 681355da1ebSSage Weil 682355da1ebSSage Weil __free_xattr(xattr); 683355da1ebSSage Weil } 684355da1ebSSage Weil 685355da1ebSSage Weil ci->i_xattrs.names_size = 0; 686355da1ebSSage Weil ci->i_xattrs.vals_size = 0; 687355da1ebSSage Weil ci->i_xattrs.index_version = 0; 688355da1ebSSage Weil ci->i_xattrs.count = 0; 689355da1ebSSage Weil ci->i_xattrs.index = RB_ROOT; 690355da1ebSSage Weil } 691355da1ebSSage Weil 692355da1ebSSage Weil static int __build_xattrs(struct inode *inode) 693be655596SSage Weil __releases(ci->i_ceph_lock) 694be655596SSage Weil __acquires(ci->i_ceph_lock) 695355da1ebSSage Weil { 696355da1ebSSage Weil u32 namelen; 697355da1ebSSage Weil u32 numattr = 0; 698355da1ebSSage Weil void *p, *end; 699355da1ebSSage Weil u32 len; 700355da1ebSSage Weil const char *name, *val; 701355da1ebSSage Weil struct ceph_inode_info *ci = ceph_inode(inode); 7020eb30853SXiubo Li u64 xattr_version; 703355da1ebSSage Weil struct ceph_inode_xattr **xattrs = NULL; 70463ff78b2SSage Weil int err = 0; 705355da1ebSSage Weil int i; 706355da1ebSSage Weil 707355da1ebSSage Weil dout("__build_xattrs() len=%d\n", 708355da1ebSSage Weil ci->i_xattrs.blob ? (int)ci->i_xattrs.blob->vec.iov_len : 0); 709355da1ebSSage Weil 710355da1ebSSage Weil if (ci->i_xattrs.index_version >= ci->i_xattrs.version) 711355da1ebSSage Weil return 0; /* already built */ 712355da1ebSSage Weil 713355da1ebSSage Weil __ceph_destroy_xattrs(ci); 714355da1ebSSage Weil 715355da1ebSSage Weil start: 716355da1ebSSage Weil /* updated internal xattr rb tree */ 717355da1ebSSage Weil if (ci->i_xattrs.blob && ci->i_xattrs.blob->vec.iov_len > 4) { 718355da1ebSSage Weil p = ci->i_xattrs.blob->vec.iov_base; 719355da1ebSSage Weil end = p + ci->i_xattrs.blob->vec.iov_len; 720355da1ebSSage Weil ceph_decode_32_safe(&p, end, numattr, bad); 721355da1ebSSage Weil xattr_version = ci->i_xattrs.version; 722be655596SSage Weil spin_unlock(&ci->i_ceph_lock); 723355da1ebSSage Weil 7247e8a2952SIlya Dryomov xattrs = kcalloc(numattr, sizeof(struct ceph_inode_xattr *), 725355da1ebSSage Weil GFP_NOFS); 726355da1ebSSage Weil err = -ENOMEM; 727355da1ebSSage Weil if (!xattrs) 728355da1ebSSage Weil goto bad_lock; 7291a295bd8SIlya Dryomov 730355da1ebSSage Weil for (i = 0; i < numattr; i++) { 731355da1ebSSage Weil xattrs[i] = kmalloc(sizeof(struct ceph_inode_xattr), 732355da1ebSSage Weil GFP_NOFS); 733355da1ebSSage Weil if (!xattrs[i]) 734355da1ebSSage Weil goto bad_lock; 735355da1ebSSage Weil } 736355da1ebSSage Weil 737be655596SSage Weil spin_lock(&ci->i_ceph_lock); 738355da1ebSSage Weil if (ci->i_xattrs.version != xattr_version) { 739355da1ebSSage Weil /* lost a race, retry */ 740355da1ebSSage Weil for (i = 0; i < numattr; i++) 741355da1ebSSage Weil kfree(xattrs[i]); 742355da1ebSSage Weil kfree(xattrs); 74321ec6ffaSAlan Cox xattrs = NULL; 744355da1ebSSage Weil goto start; 745355da1ebSSage Weil } 746355da1ebSSage Weil err = -EIO; 747355da1ebSSage Weil while (numattr--) { 748355da1ebSSage Weil ceph_decode_32_safe(&p, end, len, bad); 749355da1ebSSage Weil namelen = len; 750355da1ebSSage Weil name = p; 751355da1ebSSage Weil p += len; 752355da1ebSSage Weil ceph_decode_32_safe(&p, end, len, bad); 753355da1ebSSage Weil val = p; 754355da1ebSSage Weil p += len; 755355da1ebSSage Weil 756355da1ebSSage Weil err = __set_xattr(ci, name, namelen, val, len, 757fbc0b970SYan, Zheng 0, 0, &xattrs[numattr]); 758355da1ebSSage Weil 759355da1ebSSage Weil if (err < 0) 760355da1ebSSage Weil goto bad; 761355da1ebSSage Weil } 762355da1ebSSage Weil kfree(xattrs); 763355da1ebSSage Weil } 764355da1ebSSage Weil ci->i_xattrs.index_version = ci->i_xattrs.version; 765355da1ebSSage Weil ci->i_xattrs.dirty = false; 766355da1ebSSage Weil 767355da1ebSSage Weil return err; 768355da1ebSSage Weil bad_lock: 769be655596SSage Weil spin_lock(&ci->i_ceph_lock); 770355da1ebSSage Weil bad: 771355da1ebSSage Weil if (xattrs) { 772355da1ebSSage Weil for (i = 0; i < numattr; i++) 773355da1ebSSage Weil kfree(xattrs[i]); 774355da1ebSSage Weil kfree(xattrs); 775355da1ebSSage Weil } 776355da1ebSSage Weil ci->i_xattrs.names_size = 0; 777355da1ebSSage Weil return err; 778355da1ebSSage Weil } 779355da1ebSSage Weil 780355da1ebSSage Weil static int __get_required_blob_size(struct ceph_inode_info *ci, int name_size, 781355da1ebSSage Weil int val_size) 782355da1ebSSage Weil { 783355da1ebSSage Weil /* 784355da1ebSSage Weil * 4 bytes for the length, and additional 4 bytes per each xattr name, 785355da1ebSSage Weil * 4 bytes per each value 786355da1ebSSage Weil */ 787355da1ebSSage Weil int size = 4 + ci->i_xattrs.count*(4 + 4) + 788355da1ebSSage Weil ci->i_xattrs.names_size + 789355da1ebSSage Weil ci->i_xattrs.vals_size; 790355da1ebSSage Weil dout("__get_required_blob_size c=%d names.size=%d vals.size=%d\n", 791355da1ebSSage Weil ci->i_xattrs.count, ci->i_xattrs.names_size, 792355da1ebSSage Weil ci->i_xattrs.vals_size); 793355da1ebSSage Weil 794355da1ebSSage Weil if (name_size) 795355da1ebSSage Weil size += 4 + 4 + name_size + val_size; 796355da1ebSSage Weil 797355da1ebSSage Weil return size; 798355da1ebSSage Weil } 799355da1ebSSage Weil 800355da1ebSSage Weil /* 801355da1ebSSage Weil * If there are dirty xattrs, reencode xattrs into the prealloc_blob 80212fe3ddaSLuis Henriques * and swap into place. It returns the old i_xattrs.blob (or NULL) so 80312fe3ddaSLuis Henriques * that it can be freed by the caller as the i_ceph_lock is likely to be 80412fe3ddaSLuis Henriques * held. 805355da1ebSSage Weil */ 80612fe3ddaSLuis Henriques struct ceph_buffer *__ceph_build_xattrs_blob(struct ceph_inode_info *ci) 807355da1ebSSage Weil { 808355da1ebSSage Weil struct rb_node *p; 809355da1ebSSage Weil struct ceph_inode_xattr *xattr = NULL; 81012fe3ddaSLuis Henriques struct ceph_buffer *old_blob = NULL; 811355da1ebSSage Weil void *dest; 812355da1ebSSage Weil 813355da1ebSSage Weil dout("__build_xattrs_blob %p\n", &ci->vfs_inode); 814355da1ebSSage Weil if (ci->i_xattrs.dirty) { 815355da1ebSSage Weil int need = __get_required_blob_size(ci, 0, 0); 816355da1ebSSage Weil 817355da1ebSSage Weil BUG_ON(need > ci->i_xattrs.prealloc_blob->alloc_len); 818355da1ebSSage Weil 819355da1ebSSage Weil p = rb_first(&ci->i_xattrs.index); 820355da1ebSSage Weil dest = ci->i_xattrs.prealloc_blob->vec.iov_base; 821355da1ebSSage Weil 822355da1ebSSage Weil ceph_encode_32(&dest, ci->i_xattrs.count); 823355da1ebSSage Weil while (p) { 824355da1ebSSage Weil xattr = rb_entry(p, struct ceph_inode_xattr, node); 825355da1ebSSage Weil 826355da1ebSSage Weil ceph_encode_32(&dest, xattr->name_len); 827355da1ebSSage Weil memcpy(dest, xattr->name, xattr->name_len); 828355da1ebSSage Weil dest += xattr->name_len; 829355da1ebSSage Weil ceph_encode_32(&dest, xattr->val_len); 830355da1ebSSage Weil memcpy(dest, xattr->val, xattr->val_len); 831355da1ebSSage Weil dest += xattr->val_len; 832355da1ebSSage Weil 833355da1ebSSage Weil p = rb_next(p); 834355da1ebSSage Weil } 835355da1ebSSage Weil 836355da1ebSSage Weil /* adjust buffer len; it may be larger than we need */ 837355da1ebSSage Weil ci->i_xattrs.prealloc_blob->vec.iov_len = 838355da1ebSSage Weil dest - ci->i_xattrs.prealloc_blob->vec.iov_base; 839355da1ebSSage Weil 840b6c1d5b8SSage Weil if (ci->i_xattrs.blob) 84112fe3ddaSLuis Henriques old_blob = ci->i_xattrs.blob; 842355da1ebSSage Weil ci->i_xattrs.blob = ci->i_xattrs.prealloc_blob; 843355da1ebSSage Weil ci->i_xattrs.prealloc_blob = NULL; 844355da1ebSSage Weil ci->i_xattrs.dirty = false; 8454a625be4SSage Weil ci->i_xattrs.version++; 846355da1ebSSage Weil } 84712fe3ddaSLuis Henriques 84812fe3ddaSLuis Henriques return old_blob; 849355da1ebSSage Weil } 850355da1ebSSage Weil 851315f2408SYan, Zheng static inline int __get_request_mask(struct inode *in) { 852315f2408SYan, Zheng struct ceph_mds_request *req = current->journal_info; 853315f2408SYan, Zheng int mask = 0; 854315f2408SYan, Zheng if (req && req->r_target_inode == in) { 855315f2408SYan, Zheng if (req->r_op == CEPH_MDS_OP_LOOKUP || 856315f2408SYan, Zheng req->r_op == CEPH_MDS_OP_LOOKUPINO || 857315f2408SYan, Zheng req->r_op == CEPH_MDS_OP_LOOKUPPARENT || 858315f2408SYan, Zheng req->r_op == CEPH_MDS_OP_GETATTR) { 859315f2408SYan, Zheng mask = le32_to_cpu(req->r_args.getattr.mask); 860315f2408SYan, Zheng } else if (req->r_op == CEPH_MDS_OP_OPEN || 861315f2408SYan, Zheng req->r_op == CEPH_MDS_OP_CREATE) { 862315f2408SYan, Zheng mask = le32_to_cpu(req->r_args.open.mask); 863315f2408SYan, Zheng } 864315f2408SYan, Zheng } 865315f2408SYan, Zheng return mask; 866315f2408SYan, Zheng } 867315f2408SYan, Zheng 8687221fe4cSGuangliang Zhao ssize_t __ceph_getxattr(struct inode *inode, const char *name, void *value, 869355da1ebSSage Weil size_t size) 870355da1ebSSage Weil { 871355da1ebSSage Weil struct ceph_inode_info *ci = ceph_inode(inode); 872355da1ebSSage Weil struct ceph_inode_xattr *xattr; 873881a5fa2SAlex Elder struct ceph_vxattr *vxattr = NULL; 874315f2408SYan, Zheng int req_mask; 875f1d1b51dSJeff Layton ssize_t err; 876355da1ebSSage Weil 8770bee82fbSSage Weil /* let's see if a virtual xattr was requested */ 8780bee82fbSSage Weil vxattr = ceph_match_vxattr(inode, name); 87929dccfa5SYan, Zheng if (vxattr) { 88049a9f4f6SYan, Zheng int mask = 0; 88149a9f4f6SYan, Zheng if (vxattr->flags & VXATTR_FLAG_RSTAT) 88249a9f4f6SYan, Zheng mask |= CEPH_STAT_RSTAT; 88381048c00SJeff Layton if (vxattr->flags & VXATTR_FLAG_DIRSTAT) 88481048c00SJeff Layton mask |= CEPH_CAP_FILE_SHARED; 88549a9f4f6SYan, Zheng err = ceph_do_getattr(inode, mask, true); 8861684dd03SYan, Zheng if (err) 8871684dd03SYan, Zheng return err; 88829dccfa5SYan, Zheng err = -ENODATA; 8893b421018SJeff Layton if (!(vxattr->exists_cb && !vxattr->exists_cb(ci))) { 8900bee82fbSSage Weil err = vxattr->getxattr_cb(ci, value, size); 8913b421018SJeff Layton if (size && size < err) 8923b421018SJeff Layton err = -ERANGE; 8933b421018SJeff Layton } 894a1dc1937Smajianpeng return err; 8950bee82fbSSage Weil } 8960bee82fbSSage Weil 897315f2408SYan, Zheng req_mask = __get_request_mask(inode); 898315f2408SYan, Zheng 899a1dc1937Smajianpeng spin_lock(&ci->i_ceph_lock); 900d36e0b62SJeff Layton dout("getxattr %p name '%s' ver=%lld index_ver=%lld\n", inode, name, 901a1dc1937Smajianpeng ci->i_xattrs.version, ci->i_xattrs.index_version); 902a1dc1937Smajianpeng 903508b32d8SYan, Zheng if (ci->i_xattrs.version == 0 || 904315f2408SYan, Zheng !((req_mask & CEPH_CAP_XATTR_SHARED) || 9051af16d54SXiubo Li __ceph_caps_issued_mask_metric(ci, CEPH_CAP_XATTR_SHARED, 1))) { 906be655596SSage Weil spin_unlock(&ci->i_ceph_lock); 907315f2408SYan, Zheng 908315f2408SYan, Zheng /* security module gets xattr while filling trace */ 909d37b1d99SMarkus Elfring if (current->journal_info) { 910315f2408SYan, Zheng pr_warn_ratelimited("sync getxattr %p " 911315f2408SYan, Zheng "during filling trace\n", inode); 912315f2408SYan, Zheng return -EBUSY; 913315f2408SYan, Zheng } 914315f2408SYan, Zheng 915355da1ebSSage Weil /* get xattrs from mds (if we don't already have them) */ 916508b32d8SYan, Zheng err = ceph_do_getattr(inode, CEPH_STAT_CAP_XATTR, true); 917355da1ebSSage Weil if (err) 918355da1ebSSage Weil return err; 919be655596SSage Weil spin_lock(&ci->i_ceph_lock); 920508b32d8SYan, Zheng } 921355da1ebSSage Weil 922355da1ebSSage Weil err = __build_xattrs(inode); 923355da1ebSSage Weil if (err < 0) 924355da1ebSSage Weil goto out; 925355da1ebSSage Weil 926355da1ebSSage Weil err = -ENODATA; /* == ENOATTR */ 927355da1ebSSage Weil xattr = __get_xattr(ci, name); 9280bee82fbSSage Weil if (!xattr) 929355da1ebSSage Weil goto out; 930355da1ebSSage Weil 931355da1ebSSage Weil err = -ERANGE; 932355da1ebSSage Weil if (size && size < xattr->val_len) 933355da1ebSSage Weil goto out; 934355da1ebSSage Weil 935355da1ebSSage Weil err = xattr->val_len; 936355da1ebSSage Weil if (size == 0) 937355da1ebSSage Weil goto out; 938355da1ebSSage Weil 939355da1ebSSage Weil memcpy(value, xattr->val, xattr->val_len); 940355da1ebSSage Weil 941d37b1d99SMarkus Elfring if (current->journal_info && 942026105ebSJeff Layton !strncmp(name, XATTR_SECURITY_PREFIX, XATTR_SECURITY_PREFIX_LEN) && 943026105ebSJeff Layton security_ismaclabel(name + XATTR_SECURITY_PREFIX_LEN)) 944315f2408SYan, Zheng ci->i_ceph_flags |= CEPH_I_SEC_INITED; 945355da1ebSSage Weil out: 946be655596SSage Weil spin_unlock(&ci->i_ceph_lock); 947355da1ebSSage Weil return err; 948355da1ebSSage Weil } 949355da1ebSSage Weil 950355da1ebSSage Weil ssize_t ceph_listxattr(struct dentry *dentry, char *names, size_t size) 951355da1ebSSage Weil { 9522b0143b5SDavid Howells struct inode *inode = d_inode(dentry); 953355da1ebSSage Weil struct ceph_inode_info *ci = ceph_inode(inode); 9542b2abcacSDavid Disseldorp bool len_only = (size == 0); 955355da1ebSSage Weil u32 namelen; 956355da1ebSSage Weil int err; 957355da1ebSSage Weil 958be655596SSage Weil spin_lock(&ci->i_ceph_lock); 959355da1ebSSage Weil dout("listxattr %p ver=%lld index_ver=%lld\n", inode, 960355da1ebSSage Weil ci->i_xattrs.version, ci->i_xattrs.index_version); 961355da1ebSSage Weil 962508b32d8SYan, Zheng if (ci->i_xattrs.version == 0 || 9631af16d54SXiubo Li !__ceph_caps_issued_mask_metric(ci, CEPH_CAP_XATTR_SHARED, 1)) { 964be655596SSage Weil spin_unlock(&ci->i_ceph_lock); 965508b32d8SYan, Zheng err = ceph_do_getattr(inode, CEPH_STAT_CAP_XATTR, true); 966355da1ebSSage Weil if (err) 967355da1ebSSage Weil return err; 968be655596SSage Weil spin_lock(&ci->i_ceph_lock); 969508b32d8SYan, Zheng } 970355da1ebSSage Weil 971355da1ebSSage Weil err = __build_xattrs(inode); 972355da1ebSSage Weil if (err < 0) 973355da1ebSSage Weil goto out; 9743ce6cd12SAlex Elder 9752b2abcacSDavid Disseldorp /* add 1 byte for each xattr due to the null termination */ 976b65917ddSSage Weil namelen = ci->i_xattrs.names_size + ci->i_xattrs.count; 9772b2abcacSDavid Disseldorp if (!len_only) { 9782b2abcacSDavid Disseldorp if (namelen > size) { 979355da1ebSSage Weil err = -ERANGE; 980355da1ebSSage Weil goto out; 9812b2abcacSDavid Disseldorp } 982355da1ebSSage Weil names = __copy_xattr_names(ci, names); 9832b2abcacSDavid Disseldorp size -= namelen; 9842b2abcacSDavid Disseldorp } 9852b2abcacSDavid Disseldorp err = namelen; 986355da1ebSSage Weil out: 987be655596SSage Weil spin_unlock(&ci->i_ceph_lock); 988355da1ebSSage Weil return err; 989355da1ebSSage Weil } 990355da1ebSSage Weil 991a26feccaSAndreas Gruenbacher static int ceph_sync_setxattr(struct inode *inode, const char *name, 992355da1ebSSage Weil const char *value, size_t size, int flags) 993355da1ebSSage Weil { 994a26feccaSAndreas Gruenbacher struct ceph_fs_client *fsc = ceph_sb_to_client(inode->i_sb); 995355da1ebSSage Weil struct ceph_inode_info *ci = ceph_inode(inode); 996355da1ebSSage Weil struct ceph_mds_request *req; 9973d14c5d2SYehuda Sadeh struct ceph_mds_client *mdsc = fsc->mdsc; 99825e6bae3SYan, Zheng struct ceph_pagelist *pagelist = NULL; 99904303d8aSYan, Zheng int op = CEPH_MDS_OP_SETXATTR; 1000355da1ebSSage Weil int err; 1001355da1ebSSage Weil 10020aeff37aSYan, Zheng if (size > 0) { 100325e6bae3SYan, Zheng /* copy value into pagelist */ 100433165d47SIlya Dryomov pagelist = ceph_pagelist_alloc(GFP_NOFS); 100525e6bae3SYan, Zheng if (!pagelist) 1006355da1ebSSage Weil return -ENOMEM; 100725e6bae3SYan, Zheng 100825e6bae3SYan, Zheng err = ceph_pagelist_append(pagelist, value, size); 100925e6bae3SYan, Zheng if (err) 1010355da1ebSSage Weil goto out; 10110aeff37aSYan, Zheng } else if (!value) { 101204303d8aSYan, Zheng if (flags & CEPH_XATTR_REPLACE) 101304303d8aSYan, Zheng op = CEPH_MDS_OP_RMXATTR; 101404303d8aSYan, Zheng else 101525e6bae3SYan, Zheng flags |= CEPH_XATTR_REMOVE; 1016355da1ebSSage Weil } 1017355da1ebSSage Weil 1018355da1ebSSage Weil dout("setxattr value=%.*s\n", (int)size, value); 1019355da1ebSSage Weil 1020355da1ebSSage Weil /* do request */ 102104303d8aSYan, Zheng req = ceph_mdsc_create_request(mdsc, op, USE_AUTH_MDS); 102260d87733SJulia Lawall if (IS_ERR(req)) { 102360d87733SJulia Lawall err = PTR_ERR(req); 102460d87733SJulia Lawall goto out; 102560d87733SJulia Lawall } 1026a149bb9aSSanidhya Kashyap 1027355da1ebSSage Weil req->r_path2 = kstrdup(name, GFP_NOFS); 1028a149bb9aSSanidhya Kashyap if (!req->r_path2) { 1029a149bb9aSSanidhya Kashyap ceph_mdsc_put_request(req); 1030a149bb9aSSanidhya Kashyap err = -ENOMEM; 1031a149bb9aSSanidhya Kashyap goto out; 1032a149bb9aSSanidhya Kashyap } 1033355da1ebSSage Weil 103404303d8aSYan, Zheng if (op == CEPH_MDS_OP_SETXATTR) { 103504303d8aSYan, Zheng req->r_args.setxattr.flags = cpu_to_le32(flags); 103625e6bae3SYan, Zheng req->r_pagelist = pagelist; 103725e6bae3SYan, Zheng pagelist = NULL; 103804303d8aSYan, Zheng } 1039355da1ebSSage Weil 1040a149bb9aSSanidhya Kashyap req->r_inode = inode; 1041a149bb9aSSanidhya Kashyap ihold(inode); 1042a149bb9aSSanidhya Kashyap req->r_num_caps = 1; 1043a149bb9aSSanidhya Kashyap req->r_inode_drop = CEPH_CAP_XATTR_SHARED; 1044a149bb9aSSanidhya Kashyap 1045355da1ebSSage Weil dout("xattr.ver (before): %lld\n", ci->i_xattrs.version); 1046752c8bdcSSage Weil err = ceph_mdsc_do_request(mdsc, NULL, req); 1047355da1ebSSage Weil ceph_mdsc_put_request(req); 1048355da1ebSSage Weil dout("xattr.ver (after): %lld\n", ci->i_xattrs.version); 1049355da1ebSSage Weil 1050355da1ebSSage Weil out: 105125e6bae3SYan, Zheng if (pagelist) 105225e6bae3SYan, Zheng ceph_pagelist_release(pagelist); 1053355da1ebSSage Weil return err; 1054355da1ebSSage Weil } 1055355da1ebSSage Weil 1056a26feccaSAndreas Gruenbacher int __ceph_setxattr(struct inode *inode, const char *name, 1057355da1ebSSage Weil const void *value, size_t size, int flags) 1058355da1ebSSage Weil { 1059881a5fa2SAlex Elder struct ceph_vxattr *vxattr; 1060355da1ebSSage Weil struct ceph_inode_info *ci = ceph_inode(inode); 1061a26feccaSAndreas Gruenbacher struct ceph_mds_client *mdsc = ceph_sb_to_client(inode->i_sb)->mdsc; 1062f66fd9f0SYan, Zheng struct ceph_cap_flush *prealloc_cf = NULL; 106386968ef2SLuis Henriques struct ceph_buffer *old_blob = NULL; 106418fa8b3fSAlex Elder int issued; 1065355da1ebSSage Weil int err; 1066fbc0b970SYan, Zheng int dirty = 0; 1067355da1ebSSage Weil int name_len = strlen(name); 1068355da1ebSSage Weil int val_len = size; 1069355da1ebSSage Weil char *newname = NULL; 1070355da1ebSSage Weil char *newval = NULL; 1071355da1ebSSage Weil struct ceph_inode_xattr *xattr = NULL; 1072355da1ebSSage Weil int required_blob_size; 1073f1919826SYan, Zheng bool check_realm = false; 1074604d1b02SYan, Zheng bool lock_snap_rwsem = false; 1075355da1ebSSage Weil 10762cdeb1e4SAndreas Gruenbacher if (ceph_snap(inode) != CEPH_NOSNAP) 10772cdeb1e4SAndreas Gruenbacher return -EROFS; 1078355da1ebSSage Weil 107906476a69SAlex Elder vxattr = ceph_match_vxattr(inode, name); 1080f1919826SYan, Zheng if (vxattr) { 10814e9906e7SYan, Zheng if (vxattr->flags & VXATTR_FLAG_READONLY) 1082355da1ebSSage Weil return -EOPNOTSUPP; 1083f1919826SYan, Zheng if (value && !strncmp(vxattr->name, "ceph.quota", 10)) 1084f1919826SYan, Zheng check_realm = true; 1085f1919826SYan, Zheng } 1086355da1ebSSage Weil 10873adf654dSSage Weil /* pass any unhandled ceph.* xattrs through to the MDS */ 10883adf654dSSage Weil if (!strncmp(name, XATTR_CEPH_PREFIX, XATTR_CEPH_PREFIX_LEN)) 10893adf654dSSage Weil goto do_sync_unlocked; 10903adf654dSSage Weil 1091355da1ebSSage Weil /* preallocate memory for xattr name, value, index node */ 1092355da1ebSSage Weil err = -ENOMEM; 109361413c2fSJulia Lawall newname = kmemdup(name, name_len + 1, GFP_NOFS); 1094355da1ebSSage Weil if (!newname) 1095355da1ebSSage Weil goto out; 1096355da1ebSSage Weil 1097355da1ebSSage Weil if (val_len) { 1098b829c195SAlex Elder newval = kmemdup(value, val_len, GFP_NOFS); 1099355da1ebSSage Weil if (!newval) 1100355da1ebSSage Weil goto out; 1101355da1ebSSage Weil } 1102355da1ebSSage Weil 1103355da1ebSSage Weil xattr = kmalloc(sizeof(struct ceph_inode_xattr), GFP_NOFS); 1104355da1ebSSage Weil if (!xattr) 1105355da1ebSSage Weil goto out; 1106355da1ebSSage Weil 1107f66fd9f0SYan, Zheng prealloc_cf = ceph_alloc_cap_flush(); 1108f66fd9f0SYan, Zheng if (!prealloc_cf) 1109f66fd9f0SYan, Zheng goto out; 1110f66fd9f0SYan, Zheng 1111be655596SSage Weil spin_lock(&ci->i_ceph_lock); 1112355da1ebSSage Weil retry: 1113355da1ebSSage Weil issued = __ceph_caps_issued(ci, NULL); 1114508b32d8SYan, Zheng if (ci->i_xattrs.version == 0 || !(issued & CEPH_CAP_XATTR_EXCL)) 1115355da1ebSSage Weil goto do_sync; 1116604d1b02SYan, Zheng 1117604d1b02SYan, Zheng if (!lock_snap_rwsem && !ci->i_head_snapc) { 1118604d1b02SYan, Zheng lock_snap_rwsem = true; 1119604d1b02SYan, Zheng if (!down_read_trylock(&mdsc->snap_rwsem)) { 1120604d1b02SYan, Zheng spin_unlock(&ci->i_ceph_lock); 1121604d1b02SYan, Zheng down_read(&mdsc->snap_rwsem); 1122604d1b02SYan, Zheng spin_lock(&ci->i_ceph_lock); 1123604d1b02SYan, Zheng goto retry; 1124604d1b02SYan, Zheng } 1125604d1b02SYan, Zheng } 1126604d1b02SYan, Zheng 1127d36e0b62SJeff Layton dout("setxattr %p name '%s' issued %s\n", inode, name, 1128d36e0b62SJeff Layton ceph_cap_string(issued)); 1129355da1ebSSage Weil __build_xattrs(inode); 1130355da1ebSSage Weil 1131355da1ebSSage Weil required_blob_size = __get_required_blob_size(ci, name_len, val_len); 1132355da1ebSSage Weil 1133355da1ebSSage Weil if (!ci->i_xattrs.prealloc_blob || 1134355da1ebSSage Weil required_blob_size > ci->i_xattrs.prealloc_blob->alloc_len) { 113518fa8b3fSAlex Elder struct ceph_buffer *blob; 1136355da1ebSSage Weil 1137be655596SSage Weil spin_unlock(&ci->i_ceph_lock); 113886968ef2SLuis Henriques ceph_buffer_put(old_blob); /* Shouldn't be required */ 113986968ef2SLuis Henriques dout(" pre-allocating new blob size=%d\n", required_blob_size); 1140b6c1d5b8SSage Weil blob = ceph_buffer_new(required_blob_size, GFP_NOFS); 1141355da1ebSSage Weil if (!blob) 1142604d1b02SYan, Zheng goto do_sync_unlocked; 1143be655596SSage Weil spin_lock(&ci->i_ceph_lock); 114486968ef2SLuis Henriques /* prealloc_blob can't be released while holding i_ceph_lock */ 1145b6c1d5b8SSage Weil if (ci->i_xattrs.prealloc_blob) 114686968ef2SLuis Henriques old_blob = ci->i_xattrs.prealloc_blob; 1147355da1ebSSage Weil ci->i_xattrs.prealloc_blob = blob; 1148355da1ebSSage Weil goto retry; 1149355da1ebSSage Weil } 1150355da1ebSSage Weil 1151bcdfeb2eSYan, Zheng err = __set_xattr(ci, newname, name_len, newval, val_len, 1152bcdfeb2eSYan, Zheng flags, value ? 1 : -1, &xattr); 115318fa8b3fSAlex Elder 1154fbc0b970SYan, Zheng if (!err) { 1155f66fd9f0SYan, Zheng dirty = __ceph_mark_dirty_caps(ci, CEPH_CAP_XATTR_EXCL, 1156f66fd9f0SYan, Zheng &prealloc_cf); 1157355da1ebSSage Weil ci->i_xattrs.dirty = true; 1158c2050a45SDeepa Dinamani inode->i_ctime = current_time(inode); 1159fbc0b970SYan, Zheng } 116018fa8b3fSAlex Elder 1161be655596SSage Weil spin_unlock(&ci->i_ceph_lock); 116286968ef2SLuis Henriques ceph_buffer_put(old_blob); 1163604d1b02SYan, Zheng if (lock_snap_rwsem) 1164604d1b02SYan, Zheng up_read(&mdsc->snap_rwsem); 1165fca65b4aSSage Weil if (dirty) 1166fca65b4aSSage Weil __mark_inode_dirty(inode, dirty); 1167f66fd9f0SYan, Zheng ceph_free_cap_flush(prealloc_cf); 1168355da1ebSSage Weil return err; 1169355da1ebSSage Weil 1170355da1ebSSage Weil do_sync: 1171be655596SSage Weil spin_unlock(&ci->i_ceph_lock); 11723adf654dSSage Weil do_sync_unlocked: 1173604d1b02SYan, Zheng if (lock_snap_rwsem) 1174604d1b02SYan, Zheng up_read(&mdsc->snap_rwsem); 1175315f2408SYan, Zheng 1176315f2408SYan, Zheng /* security module set xattr while filling trace */ 1177d37b1d99SMarkus Elfring if (current->journal_info) { 1178315f2408SYan, Zheng pr_warn_ratelimited("sync setxattr %p " 1179315f2408SYan, Zheng "during filling trace\n", inode); 1180315f2408SYan, Zheng err = -EBUSY; 1181315f2408SYan, Zheng } else { 1182a26feccaSAndreas Gruenbacher err = ceph_sync_setxattr(inode, name, value, size, flags); 1183f1919826SYan, Zheng if (err >= 0 && check_realm) { 1184f1919826SYan, Zheng /* check if snaprealm was created for quota inode */ 1185f1919826SYan, Zheng spin_lock(&ci->i_ceph_lock); 1186f1919826SYan, Zheng if ((ci->i_max_files || ci->i_max_bytes) && 1187f1919826SYan, Zheng !(ci->i_snap_realm && 1188f1919826SYan, Zheng ci->i_snap_realm->ino == ci->i_vino.ino)) 1189f1919826SYan, Zheng err = -EOPNOTSUPP; 1190f1919826SYan, Zheng spin_unlock(&ci->i_ceph_lock); 1191f1919826SYan, Zheng } 1192315f2408SYan, Zheng } 1193355da1ebSSage Weil out: 1194f66fd9f0SYan, Zheng ceph_free_cap_flush(prealloc_cf); 1195355da1ebSSage Weil kfree(newname); 1196355da1ebSSage Weil kfree(newval); 1197355da1ebSSage Weil kfree(xattr); 1198355da1ebSSage Weil return err; 1199355da1ebSSage Weil } 1200355da1ebSSage Weil 12012cdeb1e4SAndreas Gruenbacher static int ceph_get_xattr_handler(const struct xattr_handler *handler, 12022cdeb1e4SAndreas Gruenbacher struct dentry *dentry, struct inode *inode, 12032cdeb1e4SAndreas Gruenbacher const char *name, void *value, size_t size) 12047221fe4cSGuangliang Zhao { 12052cdeb1e4SAndreas Gruenbacher if (!ceph_is_valid_xattr(name)) 12062cdeb1e4SAndreas Gruenbacher return -EOPNOTSUPP; 12072cdeb1e4SAndreas Gruenbacher return __ceph_getxattr(inode, name, value, size); 12087221fe4cSGuangliang Zhao } 1209315f2408SYan, Zheng 12102cdeb1e4SAndreas Gruenbacher static int ceph_set_xattr_handler(const struct xattr_handler *handler, 121159301226SAl Viro struct dentry *unused, struct inode *inode, 121259301226SAl Viro const char *name, const void *value, 121359301226SAl Viro size_t size, int flags) 12142cdeb1e4SAndreas Gruenbacher { 12152cdeb1e4SAndreas Gruenbacher if (!ceph_is_valid_xattr(name)) 12162cdeb1e4SAndreas Gruenbacher return -EOPNOTSUPP; 121759301226SAl Viro return __ceph_setxattr(inode, name, value, size, flags); 12182cdeb1e4SAndreas Gruenbacher } 12192cdeb1e4SAndreas Gruenbacher 12205130cceaSWei Yongjun static const struct xattr_handler ceph_other_xattr_handler = { 12212cdeb1e4SAndreas Gruenbacher .prefix = "", /* match any name => handlers called with full name */ 12222cdeb1e4SAndreas Gruenbacher .get = ceph_get_xattr_handler, 12232cdeb1e4SAndreas Gruenbacher .set = ceph_set_xattr_handler, 12242cdeb1e4SAndreas Gruenbacher }; 12252cdeb1e4SAndreas Gruenbacher 1226315f2408SYan, Zheng #ifdef CONFIG_SECURITY 1227315f2408SYan, Zheng bool ceph_security_xattr_wanted(struct inode *in) 1228315f2408SYan, Zheng { 1229315f2408SYan, Zheng return in->i_security != NULL; 1230315f2408SYan, Zheng } 1231315f2408SYan, Zheng 1232315f2408SYan, Zheng bool ceph_security_xattr_deadlock(struct inode *in) 1233315f2408SYan, Zheng { 1234315f2408SYan, Zheng struct ceph_inode_info *ci; 1235315f2408SYan, Zheng bool ret; 1236d37b1d99SMarkus Elfring if (!in->i_security) 1237315f2408SYan, Zheng return false; 1238315f2408SYan, Zheng ci = ceph_inode(in); 1239315f2408SYan, Zheng spin_lock(&ci->i_ceph_lock); 1240315f2408SYan, Zheng ret = !(ci->i_ceph_flags & CEPH_I_SEC_INITED) && 1241315f2408SYan, Zheng !(ci->i_xattrs.version > 0 && 1242315f2408SYan, Zheng __ceph_caps_issued_mask(ci, CEPH_CAP_XATTR_SHARED, 0)); 1243315f2408SYan, Zheng spin_unlock(&ci->i_ceph_lock); 1244315f2408SYan, Zheng return ret; 1245315f2408SYan, Zheng } 1246ac6713ccSYan, Zheng 1247ac6713ccSYan, Zheng #ifdef CONFIG_CEPH_FS_SECURITY_LABEL 1248ac6713ccSYan, Zheng int ceph_security_init_secctx(struct dentry *dentry, umode_t mode, 1249ac6713ccSYan, Zheng struct ceph_acl_sec_ctx *as_ctx) 1250ac6713ccSYan, Zheng { 1251ac6713ccSYan, Zheng struct ceph_pagelist *pagelist = as_ctx->pagelist; 1252ac6713ccSYan, Zheng const char *name; 1253ac6713ccSYan, Zheng size_t name_len; 1254ac6713ccSYan, Zheng int err; 1255ac6713ccSYan, Zheng 1256ac6713ccSYan, Zheng err = security_dentry_init_security(dentry, mode, &dentry->d_name, 1257ac6713ccSYan, Zheng &as_ctx->sec_ctx, 1258ac6713ccSYan, Zheng &as_ctx->sec_ctxlen); 1259ac6713ccSYan, Zheng if (err < 0) { 1260ac6713ccSYan, Zheng WARN_ON_ONCE(err != -EOPNOTSUPP); 1261ac6713ccSYan, Zheng err = 0; /* do nothing */ 1262ac6713ccSYan, Zheng goto out; 1263ac6713ccSYan, Zheng } 1264ac6713ccSYan, Zheng 1265ac6713ccSYan, Zheng err = -ENOMEM; 1266ac6713ccSYan, Zheng if (!pagelist) { 1267ac6713ccSYan, Zheng pagelist = ceph_pagelist_alloc(GFP_KERNEL); 1268ac6713ccSYan, Zheng if (!pagelist) 1269ac6713ccSYan, Zheng goto out; 1270ac6713ccSYan, Zheng err = ceph_pagelist_reserve(pagelist, PAGE_SIZE); 1271ac6713ccSYan, Zheng if (err) 1272ac6713ccSYan, Zheng goto out; 1273ac6713ccSYan, Zheng ceph_pagelist_encode_32(pagelist, 1); 1274ac6713ccSYan, Zheng } 1275ac6713ccSYan, Zheng 1276ac6713ccSYan, Zheng /* 1277ac6713ccSYan, Zheng * FIXME: Make security_dentry_init_security() generic. Currently 1278ac6713ccSYan, Zheng * It only supports single security module and only selinux has 1279ac6713ccSYan, Zheng * dentry_init_security hook. 1280ac6713ccSYan, Zheng */ 1281ac6713ccSYan, Zheng name = XATTR_NAME_SELINUX; 1282ac6713ccSYan, Zheng name_len = strlen(name); 1283ac6713ccSYan, Zheng err = ceph_pagelist_reserve(pagelist, 1284ac6713ccSYan, Zheng 4 * 2 + name_len + as_ctx->sec_ctxlen); 1285ac6713ccSYan, Zheng if (err) 1286ac6713ccSYan, Zheng goto out; 1287ac6713ccSYan, Zheng 1288ac6713ccSYan, Zheng if (as_ctx->pagelist) { 1289ac6713ccSYan, Zheng /* update count of KV pairs */ 1290ac6713ccSYan, Zheng BUG_ON(pagelist->length <= sizeof(__le32)); 1291ac6713ccSYan, Zheng if (list_is_singular(&pagelist->head)) { 1292ac6713ccSYan, Zheng le32_add_cpu((__le32*)pagelist->mapped_tail, 1); 1293ac6713ccSYan, Zheng } else { 1294ac6713ccSYan, Zheng struct page *page = list_first_entry(&pagelist->head, 1295ac6713ccSYan, Zheng struct page, lru); 1296ac6713ccSYan, Zheng void *addr = kmap_atomic(page); 1297ac6713ccSYan, Zheng le32_add_cpu((__le32*)addr, 1); 1298ac6713ccSYan, Zheng kunmap_atomic(addr); 1299ac6713ccSYan, Zheng } 1300ac6713ccSYan, Zheng } else { 1301ac6713ccSYan, Zheng as_ctx->pagelist = pagelist; 1302ac6713ccSYan, Zheng } 1303ac6713ccSYan, Zheng 1304ac6713ccSYan, Zheng ceph_pagelist_encode_32(pagelist, name_len); 1305ac6713ccSYan, Zheng ceph_pagelist_append(pagelist, name, name_len); 1306ac6713ccSYan, Zheng 1307ac6713ccSYan, Zheng ceph_pagelist_encode_32(pagelist, as_ctx->sec_ctxlen); 1308ac6713ccSYan, Zheng ceph_pagelist_append(pagelist, as_ctx->sec_ctx, as_ctx->sec_ctxlen); 1309ac6713ccSYan, Zheng 1310ac6713ccSYan, Zheng err = 0; 1311ac6713ccSYan, Zheng out: 1312ac6713ccSYan, Zheng if (pagelist && !as_ctx->pagelist) 1313ac6713ccSYan, Zheng ceph_pagelist_release(pagelist); 1314ac6713ccSYan, Zheng return err; 1315ac6713ccSYan, Zheng } 1316668959a5SJeff Layton #endif /* CONFIG_CEPH_FS_SECURITY_LABEL */ 1317668959a5SJeff Layton #endif /* CONFIG_SECURITY */ 13185c31e92dSYan, Zheng 13195c31e92dSYan, Zheng void ceph_release_acl_sec_ctx(struct ceph_acl_sec_ctx *as_ctx) 13205c31e92dSYan, Zheng { 13215c31e92dSYan, Zheng #ifdef CONFIG_CEPH_FS_POSIX_ACL 13225c31e92dSYan, Zheng posix_acl_release(as_ctx->acl); 13235c31e92dSYan, Zheng posix_acl_release(as_ctx->default_acl); 13245c31e92dSYan, Zheng #endif 1325ac6713ccSYan, Zheng #ifdef CONFIG_CEPH_FS_SECURITY_LABEL 1326ac6713ccSYan, Zheng security_release_secctx(as_ctx->sec_ctx, as_ctx->sec_ctxlen); 1327ac6713ccSYan, Zheng #endif 13285c31e92dSYan, Zheng if (as_ctx->pagelist) 13295c31e92dSYan, Zheng ceph_pagelist_release(as_ctx->pagelist); 13305c31e92dSYan, Zheng } 1331ac6713ccSYan, Zheng 1332ac6713ccSYan, Zheng /* 1333ac6713ccSYan, Zheng * List of handlers for synthetic system.* attributes. Other 1334ac6713ccSYan, Zheng * attributes are handled directly. 1335ac6713ccSYan, Zheng */ 1336ac6713ccSYan, Zheng const struct xattr_handler *ceph_xattr_handlers[] = { 1337ac6713ccSYan, Zheng #ifdef CONFIG_CEPH_FS_POSIX_ACL 1338ac6713ccSYan, Zheng &posix_acl_access_xattr_handler, 1339ac6713ccSYan, Zheng &posix_acl_default_xattr_handler, 1340ac6713ccSYan, Zheng #endif 1341ac6713ccSYan, Zheng &ceph_other_xattr_handler, 1342ac6713ccSYan, Zheng NULL, 1343ac6713ccSYan, Zheng }; 1344