xref: /openbmc/linux/fs/ext4/xattr.c (revision 0f7bfd6f)
1b2441318SGreg Kroah-Hartman // SPDX-License-Identifier: GPL-2.0
2ac27a0ecSDave Kleikamp /*
3617ba13bSMingming Cao  * linux/fs/ext4/xattr.c
4ac27a0ecSDave Kleikamp  *
5ac27a0ecSDave Kleikamp  * Copyright (C) 2001-2003 Andreas Gruenbacher, <agruen@suse.de>
6ac27a0ecSDave Kleikamp  *
7ac27a0ecSDave Kleikamp  * Fix by Harrison Xing <harrison@mountainviewdata.com>.
8617ba13bSMingming Cao  * Ext4 code with a lot of help from Eric Jarman <ejarman@acm.org>.
9ac27a0ecSDave Kleikamp  * Extended attributes for symlinks and special files added per
10ac27a0ecSDave Kleikamp  *  suggestion of Luka Renko <luka.renko@hermes.si>.
11ac27a0ecSDave Kleikamp  * xattr consolidation Copyright (c) 2004 James Morris <jmorris@redhat.com>,
12ac27a0ecSDave Kleikamp  *  Red Hat Inc.
13ac27a0ecSDave Kleikamp  * ea-in-inode support by Alex Tomas <alex@clusterfs.com> aka bzzz
14ac27a0ecSDave Kleikamp  *  and Andreas Gruenbacher <agruen@suse.de>.
15ac27a0ecSDave Kleikamp  */
16ac27a0ecSDave Kleikamp 
17ac27a0ecSDave Kleikamp /*
18ac27a0ecSDave Kleikamp  * Extended attributes are stored directly in inodes (on file systems with
19ac27a0ecSDave Kleikamp  * inodes bigger than 128 bytes) and on additional disk blocks. The i_file_acl
20ac27a0ecSDave Kleikamp  * field contains the block number if an inode uses an additional block. All
21ac27a0ecSDave Kleikamp  * attributes must fit in the inode and one additional block. Blocks that
22ac27a0ecSDave Kleikamp  * contain the identical set of attributes may be shared among several inodes.
23ac27a0ecSDave Kleikamp  * Identical blocks are detected by keeping a cache of blocks that have
24ac27a0ecSDave Kleikamp  * recently been accessed.
25ac27a0ecSDave Kleikamp  *
26ac27a0ecSDave Kleikamp  * The attributes in inodes and on blocks have a different header; the entries
27ac27a0ecSDave Kleikamp  * are stored in the same format:
28ac27a0ecSDave Kleikamp  *
29ac27a0ecSDave Kleikamp  *   +------------------+
30ac27a0ecSDave Kleikamp  *   | header           |
31ac27a0ecSDave Kleikamp  *   | entry 1          | |
32ac27a0ecSDave Kleikamp  *   | entry 2          | | growing downwards
33ac27a0ecSDave Kleikamp  *   | entry 3          | v
34ac27a0ecSDave Kleikamp  *   | four null bytes  |
35ac27a0ecSDave Kleikamp  *   | . . .            |
36ac27a0ecSDave Kleikamp  *   | value 1          | ^
37ac27a0ecSDave Kleikamp  *   | value 3          | | growing upwards
38ac27a0ecSDave Kleikamp  *   | value 2          | |
39ac27a0ecSDave Kleikamp  *   +------------------+
40ac27a0ecSDave Kleikamp  *
41ac27a0ecSDave Kleikamp  * The header is followed by multiple entry descriptors. In disk blocks, the
42ac27a0ecSDave Kleikamp  * entry descriptors are kept sorted. In inodes, they are unsorted. The
43ac27a0ecSDave Kleikamp  * attribute values are aligned to the end of the block in no specific order.
44ac27a0ecSDave Kleikamp  *
45ac27a0ecSDave Kleikamp  * Locking strategy
46ac27a0ecSDave Kleikamp  * ----------------
47617ba13bSMingming Cao  * EXT4_I(inode)->i_file_acl is protected by EXT4_I(inode)->xattr_sem.
48ac27a0ecSDave Kleikamp  * EA blocks are only changed if they are exclusive to an inode, so
49ac27a0ecSDave Kleikamp  * holding xattr_sem also means that nothing but the EA block's reference
50ac27a0ecSDave Kleikamp  * count can change. Multiple writers to the same block are synchronized
51ac27a0ecSDave Kleikamp  * by the buffer lock.
52ac27a0ecSDave Kleikamp  */
53ac27a0ecSDave Kleikamp 
54ac27a0ecSDave Kleikamp #include <linux/init.h>
55ac27a0ecSDave Kleikamp #include <linux/fs.h>
56ac27a0ecSDave Kleikamp #include <linux/slab.h>
577a2508e1SJan Kara #include <linux/mbcache.h>
58ac27a0ecSDave Kleikamp #include <linux/quotaops.h>
59ee73f9a5SJeff Layton #include <linux/iversion.h>
603dcf5451SChristoph Hellwig #include "ext4_jbd2.h"
613dcf5451SChristoph Hellwig #include "ext4.h"
62ac27a0ecSDave Kleikamp #include "xattr.h"
63ac27a0ecSDave Kleikamp #include "acl.h"
64ac27a0ecSDave Kleikamp 
65617ba13bSMingming Cao #ifdef EXT4_XATTR_DEBUG
66d74f3d25SJoe Perches # define ea_idebug(inode, fmt, ...)					\
67d74f3d25SJoe Perches 	printk(KERN_DEBUG "inode %s:%lu: " fmt "\n",			\
68d74f3d25SJoe Perches 	       inode->i_sb->s_id, inode->i_ino, ##__VA_ARGS__)
69d74f3d25SJoe Perches # define ea_bdebug(bh, fmt, ...)					\
70d74f3d25SJoe Perches 	printk(KERN_DEBUG "block %pg:%lu: " fmt "\n",			\
71d74f3d25SJoe Perches 	       bh->b_bdev, (unsigned long)bh->b_blocknr, ##__VA_ARGS__)
72ac27a0ecSDave Kleikamp #else
73ace36ad4SJoe Perches # define ea_idebug(inode, fmt, ...)	no_printk(fmt, ##__VA_ARGS__)
74ace36ad4SJoe Perches # define ea_bdebug(bh, fmt, ...)	no_printk(fmt, ##__VA_ARGS__)
75ac27a0ecSDave Kleikamp #endif
76ac27a0ecSDave Kleikamp 
7747387409STahsin Erdogan static void ext4_xattr_block_cache_insert(struct mb_cache *,
7847387409STahsin Erdogan 					  struct buffer_head *);
7947387409STahsin Erdogan static struct buffer_head *
8047387409STahsin Erdogan ext4_xattr_block_cache_find(struct inode *, struct ext4_xattr_header *,
817a2508e1SJan Kara 			    struct mb_cache_entry **);
82b9fc761eSTahsin Erdogan static __le32 ext4_xattr_hash_entry(char *name, size_t name_len, __le32 *value,
83b9fc761eSTahsin Erdogan 				    size_t value_count);
84f3bbac32SLinus Torvalds static __le32 ext4_xattr_hash_entry_signed(char *name, size_t name_len, __le32 *value,
85f3bbac32SLinus Torvalds 				    size_t value_count);
86daf83281STahsin Erdogan static void ext4_xattr_rehash(struct ext4_xattr_header *);
87ac27a0ecSDave Kleikamp 
88d6006186SEric Biggers static const struct xattr_handler * const ext4_xattr_handler_map[] = {
89617ba13bSMingming Cao 	[EXT4_XATTR_INDEX_USER]		     = &ext4_xattr_user_handler,
9003010a33STheodore Ts'o #ifdef CONFIG_EXT4_FS_POSIX_ACL
9164e178a7SChristoph Hellwig 	[EXT4_XATTR_INDEX_POSIX_ACL_ACCESS]  = &posix_acl_access_xattr_handler,
9264e178a7SChristoph Hellwig 	[EXT4_XATTR_INDEX_POSIX_ACL_DEFAULT] = &posix_acl_default_xattr_handler,
93ac27a0ecSDave Kleikamp #endif
94617ba13bSMingming Cao 	[EXT4_XATTR_INDEX_TRUSTED]	     = &ext4_xattr_trusted_handler,
9503010a33STheodore Ts'o #ifdef CONFIG_EXT4_FS_SECURITY
96617ba13bSMingming Cao 	[EXT4_XATTR_INDEX_SECURITY]	     = &ext4_xattr_security_handler,
97ac27a0ecSDave Kleikamp #endif
9888ee9d57SJan (janneke) Nieuwenhuizen 	[EXT4_XATTR_INDEX_HURD]		     = &ext4_xattr_hurd_handler,
99ac27a0ecSDave Kleikamp };
100ac27a0ecSDave Kleikamp 
10111e27528SStephen Hemminger const struct xattr_handler *ext4_xattr_handlers[] = {
102617ba13bSMingming Cao 	&ext4_xattr_user_handler,
103617ba13bSMingming Cao 	&ext4_xattr_trusted_handler,
10403010a33STheodore Ts'o #ifdef CONFIG_EXT4_FS_POSIX_ACL
10564e178a7SChristoph Hellwig 	&posix_acl_access_xattr_handler,
10664e178a7SChristoph Hellwig 	&posix_acl_default_xattr_handler,
107ac27a0ecSDave Kleikamp #endif
10803010a33STheodore Ts'o #ifdef CONFIG_EXT4_FS_SECURITY
109617ba13bSMingming Cao 	&ext4_xattr_security_handler,
110ac27a0ecSDave Kleikamp #endif
11188ee9d57SJan (janneke) Nieuwenhuizen 	&ext4_xattr_hurd_handler,
112ac27a0ecSDave Kleikamp 	NULL
113ac27a0ecSDave Kleikamp };
114ac27a0ecSDave Kleikamp 
11547387409STahsin Erdogan #define EA_BLOCK_CACHE(inode)	(((struct ext4_sb_info *) \
11647387409STahsin Erdogan 				inode->i_sb->s_fs_info)->s_ea_block_cache)
1179c191f70ST Makphaibulchoke 
118dec214d0STahsin Erdogan #define EA_INODE_CACHE(inode)	(((struct ext4_sb_info *) \
119dec214d0STahsin Erdogan 				inode->i_sb->s_fs_info)->s_ea_inode_cache)
120dec214d0STahsin Erdogan 
12130a7eb97STahsin Erdogan static int
12230a7eb97STahsin Erdogan ext4_expand_inode_array(struct ext4_xattr_inode_array **ea_inode_array,
12330a7eb97STahsin Erdogan 			struct inode *inode);
12430a7eb97STahsin Erdogan 
12533d201e0STahsin Erdogan #ifdef CONFIG_LOCKDEP
12633d201e0STahsin Erdogan void ext4_xattr_inode_set_class(struct inode *ea_inode)
12733d201e0STahsin Erdogan {
12833d201e0STahsin Erdogan 	lockdep_set_subclass(&ea_inode->i_rwsem, 1);
12933d201e0STahsin Erdogan }
13033d201e0STahsin Erdogan #endif
13133d201e0STahsin Erdogan 
132cc8e94fdSDarrick J. Wong static __le32 ext4_xattr_block_csum(struct inode *inode,
133cc8e94fdSDarrick J. Wong 				    sector_t block_nr,
134cc8e94fdSDarrick J. Wong 				    struct ext4_xattr_header *hdr)
135cc8e94fdSDarrick J. Wong {
136cc8e94fdSDarrick J. Wong 	struct ext4_sb_info *sbi = EXT4_SB(inode->i_sb);
137d6a77105STheodore Ts'o 	__u32 csum;
138d6a77105STheodore Ts'o 	__le64 dsk_block_nr = cpu_to_le64(block_nr);
139b47820edSDaeho Jeong 	__u32 dummy_csum = 0;
140b47820edSDaeho Jeong 	int offset = offsetof(struct ext4_xattr_header, h_checksum);
141cc8e94fdSDarrick J. Wong 
142d6a77105STheodore Ts'o 	csum = ext4_chksum(sbi, sbi->s_csum_seed, (__u8 *)&dsk_block_nr,
143d6a77105STheodore Ts'o 			   sizeof(dsk_block_nr));
144b47820edSDaeho Jeong 	csum = ext4_chksum(sbi, csum, (__u8 *)hdr, offset);
145b47820edSDaeho Jeong 	csum = ext4_chksum(sbi, csum, (__u8 *)&dummy_csum, sizeof(dummy_csum));
146b47820edSDaeho Jeong 	offset += sizeof(dummy_csum);
147b47820edSDaeho Jeong 	csum = ext4_chksum(sbi, csum, (__u8 *)hdr + offset,
148b47820edSDaeho Jeong 			   EXT4_BLOCK_SIZE(inode->i_sb) - offset);
14941eb70ddSTao Ma 
150cc8e94fdSDarrick J. Wong 	return cpu_to_le32(csum);
151cc8e94fdSDarrick J. Wong }
152cc8e94fdSDarrick J. Wong 
153cc8e94fdSDarrick J. Wong static int ext4_xattr_block_csum_verify(struct inode *inode,
154dac7a4b4STheodore Ts'o 					struct buffer_head *bh)
155cc8e94fdSDarrick J. Wong {
156dac7a4b4STheodore Ts'o 	struct ext4_xattr_header *hdr = BHDR(bh);
157dac7a4b4STheodore Ts'o 	int ret = 1;
158dac7a4b4STheodore Ts'o 
159dac7a4b4STheodore Ts'o 	if (ext4_has_metadata_csum(inode->i_sb)) {
160dac7a4b4STheodore Ts'o 		lock_buffer(bh);
161dac7a4b4STheodore Ts'o 		ret = (hdr->h_checksum == ext4_xattr_block_csum(inode,
162dac7a4b4STheodore Ts'o 							bh->b_blocknr, hdr));
163dac7a4b4STheodore Ts'o 		unlock_buffer(bh);
164dac7a4b4STheodore Ts'o 	}
165dac7a4b4STheodore Ts'o 	return ret;
166cc8e94fdSDarrick J. Wong }
167cc8e94fdSDarrick J. Wong 
168cc8e94fdSDarrick J. Wong static void ext4_xattr_block_csum_set(struct inode *inode,
169cc8e94fdSDarrick J. Wong 				      struct buffer_head *bh)
170cc8e94fdSDarrick J. Wong {
171dac7a4b4STheodore Ts'o 	if (ext4_has_metadata_csum(inode->i_sb))
172dac7a4b4STheodore Ts'o 		BHDR(bh)->h_checksum = ext4_xattr_block_csum(inode,
173dac7a4b4STheodore Ts'o 						bh->b_blocknr, BHDR(bh));
174cc8e94fdSDarrick J. Wong }
175cc8e94fdSDarrick J. Wong 
17611e27528SStephen Hemminger static inline const struct xattr_handler *
177617ba13bSMingming Cao ext4_xattr_handler(int name_index)
178ac27a0ecSDave Kleikamp {
17911e27528SStephen Hemminger 	const struct xattr_handler *handler = NULL;
180ac27a0ecSDave Kleikamp 
181617ba13bSMingming Cao 	if (name_index > 0 && name_index < ARRAY_SIZE(ext4_xattr_handler_map))
182617ba13bSMingming Cao 		handler = ext4_xattr_handler_map[name_index];
183ac27a0ecSDave Kleikamp 	return handler;
184ac27a0ecSDave Kleikamp }
185ac27a0ecSDave Kleikamp 
186ac27a0ecSDave Kleikamp static int
1873478c83cSTheodore Ts'o check_xattrs(struct inode *inode, struct buffer_head *bh,
1883478c83cSTheodore Ts'o 	     struct ext4_xattr_entry *entry, void *end, void *value_start,
1893478c83cSTheodore Ts'o 	     const char *function, unsigned int line)
190ac27a0ecSDave Kleikamp {
191a0626e75SDarrick J. Wong 	struct ext4_xattr_entry *e = entry;
1923478c83cSTheodore Ts'o 	int err = -EFSCORRUPTED;
1933478c83cSTheodore Ts'o 	char *err_str;
1943478c83cSTheodore Ts'o 
1953478c83cSTheodore Ts'o 	if (bh) {
1963478c83cSTheodore Ts'o 		if (BHDR(bh)->h_magic != cpu_to_le32(EXT4_XATTR_MAGIC) ||
1973478c83cSTheodore Ts'o 		    BHDR(bh)->h_blocks != cpu_to_le32(1)) {
1983478c83cSTheodore Ts'o 			err_str = "invalid header";
1993478c83cSTheodore Ts'o 			goto errout;
2003478c83cSTheodore Ts'o 		}
2013478c83cSTheodore Ts'o 		if (buffer_verified(bh))
2023478c83cSTheodore Ts'o 			return 0;
2033478c83cSTheodore Ts'o 		if (!ext4_xattr_block_csum_verify(inode, bh)) {
2043478c83cSTheodore Ts'o 			err = -EFSBADCRC;
2053478c83cSTheodore Ts'o 			err_str = "invalid checksum";
2063478c83cSTheodore Ts'o 			goto errout;
2073478c83cSTheodore Ts'o 		}
2083478c83cSTheodore Ts'o 	} else {
2093478c83cSTheodore Ts'o 		struct ext4_xattr_ibody_header *header = value_start;
2103478c83cSTheodore Ts'o 
2113478c83cSTheodore Ts'o 		header -= 1;
2123478c83cSTheodore Ts'o 		if (end - (void *)header < sizeof(*header) + sizeof(u32)) {
2133478c83cSTheodore Ts'o 			err_str = "in-inode xattr block too small";
2143478c83cSTheodore Ts'o 			goto errout;
2153478c83cSTheodore Ts'o 		}
2163478c83cSTheodore Ts'o 		if (header->h_magic != cpu_to_le32(EXT4_XATTR_MAGIC)) {
2173478c83cSTheodore Ts'o 			err_str = "bad magic number in in-inode xattr";
2183478c83cSTheodore Ts'o 			goto errout;
2193478c83cSTheodore Ts'o 		}
2203478c83cSTheodore Ts'o 	}
221a0626e75SDarrick J. Wong 
222d7614cc1SEric Biggers 	/* Find the end of the names list */
223a0626e75SDarrick J. Wong 	while (!IS_LAST_ENTRY(e)) {
224a0626e75SDarrick J. Wong 		struct ext4_xattr_entry *next = EXT4_XATTR_NEXT(e);
2253478c83cSTheodore Ts'o 		if ((void *)next >= end) {
2263478c83cSTheodore Ts'o 			err_str = "e_name out of bounds";
2273478c83cSTheodore Ts'o 			goto errout;
2283478c83cSTheodore Ts'o 		}
2293478c83cSTheodore Ts'o 		if (strnlen(e->e_name, e->e_name_len) != e->e_name_len) {
2303478c83cSTheodore Ts'o 			err_str = "bad e_name length";
2313478c83cSTheodore Ts'o 			goto errout;
2323478c83cSTheodore Ts'o 		}
233a0626e75SDarrick J. Wong 		e = next;
234ac27a0ecSDave Kleikamp 	}
235a0626e75SDarrick J. Wong 
236d7614cc1SEric Biggers 	/* Check the values */
237a0626e75SDarrick J. Wong 	while (!IS_LAST_ENTRY(entry)) {
238d7614cc1SEric Biggers 		u32 size = le32_to_cpu(entry->e_value_size);
2393478c83cSTheodore Ts'o 		unsigned long ea_ino = le32_to_cpu(entry->e_value_inum);
240ce3fd194SEric Biggers 
2413478c83cSTheodore Ts'o 		if (!ext4_has_feature_ea_inode(inode->i_sb) && ea_ino) {
2423478c83cSTheodore Ts'o 			err_str = "ea_inode specified without ea_inode feature enabled";
2433478c83cSTheodore Ts'o 			goto errout;
2443478c83cSTheodore Ts'o 		}
2453478c83cSTheodore Ts'o 		if (ea_ino && ((ea_ino == EXT4_ROOT_INO) ||
2463478c83cSTheodore Ts'o 			       !ext4_valid_inum(inode->i_sb, ea_ino))) {
2473478c83cSTheodore Ts'o 			err_str = "invalid ea_ino";
2483478c83cSTheodore Ts'o 			goto errout;
2493478c83cSTheodore Ts'o 		}
2503478c83cSTheodore Ts'o 		if (size > EXT4_XATTR_SIZE_MAX) {
2513478c83cSTheodore Ts'o 			err_str = "e_value size too large";
2523478c83cSTheodore Ts'o 			goto errout;
2533478c83cSTheodore Ts'o 		}
254ce3fd194SEric Biggers 
255ce3fd194SEric Biggers 		if (size != 0 && entry->e_value_inum == 0) {
256ce3fd194SEric Biggers 			u16 offs = le16_to_cpu(entry->e_value_offs);
257d7614cc1SEric Biggers 			void *value;
258d7614cc1SEric Biggers 
259d7614cc1SEric Biggers 			/*
260d7614cc1SEric Biggers 			 * The value cannot overlap the names, and the value
261d7614cc1SEric Biggers 			 * with padding cannot extend beyond 'end'.  Check both
262d7614cc1SEric Biggers 			 * the padded and unpadded sizes, since the size may
263d7614cc1SEric Biggers 			 * overflow to 0 when adding padding.
264d7614cc1SEric Biggers 			 */
2653478c83cSTheodore Ts'o 			if (offs > end - value_start) {
2663478c83cSTheodore Ts'o 				err_str = "e_value out of bounds";
2673478c83cSTheodore Ts'o 				goto errout;
2683478c83cSTheodore Ts'o 			}
269d7614cc1SEric Biggers 			value = value_start + offs;
270d7614cc1SEric Biggers 			if (value < (void *)e + sizeof(u32) ||
271d7614cc1SEric Biggers 			    size > end - value ||
2723478c83cSTheodore Ts'o 			    EXT4_XATTR_SIZE(size) > end - value) {
2733478c83cSTheodore Ts'o 				err_str = "overlapping e_value ";
2743478c83cSTheodore Ts'o 				goto errout;
2753478c83cSTheodore Ts'o 			}
276d7614cc1SEric Biggers 		}
277a0626e75SDarrick J. Wong 		entry = EXT4_XATTR_NEXT(entry);
278a0626e75SDarrick J. Wong 	}
2793478c83cSTheodore Ts'o 	if (bh)
2803478c83cSTheodore Ts'o 		set_buffer_verified(bh);
281ac27a0ecSDave Kleikamp 	return 0;
2823478c83cSTheodore Ts'o 
2833478c83cSTheodore Ts'o errout:
2843478c83cSTheodore Ts'o 	if (bh)
2853478c83cSTheodore Ts'o 		__ext4_error_inode(inode, function, line, 0, -err,
2863478c83cSTheodore Ts'o 				   "corrupted xattr block %llu: %s",
2873478c83cSTheodore Ts'o 				   (unsigned long long) bh->b_blocknr,
2883478c83cSTheodore Ts'o 				   err_str);
2893478c83cSTheodore Ts'o 	else
2903478c83cSTheodore Ts'o 		__ext4_error_inode(inode, function, line, 0, -err,
2913478c83cSTheodore Ts'o 				   "corrupted in-inode xattr: %s", err_str);
2923478c83cSTheodore Ts'o 	return err;
293ac27a0ecSDave Kleikamp }
294ac27a0ecSDave Kleikamp 
295ac27a0ecSDave Kleikamp static inline int
296de05ca85STheodore Ts'o __ext4_xattr_check_block(struct inode *inode, struct buffer_head *bh,
297de05ca85STheodore Ts'o 			 const char *function, unsigned int line)
298ac27a0ecSDave Kleikamp {
2993478c83cSTheodore Ts'o 	return check_xattrs(inode, bh, BFIRST(bh), bh->b_data + bh->b_size,
3003478c83cSTheodore Ts'o 			    bh->b_data, function, line);
301ac27a0ecSDave Kleikamp }
302ac27a0ecSDave Kleikamp 
303de05ca85STheodore Ts'o #define ext4_xattr_check_block(inode, bh) \
304de05ca85STheodore Ts'o 	__ext4_xattr_check_block((inode), (bh),  __func__, __LINE__)
305de05ca85STheodore Ts'o 
306de05ca85STheodore Ts'o 
3073478c83cSTheodore Ts'o static inline int
3089e92f48cSTheodore Ts'o __xattr_check_inode(struct inode *inode, struct ext4_xattr_ibody_header *header,
3099e92f48cSTheodore Ts'o 			 void *end, const char *function, unsigned int line)
3109e92f48cSTheodore Ts'o {
3113478c83cSTheodore Ts'o 	return check_xattrs(inode, NULL, IFIRST(header), end, IFIRST(header),
3123478c83cSTheodore Ts'o 			    function, line);
3139e92f48cSTheodore Ts'o }
3149e92f48cSTheodore Ts'o 
3159e92f48cSTheodore Ts'o #define xattr_check_inode(inode, header, end) \
3169e92f48cSTheodore Ts'o 	__xattr_check_inode((inode), (header), (end), __func__, __LINE__)
3179e92f48cSTheodore Ts'o 
318ac27a0ecSDave Kleikamp static int
3199496005dSTheodore Ts'o xattr_find_entry(struct inode *inode, struct ext4_xattr_entry **pentry,
3209496005dSTheodore Ts'o 		 void *end, int name_index, const char *name, int sorted)
321ac27a0ecSDave Kleikamp {
3229496005dSTheodore Ts'o 	struct ext4_xattr_entry *entry, *next;
323ac27a0ecSDave Kleikamp 	size_t name_len;
324ac27a0ecSDave Kleikamp 	int cmp = 1;
325ac27a0ecSDave Kleikamp 
326ac27a0ecSDave Kleikamp 	if (name == NULL)
327ac27a0ecSDave Kleikamp 		return -EINVAL;
328ac27a0ecSDave Kleikamp 	name_len = strlen(name);
3299496005dSTheodore Ts'o 	for (entry = *pentry; !IS_LAST_ENTRY(entry); entry = next) {
3309496005dSTheodore Ts'o 		next = EXT4_XATTR_NEXT(entry);
3319496005dSTheodore Ts'o 		if ((void *) next >= end) {
3329496005dSTheodore Ts'o 			EXT4_ERROR_INODE(inode, "corrupted xattr entries");
3339496005dSTheodore Ts'o 			return -EFSCORRUPTED;
3349496005dSTheodore Ts'o 		}
335ac27a0ecSDave Kleikamp 		cmp = name_index - entry->e_name_index;
336ac27a0ecSDave Kleikamp 		if (!cmp)
337ac27a0ecSDave Kleikamp 			cmp = name_len - entry->e_name_len;
338ac27a0ecSDave Kleikamp 		if (!cmp)
339ac27a0ecSDave Kleikamp 			cmp = memcmp(name, entry->e_name, name_len);
340ac27a0ecSDave Kleikamp 		if (cmp <= 0 && (sorted || cmp == 0))
341ac27a0ecSDave Kleikamp 			break;
342ac27a0ecSDave Kleikamp 	}
343ac27a0ecSDave Kleikamp 	*pentry = entry;
344ac27a0ecSDave Kleikamp 	return cmp ? -ENODATA : 0;
345ac27a0ecSDave Kleikamp }
346ac27a0ecSDave Kleikamp 
347dec214d0STahsin Erdogan static u32
348dec214d0STahsin Erdogan ext4_xattr_inode_hash(struct ext4_sb_info *sbi, const void *buffer, size_t size)
349dec214d0STahsin Erdogan {
350dec214d0STahsin Erdogan 	return ext4_chksum(sbi, sbi->s_csum_seed, buffer, size);
351dec214d0STahsin Erdogan }
352dec214d0STahsin Erdogan 
353dec214d0STahsin Erdogan static u64 ext4_xattr_inode_get_ref(struct inode *ea_inode)
354dec214d0STahsin Erdogan {
355dec214d0STahsin Erdogan 	return ((u64)ea_inode->i_ctime.tv_sec << 32) |
356ee73f9a5SJeff Layton 		(u32) inode_peek_iversion_raw(ea_inode);
357dec214d0STahsin Erdogan }
358dec214d0STahsin Erdogan 
359dec214d0STahsin Erdogan static void ext4_xattr_inode_set_ref(struct inode *ea_inode, u64 ref_count)
360dec214d0STahsin Erdogan {
361dec214d0STahsin Erdogan 	ea_inode->i_ctime.tv_sec = (u32)(ref_count >> 32);
362ee73f9a5SJeff Layton 	inode_set_iversion_raw(ea_inode, ref_count & 0xffffffff);
363dec214d0STahsin Erdogan }
364dec214d0STahsin Erdogan 
365dec214d0STahsin Erdogan static u32 ext4_xattr_inode_get_hash(struct inode *ea_inode)
366dec214d0STahsin Erdogan {
367dec214d0STahsin Erdogan 	return (u32)ea_inode->i_atime.tv_sec;
368dec214d0STahsin Erdogan }
369dec214d0STahsin Erdogan 
370dec214d0STahsin Erdogan static void ext4_xattr_inode_set_hash(struct inode *ea_inode, u32 hash)
371dec214d0STahsin Erdogan {
372dec214d0STahsin Erdogan 	ea_inode->i_atime.tv_sec = hash;
373dec214d0STahsin Erdogan }
374dec214d0STahsin Erdogan 
375e50e5129SAndreas Dilger /*
376e50e5129SAndreas Dilger  * Read the EA value from an inode.
377e50e5129SAndreas Dilger  */
37890966693STahsin Erdogan static int ext4_xattr_inode_read(struct inode *ea_inode, void *buf, size_t size)
379e50e5129SAndreas Dilger {
3809699d4f9STahsin Erdogan 	int blocksize = 1 << ea_inode->i_blkbits;
3819699d4f9STahsin Erdogan 	int bh_count = (size + blocksize - 1) >> ea_inode->i_blkbits;
3829699d4f9STahsin Erdogan 	int tail_size = (size % blocksize) ?: blocksize;
3839699d4f9STahsin Erdogan 	struct buffer_head *bhs_inline[8];
3849699d4f9STahsin Erdogan 	struct buffer_head **bhs = bhs_inline;
3859699d4f9STahsin Erdogan 	int i, ret;
386e50e5129SAndreas Dilger 
3879699d4f9STahsin Erdogan 	if (bh_count > ARRAY_SIZE(bhs_inline)) {
3889699d4f9STahsin Erdogan 		bhs = kmalloc_array(bh_count, sizeof(*bhs), GFP_NOFS);
3899699d4f9STahsin Erdogan 		if (!bhs)
3909699d4f9STahsin Erdogan 			return -ENOMEM;
391e50e5129SAndreas Dilger 	}
3929699d4f9STahsin Erdogan 
3939699d4f9STahsin Erdogan 	ret = ext4_bread_batch(ea_inode, 0 /* block */, bh_count,
3949699d4f9STahsin Erdogan 			       true /* wait */, bhs);
3959699d4f9STahsin Erdogan 	if (ret)
3969699d4f9STahsin Erdogan 		goto free_bhs;
3979699d4f9STahsin Erdogan 
3989699d4f9STahsin Erdogan 	for (i = 0; i < bh_count; i++) {
3999699d4f9STahsin Erdogan 		/* There shouldn't be any holes in ea_inode. */
4009699d4f9STahsin Erdogan 		if (!bhs[i]) {
4019699d4f9STahsin Erdogan 			ret = -EFSCORRUPTED;
4029699d4f9STahsin Erdogan 			goto put_bhs;
4039699d4f9STahsin Erdogan 		}
4049699d4f9STahsin Erdogan 		memcpy((char *)buf + blocksize * i, bhs[i]->b_data,
4059699d4f9STahsin Erdogan 		       i < bh_count - 1 ? blocksize : tail_size);
4069699d4f9STahsin Erdogan 	}
4079699d4f9STahsin Erdogan 	ret = 0;
4089699d4f9STahsin Erdogan put_bhs:
4099699d4f9STahsin Erdogan 	for (i = 0; i < bh_count; i++)
4109699d4f9STahsin Erdogan 		brelse(bhs[i]);
4119699d4f9STahsin Erdogan free_bhs:
4129699d4f9STahsin Erdogan 	if (bhs != bhs_inline)
4139699d4f9STahsin Erdogan 		kfree(bhs);
4149699d4f9STahsin Erdogan 	return ret;
415e50e5129SAndreas Dilger }
416e50e5129SAndreas Dilger 
417a6d05676STahsin Erdogan #define EXT4_XATTR_INODE_GET_PARENT(inode) ((__u32)(inode)->i_mtime.tv_sec)
418a6d05676STahsin Erdogan 
419bab79b04STahsin Erdogan static int ext4_xattr_inode_iget(struct inode *parent, unsigned long ea_ino,
420a6d05676STahsin Erdogan 				 u32 ea_inode_hash, struct inode **ea_inode)
421e50e5129SAndreas Dilger {
422bab79b04STahsin Erdogan 	struct inode *inode;
423bab79b04STahsin Erdogan 	int err;
424e50e5129SAndreas Dilger 
425*0f7bfd6fSBaokun Li 	/*
426*0f7bfd6fSBaokun Li 	 * We have to check for this corruption early as otherwise
427*0f7bfd6fSBaokun Li 	 * iget_locked() could wait indefinitely for the state of our
428*0f7bfd6fSBaokun Li 	 * parent inode.
429*0f7bfd6fSBaokun Li 	 */
430*0f7bfd6fSBaokun Li 	if (parent->i_ino == ea_ino) {
431*0f7bfd6fSBaokun Li 		ext4_error(parent->i_sb,
432*0f7bfd6fSBaokun Li 			   "Parent and EA inode have the same ino %lu", ea_ino);
433*0f7bfd6fSBaokun Li 		return -EFSCORRUPTED;
434*0f7bfd6fSBaokun Li 	}
435*0f7bfd6fSBaokun Li 
4368a363970STheodore Ts'o 	inode = ext4_iget(parent->i_sb, ea_ino, EXT4_IGET_NORMAL);
437bab79b04STahsin Erdogan 	if (IS_ERR(inode)) {
438bab79b04STahsin Erdogan 		err = PTR_ERR(inode);
439dec214d0STahsin Erdogan 		ext4_error(parent->i_sb,
440dec214d0STahsin Erdogan 			   "error while reading EA inode %lu err=%d", ea_ino,
441dec214d0STahsin Erdogan 			   err);
442bab79b04STahsin Erdogan 		return err;
443e50e5129SAndreas Dilger 	}
444e50e5129SAndreas Dilger 
445bab79b04STahsin Erdogan 	if (is_bad_inode(inode)) {
446dec214d0STahsin Erdogan 		ext4_error(parent->i_sb,
447dec214d0STahsin Erdogan 			   "error while reading EA inode %lu is_bad_inode",
448dec214d0STahsin Erdogan 			   ea_ino);
449bab79b04STahsin Erdogan 		err = -EIO;
450e50e5129SAndreas Dilger 		goto error;
451e50e5129SAndreas Dilger 	}
452e50e5129SAndreas Dilger 
453bab79b04STahsin Erdogan 	if (!(EXT4_I(inode)->i_flags & EXT4_EA_INODE_FL)) {
454dec214d0STahsin Erdogan 		ext4_error(parent->i_sb,
455dec214d0STahsin Erdogan 			   "EA inode %lu does not have EXT4_EA_INODE_FL flag",
456dec214d0STahsin Erdogan 			    ea_ino);
457bab79b04STahsin Erdogan 		err = -EINVAL;
458e50e5129SAndreas Dilger 		goto error;
459e50e5129SAndreas Dilger 	}
460e50e5129SAndreas Dilger 
461a6d05676STahsin Erdogan 	ext4_xattr_inode_set_class(inode);
462a6d05676STahsin Erdogan 
463a6d05676STahsin Erdogan 	/*
464a6d05676STahsin Erdogan 	 * Check whether this is an old Lustre-style xattr inode. Lustre
465a6d05676STahsin Erdogan 	 * implementation does not have hash validation, rather it has a
466a6d05676STahsin Erdogan 	 * backpointer from ea_inode to the parent inode.
467a6d05676STahsin Erdogan 	 */
468a6d05676STahsin Erdogan 	if (ea_inode_hash != ext4_xattr_inode_get_hash(inode) &&
469a6d05676STahsin Erdogan 	    EXT4_XATTR_INODE_GET_PARENT(inode) == parent->i_ino &&
470a6d05676STahsin Erdogan 	    inode->i_generation == parent->i_generation) {
471a6d05676STahsin Erdogan 		ext4_set_inode_state(inode, EXT4_STATE_LUSTRE_EA_INODE);
472a6d05676STahsin Erdogan 		ext4_xattr_inode_set_ref(inode, 1);
473a6d05676STahsin Erdogan 	} else {
474a6d05676STahsin Erdogan 		inode_lock(inode);
475a6d05676STahsin Erdogan 		inode->i_flags |= S_NOQUOTA;
476a6d05676STahsin Erdogan 		inode_unlock(inode);
477a6d05676STahsin Erdogan 	}
478a6d05676STahsin Erdogan 
479bab79b04STahsin Erdogan 	*ea_inode = inode;
480bab79b04STahsin Erdogan 	return 0;
481e50e5129SAndreas Dilger error:
482bab79b04STahsin Erdogan 	iput(inode);
483bab79b04STahsin Erdogan 	return err;
484e50e5129SAndreas Dilger }
485e50e5129SAndreas Dilger 
4866bc0d63dSJan Kara /* Remove entry from mbcache when EA inode is getting evicted */
4876bc0d63dSJan Kara void ext4_evict_ea_inode(struct inode *inode)
4886bc0d63dSJan Kara {
48965f8b800SJan Kara 	struct mb_cache_entry *oe;
49065f8b800SJan Kara 
49165f8b800SJan Kara 	if (!EA_INODE_CACHE(inode))
49265f8b800SJan Kara 		return;
49365f8b800SJan Kara 	/* Wait for entry to get unused so that we can remove it */
49465f8b800SJan Kara 	while ((oe = mb_cache_entry_delete_or_get(EA_INODE_CACHE(inode),
49565f8b800SJan Kara 			ext4_xattr_inode_get_hash(inode), inode->i_ino))) {
49665f8b800SJan Kara 		mb_cache_entry_wait_unused(oe);
49765f8b800SJan Kara 		mb_cache_entry_put(EA_INODE_CACHE(inode), oe);
49865f8b800SJan Kara 	}
4996bc0d63dSJan Kara }
5006bc0d63dSJan Kara 
501dec214d0STahsin Erdogan static int
502b9fc761eSTahsin Erdogan ext4_xattr_inode_verify_hashes(struct inode *ea_inode,
503b9fc761eSTahsin Erdogan 			       struct ext4_xattr_entry *entry, void *buffer,
504b9fc761eSTahsin Erdogan 			       size_t size)
505dec214d0STahsin Erdogan {
506dec214d0STahsin Erdogan 	u32 hash;
507dec214d0STahsin Erdogan 
508dec214d0STahsin Erdogan 	/* Verify stored hash matches calculated hash. */
509dec214d0STahsin Erdogan 	hash = ext4_xattr_inode_hash(EXT4_SB(ea_inode->i_sb), buffer, size);
510dec214d0STahsin Erdogan 	if (hash != ext4_xattr_inode_get_hash(ea_inode))
511dec214d0STahsin Erdogan 		return -EFSCORRUPTED;
512b9fc761eSTahsin Erdogan 
513b9fc761eSTahsin Erdogan 	if (entry) {
514b9fc761eSTahsin Erdogan 		__le32 e_hash, tmp_data;
515b9fc761eSTahsin Erdogan 
516b9fc761eSTahsin Erdogan 		/* Verify entry hash. */
517b9fc761eSTahsin Erdogan 		tmp_data = cpu_to_le32(hash);
518b9fc761eSTahsin Erdogan 		e_hash = ext4_xattr_hash_entry(entry->e_name, entry->e_name_len,
519b9fc761eSTahsin Erdogan 					       &tmp_data, 1);
520f3bbac32SLinus Torvalds 		/* All good? */
521f3bbac32SLinus Torvalds 		if (e_hash == entry->e_hash)
522f3bbac32SLinus Torvalds 			return 0;
523f3bbac32SLinus Torvalds 
524f3bbac32SLinus Torvalds 		/*
525f3bbac32SLinus Torvalds 		 * Not good. Maybe the entry hash was calculated
526f3bbac32SLinus Torvalds 		 * using the buggy signed char version?
527f3bbac32SLinus Torvalds 		 */
528f3bbac32SLinus Torvalds 		e_hash = ext4_xattr_hash_entry_signed(entry->e_name, entry->e_name_len,
529f3bbac32SLinus Torvalds 							&tmp_data, 1);
530f3bbac32SLinus Torvalds 		if (e_hash == entry->e_hash)
531f3bbac32SLinus Torvalds 			return 0;
532f3bbac32SLinus Torvalds 
533f3bbac32SLinus Torvalds 		/* Still no match - bad */
534b9fc761eSTahsin Erdogan 		return -EFSCORRUPTED;
535b9fc761eSTahsin Erdogan 	}
536dec214d0STahsin Erdogan 	return 0;
537dec214d0STahsin Erdogan }
538dec214d0STahsin Erdogan 
539e50e5129SAndreas Dilger /*
540b9fc761eSTahsin Erdogan  * Read xattr value from the EA inode.
541e50e5129SAndreas Dilger  */
542e50e5129SAndreas Dilger static int
543b9fc761eSTahsin Erdogan ext4_xattr_inode_get(struct inode *inode, struct ext4_xattr_entry *entry,
544b9fc761eSTahsin Erdogan 		     void *buffer, size_t size)
545e50e5129SAndreas Dilger {
546dec214d0STahsin Erdogan 	struct mb_cache *ea_inode_cache = EA_INODE_CACHE(inode);
547bab79b04STahsin Erdogan 	struct inode *ea_inode;
548dec214d0STahsin Erdogan 	int err;
549e50e5129SAndreas Dilger 
550b9fc761eSTahsin Erdogan 	err = ext4_xattr_inode_iget(inode, le32_to_cpu(entry->e_value_inum),
551a6d05676STahsin Erdogan 				    le32_to_cpu(entry->e_hash), &ea_inode);
552dec214d0STahsin Erdogan 	if (err) {
553dec214d0STahsin Erdogan 		ea_inode = NULL;
554dec214d0STahsin Erdogan 		goto out;
555dec214d0STahsin Erdogan 	}
556e50e5129SAndreas Dilger 
557dec214d0STahsin Erdogan 	if (i_size_read(ea_inode) != size) {
558dec214d0STahsin Erdogan 		ext4_warning_inode(ea_inode,
559dec214d0STahsin Erdogan 				   "ea_inode file size=%llu entry size=%zu",
560dec214d0STahsin Erdogan 				   i_size_read(ea_inode), size);
561dec214d0STahsin Erdogan 		err = -EFSCORRUPTED;
562dec214d0STahsin Erdogan 		goto out;
563dec214d0STahsin Erdogan 	}
564dec214d0STahsin Erdogan 
565dec214d0STahsin Erdogan 	err = ext4_xattr_inode_read(ea_inode, buffer, size);
566dec214d0STahsin Erdogan 	if (err)
567dec214d0STahsin Erdogan 		goto out;
568dec214d0STahsin Erdogan 
569a6d05676STahsin Erdogan 	if (!ext4_test_inode_state(ea_inode, EXT4_STATE_LUSTRE_EA_INODE)) {
570a6d05676STahsin Erdogan 		err = ext4_xattr_inode_verify_hashes(ea_inode, entry, buffer,
571a6d05676STahsin Erdogan 						     size);
572a6d05676STahsin Erdogan 		if (err) {
573dec214d0STahsin Erdogan 			ext4_warning_inode(ea_inode,
574dec214d0STahsin Erdogan 					   "EA inode hash validation failed");
575dec214d0STahsin Erdogan 			goto out;
576dec214d0STahsin Erdogan 		}
577dec214d0STahsin Erdogan 
578dec214d0STahsin Erdogan 		if (ea_inode_cache)
579dec214d0STahsin Erdogan 			mb_cache_entry_create(ea_inode_cache, GFP_NOFS,
580dec214d0STahsin Erdogan 					ext4_xattr_inode_get_hash(ea_inode),
581dec214d0STahsin Erdogan 					ea_inode->i_ino, true /* reusable */);
582a6d05676STahsin Erdogan 	}
583dec214d0STahsin Erdogan out:
584e50e5129SAndreas Dilger 	iput(ea_inode);
585dec214d0STahsin Erdogan 	return err;
586e50e5129SAndreas Dilger }
587e50e5129SAndreas Dilger 
588ac27a0ecSDave Kleikamp static int
589617ba13bSMingming Cao ext4_xattr_block_get(struct inode *inode, int name_index, const char *name,
590ac27a0ecSDave Kleikamp 		     void *buffer, size_t buffer_size)
591ac27a0ecSDave Kleikamp {
592ac27a0ecSDave Kleikamp 	struct buffer_head *bh = NULL;
593617ba13bSMingming Cao 	struct ext4_xattr_entry *entry;
594ac27a0ecSDave Kleikamp 	size_t size;
5959496005dSTheodore Ts'o 	void *end;
596ac27a0ecSDave Kleikamp 	int error;
59747387409STahsin Erdogan 	struct mb_cache *ea_block_cache = EA_BLOCK_CACHE(inode);
598ac27a0ecSDave Kleikamp 
599ac27a0ecSDave Kleikamp 	ea_idebug(inode, "name=%d.%s, buffer=%p, buffer_size=%ld",
600ac27a0ecSDave Kleikamp 		  name_index, name, buffer, (long)buffer_size);
601ac27a0ecSDave Kleikamp 
602617ba13bSMingming Cao 	if (!EXT4_I(inode)->i_file_acl)
603fb265c9cSTheodore Ts'o 		return -ENODATA;
604ace36ad4SJoe Perches 	ea_idebug(inode, "reading block %llu",
605ace36ad4SJoe Perches 		  (unsigned long long)EXT4_I(inode)->i_file_acl);
606fb265c9cSTheodore Ts'o 	bh = ext4_sb_bread(inode->i_sb, EXT4_I(inode)->i_file_acl, REQ_PRIO);
607fb265c9cSTheodore Ts'o 	if (IS_ERR(bh))
608fb265c9cSTheodore Ts'o 		return PTR_ERR(bh);
609ac27a0ecSDave Kleikamp 	ea_bdebug(bh, "b_count=%d, refcount=%d",
610ac27a0ecSDave Kleikamp 		atomic_read(&(bh->b_count)), le32_to_cpu(BHDR(bh)->h_refcount));
611de05ca85STheodore Ts'o 	error = ext4_xattr_check_block(inode, bh);
612de05ca85STheodore Ts'o 	if (error)
613ac27a0ecSDave Kleikamp 		goto cleanup;
61447387409STahsin Erdogan 	ext4_xattr_block_cache_insert(ea_block_cache, bh);
615ac27a0ecSDave Kleikamp 	entry = BFIRST(bh);
6169496005dSTheodore Ts'o 	end = bh->b_data + bh->b_size;
6179496005dSTheodore Ts'o 	error = xattr_find_entry(inode, &entry, end, name_index, name, 1);
618ac27a0ecSDave Kleikamp 	if (error)
619ac27a0ecSDave Kleikamp 		goto cleanup;
620ac27a0ecSDave Kleikamp 	size = le32_to_cpu(entry->e_value_size);
621ac27a0ecSDave Kleikamp 	error = -ERANGE;
62254dd0e0aSTheodore Ts'o 	if (unlikely(size > EXT4_XATTR_SIZE_MAX))
62354dd0e0aSTheodore Ts'o 		goto cleanup;
62454dd0e0aSTheodore Ts'o 	if (buffer) {
625ac27a0ecSDave Kleikamp 		if (size > buffer_size)
626ac27a0ecSDave Kleikamp 			goto cleanup;
627e50e5129SAndreas Dilger 		if (entry->e_value_inum) {
628b9fc761eSTahsin Erdogan 			error = ext4_xattr_inode_get(inode, entry, buffer,
629b9fc761eSTahsin Erdogan 						     size);
630e50e5129SAndreas Dilger 			if (error)
631e50e5129SAndreas Dilger 				goto cleanup;
632e50e5129SAndreas Dilger 		} else {
63354dd0e0aSTheodore Ts'o 			u16 offset = le16_to_cpu(entry->e_value_offs);
63454dd0e0aSTheodore Ts'o 			void *p = bh->b_data + offset;
63554dd0e0aSTheodore Ts'o 
63654dd0e0aSTheodore Ts'o 			if (unlikely(p + size > end))
63754dd0e0aSTheodore Ts'o 				goto cleanup;
63854dd0e0aSTheodore Ts'o 			memcpy(buffer, p, size);
639e50e5129SAndreas Dilger 		}
640ac27a0ecSDave Kleikamp 	}
641ac27a0ecSDave Kleikamp 	error = size;
642ac27a0ecSDave Kleikamp 
643ac27a0ecSDave Kleikamp cleanup:
644ac27a0ecSDave Kleikamp 	brelse(bh);
645ac27a0ecSDave Kleikamp 	return error;
646ac27a0ecSDave Kleikamp }
647ac27a0ecSDave Kleikamp 
648879b3825STao Ma int
649617ba13bSMingming Cao ext4_xattr_ibody_get(struct inode *inode, int name_index, const char *name,
650ac27a0ecSDave Kleikamp 		     void *buffer, size_t buffer_size)
651ac27a0ecSDave Kleikamp {
652617ba13bSMingming Cao 	struct ext4_xattr_ibody_header *header;
653617ba13bSMingming Cao 	struct ext4_xattr_entry *entry;
654617ba13bSMingming Cao 	struct ext4_inode *raw_inode;
655617ba13bSMingming Cao 	struct ext4_iloc iloc;
656ac27a0ecSDave Kleikamp 	size_t size;
657ac27a0ecSDave Kleikamp 	void *end;
658ac27a0ecSDave Kleikamp 	int error;
659ac27a0ecSDave Kleikamp 
66019f5fb7aSTheodore Ts'o 	if (!ext4_test_inode_state(inode, EXT4_STATE_XATTR))
661ac27a0ecSDave Kleikamp 		return -ENODATA;
662617ba13bSMingming Cao 	error = ext4_get_inode_loc(inode, &iloc);
663ac27a0ecSDave Kleikamp 	if (error)
664ac27a0ecSDave Kleikamp 		return error;
665617ba13bSMingming Cao 	raw_inode = ext4_raw_inode(&iloc);
666ac27a0ecSDave Kleikamp 	header = IHDR(inode, raw_inode);
667617ba13bSMingming Cao 	end = (void *)raw_inode + EXT4_SB(inode->i_sb)->s_inode_size;
6689e92f48cSTheodore Ts'o 	error = xattr_check_inode(inode, header, end);
669ac27a0ecSDave Kleikamp 	if (error)
670ac27a0ecSDave Kleikamp 		goto cleanup;
6716ba644b9SEric Biggers 	entry = IFIRST(header);
6729496005dSTheodore Ts'o 	error = xattr_find_entry(inode, &entry, end, name_index, name, 0);
673ac27a0ecSDave Kleikamp 	if (error)
674ac27a0ecSDave Kleikamp 		goto cleanup;
675ac27a0ecSDave Kleikamp 	size = le32_to_cpu(entry->e_value_size);
676ac27a0ecSDave Kleikamp 	error = -ERANGE;
67754dd0e0aSTheodore Ts'o 	if (unlikely(size > EXT4_XATTR_SIZE_MAX))
67854dd0e0aSTheodore Ts'o 		goto cleanup;
67954dd0e0aSTheodore Ts'o 	if (buffer) {
680ac27a0ecSDave Kleikamp 		if (size > buffer_size)
681ac27a0ecSDave Kleikamp 			goto cleanup;
682e50e5129SAndreas Dilger 		if (entry->e_value_inum) {
683b9fc761eSTahsin Erdogan 			error = ext4_xattr_inode_get(inode, entry, buffer,
684b9fc761eSTahsin Erdogan 						     size);
685e50e5129SAndreas Dilger 			if (error)
686e50e5129SAndreas Dilger 				goto cleanup;
687e50e5129SAndreas Dilger 		} else {
68854dd0e0aSTheodore Ts'o 			u16 offset = le16_to_cpu(entry->e_value_offs);
68954dd0e0aSTheodore Ts'o 			void *p = (void *)IFIRST(header) + offset;
69054dd0e0aSTheodore Ts'o 
69154dd0e0aSTheodore Ts'o 			if (unlikely(p + size > end))
69254dd0e0aSTheodore Ts'o 				goto cleanup;
69354dd0e0aSTheodore Ts'o 			memcpy(buffer, p, size);
694ac27a0ecSDave Kleikamp 		}
695e50e5129SAndreas Dilger 	}
696ac27a0ecSDave Kleikamp 	error = size;
697ac27a0ecSDave Kleikamp 
698ac27a0ecSDave Kleikamp cleanup:
699ac27a0ecSDave Kleikamp 	brelse(iloc.bh);
700ac27a0ecSDave Kleikamp 	return error;
701ac27a0ecSDave Kleikamp }
702ac27a0ecSDave Kleikamp 
703ac27a0ecSDave Kleikamp /*
704617ba13bSMingming Cao  * ext4_xattr_get()
705ac27a0ecSDave Kleikamp  *
706ac27a0ecSDave Kleikamp  * Copy an extended attribute into the buffer
707ac27a0ecSDave Kleikamp  * provided, or compute the buffer size required.
708ac27a0ecSDave Kleikamp  * Buffer is NULL to compute the size of the buffer required.
709ac27a0ecSDave Kleikamp  *
710ac27a0ecSDave Kleikamp  * Returns a negative error number on failure, or the number of bytes
711ac27a0ecSDave Kleikamp  * used / required on success.
712ac27a0ecSDave Kleikamp  */
713ac27a0ecSDave Kleikamp int
714617ba13bSMingming Cao ext4_xattr_get(struct inode *inode, int name_index, const char *name,
715ac27a0ecSDave Kleikamp 	       void *buffer, size_t buffer_size)
716ac27a0ecSDave Kleikamp {
717ac27a0ecSDave Kleikamp 	int error;
718ac27a0ecSDave Kleikamp 
7190db1ff22STheodore Ts'o 	if (unlikely(ext4_forced_shutdown(EXT4_SB(inode->i_sb))))
7200db1ff22STheodore Ts'o 		return -EIO;
7210db1ff22STheodore Ts'o 
722230b8c1aSZhang Zhen 	if (strlen(name) > 255)
723230b8c1aSZhang Zhen 		return -ERANGE;
724230b8c1aSZhang Zhen 
725617ba13bSMingming Cao 	down_read(&EXT4_I(inode)->xattr_sem);
726617ba13bSMingming Cao 	error = ext4_xattr_ibody_get(inode, name_index, name, buffer,
727ac27a0ecSDave Kleikamp 				     buffer_size);
728ac27a0ecSDave Kleikamp 	if (error == -ENODATA)
729617ba13bSMingming Cao 		error = ext4_xattr_block_get(inode, name_index, name, buffer,
730ac27a0ecSDave Kleikamp 					     buffer_size);
731617ba13bSMingming Cao 	up_read(&EXT4_I(inode)->xattr_sem);
732ac27a0ecSDave Kleikamp 	return error;
733ac27a0ecSDave Kleikamp }
734ac27a0ecSDave Kleikamp 
735ac27a0ecSDave Kleikamp static int
736431547b3SChristoph Hellwig ext4_xattr_list_entries(struct dentry *dentry, struct ext4_xattr_entry *entry,
737ac27a0ecSDave Kleikamp 			char *buffer, size_t buffer_size)
738ac27a0ecSDave Kleikamp {
739ac27a0ecSDave Kleikamp 	size_t rest = buffer_size;
740ac27a0ecSDave Kleikamp 
741617ba13bSMingming Cao 	for (; !IS_LAST_ENTRY(entry); entry = EXT4_XATTR_NEXT(entry)) {
74211e27528SStephen Hemminger 		const struct xattr_handler *handler =
743617ba13bSMingming Cao 			ext4_xattr_handler(entry->e_name_index);
744ac27a0ecSDave Kleikamp 
745764a5c6bSAndreas Gruenbacher 		if (handler && (!handler->list || handler->list(dentry))) {
746764a5c6bSAndreas Gruenbacher 			const char *prefix = handler->prefix ?: handler->name;
747764a5c6bSAndreas Gruenbacher 			size_t prefix_len = strlen(prefix);
748764a5c6bSAndreas Gruenbacher 			size_t size = prefix_len + entry->e_name_len + 1;
749764a5c6bSAndreas Gruenbacher 
750ac27a0ecSDave Kleikamp 			if (buffer) {
751ac27a0ecSDave Kleikamp 				if (size > rest)
752ac27a0ecSDave Kleikamp 					return -ERANGE;
753764a5c6bSAndreas Gruenbacher 				memcpy(buffer, prefix, prefix_len);
754764a5c6bSAndreas Gruenbacher 				buffer += prefix_len;
755764a5c6bSAndreas Gruenbacher 				memcpy(buffer, entry->e_name, entry->e_name_len);
756764a5c6bSAndreas Gruenbacher 				buffer += entry->e_name_len;
757764a5c6bSAndreas Gruenbacher 				*buffer++ = 0;
758ac27a0ecSDave Kleikamp 			}
759ac27a0ecSDave Kleikamp 			rest -= size;
760ac27a0ecSDave Kleikamp 		}
761ac27a0ecSDave Kleikamp 	}
762764a5c6bSAndreas Gruenbacher 	return buffer_size - rest;  /* total size */
763ac27a0ecSDave Kleikamp }
764ac27a0ecSDave Kleikamp 
765ac27a0ecSDave Kleikamp static int
766431547b3SChristoph Hellwig ext4_xattr_block_list(struct dentry *dentry, char *buffer, size_t buffer_size)
767ac27a0ecSDave Kleikamp {
7682b0143b5SDavid Howells 	struct inode *inode = d_inode(dentry);
769ac27a0ecSDave Kleikamp 	struct buffer_head *bh = NULL;
770ac27a0ecSDave Kleikamp 	int error;
771ac27a0ecSDave Kleikamp 
772ac27a0ecSDave Kleikamp 	ea_idebug(inode, "buffer=%p, buffer_size=%ld",
773ac27a0ecSDave Kleikamp 		  buffer, (long)buffer_size);
774ac27a0ecSDave Kleikamp 
775617ba13bSMingming Cao 	if (!EXT4_I(inode)->i_file_acl)
776fb265c9cSTheodore Ts'o 		return 0;
777ace36ad4SJoe Perches 	ea_idebug(inode, "reading block %llu",
778ace36ad4SJoe Perches 		  (unsigned long long)EXT4_I(inode)->i_file_acl);
779fb265c9cSTheodore Ts'o 	bh = ext4_sb_bread(inode->i_sb, EXT4_I(inode)->i_file_acl, REQ_PRIO);
780fb265c9cSTheodore Ts'o 	if (IS_ERR(bh))
781fb265c9cSTheodore Ts'o 		return PTR_ERR(bh);
782ac27a0ecSDave Kleikamp 	ea_bdebug(bh, "b_count=%d, refcount=%d",
783ac27a0ecSDave Kleikamp 		atomic_read(&(bh->b_count)), le32_to_cpu(BHDR(bh)->h_refcount));
784de05ca85STheodore Ts'o 	error = ext4_xattr_check_block(inode, bh);
785de05ca85STheodore Ts'o 	if (error)
786ac27a0ecSDave Kleikamp 		goto cleanup;
78747387409STahsin Erdogan 	ext4_xattr_block_cache_insert(EA_BLOCK_CACHE(inode), bh);
788fb265c9cSTheodore Ts'o 	error = ext4_xattr_list_entries(dentry, BFIRST(bh), buffer,
789fb265c9cSTheodore Ts'o 					buffer_size);
790ac27a0ecSDave Kleikamp cleanup:
791ac27a0ecSDave Kleikamp 	brelse(bh);
792ac27a0ecSDave Kleikamp 	return error;
793ac27a0ecSDave Kleikamp }
794ac27a0ecSDave Kleikamp 
795ac27a0ecSDave Kleikamp static int
796431547b3SChristoph Hellwig ext4_xattr_ibody_list(struct dentry *dentry, char *buffer, size_t buffer_size)
797ac27a0ecSDave Kleikamp {
7982b0143b5SDavid Howells 	struct inode *inode = d_inode(dentry);
799617ba13bSMingming Cao 	struct ext4_xattr_ibody_header *header;
800617ba13bSMingming Cao 	struct ext4_inode *raw_inode;
801617ba13bSMingming Cao 	struct ext4_iloc iloc;
802ac27a0ecSDave Kleikamp 	void *end;
803ac27a0ecSDave Kleikamp 	int error;
804ac27a0ecSDave Kleikamp 
80519f5fb7aSTheodore Ts'o 	if (!ext4_test_inode_state(inode, EXT4_STATE_XATTR))
806ac27a0ecSDave Kleikamp 		return 0;
807617ba13bSMingming Cao 	error = ext4_get_inode_loc(inode, &iloc);
808ac27a0ecSDave Kleikamp 	if (error)
809ac27a0ecSDave Kleikamp 		return error;
810617ba13bSMingming Cao 	raw_inode = ext4_raw_inode(&iloc);
811ac27a0ecSDave Kleikamp 	header = IHDR(inode, raw_inode);
812617ba13bSMingming Cao 	end = (void *)raw_inode + EXT4_SB(inode->i_sb)->s_inode_size;
8139e92f48cSTheodore Ts'o 	error = xattr_check_inode(inode, header, end);
814ac27a0ecSDave Kleikamp 	if (error)
815ac27a0ecSDave Kleikamp 		goto cleanup;
816431547b3SChristoph Hellwig 	error = ext4_xattr_list_entries(dentry, IFIRST(header),
817ac27a0ecSDave Kleikamp 					buffer, buffer_size);
818ac27a0ecSDave Kleikamp 
819ac27a0ecSDave Kleikamp cleanup:
820ac27a0ecSDave Kleikamp 	brelse(iloc.bh);
821ac27a0ecSDave Kleikamp 	return error;
822ac27a0ecSDave Kleikamp }
823ac27a0ecSDave Kleikamp 
824ac27a0ecSDave Kleikamp /*
825ba7ea1d8SEric Biggers  * Inode operation listxattr()
826ba7ea1d8SEric Biggers  *
827ba7ea1d8SEric Biggers  * d_inode(dentry)->i_rwsem: don't care
828ac27a0ecSDave Kleikamp  *
829ac27a0ecSDave Kleikamp  * Copy a list of attribute names into the buffer
830ac27a0ecSDave Kleikamp  * provided, or compute the buffer size required.
831ac27a0ecSDave Kleikamp  * Buffer is NULL to compute the size of the buffer required.
832ac27a0ecSDave Kleikamp  *
833ac27a0ecSDave Kleikamp  * Returns a negative error number on failure, or the number of bytes
834ac27a0ecSDave Kleikamp  * used / required on success.
835ac27a0ecSDave Kleikamp  */
836ba7ea1d8SEric Biggers ssize_t
837ba7ea1d8SEric Biggers ext4_listxattr(struct dentry *dentry, char *buffer, size_t buffer_size)
838ac27a0ecSDave Kleikamp {
839eaeef867STheodore Ts'o 	int ret, ret2;
840ac27a0ecSDave Kleikamp 
8412b0143b5SDavid Howells 	down_read(&EXT4_I(d_inode(dentry))->xattr_sem);
842eaeef867STheodore Ts'o 	ret = ret2 = ext4_xattr_ibody_list(dentry, buffer, buffer_size);
843eaeef867STheodore Ts'o 	if (ret < 0)
844eaeef867STheodore Ts'o 		goto errout;
845ac27a0ecSDave Kleikamp 	if (buffer) {
846eaeef867STheodore Ts'o 		buffer += ret;
847eaeef867STheodore Ts'o 		buffer_size -= ret;
848ac27a0ecSDave Kleikamp 	}
849eaeef867STheodore Ts'o 	ret = ext4_xattr_block_list(dentry, buffer, buffer_size);
850eaeef867STheodore Ts'o 	if (ret < 0)
851eaeef867STheodore Ts'o 		goto errout;
852eaeef867STheodore Ts'o 	ret += ret2;
853eaeef867STheodore Ts'o errout:
8542b0143b5SDavid Howells 	up_read(&EXT4_I(d_inode(dentry))->xattr_sem);
855eaeef867STheodore Ts'o 	return ret;
856ac27a0ecSDave Kleikamp }
857ac27a0ecSDave Kleikamp 
858ac27a0ecSDave Kleikamp /*
859617ba13bSMingming Cao  * If the EXT4_FEATURE_COMPAT_EXT_ATTR feature of this file system is
860ac27a0ecSDave Kleikamp  * not set, set it.
861ac27a0ecSDave Kleikamp  */
862617ba13bSMingming Cao static void ext4_xattr_update_super_block(handle_t *handle,
863ac27a0ecSDave Kleikamp 					  struct super_block *sb)
864ac27a0ecSDave Kleikamp {
865e2b911c5SDarrick J. Wong 	if (ext4_has_feature_xattr(sb))
866ac27a0ecSDave Kleikamp 		return;
867ac27a0ecSDave Kleikamp 
8685d601255Sliang xie 	BUFFER_TRACE(EXT4_SB(sb)->s_sbh, "get_write_access");
869188c299eSJan Kara 	if (ext4_journal_get_write_access(handle, sb, EXT4_SB(sb)->s_sbh,
870188c299eSJan Kara 					  EXT4_JTR_NONE) == 0) {
87105c2c00fSJan Kara 		lock_buffer(EXT4_SB(sb)->s_sbh);
872e2b911c5SDarrick J. Wong 		ext4_set_feature_xattr(sb);
87305c2c00fSJan Kara 		ext4_superblock_csum_set(sb);
87405c2c00fSJan Kara 		unlock_buffer(EXT4_SB(sb)->s_sbh);
875a3f5cf14SJan Kara 		ext4_handle_dirty_metadata(handle, NULL, EXT4_SB(sb)->s_sbh);
876ac27a0ecSDave Kleikamp 	}
877ac27a0ecSDave Kleikamp }
878ac27a0ecSDave Kleikamp 
8797a9ca53aSTahsin Erdogan int ext4_get_inode_usage(struct inode *inode, qsize_t *usage)
8807a9ca53aSTahsin Erdogan {
8817a9ca53aSTahsin Erdogan 	struct ext4_iloc iloc = { .bh = NULL };
8827a9ca53aSTahsin Erdogan 	struct buffer_head *bh = NULL;
8837a9ca53aSTahsin Erdogan 	struct ext4_inode *raw_inode;
8847a9ca53aSTahsin Erdogan 	struct ext4_xattr_ibody_header *header;
8857a9ca53aSTahsin Erdogan 	struct ext4_xattr_entry *entry;
8867a9ca53aSTahsin Erdogan 	qsize_t ea_inode_refs = 0;
8877a9ca53aSTahsin Erdogan 	void *end;
8887a9ca53aSTahsin Erdogan 	int ret;
8897a9ca53aSTahsin Erdogan 
8907a9ca53aSTahsin Erdogan 	lockdep_assert_held_read(&EXT4_I(inode)->xattr_sem);
8917a9ca53aSTahsin Erdogan 
8927a9ca53aSTahsin Erdogan 	if (ext4_test_inode_state(inode, EXT4_STATE_XATTR)) {
8937a9ca53aSTahsin Erdogan 		ret = ext4_get_inode_loc(inode, &iloc);
8947a9ca53aSTahsin Erdogan 		if (ret)
8957a9ca53aSTahsin Erdogan 			goto out;
8967a9ca53aSTahsin Erdogan 		raw_inode = ext4_raw_inode(&iloc);
8977a9ca53aSTahsin Erdogan 		header = IHDR(inode, raw_inode);
8987a9ca53aSTahsin Erdogan 		end = (void *)raw_inode + EXT4_SB(inode->i_sb)->s_inode_size;
8997a9ca53aSTahsin Erdogan 		ret = xattr_check_inode(inode, header, end);
9007a9ca53aSTahsin Erdogan 		if (ret)
9017a9ca53aSTahsin Erdogan 			goto out;
9027a9ca53aSTahsin Erdogan 
9037a9ca53aSTahsin Erdogan 		for (entry = IFIRST(header); !IS_LAST_ENTRY(entry);
9047a9ca53aSTahsin Erdogan 		     entry = EXT4_XATTR_NEXT(entry))
9057a9ca53aSTahsin Erdogan 			if (entry->e_value_inum)
9067a9ca53aSTahsin Erdogan 				ea_inode_refs++;
9077a9ca53aSTahsin Erdogan 	}
9087a9ca53aSTahsin Erdogan 
9097a9ca53aSTahsin Erdogan 	if (EXT4_I(inode)->i_file_acl) {
910fb265c9cSTheodore Ts'o 		bh = ext4_sb_bread(inode->i_sb, EXT4_I(inode)->i_file_acl, REQ_PRIO);
911fb265c9cSTheodore Ts'o 		if (IS_ERR(bh)) {
912fb265c9cSTheodore Ts'o 			ret = PTR_ERR(bh);
9137159a986SDan Carpenter 			bh = NULL;
9147a9ca53aSTahsin Erdogan 			goto out;
9157a9ca53aSTahsin Erdogan 		}
9167a9ca53aSTahsin Erdogan 
917de05ca85STheodore Ts'o 		ret = ext4_xattr_check_block(inode, bh);
918de05ca85STheodore Ts'o 		if (ret)
9197a9ca53aSTahsin Erdogan 			goto out;
9207a9ca53aSTahsin Erdogan 
9217a9ca53aSTahsin Erdogan 		for (entry = BFIRST(bh); !IS_LAST_ENTRY(entry);
9227a9ca53aSTahsin Erdogan 		     entry = EXT4_XATTR_NEXT(entry))
9237a9ca53aSTahsin Erdogan 			if (entry->e_value_inum)
9247a9ca53aSTahsin Erdogan 				ea_inode_refs++;
9257a9ca53aSTahsin Erdogan 	}
9267a9ca53aSTahsin Erdogan 	*usage = ea_inode_refs + 1;
9277a9ca53aSTahsin Erdogan 	ret = 0;
9287a9ca53aSTahsin Erdogan out:
9297a9ca53aSTahsin Erdogan 	brelse(iloc.bh);
9307a9ca53aSTahsin Erdogan 	brelse(bh);
9317a9ca53aSTahsin Erdogan 	return ret;
9327a9ca53aSTahsin Erdogan }
9337a9ca53aSTahsin Erdogan 
934dec214d0STahsin Erdogan static inline size_t round_up_cluster(struct inode *inode, size_t length)
935dec214d0STahsin Erdogan {
936dec214d0STahsin Erdogan 	struct super_block *sb = inode->i_sb;
937dec214d0STahsin Erdogan 	size_t cluster_size = 1 << (EXT4_SB(sb)->s_cluster_bits +
938dec214d0STahsin Erdogan 				    inode->i_blkbits);
939dec214d0STahsin Erdogan 	size_t mask = ~(cluster_size - 1);
940dec214d0STahsin Erdogan 
941dec214d0STahsin Erdogan 	return (length + cluster_size - 1) & mask;
942dec214d0STahsin Erdogan }
943dec214d0STahsin Erdogan 
944dec214d0STahsin Erdogan static int ext4_xattr_inode_alloc_quota(struct inode *inode, size_t len)
945dec214d0STahsin Erdogan {
946dec214d0STahsin Erdogan 	int err;
947dec214d0STahsin Erdogan 
948dec214d0STahsin Erdogan 	err = dquot_alloc_inode(inode);
949dec214d0STahsin Erdogan 	if (err)
950dec214d0STahsin Erdogan 		return err;
951dec214d0STahsin Erdogan 	err = dquot_alloc_space_nodirty(inode, round_up_cluster(inode, len));
952dec214d0STahsin Erdogan 	if (err)
953dec214d0STahsin Erdogan 		dquot_free_inode(inode);
954dec214d0STahsin Erdogan 	return err;
955dec214d0STahsin Erdogan }
956dec214d0STahsin Erdogan 
957a6d05676STahsin Erdogan static void ext4_xattr_inode_free_quota(struct inode *parent,
958a6d05676STahsin Erdogan 					struct inode *ea_inode,
959a6d05676STahsin Erdogan 					size_t len)
960dec214d0STahsin Erdogan {
961a6d05676STahsin Erdogan 	if (ea_inode &&
962a6d05676STahsin Erdogan 	    ext4_test_inode_state(ea_inode, EXT4_STATE_LUSTRE_EA_INODE))
963a6d05676STahsin Erdogan 		return;
964a6d05676STahsin Erdogan 	dquot_free_space_nodirty(parent, round_up_cluster(parent, len));
965a6d05676STahsin Erdogan 	dquot_free_inode(parent);
966dec214d0STahsin Erdogan }
967dec214d0STahsin Erdogan 
968af65207cSTahsin Erdogan int __ext4_xattr_set_credits(struct super_block *sb, struct inode *inode,
969af65207cSTahsin Erdogan 			     struct buffer_head *block_bh, size_t value_len,
970af65207cSTahsin Erdogan 			     bool is_create)
971dec214d0STahsin Erdogan {
972dec214d0STahsin Erdogan 	int credits;
973dec214d0STahsin Erdogan 	int blocks;
974dec214d0STahsin Erdogan 
975dec214d0STahsin Erdogan 	/*
976dec214d0STahsin Erdogan 	 * 1) Owner inode update
977dec214d0STahsin Erdogan 	 * 2) Ref count update on old xattr block
978dec214d0STahsin Erdogan 	 * 3) new xattr block
979dec214d0STahsin Erdogan 	 * 4) block bitmap update for new xattr block
980dec214d0STahsin Erdogan 	 * 5) group descriptor for new xattr block
981dec214d0STahsin Erdogan 	 * 6) block bitmap update for old xattr block
982dec214d0STahsin Erdogan 	 * 7) group descriptor for old block
983dec214d0STahsin Erdogan 	 *
984dec214d0STahsin Erdogan 	 * 6 & 7 can happen if we have two racing threads T_a and T_b
985dec214d0STahsin Erdogan 	 * which are each trying to set an xattr on inodes I_a and I_b
986dec214d0STahsin Erdogan 	 * which were both initially sharing an xattr block.
987dec214d0STahsin Erdogan 	 */
988dec214d0STahsin Erdogan 	credits = 7;
989dec214d0STahsin Erdogan 
990dec214d0STahsin Erdogan 	/* Quota updates. */
991dec214d0STahsin Erdogan 	credits += EXT4_MAXQUOTAS_TRANS_BLOCKS(sb);
992dec214d0STahsin Erdogan 
993dec214d0STahsin Erdogan 	/*
994dec214d0STahsin Erdogan 	 * In case of inline data, we may push out the data to a block,
995dec214d0STahsin Erdogan 	 * so we need to reserve credits for this eventuality
996dec214d0STahsin Erdogan 	 */
997af65207cSTahsin Erdogan 	if (inode && ext4_has_inline_data(inode))
998dec214d0STahsin Erdogan 		credits += ext4_writepage_trans_blocks(inode) + 1;
999dec214d0STahsin Erdogan 
1000dec214d0STahsin Erdogan 	/* We are done if ea_inode feature is not enabled. */
1001dec214d0STahsin Erdogan 	if (!ext4_has_feature_ea_inode(sb))
1002dec214d0STahsin Erdogan 		return credits;
1003dec214d0STahsin Erdogan 
1004dec214d0STahsin Erdogan 	/* New ea_inode, inode map, block bitmap, group descriptor. */
1005dec214d0STahsin Erdogan 	credits += 4;
1006dec214d0STahsin Erdogan 
1007dec214d0STahsin Erdogan 	/* Data blocks. */
1008dec214d0STahsin Erdogan 	blocks = (value_len + sb->s_blocksize - 1) >> sb->s_blocksize_bits;
1009dec214d0STahsin Erdogan 
1010dec214d0STahsin Erdogan 	/* Indirection block or one level of extent tree. */
1011dec214d0STahsin Erdogan 	blocks += 1;
1012dec214d0STahsin Erdogan 
1013dec214d0STahsin Erdogan 	/* Block bitmap and group descriptor updates for each block. */
1014dec214d0STahsin Erdogan 	credits += blocks * 2;
1015dec214d0STahsin Erdogan 
1016dec214d0STahsin Erdogan 	/* Blocks themselves. */
1017dec214d0STahsin Erdogan 	credits += blocks;
1018dec214d0STahsin Erdogan 
1019af65207cSTahsin Erdogan 	if (!is_create) {
1020dec214d0STahsin Erdogan 		/* Dereference ea_inode holding old xattr value.
1021dec214d0STahsin Erdogan 		 * Old ea_inode, inode map, block bitmap, group descriptor.
1022dec214d0STahsin Erdogan 		 */
1023dec214d0STahsin Erdogan 		credits += 4;
1024dec214d0STahsin Erdogan 
1025dec214d0STahsin Erdogan 		/* Data blocks for old ea_inode. */
1026dec214d0STahsin Erdogan 		blocks = XATTR_SIZE_MAX >> sb->s_blocksize_bits;
1027dec214d0STahsin Erdogan 
1028af65207cSTahsin Erdogan 		/* Indirection block or one level of extent tree for old
1029af65207cSTahsin Erdogan 		 * ea_inode.
1030af65207cSTahsin Erdogan 		 */
1031dec214d0STahsin Erdogan 		blocks += 1;
1032dec214d0STahsin Erdogan 
1033dec214d0STahsin Erdogan 		/* Block bitmap and group descriptor updates for each block. */
1034dec214d0STahsin Erdogan 		credits += blocks * 2;
1035af65207cSTahsin Erdogan 	}
1036dec214d0STahsin Erdogan 
1037dec214d0STahsin Erdogan 	/* We may need to clone the existing xattr block in which case we need
1038dec214d0STahsin Erdogan 	 * to increment ref counts for existing ea_inodes referenced by it.
1039dec214d0STahsin Erdogan 	 */
1040dec214d0STahsin Erdogan 	if (block_bh) {
1041dec214d0STahsin Erdogan 		struct ext4_xattr_entry *entry = BFIRST(block_bh);
1042dec214d0STahsin Erdogan 
1043dec214d0STahsin Erdogan 		for (; !IS_LAST_ENTRY(entry); entry = EXT4_XATTR_NEXT(entry))
1044dec214d0STahsin Erdogan 			if (entry->e_value_inum)
1045dec214d0STahsin Erdogan 				/* Ref count update on ea_inode. */
1046dec214d0STahsin Erdogan 				credits += 1;
1047dec214d0STahsin Erdogan 	}
1048dec214d0STahsin Erdogan 	return credits;
1049dec214d0STahsin Erdogan }
1050dec214d0STahsin Erdogan 
1051dec214d0STahsin Erdogan static int ext4_xattr_inode_update_ref(handle_t *handle, struct inode *ea_inode,
1052dec214d0STahsin Erdogan 				       int ref_change)
1053dec214d0STahsin Erdogan {
1054dec214d0STahsin Erdogan 	struct ext4_iloc iloc;
1055dec214d0STahsin Erdogan 	s64 ref_count;
1056dec214d0STahsin Erdogan 	int ret;
1057dec214d0STahsin Erdogan 
1058dec214d0STahsin Erdogan 	inode_lock(ea_inode);
1059dec214d0STahsin Erdogan 
1060dec214d0STahsin Erdogan 	ret = ext4_reserve_inode_write(handle, ea_inode, &iloc);
10611bfc204dSVasily Averin 	if (ret)
1062dec214d0STahsin Erdogan 		goto out;
1063dec214d0STahsin Erdogan 
1064dec214d0STahsin Erdogan 	ref_count = ext4_xattr_inode_get_ref(ea_inode);
1065dec214d0STahsin Erdogan 	ref_count += ref_change;
1066dec214d0STahsin Erdogan 	ext4_xattr_inode_set_ref(ea_inode, ref_count);
1067dec214d0STahsin Erdogan 
1068dec214d0STahsin Erdogan 	if (ref_change > 0) {
1069dec214d0STahsin Erdogan 		WARN_ONCE(ref_count <= 0, "EA inode %lu ref_count=%lld",
1070dec214d0STahsin Erdogan 			  ea_inode->i_ino, ref_count);
1071dec214d0STahsin Erdogan 
1072dec214d0STahsin Erdogan 		if (ref_count == 1) {
1073dec214d0STahsin Erdogan 			WARN_ONCE(ea_inode->i_nlink, "EA inode %lu i_nlink=%u",
1074dec214d0STahsin Erdogan 				  ea_inode->i_ino, ea_inode->i_nlink);
1075dec214d0STahsin Erdogan 
1076dec214d0STahsin Erdogan 			set_nlink(ea_inode, 1);
1077dec214d0STahsin Erdogan 			ext4_orphan_del(handle, ea_inode);
1078cdb7ee4cSTahsin Erdogan 		}
1079dec214d0STahsin Erdogan 	} else {
1080dec214d0STahsin Erdogan 		WARN_ONCE(ref_count < 0, "EA inode %lu ref_count=%lld",
1081dec214d0STahsin Erdogan 			  ea_inode->i_ino, ref_count);
1082dec214d0STahsin Erdogan 
1083dec214d0STahsin Erdogan 		if (ref_count == 0) {
1084dec214d0STahsin Erdogan 			WARN_ONCE(ea_inode->i_nlink != 1,
1085dec214d0STahsin Erdogan 				  "EA inode %lu i_nlink=%u",
1086dec214d0STahsin Erdogan 				  ea_inode->i_ino, ea_inode->i_nlink);
1087dec214d0STahsin Erdogan 
1088dec214d0STahsin Erdogan 			clear_nlink(ea_inode);
1089dec214d0STahsin Erdogan 			ext4_orphan_add(handle, ea_inode);
1090dec214d0STahsin Erdogan 		}
1091cdb7ee4cSTahsin Erdogan 	}
1092dec214d0STahsin Erdogan 
1093dec214d0STahsin Erdogan 	ret = ext4_mark_iloc_dirty(handle, ea_inode, &iloc);
1094dec214d0STahsin Erdogan 	if (ret)
1095dec214d0STahsin Erdogan 		ext4_warning_inode(ea_inode,
1096dec214d0STahsin Erdogan 				   "ext4_mark_iloc_dirty() failed ret=%d", ret);
1097dec214d0STahsin Erdogan out:
1098dec214d0STahsin Erdogan 	inode_unlock(ea_inode);
1099dec214d0STahsin Erdogan 	return ret;
1100dec214d0STahsin Erdogan }
1101dec214d0STahsin Erdogan 
1102dec214d0STahsin Erdogan static int ext4_xattr_inode_inc_ref(handle_t *handle, struct inode *ea_inode)
1103dec214d0STahsin Erdogan {
1104dec214d0STahsin Erdogan 	return ext4_xattr_inode_update_ref(handle, ea_inode, 1);
1105dec214d0STahsin Erdogan }
1106dec214d0STahsin Erdogan 
1107dec214d0STahsin Erdogan static int ext4_xattr_inode_dec_ref(handle_t *handle, struct inode *ea_inode)
1108dec214d0STahsin Erdogan {
1109dec214d0STahsin Erdogan 	return ext4_xattr_inode_update_ref(handle, ea_inode, -1);
1110dec214d0STahsin Erdogan }
1111dec214d0STahsin Erdogan 
1112dec214d0STahsin Erdogan static int ext4_xattr_inode_inc_ref_all(handle_t *handle, struct inode *parent,
1113dec214d0STahsin Erdogan 					struct ext4_xattr_entry *first)
1114dec214d0STahsin Erdogan {
1115dec214d0STahsin Erdogan 	struct inode *ea_inode;
1116dec214d0STahsin Erdogan 	struct ext4_xattr_entry *entry;
1117dec214d0STahsin Erdogan 	struct ext4_xattr_entry *failed_entry;
1118dec214d0STahsin Erdogan 	unsigned int ea_ino;
1119dec214d0STahsin Erdogan 	int err, saved_err;
1120dec214d0STahsin Erdogan 
1121dec214d0STahsin Erdogan 	for (entry = first; !IS_LAST_ENTRY(entry);
1122dec214d0STahsin Erdogan 	     entry = EXT4_XATTR_NEXT(entry)) {
1123dec214d0STahsin Erdogan 		if (!entry->e_value_inum)
1124dec214d0STahsin Erdogan 			continue;
1125dec214d0STahsin Erdogan 		ea_ino = le32_to_cpu(entry->e_value_inum);
1126a6d05676STahsin Erdogan 		err = ext4_xattr_inode_iget(parent, ea_ino,
1127a6d05676STahsin Erdogan 					    le32_to_cpu(entry->e_hash),
1128a6d05676STahsin Erdogan 					    &ea_inode);
1129dec214d0STahsin Erdogan 		if (err)
1130dec214d0STahsin Erdogan 			goto cleanup;
1131dec214d0STahsin Erdogan 		err = ext4_xattr_inode_inc_ref(handle, ea_inode);
1132dec214d0STahsin Erdogan 		if (err) {
1133dec214d0STahsin Erdogan 			ext4_warning_inode(ea_inode, "inc ref error %d", err);
1134dec214d0STahsin Erdogan 			iput(ea_inode);
1135dec214d0STahsin Erdogan 			goto cleanup;
1136dec214d0STahsin Erdogan 		}
1137dec214d0STahsin Erdogan 		iput(ea_inode);
1138dec214d0STahsin Erdogan 	}
1139dec214d0STahsin Erdogan 	return 0;
1140dec214d0STahsin Erdogan 
1141dec214d0STahsin Erdogan cleanup:
1142dec214d0STahsin Erdogan 	saved_err = err;
1143dec214d0STahsin Erdogan 	failed_entry = entry;
1144dec214d0STahsin Erdogan 
1145dec214d0STahsin Erdogan 	for (entry = first; entry != failed_entry;
1146dec214d0STahsin Erdogan 	     entry = EXT4_XATTR_NEXT(entry)) {
1147dec214d0STahsin Erdogan 		if (!entry->e_value_inum)
1148dec214d0STahsin Erdogan 			continue;
1149dec214d0STahsin Erdogan 		ea_ino = le32_to_cpu(entry->e_value_inum);
1150a6d05676STahsin Erdogan 		err = ext4_xattr_inode_iget(parent, ea_ino,
1151a6d05676STahsin Erdogan 					    le32_to_cpu(entry->e_hash),
1152a6d05676STahsin Erdogan 					    &ea_inode);
1153dec214d0STahsin Erdogan 		if (err) {
1154dec214d0STahsin Erdogan 			ext4_warning(parent->i_sb,
1155dec214d0STahsin Erdogan 				     "cleanup ea_ino %u iget error %d", ea_ino,
1156dec214d0STahsin Erdogan 				     err);
1157dec214d0STahsin Erdogan 			continue;
1158dec214d0STahsin Erdogan 		}
1159dec214d0STahsin Erdogan 		err = ext4_xattr_inode_dec_ref(handle, ea_inode);
1160dec214d0STahsin Erdogan 		if (err)
1161dec214d0STahsin Erdogan 			ext4_warning_inode(ea_inode, "cleanup dec ref error %d",
1162dec214d0STahsin Erdogan 					   err);
1163dec214d0STahsin Erdogan 		iput(ea_inode);
1164dec214d0STahsin Erdogan 	}
1165dec214d0STahsin Erdogan 	return saved_err;
1166dec214d0STahsin Erdogan }
1167dec214d0STahsin Erdogan 
1168a4130367SJan Kara static int ext4_xattr_restart_fn(handle_t *handle, struct inode *inode,
1169a4130367SJan Kara 			struct buffer_head *bh, bool block_csum, bool dirty)
1170a4130367SJan Kara {
1171a4130367SJan Kara 	int error;
1172a4130367SJan Kara 
1173a4130367SJan Kara 	if (bh && dirty) {
1174a4130367SJan Kara 		if (block_csum)
1175a4130367SJan Kara 			ext4_xattr_block_csum_set(inode, bh);
1176a4130367SJan Kara 		error = ext4_handle_dirty_metadata(handle, NULL, bh);
1177a4130367SJan Kara 		if (error) {
1178a4130367SJan Kara 			ext4_warning(inode->i_sb, "Handle metadata (error %d)",
1179a4130367SJan Kara 				     error);
1180a4130367SJan Kara 			return error;
1181a4130367SJan Kara 		}
1182a4130367SJan Kara 	}
1183a4130367SJan Kara 	return 0;
1184a4130367SJan Kara }
1185a4130367SJan Kara 
118630a7eb97STahsin Erdogan static void
1187dec214d0STahsin Erdogan ext4_xattr_inode_dec_ref_all(handle_t *handle, struct inode *parent,
118830a7eb97STahsin Erdogan 			     struct buffer_head *bh,
118930a7eb97STahsin Erdogan 			     struct ext4_xattr_entry *first, bool block_csum,
119030a7eb97STahsin Erdogan 			     struct ext4_xattr_inode_array **ea_inode_array,
1191dec214d0STahsin Erdogan 			     int extra_credits, bool skip_quota)
119230a7eb97STahsin Erdogan {
119330a7eb97STahsin Erdogan 	struct inode *ea_inode;
119430a7eb97STahsin Erdogan 	struct ext4_xattr_entry *entry;
119530a7eb97STahsin Erdogan 	bool dirty = false;
119630a7eb97STahsin Erdogan 	unsigned int ea_ino;
119730a7eb97STahsin Erdogan 	int err;
119830a7eb97STahsin Erdogan 	int credits;
119930a7eb97STahsin Erdogan 
120030a7eb97STahsin Erdogan 	/* One credit for dec ref on ea_inode, one for orphan list addition, */
120130a7eb97STahsin Erdogan 	credits = 2 + extra_credits;
120230a7eb97STahsin Erdogan 
120330a7eb97STahsin Erdogan 	for (entry = first; !IS_LAST_ENTRY(entry);
120430a7eb97STahsin Erdogan 	     entry = EXT4_XATTR_NEXT(entry)) {
120530a7eb97STahsin Erdogan 		if (!entry->e_value_inum)
120630a7eb97STahsin Erdogan 			continue;
120730a7eb97STahsin Erdogan 		ea_ino = le32_to_cpu(entry->e_value_inum);
1208a6d05676STahsin Erdogan 		err = ext4_xattr_inode_iget(parent, ea_ino,
1209a6d05676STahsin Erdogan 					    le32_to_cpu(entry->e_hash),
1210a6d05676STahsin Erdogan 					    &ea_inode);
121130a7eb97STahsin Erdogan 		if (err)
121230a7eb97STahsin Erdogan 			continue;
121330a7eb97STahsin Erdogan 
121430a7eb97STahsin Erdogan 		err = ext4_expand_inode_array(ea_inode_array, ea_inode);
121530a7eb97STahsin Erdogan 		if (err) {
121630a7eb97STahsin Erdogan 			ext4_warning_inode(ea_inode,
121730a7eb97STahsin Erdogan 					   "Expand inode array err=%d", err);
121830a7eb97STahsin Erdogan 			iput(ea_inode);
121930a7eb97STahsin Erdogan 			continue;
122030a7eb97STahsin Erdogan 		}
122130a7eb97STahsin Erdogan 
1222a4130367SJan Kara 		err = ext4_journal_ensure_credits_fn(handle, credits, credits,
122383448bdfSJan Kara 			ext4_free_metadata_revoke_credits(parent->i_sb, 1),
1224a4130367SJan Kara 			ext4_xattr_restart_fn(handle, parent, bh, block_csum,
1225a4130367SJan Kara 					      dirty));
1226a4130367SJan Kara 		if (err < 0) {
122730a7eb97STahsin Erdogan 			ext4_warning_inode(ea_inode, "Ensure credits err=%d",
122830a7eb97STahsin Erdogan 					   err);
122930a7eb97STahsin Erdogan 			continue;
123030a7eb97STahsin Erdogan 		}
1231a4130367SJan Kara 		if (err > 0) {
1232188c299eSJan Kara 			err = ext4_journal_get_write_access(handle,
1233188c299eSJan Kara 					parent->i_sb, bh, EXT4_JTR_NONE);
1234a4130367SJan Kara 			if (err) {
1235a4130367SJan Kara 				ext4_warning_inode(ea_inode,
1236a4130367SJan Kara 						"Re-get write access err=%d",
1237a4130367SJan Kara 						err);
1238a4130367SJan Kara 				continue;
1239a4130367SJan Kara 			}
1240a4130367SJan Kara 		}
124130a7eb97STahsin Erdogan 
1242dec214d0STahsin Erdogan 		err = ext4_xattr_inode_dec_ref(handle, ea_inode);
1243dec214d0STahsin Erdogan 		if (err) {
1244dec214d0STahsin Erdogan 			ext4_warning_inode(ea_inode, "ea_inode dec ref err=%d",
1245dec214d0STahsin Erdogan 					   err);
1246dec214d0STahsin Erdogan 			continue;
1247dec214d0STahsin Erdogan 		}
1248dec214d0STahsin Erdogan 
1249dec214d0STahsin Erdogan 		if (!skip_quota)
1250a6d05676STahsin Erdogan 			ext4_xattr_inode_free_quota(parent, ea_inode,
1251dec214d0STahsin Erdogan 					      le32_to_cpu(entry->e_value_size));
125230a7eb97STahsin Erdogan 
125330a7eb97STahsin Erdogan 		/*
125430a7eb97STahsin Erdogan 		 * Forget about ea_inode within the same transaction that
125530a7eb97STahsin Erdogan 		 * decrements the ref count. This avoids duplicate decrements in
125630a7eb97STahsin Erdogan 		 * case the rest of the work spills over to subsequent
125730a7eb97STahsin Erdogan 		 * transactions.
125830a7eb97STahsin Erdogan 		 */
125930a7eb97STahsin Erdogan 		entry->e_value_inum = 0;
126030a7eb97STahsin Erdogan 		entry->e_value_size = 0;
126130a7eb97STahsin Erdogan 
126230a7eb97STahsin Erdogan 		dirty = true;
126330a7eb97STahsin Erdogan 	}
126430a7eb97STahsin Erdogan 
126530a7eb97STahsin Erdogan 	if (dirty) {
126630a7eb97STahsin Erdogan 		/*
126730a7eb97STahsin Erdogan 		 * Note that we are deliberately skipping csum calculation for
126830a7eb97STahsin Erdogan 		 * the final update because we do not expect any journal
126930a7eb97STahsin Erdogan 		 * restarts until xattr block is freed.
127030a7eb97STahsin Erdogan 		 */
127130a7eb97STahsin Erdogan 
127230a7eb97STahsin Erdogan 		err = ext4_handle_dirty_metadata(handle, NULL, bh);
127330a7eb97STahsin Erdogan 		if (err)
127430a7eb97STahsin Erdogan 			ext4_warning_inode(parent,
127530a7eb97STahsin Erdogan 					   "handle dirty metadata err=%d", err);
127630a7eb97STahsin Erdogan 	}
127730a7eb97STahsin Erdogan }
127830a7eb97STahsin Erdogan 
1279ac27a0ecSDave Kleikamp /*
1280ec4cb1aaSJan Kara  * Release the xattr block BH: If the reference count is > 1, decrement it;
1281ec4cb1aaSJan Kara  * otherwise free the block.
1282ac27a0ecSDave Kleikamp  */
1283ac27a0ecSDave Kleikamp static void
1284617ba13bSMingming Cao ext4_xattr_release_block(handle_t *handle, struct inode *inode,
1285dec214d0STahsin Erdogan 			 struct buffer_head *bh,
1286dec214d0STahsin Erdogan 			 struct ext4_xattr_inode_array **ea_inode_array,
1287dec214d0STahsin Erdogan 			 int extra_credits)
1288ac27a0ecSDave Kleikamp {
128947387409STahsin Erdogan 	struct mb_cache *ea_block_cache = EA_BLOCK_CACHE(inode);
12906048c64bSAndreas Gruenbacher 	u32 hash, ref;
12918a2bfdcbSMingming Cao 	int error = 0;
1292ac27a0ecSDave Kleikamp 
12935d601255Sliang xie 	BUFFER_TRACE(bh, "get_write_access");
1294188c299eSJan Kara 	error = ext4_journal_get_write_access(handle, inode->i_sb, bh,
1295188c299eSJan Kara 					      EXT4_JTR_NONE);
12968a2bfdcbSMingming Cao 	if (error)
12978a2bfdcbSMingming Cao 		goto out;
12988a2bfdcbSMingming Cao 
129965f8b800SJan Kara retry_ref:
13008a2bfdcbSMingming Cao 	lock_buffer(bh);
13016048c64bSAndreas Gruenbacher 	hash = le32_to_cpu(BHDR(bh)->h_hash);
13026048c64bSAndreas Gruenbacher 	ref = le32_to_cpu(BHDR(bh)->h_refcount);
13036048c64bSAndreas Gruenbacher 	if (ref == 1) {
1304ac27a0ecSDave Kleikamp 		ea_bdebug(bh, "refcount now=0; freeing");
130582939d79SJan Kara 		/*
130682939d79SJan Kara 		 * This must happen under buffer lock for
130782939d79SJan Kara 		 * ext4_xattr_block_set() to reliably detect freed block
130882939d79SJan Kara 		 */
130965f8b800SJan Kara 		if (ea_block_cache) {
131065f8b800SJan Kara 			struct mb_cache_entry *oe;
131165f8b800SJan Kara 
131265f8b800SJan Kara 			oe = mb_cache_entry_delete_or_get(ea_block_cache, hash,
1313cdb7ee4cSTahsin Erdogan 							  bh->b_blocknr);
131465f8b800SJan Kara 			if (oe) {
131565f8b800SJan Kara 				unlock_buffer(bh);
131665f8b800SJan Kara 				mb_cache_entry_wait_unused(oe);
131765f8b800SJan Kara 				mb_cache_entry_put(ea_block_cache, oe);
131865f8b800SJan Kara 				goto retry_ref;
131965f8b800SJan Kara 			}
132065f8b800SJan Kara 		}
1321ac27a0ecSDave Kleikamp 		get_bh(bh);
1322ec4cb1aaSJan Kara 		unlock_buffer(bh);
1323dec214d0STahsin Erdogan 
1324dec214d0STahsin Erdogan 		if (ext4_has_feature_ea_inode(inode->i_sb))
1325dec214d0STahsin Erdogan 			ext4_xattr_inode_dec_ref_all(handle, inode, bh,
1326dec214d0STahsin Erdogan 						     BFIRST(bh),
1327dec214d0STahsin Erdogan 						     true /* block_csum */,
1328dec214d0STahsin Erdogan 						     ea_inode_array,
1329dec214d0STahsin Erdogan 						     extra_credits,
1330dec214d0STahsin Erdogan 						     true /* skip_quota */);
1331e6362609STheodore Ts'o 		ext4_free_blocks(handle, inode, bh, 0, 1,
1332e6362609STheodore Ts'o 				 EXT4_FREE_BLOCKS_METADATA |
1333e6362609STheodore Ts'o 				 EXT4_FREE_BLOCKS_FORGET);
1334ac27a0ecSDave Kleikamp 	} else {
13356048c64bSAndreas Gruenbacher 		ref--;
13366048c64bSAndreas Gruenbacher 		BHDR(bh)->h_refcount = cpu_to_le32(ref);
13376048c64bSAndreas Gruenbacher 		if (ref == EXT4_XATTR_REFCOUNT_MAX - 1) {
13386048c64bSAndreas Gruenbacher 			struct mb_cache_entry *ce;
13396048c64bSAndreas Gruenbacher 
1340cdb7ee4cSTahsin Erdogan 			if (ea_block_cache) {
134147387409STahsin Erdogan 				ce = mb_cache_entry_get(ea_block_cache, hash,
13426048c64bSAndreas Gruenbacher 							bh->b_blocknr);
13436048c64bSAndreas Gruenbacher 				if (ce) {
1344a44e84a9SJan Kara 					set_bit(MBE_REUSABLE_B, &ce->e_flags);
134547387409STahsin Erdogan 					mb_cache_entry_put(ea_block_cache, ce);
13466048c64bSAndreas Gruenbacher 				}
13476048c64bSAndreas Gruenbacher 			}
1348cdb7ee4cSTahsin Erdogan 		}
13496048c64bSAndreas Gruenbacher 
1350dac7a4b4STheodore Ts'o 		ext4_xattr_block_csum_set(inode, bh);
1351ec4cb1aaSJan Kara 		/*
1352ec4cb1aaSJan Kara 		 * Beware of this ugliness: Releasing of xattr block references
1353ec4cb1aaSJan Kara 		 * from different inodes can race and so we have to protect
1354ec4cb1aaSJan Kara 		 * from a race where someone else frees the block (and releases
1355ec4cb1aaSJan Kara 		 * its journal_head) before we are done dirtying the buffer. In
1356ec4cb1aaSJan Kara 		 * nojournal mode this race is harmless and we actually cannot
1357dac7a4b4STheodore Ts'o 		 * call ext4_handle_dirty_metadata() with locked buffer as
1358ec4cb1aaSJan Kara 		 * that function can call sync_dirty_buffer() so for that case
1359ec4cb1aaSJan Kara 		 * we handle the dirtying after unlocking the buffer.
1360ec4cb1aaSJan Kara 		 */
1361ec4cb1aaSJan Kara 		if (ext4_handle_valid(handle))
1362dac7a4b4STheodore Ts'o 			error = ext4_handle_dirty_metadata(handle, inode, bh);
1363c1bb05a6SEric Sandeen 		unlock_buffer(bh);
1364ec4cb1aaSJan Kara 		if (!ext4_handle_valid(handle))
1365dac7a4b4STheodore Ts'o 			error = ext4_handle_dirty_metadata(handle, inode, bh);
1366ac27a0ecSDave Kleikamp 		if (IS_SYNC(inode))
13670390131bSFrank Mayhar 			ext4_handle_sync(handle);
13681231b3a1SLukas Czerner 		dquot_free_block(inode, EXT4_C2B(EXT4_SB(inode->i_sb), 1));
1369ac27a0ecSDave Kleikamp 		ea_bdebug(bh, "refcount now=%d; releasing",
1370ac27a0ecSDave Kleikamp 			  le32_to_cpu(BHDR(bh)->h_refcount));
1371ac27a0ecSDave Kleikamp 	}
13728a2bfdcbSMingming Cao out:
13738a2bfdcbSMingming Cao 	ext4_std_error(inode->i_sb, error);
13748a2bfdcbSMingming Cao 	return;
1375ac27a0ecSDave Kleikamp }
1376ac27a0ecSDave Kleikamp 
13776dd4ee7cSKalpak Shah /*
13786dd4ee7cSKalpak Shah  * Find the available free space for EAs. This also returns the total number of
13796dd4ee7cSKalpak Shah  * bytes used by EA entries.
13806dd4ee7cSKalpak Shah  */
13816dd4ee7cSKalpak Shah static size_t ext4_xattr_free_space(struct ext4_xattr_entry *last,
13826dd4ee7cSKalpak Shah 				    size_t *min_offs, void *base, int *total)
13836dd4ee7cSKalpak Shah {
13846dd4ee7cSKalpak Shah 	for (; !IS_LAST_ENTRY(last); last = EXT4_XATTR_NEXT(last)) {
1385e50e5129SAndreas Dilger 		if (!last->e_value_inum && last->e_value_size) {
13866dd4ee7cSKalpak Shah 			size_t offs = le16_to_cpu(last->e_value_offs);
13876dd4ee7cSKalpak Shah 			if (offs < *min_offs)
13886dd4ee7cSKalpak Shah 				*min_offs = offs;
13896dd4ee7cSKalpak Shah 		}
13907b1b2c1bSTheodore Ts'o 		if (total)
13917b1b2c1bSTheodore Ts'o 			*total += EXT4_XATTR_LEN(last->e_name_len);
13926dd4ee7cSKalpak Shah 	}
13936dd4ee7cSKalpak Shah 	return (*min_offs - ((void *)last - base) - sizeof(__u32));
13946dd4ee7cSKalpak Shah }
13956dd4ee7cSKalpak Shah 
1396e50e5129SAndreas Dilger /*
1397e50e5129SAndreas Dilger  * Write the value of the EA in an inode.
1398e50e5129SAndreas Dilger  */
1399e50e5129SAndreas Dilger static int ext4_xattr_inode_write(handle_t *handle, struct inode *ea_inode,
1400e50e5129SAndreas Dilger 				  const void *buf, int bufsize)
1401e50e5129SAndreas Dilger {
1402e50e5129SAndreas Dilger 	struct buffer_head *bh = NULL;
1403e50e5129SAndreas Dilger 	unsigned long block = 0;
1404dec214d0STahsin Erdogan 	int blocksize = ea_inode->i_sb->s_blocksize;
1405dec214d0STahsin Erdogan 	int max_blocks = (bufsize + blocksize - 1) >> ea_inode->i_blkbits;
1406e50e5129SAndreas Dilger 	int csize, wsize = 0;
14074209ae12SHarshad Shirwadkar 	int ret = 0, ret2 = 0;
1408e50e5129SAndreas Dilger 	int retries = 0;
1409e50e5129SAndreas Dilger 
1410e50e5129SAndreas Dilger retry:
1411e50e5129SAndreas Dilger 	while (ret >= 0 && ret < max_blocks) {
1412e50e5129SAndreas Dilger 		struct ext4_map_blocks map;
1413e50e5129SAndreas Dilger 		map.m_lblk = block += ret;
1414e50e5129SAndreas Dilger 		map.m_len = max_blocks -= ret;
1415e50e5129SAndreas Dilger 
1416e50e5129SAndreas Dilger 		ret = ext4_map_blocks(handle, ea_inode, &map,
1417e50e5129SAndreas Dilger 				      EXT4_GET_BLOCKS_CREATE);
1418e50e5129SAndreas Dilger 		if (ret <= 0) {
1419e50e5129SAndreas Dilger 			ext4_mark_inode_dirty(handle, ea_inode);
1420e50e5129SAndreas Dilger 			if (ret == -ENOSPC &&
1421e50e5129SAndreas Dilger 			    ext4_should_retry_alloc(ea_inode->i_sb, &retries)) {
1422e50e5129SAndreas Dilger 				ret = 0;
1423e50e5129SAndreas Dilger 				goto retry;
1424e50e5129SAndreas Dilger 			}
1425e50e5129SAndreas Dilger 			break;
1426e50e5129SAndreas Dilger 		}
1427e50e5129SAndreas Dilger 	}
1428e50e5129SAndreas Dilger 
1429e50e5129SAndreas Dilger 	if (ret < 0)
1430e50e5129SAndreas Dilger 		return ret;
1431e50e5129SAndreas Dilger 
1432e50e5129SAndreas Dilger 	block = 0;
1433e50e5129SAndreas Dilger 	while (wsize < bufsize) {
1434e50e5129SAndreas Dilger 		brelse(bh);
1435e50e5129SAndreas Dilger 		csize = (bufsize - wsize) > blocksize ? blocksize :
1436e50e5129SAndreas Dilger 								bufsize - wsize;
1437e50e5129SAndreas Dilger 		bh = ext4_getblk(handle, ea_inode, block, 0);
1438e50e5129SAndreas Dilger 		if (IS_ERR(bh))
1439e50e5129SAndreas Dilger 			return PTR_ERR(bh);
1440eb6984faSVasily Averin 		if (!bh) {
1441eb6984faSVasily Averin 			WARN_ON_ONCE(1);
1442eb6984faSVasily Averin 			EXT4_ERROR_INODE(ea_inode,
1443eb6984faSVasily Averin 					 "ext4_getblk() return bh = NULL");
1444eb6984faSVasily Averin 			return -EFSCORRUPTED;
1445eb6984faSVasily Averin 		}
1446188c299eSJan Kara 		ret = ext4_journal_get_write_access(handle, ea_inode->i_sb, bh,
1447188c299eSJan Kara 						   EXT4_JTR_NONE);
1448e50e5129SAndreas Dilger 		if (ret)
1449e50e5129SAndreas Dilger 			goto out;
1450e50e5129SAndreas Dilger 
1451e50e5129SAndreas Dilger 		memcpy(bh->b_data, buf, csize);
1452e50e5129SAndreas Dilger 		set_buffer_uptodate(bh);
1453e50e5129SAndreas Dilger 		ext4_handle_dirty_metadata(handle, ea_inode, bh);
1454e50e5129SAndreas Dilger 
1455e50e5129SAndreas Dilger 		buf += csize;
1456e50e5129SAndreas Dilger 		wsize += csize;
1457e50e5129SAndreas Dilger 		block += 1;
1458e50e5129SAndreas Dilger 	}
1459e50e5129SAndreas Dilger 
1460e50e5129SAndreas Dilger 	inode_lock(ea_inode);
1461e50e5129SAndreas Dilger 	i_size_write(ea_inode, wsize);
1462e50e5129SAndreas Dilger 	ext4_update_i_disksize(ea_inode, wsize);
1463e50e5129SAndreas Dilger 	inode_unlock(ea_inode);
1464e50e5129SAndreas Dilger 
14654209ae12SHarshad Shirwadkar 	ret2 = ext4_mark_inode_dirty(handle, ea_inode);
14664209ae12SHarshad Shirwadkar 	if (unlikely(ret2 && !ret))
14674209ae12SHarshad Shirwadkar 		ret = ret2;
1468e50e5129SAndreas Dilger 
1469e50e5129SAndreas Dilger out:
1470e50e5129SAndreas Dilger 	brelse(bh);
1471e50e5129SAndreas Dilger 
1472e50e5129SAndreas Dilger 	return ret;
1473e50e5129SAndreas Dilger }
1474e50e5129SAndreas Dilger 
1475e50e5129SAndreas Dilger /*
1476e50e5129SAndreas Dilger  * Create an inode to store the value of a large EA.
1477e50e5129SAndreas Dilger  */
1478e50e5129SAndreas Dilger static struct inode *ext4_xattr_inode_create(handle_t *handle,
1479dec214d0STahsin Erdogan 					     struct inode *inode, u32 hash)
1480e50e5129SAndreas Dilger {
1481e50e5129SAndreas Dilger 	struct inode *ea_inode = NULL;
14829e1ba001STahsin Erdogan 	uid_t owner[2] = { i_uid_read(inode), i_gid_read(inode) };
1483bd3b963bSTahsin Erdogan 	int err;
1484e50e5129SAndreas Dilger 
1485f31173c1SJun Nie 	if (inode->i_sb->s_root == NULL) {
1486f31173c1SJun Nie 		ext4_warning(inode->i_sb,
1487f31173c1SJun Nie 			     "refuse to create EA inode when umounting");
1488f31173c1SJun Nie 		WARN_ON(1);
1489f31173c1SJun Nie 		return ERR_PTR(-EINVAL);
1490f31173c1SJun Nie 	}
1491f31173c1SJun Nie 
1492e50e5129SAndreas Dilger 	/*
1493e50e5129SAndreas Dilger 	 * Let the next inode be the goal, so we try and allocate the EA inode
1494e50e5129SAndreas Dilger 	 * in the same group, or nearby one.
1495e50e5129SAndreas Dilger 	 */
1496e50e5129SAndreas Dilger 	ea_inode = ext4_new_inode(handle, inode->i_sb->s_root->d_inode,
14979e1ba001STahsin Erdogan 				  S_IFREG | 0600, NULL, inode->i_ino + 1, owner,
14981b917ed8STahsin Erdogan 				  EXT4_EA_INODE_FL);
1499e50e5129SAndreas Dilger 	if (!IS_ERR(ea_inode)) {
1500e50e5129SAndreas Dilger 		ea_inode->i_op = &ext4_file_inode_operations;
1501e50e5129SAndreas Dilger 		ea_inode->i_fop = &ext4_file_operations;
1502e50e5129SAndreas Dilger 		ext4_set_aops(ea_inode);
150333d201e0STahsin Erdogan 		ext4_xattr_inode_set_class(ea_inode);
1504e50e5129SAndreas Dilger 		unlock_new_inode(ea_inode);
1505dec214d0STahsin Erdogan 		ext4_xattr_inode_set_ref(ea_inode, 1);
1506dec214d0STahsin Erdogan 		ext4_xattr_inode_set_hash(ea_inode, hash);
1507dec214d0STahsin Erdogan 		err = ext4_mark_inode_dirty(handle, ea_inode);
1508dec214d0STahsin Erdogan 		if (!err)
1509bd3b963bSTahsin Erdogan 			err = ext4_inode_attach_jinode(ea_inode);
1510bd3b963bSTahsin Erdogan 		if (err) {
1511e4db04f7SYe Bin 			if (ext4_xattr_inode_dec_ref(handle, ea_inode))
1512e4db04f7SYe Bin 				ext4_warning_inode(ea_inode,
1513e4db04f7SYe Bin 					"cleanup dec ref error %d", err);
1514bd3b963bSTahsin Erdogan 			iput(ea_inode);
1515bd3b963bSTahsin Erdogan 			return ERR_PTR(err);
1516bd3b963bSTahsin Erdogan 		}
1517dec214d0STahsin Erdogan 
1518dec214d0STahsin Erdogan 		/*
1519dec214d0STahsin Erdogan 		 * Xattr inodes are shared therefore quota charging is performed
1520dec214d0STahsin Erdogan 		 * at a higher level.
1521dec214d0STahsin Erdogan 		 */
1522dec214d0STahsin Erdogan 		dquot_free_inode(ea_inode);
1523dec214d0STahsin Erdogan 		dquot_drop(ea_inode);
1524dec214d0STahsin Erdogan 		inode_lock(ea_inode);
1525dec214d0STahsin Erdogan 		ea_inode->i_flags |= S_NOQUOTA;
1526dec214d0STahsin Erdogan 		inode_unlock(ea_inode);
1527e50e5129SAndreas Dilger 	}
1528e50e5129SAndreas Dilger 
1529e50e5129SAndreas Dilger 	return ea_inode;
1530e50e5129SAndreas Dilger }
1531e50e5129SAndreas Dilger 
1532dec214d0STahsin Erdogan static struct inode *
1533dec214d0STahsin Erdogan ext4_xattr_inode_cache_find(struct inode *inode, const void *value,
1534dec214d0STahsin Erdogan 			    size_t value_len, u32 hash)
1535e50e5129SAndreas Dilger {
1536dec214d0STahsin Erdogan 	struct inode *ea_inode;
1537dec214d0STahsin Erdogan 	struct mb_cache_entry *ce;
1538dec214d0STahsin Erdogan 	struct mb_cache *ea_inode_cache = EA_INODE_CACHE(inode);
1539dec214d0STahsin Erdogan 	void *ea_data;
1540e50e5129SAndreas Dilger 
1541cdb7ee4cSTahsin Erdogan 	if (!ea_inode_cache)
1542cdb7ee4cSTahsin Erdogan 		return NULL;
1543cdb7ee4cSTahsin Erdogan 
1544dec214d0STahsin Erdogan 	ce = mb_cache_entry_find_first(ea_inode_cache, hash);
1545dec214d0STahsin Erdogan 	if (!ce)
1546dec214d0STahsin Erdogan 		return NULL;
1547e50e5129SAndreas Dilger 
1548163f0ec1SJan Kara 	WARN_ON_ONCE(ext4_handle_valid(journal_current_handle()) &&
1549163f0ec1SJan Kara 		     !(current->flags & PF_MEMALLOC_NOFS));
1550163f0ec1SJan Kara 
155171b565ceSTheodore Ts'o 	ea_data = kvmalloc(value_len, GFP_KERNEL);
1552dec214d0STahsin Erdogan 	if (!ea_data) {
1553dec214d0STahsin Erdogan 		mb_cache_entry_put(ea_inode_cache, ce);
1554dec214d0STahsin Erdogan 		return NULL;
1555dec214d0STahsin Erdogan 	}
1556dec214d0STahsin Erdogan 
1557dec214d0STahsin Erdogan 	while (ce) {
15588a363970STheodore Ts'o 		ea_inode = ext4_iget(inode->i_sb, ce->e_value,
15598a363970STheodore Ts'o 				     EXT4_IGET_NORMAL);
1560dec214d0STahsin Erdogan 		if (!IS_ERR(ea_inode) &&
1561dec214d0STahsin Erdogan 		    !is_bad_inode(ea_inode) &&
1562dec214d0STahsin Erdogan 		    (EXT4_I(ea_inode)->i_flags & EXT4_EA_INODE_FL) &&
1563dec214d0STahsin Erdogan 		    i_size_read(ea_inode) == value_len &&
1564dec214d0STahsin Erdogan 		    !ext4_xattr_inode_read(ea_inode, ea_data, value_len) &&
1565b9fc761eSTahsin Erdogan 		    !ext4_xattr_inode_verify_hashes(ea_inode, NULL, ea_data,
1566dec214d0STahsin Erdogan 						    value_len) &&
1567dec214d0STahsin Erdogan 		    !memcmp(value, ea_data, value_len)) {
1568dec214d0STahsin Erdogan 			mb_cache_entry_touch(ea_inode_cache, ce);
1569dec214d0STahsin Erdogan 			mb_cache_entry_put(ea_inode_cache, ce);
1570dec214d0STahsin Erdogan 			kvfree(ea_data);
1571dec214d0STahsin Erdogan 			return ea_inode;
1572dec214d0STahsin Erdogan 		}
1573dec214d0STahsin Erdogan 
1574dec214d0STahsin Erdogan 		if (!IS_ERR(ea_inode))
1575e50e5129SAndreas Dilger 			iput(ea_inode);
1576dec214d0STahsin Erdogan 		ce = mb_cache_entry_find_next(ea_inode_cache, ce);
1577dec214d0STahsin Erdogan 	}
1578dec214d0STahsin Erdogan 	kvfree(ea_data);
1579dec214d0STahsin Erdogan 	return NULL;
1580e50e5129SAndreas Dilger }
1581e50e5129SAndreas Dilger 
1582e50e5129SAndreas Dilger /*
1583e50e5129SAndreas Dilger  * Add value of the EA in an inode.
1584e50e5129SAndreas Dilger  */
1585dec214d0STahsin Erdogan static int ext4_xattr_inode_lookup_create(handle_t *handle, struct inode *inode,
1586dec214d0STahsin Erdogan 					  const void *value, size_t value_len,
1587dec214d0STahsin Erdogan 					  struct inode **ret_inode)
1588e50e5129SAndreas Dilger {
1589e50e5129SAndreas Dilger 	struct inode *ea_inode;
1590dec214d0STahsin Erdogan 	u32 hash;
1591e50e5129SAndreas Dilger 	int err;
1592e50e5129SAndreas Dilger 
1593dec214d0STahsin Erdogan 	hash = ext4_xattr_inode_hash(EXT4_SB(inode->i_sb), value, value_len);
1594dec214d0STahsin Erdogan 	ea_inode = ext4_xattr_inode_cache_find(inode, value, value_len, hash);
1595dec214d0STahsin Erdogan 	if (ea_inode) {
1596dec214d0STahsin Erdogan 		err = ext4_xattr_inode_inc_ref(handle, ea_inode);
1597dec214d0STahsin Erdogan 		if (err) {
1598dec214d0STahsin Erdogan 			iput(ea_inode);
1599dec214d0STahsin Erdogan 			return err;
1600dec214d0STahsin Erdogan 		}
1601dec214d0STahsin Erdogan 
1602dec214d0STahsin Erdogan 		*ret_inode = ea_inode;
1603dec214d0STahsin Erdogan 		return 0;
1604dec214d0STahsin Erdogan 	}
1605dec214d0STahsin Erdogan 
1606e50e5129SAndreas Dilger 	/* Create an inode for the EA value */
1607dec214d0STahsin Erdogan 	ea_inode = ext4_xattr_inode_create(handle, inode, hash);
1608e50e5129SAndreas Dilger 	if (IS_ERR(ea_inode))
1609e50e5129SAndreas Dilger 		return PTR_ERR(ea_inode);
1610e50e5129SAndreas Dilger 
1611e50e5129SAndreas Dilger 	err = ext4_xattr_inode_write(handle, ea_inode, value, value_len);
1612dec214d0STahsin Erdogan 	if (err) {
161356d0d0b9SLi Zhong 		if (ext4_xattr_inode_dec_ref(handle, ea_inode))
161456d0d0b9SLi Zhong 			ext4_warning_inode(ea_inode, "cleanup dec ref error %d", err);
1615e50e5129SAndreas Dilger 		iput(ea_inode);
1616e50e5129SAndreas Dilger 		return err;
1617e50e5129SAndreas Dilger 	}
1618e50e5129SAndreas Dilger 
1619cdb7ee4cSTahsin Erdogan 	if (EA_INODE_CACHE(inode))
1620dec214d0STahsin Erdogan 		mb_cache_entry_create(EA_INODE_CACHE(inode), GFP_NOFS, hash,
1621dec214d0STahsin Erdogan 				      ea_inode->i_ino, true /* reusable */);
1622dec214d0STahsin Erdogan 
1623dec214d0STahsin Erdogan 	*ret_inode = ea_inode;
1624dec214d0STahsin Erdogan 	return 0;
1625dec214d0STahsin Erdogan }
1626dec214d0STahsin Erdogan 
16279c6e7853STahsin Erdogan /*
16289c6e7853STahsin Erdogan  * Reserve min(block_size/8, 1024) bytes for xattr entries/names if ea_inode
16299c6e7853STahsin Erdogan  * feature is enabled.
16309c6e7853STahsin Erdogan  */
16319c6e7853STahsin Erdogan #define EXT4_XATTR_BLOCK_RESERVE(inode)	min(i_blocksize(inode)/8, 1024U)
16329c6e7853STahsin Erdogan 
1633e50e5129SAndreas Dilger static int ext4_xattr_set_entry(struct ext4_xattr_info *i,
1634e50e5129SAndreas Dilger 				struct ext4_xattr_search *s,
1635daf83281STahsin Erdogan 				handle_t *handle, struct inode *inode,
1636daf83281STahsin Erdogan 				bool is_block)
1637ac27a0ecSDave Kleikamp {
16385369a762STheodore Ts'o 	struct ext4_xattr_entry *last, *next;
1639dec214d0STahsin Erdogan 	struct ext4_xattr_entry *here = s->here;
1640dec214d0STahsin Erdogan 	size_t min_offs = s->end - s->base, name_len = strlen(i->name);
1641e50e5129SAndreas Dilger 	int in_inode = i->in_inode;
1642dec214d0STahsin Erdogan 	struct inode *old_ea_inode = NULL;
1643dec214d0STahsin Erdogan 	struct inode *new_ea_inode = NULL;
1644dec214d0STahsin Erdogan 	size_t old_size, new_size;
1645dec214d0STahsin Erdogan 	int ret;
1646dec214d0STahsin Erdogan 
1647dec214d0STahsin Erdogan 	/* Space used by old and new values. */
1648dec214d0STahsin Erdogan 	old_size = (!s->not_found && !here->e_value_inum) ?
1649dec214d0STahsin Erdogan 			EXT4_XATTR_SIZE(le32_to_cpu(here->e_value_size)) : 0;
1650dec214d0STahsin Erdogan 	new_size = (i->value && !in_inode) ? EXT4_XATTR_SIZE(i->value_len) : 0;
1651dec214d0STahsin Erdogan 
1652dec214d0STahsin Erdogan 	/*
1653dec214d0STahsin Erdogan 	 * Optimization for the simple case when old and new values have the
1654dec214d0STahsin Erdogan 	 * same padded sizes. Not applicable if external inodes are involved.
1655dec214d0STahsin Erdogan 	 */
1656dec214d0STahsin Erdogan 	if (new_size && new_size == old_size) {
1657dec214d0STahsin Erdogan 		size_t offs = le16_to_cpu(here->e_value_offs);
1658dec214d0STahsin Erdogan 		void *val = s->base + offs;
1659dec214d0STahsin Erdogan 
1660dec214d0STahsin Erdogan 		here->e_value_size = cpu_to_le32(i->value_len);
1661dec214d0STahsin Erdogan 		if (i->value == EXT4_ZERO_XATTR_VALUE) {
1662dec214d0STahsin Erdogan 			memset(val, 0, new_size);
1663dec214d0STahsin Erdogan 		} else {
1664dec214d0STahsin Erdogan 			memcpy(val, i->value, i->value_len);
1665dec214d0STahsin Erdogan 			/* Clear padding bytes. */
1666dec214d0STahsin Erdogan 			memset(val + i->value_len, 0, new_size - i->value_len);
1667dec214d0STahsin Erdogan 		}
166832aaf194STahsin Erdogan 		goto update_hash;
1669dec214d0STahsin Erdogan 	}
1670e50e5129SAndreas Dilger 
1671ac27a0ecSDave Kleikamp 	/* Compute min_offs and last. */
1672ac27a0ecSDave Kleikamp 	last = s->first;
16735369a762STheodore Ts'o 	for (; !IS_LAST_ENTRY(last); last = next) {
16745369a762STheodore Ts'o 		next = EXT4_XATTR_NEXT(last);
16755369a762STheodore Ts'o 		if ((void *)next >= s->end) {
16765369a762STheodore Ts'o 			EXT4_ERROR_INODE(inode, "corrupted xattr entries");
16775369a762STheodore Ts'o 			ret = -EFSCORRUPTED;
16785369a762STheodore Ts'o 			goto out;
16795369a762STheodore Ts'o 		}
1680e50e5129SAndreas Dilger 		if (!last->e_value_inum && last->e_value_size) {
1681ac27a0ecSDave Kleikamp 			size_t offs = le16_to_cpu(last->e_value_offs);
1682ac27a0ecSDave Kleikamp 			if (offs < min_offs)
1683ac27a0ecSDave Kleikamp 				min_offs = offs;
1684ac27a0ecSDave Kleikamp 		}
1685ac27a0ecSDave Kleikamp 	}
1686dec214d0STahsin Erdogan 
1687dec214d0STahsin Erdogan 	/* Check whether we have enough space. */
1688ac27a0ecSDave Kleikamp 	if (i->value) {
1689dec214d0STahsin Erdogan 		size_t free;
1690e50e5129SAndreas Dilger 
1691dec214d0STahsin Erdogan 		free = min_offs - ((void *)last - s->base) - sizeof(__u32);
1692dec214d0STahsin Erdogan 		if (!s->not_found)
1693dec214d0STahsin Erdogan 			free += EXT4_XATTR_LEN(name_len) + old_size;
1694e50e5129SAndreas Dilger 
1695dec214d0STahsin Erdogan 		if (free < EXT4_XATTR_LEN(name_len) + new_size) {
1696dec214d0STahsin Erdogan 			ret = -ENOSPC;
1697dec214d0STahsin Erdogan 			goto out;
1698dec214d0STahsin Erdogan 		}
16999c6e7853STahsin Erdogan 
17009c6e7853STahsin Erdogan 		/*
17019c6e7853STahsin Erdogan 		 * If storing the value in an external inode is an option,
17029c6e7853STahsin Erdogan 		 * reserve space for xattr entries/names in the external
17039c6e7853STahsin Erdogan 		 * attribute block so that a long value does not occupy the
17043088e5a5SBhaskar Chowdhury 		 * whole space and prevent further entries being added.
17059c6e7853STahsin Erdogan 		 */
1706daf83281STahsin Erdogan 		if (ext4_has_feature_ea_inode(inode->i_sb) &&
1707daf83281STahsin Erdogan 		    new_size && is_block &&
17089c6e7853STahsin Erdogan 		    (min_offs + old_size - new_size) <
17099c6e7853STahsin Erdogan 					EXT4_XATTR_BLOCK_RESERVE(inode)) {
17109c6e7853STahsin Erdogan 			ret = -ENOSPC;
17119c6e7853STahsin Erdogan 			goto out;
17129c6e7853STahsin Erdogan 		}
1713ac27a0ecSDave Kleikamp 	}
1714ac27a0ecSDave Kleikamp 
1715dec214d0STahsin Erdogan 	/*
1716dec214d0STahsin Erdogan 	 * Getting access to old and new ea inodes is subject to failures.
1717dec214d0STahsin Erdogan 	 * Finish that work before doing any modifications to the xattr data.
1718dec214d0STahsin Erdogan 	 */
1719dec214d0STahsin Erdogan 	if (!s->not_found && here->e_value_inum) {
1720dec214d0STahsin Erdogan 		ret = ext4_xattr_inode_iget(inode,
1721dec214d0STahsin Erdogan 					    le32_to_cpu(here->e_value_inum),
1722a6d05676STahsin Erdogan 					    le32_to_cpu(here->e_hash),
1723dec214d0STahsin Erdogan 					    &old_ea_inode);
1724dec214d0STahsin Erdogan 		if (ret) {
1725dec214d0STahsin Erdogan 			old_ea_inode = NULL;
1726dec214d0STahsin Erdogan 			goto out;
1727bd9926e8STheodore Ts'o 		}
1728dec214d0STahsin Erdogan 	}
1729dec214d0STahsin Erdogan 	if (i->value && in_inode) {
1730dec214d0STahsin Erdogan 		WARN_ON_ONCE(!i->value_len);
1731dec214d0STahsin Erdogan 
1732dec214d0STahsin Erdogan 		ret = ext4_xattr_inode_alloc_quota(inode, i->value_len);
1733dec214d0STahsin Erdogan 		if (ret)
1734dec214d0STahsin Erdogan 			goto out;
1735dec214d0STahsin Erdogan 
1736dec214d0STahsin Erdogan 		ret = ext4_xattr_inode_lookup_create(handle, inode, i->value,
1737dec214d0STahsin Erdogan 						     i->value_len,
1738dec214d0STahsin Erdogan 						     &new_ea_inode);
1739dec214d0STahsin Erdogan 		if (ret) {
1740dec214d0STahsin Erdogan 			new_ea_inode = NULL;
1741a6d05676STahsin Erdogan 			ext4_xattr_inode_free_quota(inode, NULL, i->value_len);
1742dec214d0STahsin Erdogan 			goto out;
1743dec214d0STahsin Erdogan 		}
1744ac27a0ecSDave Kleikamp 	}
1745ac27a0ecSDave Kleikamp 
1746dec214d0STahsin Erdogan 	if (old_ea_inode) {
1747dec214d0STahsin Erdogan 		/* We are ready to release ref count on the old_ea_inode. */
1748dec214d0STahsin Erdogan 		ret = ext4_xattr_inode_dec_ref(handle, old_ea_inode);
1749dec214d0STahsin Erdogan 		if (ret) {
1750dec214d0STahsin Erdogan 			/* Release newly required ref count on new_ea_inode. */
1751dec214d0STahsin Erdogan 			if (new_ea_inode) {
1752dec214d0STahsin Erdogan 				int err;
1753dec214d0STahsin Erdogan 
1754dec214d0STahsin Erdogan 				err = ext4_xattr_inode_dec_ref(handle,
1755dec214d0STahsin Erdogan 							       new_ea_inode);
1756dec214d0STahsin Erdogan 				if (err)
1757dec214d0STahsin Erdogan 					ext4_warning_inode(new_ea_inode,
1758dec214d0STahsin Erdogan 						  "dec ref new_ea_inode err=%d",
1759dec214d0STahsin Erdogan 						  err);
1760a6d05676STahsin Erdogan 				ext4_xattr_inode_free_quota(inode, new_ea_inode,
1761dec214d0STahsin Erdogan 							    i->value_len);
1762dec214d0STahsin Erdogan 			}
1763dec214d0STahsin Erdogan 			goto out;
1764dec214d0STahsin Erdogan 		}
1765dec214d0STahsin Erdogan 
1766a6d05676STahsin Erdogan 		ext4_xattr_inode_free_quota(inode, old_ea_inode,
1767dec214d0STahsin Erdogan 					    le32_to_cpu(here->e_value_size));
1768dec214d0STahsin Erdogan 	}
1769dec214d0STahsin Erdogan 
1770dec214d0STahsin Erdogan 	/* No failures allowed past this point. */
1771dec214d0STahsin Erdogan 
1772e5d01196STheodore Ts'o 	if (!s->not_found && here->e_value_size && !here->e_value_inum) {
1773ac27a0ecSDave Kleikamp 		/* Remove the old value. */
1774dec214d0STahsin Erdogan 		void *first_val = s->base + min_offs;
1775dec214d0STahsin Erdogan 		size_t offs = le16_to_cpu(here->e_value_offs);
1776dec214d0STahsin Erdogan 		void *val = s->base + offs;
1777dec214d0STahsin Erdogan 
1778dec214d0STahsin Erdogan 		memmove(first_val + old_size, first_val, val - first_val);
1779dec214d0STahsin Erdogan 		memset(first_val, 0, old_size);
1780dec214d0STahsin Erdogan 		min_offs += old_size;
1781ac27a0ecSDave Kleikamp 
1782ac27a0ecSDave Kleikamp 		/* Adjust all value offsets. */
1783ac27a0ecSDave Kleikamp 		last = s->first;
1784ac27a0ecSDave Kleikamp 		while (!IS_LAST_ENTRY(last)) {
1785ac27a0ecSDave Kleikamp 			size_t o = le16_to_cpu(last->e_value_offs);
1786dec214d0STahsin Erdogan 
1787e50e5129SAndreas Dilger 			if (!last->e_value_inum &&
1788e50e5129SAndreas Dilger 			    last->e_value_size && o < offs)
1789dec214d0STahsin Erdogan 				last->e_value_offs = cpu_to_le16(o + old_size);
1790617ba13bSMingming Cao 			last = EXT4_XATTR_NEXT(last);
1791ac27a0ecSDave Kleikamp 		}
1792ac27a0ecSDave Kleikamp 	}
1793dec214d0STahsin Erdogan 
1794ac27a0ecSDave Kleikamp 	if (!i->value) {
1795dec214d0STahsin Erdogan 		/* Remove old name. */
1796617ba13bSMingming Cao 		size_t size = EXT4_XATTR_LEN(name_len);
1797dec214d0STahsin Erdogan 
1798ac27a0ecSDave Kleikamp 		last = ENTRY((void *)last - size);
1799dec214d0STahsin Erdogan 		memmove(here, (void *)here + size,
1800dec214d0STahsin Erdogan 			(void *)last - (void *)here + sizeof(__u32));
1801ac27a0ecSDave Kleikamp 		memset(last, 0, size);
1802dec214d0STahsin Erdogan 	} else if (s->not_found) {
1803dec214d0STahsin Erdogan 		/* Insert new name. */
1804dec214d0STahsin Erdogan 		size_t size = EXT4_XATTR_LEN(name_len);
1805dec214d0STahsin Erdogan 		size_t rest = (void *)last - (void *)here + sizeof(__u32);
1806dec214d0STahsin Erdogan 
1807dec214d0STahsin Erdogan 		memmove((void *)here + size, here, rest);
1808dec214d0STahsin Erdogan 		memset(here, 0, size);
1809dec214d0STahsin Erdogan 		here->e_name_index = i->name_index;
1810dec214d0STahsin Erdogan 		here->e_name_len = name_len;
1811dec214d0STahsin Erdogan 		memcpy(here->e_name, i->name, name_len);
1812dec214d0STahsin Erdogan 	} else {
1813dec214d0STahsin Erdogan 		/* This is an update, reset value info. */
1814dec214d0STahsin Erdogan 		here->e_value_inum = 0;
1815dec214d0STahsin Erdogan 		here->e_value_offs = 0;
1816dec214d0STahsin Erdogan 		here->e_value_size = 0;
1817ac27a0ecSDave Kleikamp 	}
1818ac27a0ecSDave Kleikamp 
1819ac27a0ecSDave Kleikamp 	if (i->value) {
1820dec214d0STahsin Erdogan 		/* Insert new value. */
1821e50e5129SAndreas Dilger 		if (in_inode) {
1822dec214d0STahsin Erdogan 			here->e_value_inum = cpu_to_le32(new_ea_inode->i_ino);
1823e50e5129SAndreas Dilger 		} else if (i->value_len) {
1824dec214d0STahsin Erdogan 			void *val = s->base + min_offs - new_size;
1825e50e5129SAndreas Dilger 
1826dec214d0STahsin Erdogan 			here->e_value_offs = cpu_to_le16(min_offs - new_size);
1827dec214d0STahsin Erdogan 			if (i->value == EXT4_ZERO_XATTR_VALUE) {
1828dec214d0STahsin Erdogan 				memset(val, 0, new_size);
1829dec214d0STahsin Erdogan 			} else {
1830dec214d0STahsin Erdogan 				memcpy(val, i->value, i->value_len);
1831dec214d0STahsin Erdogan 				/* Clear padding bytes. */
1832dec214d0STahsin Erdogan 				memset(val + i->value_len, 0,
1833dec214d0STahsin Erdogan 				       new_size - i->value_len);
1834dec214d0STahsin Erdogan 			}
1835dec214d0STahsin Erdogan 		}
1836dec214d0STahsin Erdogan 		here->e_value_size = cpu_to_le32(i->value_len);
1837dec214d0STahsin Erdogan 	}
1838daf83281STahsin Erdogan 
183932aaf194STahsin Erdogan update_hash:
1840b9fc761eSTahsin Erdogan 	if (i->value) {
1841b9fc761eSTahsin Erdogan 		__le32 hash = 0;
1842b9fc761eSTahsin Erdogan 
1843b9fc761eSTahsin Erdogan 		/* Entry hash calculation. */
1844b9fc761eSTahsin Erdogan 		if (in_inode) {
1845b9fc761eSTahsin Erdogan 			__le32 crc32c_hash;
1846b9fc761eSTahsin Erdogan 
1847b9fc761eSTahsin Erdogan 			/*
1848b9fc761eSTahsin Erdogan 			 * Feed crc32c hash instead of the raw value for entry
1849b9fc761eSTahsin Erdogan 			 * hash calculation. This is to avoid walking
1850b9fc761eSTahsin Erdogan 			 * potentially long value buffer again.
1851b9fc761eSTahsin Erdogan 			 */
1852b9fc761eSTahsin Erdogan 			crc32c_hash = cpu_to_le32(
1853b9fc761eSTahsin Erdogan 				       ext4_xattr_inode_get_hash(new_ea_inode));
1854b9fc761eSTahsin Erdogan 			hash = ext4_xattr_hash_entry(here->e_name,
1855b9fc761eSTahsin Erdogan 						     here->e_name_len,
1856b9fc761eSTahsin Erdogan 						     &crc32c_hash, 1);
1857b9fc761eSTahsin Erdogan 		} else if (is_block) {
185832aaf194STahsin Erdogan 			__le32 *value = s->base + le16_to_cpu(
185932aaf194STahsin Erdogan 							here->e_value_offs);
1860b9fc761eSTahsin Erdogan 
1861b9fc761eSTahsin Erdogan 			hash = ext4_xattr_hash_entry(here->e_name,
1862b9fc761eSTahsin Erdogan 						     here->e_name_len, value,
1863b9fc761eSTahsin Erdogan 						     new_size >> 2);
1864daf83281STahsin Erdogan 		}
1865b9fc761eSTahsin Erdogan 		here->e_hash = hash;
1866b9fc761eSTahsin Erdogan 	}
1867b9fc761eSTahsin Erdogan 
1868b9fc761eSTahsin Erdogan 	if (is_block)
1869b9fc761eSTahsin Erdogan 		ext4_xattr_rehash((struct ext4_xattr_header *)s->base);
1870daf83281STahsin Erdogan 
1871dec214d0STahsin Erdogan 	ret = 0;
1872e50e5129SAndreas Dilger out:
1873dec214d0STahsin Erdogan 	iput(old_ea_inode);
1874dec214d0STahsin Erdogan 	iput(new_ea_inode);
1875dec214d0STahsin Erdogan 	return ret;
1876ac27a0ecSDave Kleikamp }
1877ac27a0ecSDave Kleikamp 
1878617ba13bSMingming Cao struct ext4_xattr_block_find {
1879617ba13bSMingming Cao 	struct ext4_xattr_search s;
1880ac27a0ecSDave Kleikamp 	struct buffer_head *bh;
1881ac27a0ecSDave Kleikamp };
1882ac27a0ecSDave Kleikamp 
1883ac27a0ecSDave Kleikamp static int
1884617ba13bSMingming Cao ext4_xattr_block_find(struct inode *inode, struct ext4_xattr_info *i,
1885617ba13bSMingming Cao 		      struct ext4_xattr_block_find *bs)
1886ac27a0ecSDave Kleikamp {
1887ac27a0ecSDave Kleikamp 	struct super_block *sb = inode->i_sb;
1888ac27a0ecSDave Kleikamp 	int error;
1889ac27a0ecSDave Kleikamp 
1890ac27a0ecSDave Kleikamp 	ea_idebug(inode, "name=%d.%s, value=%p, value_len=%ld",
1891ac27a0ecSDave Kleikamp 		  i->name_index, i->name, i->value, (long)i->value_len);
1892ac27a0ecSDave Kleikamp 
1893617ba13bSMingming Cao 	if (EXT4_I(inode)->i_file_acl) {
1894ac27a0ecSDave Kleikamp 		/* The inode already has an extended attribute block. */
1895fb265c9cSTheodore Ts'o 		bs->bh = ext4_sb_bread(sb, EXT4_I(inode)->i_file_acl, REQ_PRIO);
18968418897fSJeffle Xu 		if (IS_ERR(bs->bh)) {
18978418897fSJeffle Xu 			error = PTR_ERR(bs->bh);
18988418897fSJeffle Xu 			bs->bh = NULL;
18998418897fSJeffle Xu 			return error;
19008418897fSJeffle Xu 		}
1901ac27a0ecSDave Kleikamp 		ea_bdebug(bs->bh, "b_count=%d, refcount=%d",
1902ac27a0ecSDave Kleikamp 			atomic_read(&(bs->bh->b_count)),
1903ac27a0ecSDave Kleikamp 			le32_to_cpu(BHDR(bs->bh)->h_refcount));
1904de05ca85STheodore Ts'o 		error = ext4_xattr_check_block(inode, bs->bh);
1905de05ca85STheodore Ts'o 		if (error)
1906fb265c9cSTheodore Ts'o 			return error;
1907ac27a0ecSDave Kleikamp 		/* Find the named attribute. */
1908ac27a0ecSDave Kleikamp 		bs->s.base = BHDR(bs->bh);
1909ac27a0ecSDave Kleikamp 		bs->s.first = BFIRST(bs->bh);
1910ac27a0ecSDave Kleikamp 		bs->s.end = bs->bh->b_data + bs->bh->b_size;
1911ac27a0ecSDave Kleikamp 		bs->s.here = bs->s.first;
19129496005dSTheodore Ts'o 		error = xattr_find_entry(inode, &bs->s.here, bs->s.end,
19139496005dSTheodore Ts'o 					 i->name_index, i->name, 1);
1914ac27a0ecSDave Kleikamp 		if (error && error != -ENODATA)
1915fb265c9cSTheodore Ts'o 			return error;
1916ac27a0ecSDave Kleikamp 		bs->s.not_found = error;
1917ac27a0ecSDave Kleikamp 	}
1918fb265c9cSTheodore Ts'o 	return 0;
1919ac27a0ecSDave Kleikamp }
1920ac27a0ecSDave Kleikamp 
1921ac27a0ecSDave Kleikamp static int
1922617ba13bSMingming Cao ext4_xattr_block_set(handle_t *handle, struct inode *inode,
1923617ba13bSMingming Cao 		     struct ext4_xattr_info *i,
1924617ba13bSMingming Cao 		     struct ext4_xattr_block_find *bs)
1925ac27a0ecSDave Kleikamp {
1926ac27a0ecSDave Kleikamp 	struct super_block *sb = inode->i_sb;
1927ac27a0ecSDave Kleikamp 	struct buffer_head *new_bh = NULL;
1928b347e2bcSTahsin Erdogan 	struct ext4_xattr_search s_copy = bs->s;
1929b347e2bcSTahsin Erdogan 	struct ext4_xattr_search *s = &s_copy;
19307a2508e1SJan Kara 	struct mb_cache_entry *ce = NULL;
19318a2bfdcbSMingming Cao 	int error = 0;
193247387409STahsin Erdogan 	struct mb_cache *ea_block_cache = EA_BLOCK_CACHE(inode);
1933a6d05676STahsin Erdogan 	struct inode *ea_inode = NULL, *tmp_inode;
1934a6d05676STahsin Erdogan 	size_t old_ea_inode_quota = 0;
1935a6d05676STahsin Erdogan 	unsigned int ea_ino;
1936a6d05676STahsin Erdogan 
1937ac27a0ecSDave Kleikamp 
1938617ba13bSMingming Cao #define header(x) ((struct ext4_xattr_header *)(x))
1939ac27a0ecSDave Kleikamp 
1940ac27a0ecSDave Kleikamp 	if (s->base) {
1941fd48e9acSJan Kara 		int offset = (char *)s->here - bs->bh->b_data;
1942fd48e9acSJan Kara 
19435d601255Sliang xie 		BUFFER_TRACE(bs->bh, "get_write_access");
1944188c299eSJan Kara 		error = ext4_journal_get_write_access(handle, sb, bs->bh,
1945188c299eSJan Kara 						      EXT4_JTR_NONE);
19468a2bfdcbSMingming Cao 		if (error)
19478a2bfdcbSMingming Cao 			goto cleanup;
19488a2bfdcbSMingming Cao 		lock_buffer(bs->bh);
19498a2bfdcbSMingming Cao 
1950ac27a0ecSDave Kleikamp 		if (header(s->base)->h_refcount == cpu_to_le32(1)) {
195182939d79SJan Kara 			__u32 hash = le32_to_cpu(BHDR(bs->bh)->h_hash);
195282939d79SJan Kara 
195382939d79SJan Kara 			/*
195482939d79SJan Kara 			 * This must happen under buffer lock for
195582939d79SJan Kara 			 * ext4_xattr_block_set() to reliably detect modified
195682939d79SJan Kara 			 * block
195782939d79SJan Kara 			 */
195865f8b800SJan Kara 			if (ea_block_cache) {
195965f8b800SJan Kara 				struct mb_cache_entry *oe;
196065f8b800SJan Kara 
196165f8b800SJan Kara 				oe = mb_cache_entry_delete_or_get(ea_block_cache,
196265f8b800SJan Kara 					hash, bs->bh->b_blocknr);
196365f8b800SJan Kara 				if (oe) {
196465f8b800SJan Kara 					/*
196565f8b800SJan Kara 					 * Xattr block is getting reused. Leave
196665f8b800SJan Kara 					 * it alone.
196765f8b800SJan Kara 					 */
196865f8b800SJan Kara 					mb_cache_entry_put(ea_block_cache, oe);
196965f8b800SJan Kara 					goto clone_block;
197065f8b800SJan Kara 				}
197165f8b800SJan Kara 			}
1972ac27a0ecSDave Kleikamp 			ea_bdebug(bs->bh, "modifying in-place");
1973daf83281STahsin Erdogan 			error = ext4_xattr_set_entry(i, s, handle, inode,
1974daf83281STahsin Erdogan 						     true /* is_block */);
1975dac7a4b4STheodore Ts'o 			ext4_xattr_block_csum_set(inode, bs->bh);
1976ac27a0ecSDave Kleikamp 			unlock_buffer(bs->bh);
19776a797d27SDarrick J. Wong 			if (error == -EFSCORRUPTED)
1978ac27a0ecSDave Kleikamp 				goto bad_block;
1979ac27a0ecSDave Kleikamp 			if (!error)
1980dac7a4b4STheodore Ts'o 				error = ext4_handle_dirty_metadata(handle,
19810390131bSFrank Mayhar 								   inode,
1982ac27a0ecSDave Kleikamp 								   bs->bh);
1983ac27a0ecSDave Kleikamp 			if (error)
1984ac27a0ecSDave Kleikamp 				goto cleanup;
1985ac27a0ecSDave Kleikamp 			goto inserted;
1986fd48e9acSJan Kara 		}
198765f8b800SJan Kara clone_block:
19888a2bfdcbSMingming Cao 		unlock_buffer(bs->bh);
1989ac27a0ecSDave Kleikamp 		ea_bdebug(bs->bh, "cloning");
19904efd9f0dSShuqi Zhang 		s->base = kmemdup(BHDR(bs->bh), bs->bh->b_size, GFP_NOFS);
1991ac27a0ecSDave Kleikamp 		error = -ENOMEM;
1992ac27a0ecSDave Kleikamp 		if (s->base == NULL)
1993ac27a0ecSDave Kleikamp 			goto cleanup;
1994ac27a0ecSDave Kleikamp 		s->first = ENTRY(header(s->base)+1);
1995ac27a0ecSDave Kleikamp 		header(s->base)->h_refcount = cpu_to_le32(1);
1996ac27a0ecSDave Kleikamp 		s->here = ENTRY(s->base + offset);
1997ac27a0ecSDave Kleikamp 		s->end = s->base + bs->bh->b_size;
1998dec214d0STahsin Erdogan 
1999dec214d0STahsin Erdogan 		/*
2000dec214d0STahsin Erdogan 		 * If existing entry points to an xattr inode, we need
2001dec214d0STahsin Erdogan 		 * to prevent ext4_xattr_set_entry() from decrementing
2002dec214d0STahsin Erdogan 		 * ref count on it because the reference belongs to the
2003dec214d0STahsin Erdogan 		 * original block. In this case, make the entry look
2004dec214d0STahsin Erdogan 		 * like it has an empty value.
2005dec214d0STahsin Erdogan 		 */
2006dec214d0STahsin Erdogan 		if (!s->not_found && s->here->e_value_inum) {
2007a6d05676STahsin Erdogan 			ea_ino = le32_to_cpu(s->here->e_value_inum);
2008a6d05676STahsin Erdogan 			error = ext4_xattr_inode_iget(inode, ea_ino,
2009a6d05676STahsin Erdogan 				      le32_to_cpu(s->here->e_hash),
2010a6d05676STahsin Erdogan 				      &tmp_inode);
2011a6d05676STahsin Erdogan 			if (error)
2012a6d05676STahsin Erdogan 				goto cleanup;
2013a6d05676STahsin Erdogan 
2014a6d05676STahsin Erdogan 			if (!ext4_test_inode_state(tmp_inode,
2015a6d05676STahsin Erdogan 					EXT4_STATE_LUSTRE_EA_INODE)) {
2016dec214d0STahsin Erdogan 				/*
2017a6d05676STahsin Erdogan 				 * Defer quota free call for previous
2018a6d05676STahsin Erdogan 				 * inode until success is guaranteed.
2019dec214d0STahsin Erdogan 				 */
2020a6d05676STahsin Erdogan 				old_ea_inode_quota = le32_to_cpu(
2021dec214d0STahsin Erdogan 						s->here->e_value_size);
2022a6d05676STahsin Erdogan 			}
2023a6d05676STahsin Erdogan 			iput(tmp_inode);
2024a6d05676STahsin Erdogan 
2025dec214d0STahsin Erdogan 			s->here->e_value_inum = 0;
2026dec214d0STahsin Erdogan 			s->here->e_value_size = 0;
2027dec214d0STahsin Erdogan 		}
2028ac27a0ecSDave Kleikamp 	} else {
2029ac27a0ecSDave Kleikamp 		/* Allocate a buffer where we construct the new block. */
2030216553c4SJosef Bacik 		s->base = kzalloc(sb->s_blocksize, GFP_NOFS);
2031ac27a0ecSDave Kleikamp 		error = -ENOMEM;
2032ac27a0ecSDave Kleikamp 		if (s->base == NULL)
2033ac27a0ecSDave Kleikamp 			goto cleanup;
2034617ba13bSMingming Cao 		header(s->base)->h_magic = cpu_to_le32(EXT4_XATTR_MAGIC);
2035ac27a0ecSDave Kleikamp 		header(s->base)->h_blocks = cpu_to_le32(1);
2036ac27a0ecSDave Kleikamp 		header(s->base)->h_refcount = cpu_to_le32(1);
2037ac27a0ecSDave Kleikamp 		s->first = ENTRY(header(s->base)+1);
2038ac27a0ecSDave Kleikamp 		s->here = ENTRY(header(s->base)+1);
2039ac27a0ecSDave Kleikamp 		s->end = s->base + sb->s_blocksize;
2040ac27a0ecSDave Kleikamp 	}
2041ac27a0ecSDave Kleikamp 
2042daf83281STahsin Erdogan 	error = ext4_xattr_set_entry(i, s, handle, inode, true /* is_block */);
20436a797d27SDarrick J. Wong 	if (error == -EFSCORRUPTED)
2044ac27a0ecSDave Kleikamp 		goto bad_block;
2045ac27a0ecSDave Kleikamp 	if (error)
2046ac27a0ecSDave Kleikamp 		goto cleanup;
2047dec214d0STahsin Erdogan 
2048dec214d0STahsin Erdogan 	if (i->value && s->here->e_value_inum) {
2049dec214d0STahsin Erdogan 		/*
2050dec214d0STahsin Erdogan 		 * A ref count on ea_inode has been taken as part of the call to
2051dec214d0STahsin Erdogan 		 * ext4_xattr_set_entry() above. We would like to drop this
2052dec214d0STahsin Erdogan 		 * extra ref but we have to wait until the xattr block is
2053dec214d0STahsin Erdogan 		 * initialized and has its own ref count on the ea_inode.
2054dec214d0STahsin Erdogan 		 */
2055dec214d0STahsin Erdogan 		ea_ino = le32_to_cpu(s->here->e_value_inum);
2056a6d05676STahsin Erdogan 		error = ext4_xattr_inode_iget(inode, ea_ino,
2057a6d05676STahsin Erdogan 					      le32_to_cpu(s->here->e_hash),
2058a6d05676STahsin Erdogan 					      &ea_inode);
2059dec214d0STahsin Erdogan 		if (error) {
2060dec214d0STahsin Erdogan 			ea_inode = NULL;
2061dec214d0STahsin Erdogan 			goto cleanup;
2062dec214d0STahsin Erdogan 		}
2063dec214d0STahsin Erdogan 	}
2064dec214d0STahsin Erdogan 
2065ac27a0ecSDave Kleikamp inserted:
2066ac27a0ecSDave Kleikamp 	if (!IS_LAST_ENTRY(s->first)) {
206747387409STahsin Erdogan 		new_bh = ext4_xattr_block_cache_find(inode, header(s->base),
206847387409STahsin Erdogan 						     &ce);
2069ac27a0ecSDave Kleikamp 		if (new_bh) {
2070ac27a0ecSDave Kleikamp 			/* We found an identical block in the cache. */
2071ac27a0ecSDave Kleikamp 			if (new_bh == bs->bh)
2072ac27a0ecSDave Kleikamp 				ea_bdebug(new_bh, "keeping");
2073ac27a0ecSDave Kleikamp 			else {
20746048c64bSAndreas Gruenbacher 				u32 ref;
20756048c64bSAndreas Gruenbacher 
2076b8cb5a54STahsin Erdogan 				WARN_ON_ONCE(dquot_initialize_needed(inode));
2077b8cb5a54STahsin Erdogan 
2078ac27a0ecSDave Kleikamp 				/* The old block is released after updating
2079ac27a0ecSDave Kleikamp 				   the inode. */
20801231b3a1SLukas Czerner 				error = dquot_alloc_block(inode,
20811231b3a1SLukas Czerner 						EXT4_C2B(EXT4_SB(sb), 1));
20825dd4056dSChristoph Hellwig 				if (error)
2083ac27a0ecSDave Kleikamp 					goto cleanup;
20845d601255Sliang xie 				BUFFER_TRACE(new_bh, "get_write_access");
2085188c299eSJan Kara 				error = ext4_journal_get_write_access(
2086188c299eSJan Kara 						handle, sb, new_bh,
2087188c299eSJan Kara 						EXT4_JTR_NONE);
2088ac27a0ecSDave Kleikamp 				if (error)
2089ac27a0ecSDave Kleikamp 					goto cleanup_dquot;
2090ac27a0ecSDave Kleikamp 				lock_buffer(new_bh);
209182939d79SJan Kara 				/*
209282939d79SJan Kara 				 * We have to be careful about races with
209365f8b800SJan Kara 				 * adding references to xattr block. Once we
209465f8b800SJan Kara 				 * hold buffer lock xattr block's state is
209565f8b800SJan Kara 				 * stable so we can check the additional
209665f8b800SJan Kara 				 * reference fits.
209782939d79SJan Kara 				 */
209865f8b800SJan Kara 				ref = le32_to_cpu(BHDR(new_bh)->h_refcount) + 1;
209965f8b800SJan Kara 				if (ref > EXT4_XATTR_REFCOUNT_MAX) {
210082939d79SJan Kara 					/*
210182939d79SJan Kara 					 * Undo everything and check mbcache
210282939d79SJan Kara 					 * again.
210382939d79SJan Kara 					 */
210482939d79SJan Kara 					unlock_buffer(new_bh);
210582939d79SJan Kara 					dquot_free_block(inode,
210682939d79SJan Kara 							 EXT4_C2B(EXT4_SB(sb),
210782939d79SJan Kara 								  1));
210882939d79SJan Kara 					brelse(new_bh);
210947387409STahsin Erdogan 					mb_cache_entry_put(ea_block_cache, ce);
211082939d79SJan Kara 					ce = NULL;
211182939d79SJan Kara 					new_bh = NULL;
211282939d79SJan Kara 					goto inserted;
211382939d79SJan Kara 				}
21146048c64bSAndreas Gruenbacher 				BHDR(new_bh)->h_refcount = cpu_to_le32(ref);
211565f8b800SJan Kara 				if (ref == EXT4_XATTR_REFCOUNT_MAX)
2116a44e84a9SJan Kara 					clear_bit(MBE_REUSABLE_B, &ce->e_flags);
2117ac27a0ecSDave Kleikamp 				ea_bdebug(new_bh, "reusing; refcount now=%d",
21186048c64bSAndreas Gruenbacher 					  ref);
2119dac7a4b4STheodore Ts'o 				ext4_xattr_block_csum_set(inode, new_bh);
2120ac27a0ecSDave Kleikamp 				unlock_buffer(new_bh);
2121dac7a4b4STheodore Ts'o 				error = ext4_handle_dirty_metadata(handle,
21220390131bSFrank Mayhar 								   inode,
2123ac27a0ecSDave Kleikamp 								   new_bh);
2124ac27a0ecSDave Kleikamp 				if (error)
2125ac27a0ecSDave Kleikamp 					goto cleanup_dquot;
2126ac27a0ecSDave Kleikamp 			}
212747387409STahsin Erdogan 			mb_cache_entry_touch(ea_block_cache, ce);
212847387409STahsin Erdogan 			mb_cache_entry_put(ea_block_cache, ce);
2129ac27a0ecSDave Kleikamp 			ce = NULL;
2130ac27a0ecSDave Kleikamp 		} else if (bs->bh && s->base == bs->bh->b_data) {
2131ac27a0ecSDave Kleikamp 			/* We were modifying this block in-place. */
2132ac27a0ecSDave Kleikamp 			ea_bdebug(bs->bh, "keeping this block");
2133ec000220STahsin Erdogan 			ext4_xattr_block_cache_insert(ea_block_cache, bs->bh);
2134ac27a0ecSDave Kleikamp 			new_bh = bs->bh;
2135ac27a0ecSDave Kleikamp 			get_bh(new_bh);
2136ac27a0ecSDave Kleikamp 		} else {
2137ac27a0ecSDave Kleikamp 			/* We need to allocate a new block */
2138fb0a387dSEric Sandeen 			ext4_fsblk_t goal, block;
2139fb0a387dSEric Sandeen 
2140b8cb5a54STahsin Erdogan 			WARN_ON_ONCE(dquot_initialize_needed(inode));
2141b8cb5a54STahsin Erdogan 
2142fb0a387dSEric Sandeen 			goal = ext4_group_first_block_no(sb,
2143d00a6d7bSAkinobu Mita 						EXT4_I(inode)->i_block_group);
214455f020dbSAllison Henderson 			block = ext4_new_meta_blocks(handle, inode, goal, 0,
214555f020dbSAllison Henderson 						     NULL, &error);
2146ac27a0ecSDave Kleikamp 			if (error)
2147ac27a0ecSDave Kleikamp 				goto cleanup;
2148fb0a387dSEric Sandeen 
2149ace36ad4SJoe Perches 			ea_idebug(inode, "creating block %llu",
2150ace36ad4SJoe Perches 				  (unsigned long long)block);
2151ac27a0ecSDave Kleikamp 
2152ac27a0ecSDave Kleikamp 			new_bh = sb_getblk(sb, block);
2153aebf0243SWang Shilong 			if (unlikely(!new_bh)) {
2154860d21e2STheodore Ts'o 				error = -ENOMEM;
2155ac27a0ecSDave Kleikamp getblk_failed:
21567dc57615SPeter Huewe 				ext4_free_blocks(handle, inode, NULL, block, 1,
2157e6362609STheodore Ts'o 						 EXT4_FREE_BLOCKS_METADATA);
2158ac27a0ecSDave Kleikamp 				goto cleanup;
2159ac27a0ecSDave Kleikamp 			}
2160dec214d0STahsin Erdogan 			error = ext4_xattr_inode_inc_ref_all(handle, inode,
2161dec214d0STahsin Erdogan 						      ENTRY(header(s->base)+1));
2162dec214d0STahsin Erdogan 			if (error)
2163dec214d0STahsin Erdogan 				goto getblk_failed;
2164dec214d0STahsin Erdogan 			if (ea_inode) {
2165dec214d0STahsin Erdogan 				/* Drop the extra ref on ea_inode. */
2166dec214d0STahsin Erdogan 				error = ext4_xattr_inode_dec_ref(handle,
2167dec214d0STahsin Erdogan 								 ea_inode);
2168dec214d0STahsin Erdogan 				if (error)
2169dec214d0STahsin Erdogan 					ext4_warning_inode(ea_inode,
2170dec214d0STahsin Erdogan 							   "dec ref error=%d",
2171dec214d0STahsin Erdogan 							   error);
2172dec214d0STahsin Erdogan 				iput(ea_inode);
2173dec214d0STahsin Erdogan 				ea_inode = NULL;
2174dec214d0STahsin Erdogan 			}
2175dec214d0STahsin Erdogan 
2176ac27a0ecSDave Kleikamp 			lock_buffer(new_bh);
2177188c299eSJan Kara 			error = ext4_journal_get_create_access(handle, sb,
2178188c299eSJan Kara 							new_bh, EXT4_JTR_NONE);
2179ac27a0ecSDave Kleikamp 			if (error) {
2180ac27a0ecSDave Kleikamp 				unlock_buffer(new_bh);
2181860d21e2STheodore Ts'o 				error = -EIO;
2182ac27a0ecSDave Kleikamp 				goto getblk_failed;
2183ac27a0ecSDave Kleikamp 			}
2184ac27a0ecSDave Kleikamp 			memcpy(new_bh->b_data, s->base, new_bh->b_size);
2185dac7a4b4STheodore Ts'o 			ext4_xattr_block_csum_set(inode, new_bh);
2186ac27a0ecSDave Kleikamp 			set_buffer_uptodate(new_bh);
2187ac27a0ecSDave Kleikamp 			unlock_buffer(new_bh);
218847387409STahsin Erdogan 			ext4_xattr_block_cache_insert(ea_block_cache, new_bh);
2189dac7a4b4STheodore Ts'o 			error = ext4_handle_dirty_metadata(handle, inode,
2190dac7a4b4STheodore Ts'o 							   new_bh);
2191ac27a0ecSDave Kleikamp 			if (error)
2192ac27a0ecSDave Kleikamp 				goto cleanup;
2193ac27a0ecSDave Kleikamp 		}
2194ac27a0ecSDave Kleikamp 	}
2195ac27a0ecSDave Kleikamp 
2196a6d05676STahsin Erdogan 	if (old_ea_inode_quota)
2197a6d05676STahsin Erdogan 		ext4_xattr_inode_free_quota(inode, NULL, old_ea_inode_quota);
2198dec214d0STahsin Erdogan 
2199ac27a0ecSDave Kleikamp 	/* Update the inode. */
2200617ba13bSMingming Cao 	EXT4_I(inode)->i_file_acl = new_bh ? new_bh->b_blocknr : 0;
2201ac27a0ecSDave Kleikamp 
2202ac27a0ecSDave Kleikamp 	/* Drop the previous xattr block. */
2203dec214d0STahsin Erdogan 	if (bs->bh && bs->bh != new_bh) {
2204dec214d0STahsin Erdogan 		struct ext4_xattr_inode_array *ea_inode_array = NULL;
2205dec214d0STahsin Erdogan 
2206dec214d0STahsin Erdogan 		ext4_xattr_release_block(handle, inode, bs->bh,
2207dec214d0STahsin Erdogan 					 &ea_inode_array,
2208dec214d0STahsin Erdogan 					 0 /* extra_credits */);
2209dec214d0STahsin Erdogan 		ext4_xattr_inode_array_free(ea_inode_array);
2210dec214d0STahsin Erdogan 	}
2211ac27a0ecSDave Kleikamp 	error = 0;
2212ac27a0ecSDave Kleikamp 
2213ac27a0ecSDave Kleikamp cleanup:
2214dec214d0STahsin Erdogan 	if (ea_inode) {
2215dec214d0STahsin Erdogan 		int error2;
2216dec214d0STahsin Erdogan 
2217dec214d0STahsin Erdogan 		error2 = ext4_xattr_inode_dec_ref(handle, ea_inode);
2218dec214d0STahsin Erdogan 		if (error2)
2219dec214d0STahsin Erdogan 			ext4_warning_inode(ea_inode, "dec ref error=%d",
2220dec214d0STahsin Erdogan 					   error2);
2221dec214d0STahsin Erdogan 
2222dec214d0STahsin Erdogan 		/* If there was an error, revert the quota charge. */
2223dec214d0STahsin Erdogan 		if (error)
2224a6d05676STahsin Erdogan 			ext4_xattr_inode_free_quota(inode, ea_inode,
2225dec214d0STahsin Erdogan 						    i_size_read(ea_inode));
2226dec214d0STahsin Erdogan 		iput(ea_inode);
2227dec214d0STahsin Erdogan 	}
2228ac27a0ecSDave Kleikamp 	if (ce)
222947387409STahsin Erdogan 		mb_cache_entry_put(ea_block_cache, ce);
2230ac27a0ecSDave Kleikamp 	brelse(new_bh);
2231ac27a0ecSDave Kleikamp 	if (!(bs->bh && s->base == bs->bh->b_data))
2232ac27a0ecSDave Kleikamp 		kfree(s->base);
2233ac27a0ecSDave Kleikamp 
2234ac27a0ecSDave Kleikamp 	return error;
2235ac27a0ecSDave Kleikamp 
2236ac27a0ecSDave Kleikamp cleanup_dquot:
22371231b3a1SLukas Czerner 	dquot_free_block(inode, EXT4_C2B(EXT4_SB(sb), 1));
2238ac27a0ecSDave Kleikamp 	goto cleanup;
2239ac27a0ecSDave Kleikamp 
2240ac27a0ecSDave Kleikamp bad_block:
224124676da4STheodore Ts'o 	EXT4_ERROR_INODE(inode, "bad block %llu",
224224676da4STheodore Ts'o 			 EXT4_I(inode)->i_file_acl);
2243ac27a0ecSDave Kleikamp 	goto cleanup;
2244ac27a0ecSDave Kleikamp 
2245ac27a0ecSDave Kleikamp #undef header
2246ac27a0ecSDave Kleikamp }
2247ac27a0ecSDave Kleikamp 
2248879b3825STao Ma int ext4_xattr_ibody_find(struct inode *inode, struct ext4_xattr_info *i,
2249617ba13bSMingming Cao 			  struct ext4_xattr_ibody_find *is)
2250ac27a0ecSDave Kleikamp {
2251617ba13bSMingming Cao 	struct ext4_xattr_ibody_header *header;
2252617ba13bSMingming Cao 	struct ext4_inode *raw_inode;
2253ac27a0ecSDave Kleikamp 	int error;
2254ac27a0ecSDave Kleikamp 
225567d7d8adSBaokun Li 	if (!EXT4_INODE_HAS_XATTR_SPACE(inode))
2256ac27a0ecSDave Kleikamp 		return 0;
225767d7d8adSBaokun Li 
2258617ba13bSMingming Cao 	raw_inode = ext4_raw_inode(&is->iloc);
2259ac27a0ecSDave Kleikamp 	header = IHDR(inode, raw_inode);
2260ac27a0ecSDave Kleikamp 	is->s.base = is->s.first = IFIRST(header);
2261ac27a0ecSDave Kleikamp 	is->s.here = is->s.first;
2262617ba13bSMingming Cao 	is->s.end = (void *)raw_inode + EXT4_SB(inode->i_sb)->s_inode_size;
226319f5fb7aSTheodore Ts'o 	if (ext4_test_inode_state(inode, EXT4_STATE_XATTR)) {
22649e92f48cSTheodore Ts'o 		error = xattr_check_inode(inode, header, is->s.end);
2265ac27a0ecSDave Kleikamp 		if (error)
2266ac27a0ecSDave Kleikamp 			return error;
2267ac27a0ecSDave Kleikamp 		/* Find the named attribute. */
22689496005dSTheodore Ts'o 		error = xattr_find_entry(inode, &is->s.here, is->s.end,
22699496005dSTheodore Ts'o 					 i->name_index, i->name, 0);
2270ac27a0ecSDave Kleikamp 		if (error && error != -ENODATA)
2271ac27a0ecSDave Kleikamp 			return error;
2272ac27a0ecSDave Kleikamp 		is->s.not_found = error;
2273ac27a0ecSDave Kleikamp 	}
2274ac27a0ecSDave Kleikamp 	return 0;
2275ac27a0ecSDave Kleikamp }
2276ac27a0ecSDave Kleikamp 
2277310c097cSRitesh Harjani int ext4_xattr_ibody_set(handle_t *handle, struct inode *inode,
2278617ba13bSMingming Cao 				struct ext4_xattr_info *i,
2279617ba13bSMingming Cao 				struct ext4_xattr_ibody_find *is)
2280ac27a0ecSDave Kleikamp {
2281617ba13bSMingming Cao 	struct ext4_xattr_ibody_header *header;
2282617ba13bSMingming Cao 	struct ext4_xattr_search *s = &is->s;
2283ac27a0ecSDave Kleikamp 	int error;
2284ac27a0ecSDave Kleikamp 
228567d7d8adSBaokun Li 	if (!EXT4_INODE_HAS_XATTR_SPACE(inode))
2286ac27a0ecSDave Kleikamp 		return -ENOSPC;
228767d7d8adSBaokun Li 
2288daf83281STahsin Erdogan 	error = ext4_xattr_set_entry(i, s, handle, inode, false /* is_block */);
2289ac27a0ecSDave Kleikamp 	if (error)
2290ac27a0ecSDave Kleikamp 		return error;
2291617ba13bSMingming Cao 	header = IHDR(inode, ext4_raw_inode(&is->iloc));
2292ac27a0ecSDave Kleikamp 	if (!IS_LAST_ENTRY(s->first)) {
2293617ba13bSMingming Cao 		header->h_magic = cpu_to_le32(EXT4_XATTR_MAGIC);
229419f5fb7aSTheodore Ts'o 		ext4_set_inode_state(inode, EXT4_STATE_XATTR);
2295ac27a0ecSDave Kleikamp 	} else {
2296ac27a0ecSDave Kleikamp 		header->h_magic = cpu_to_le32(0);
229719f5fb7aSTheodore Ts'o 		ext4_clear_inode_state(inode, EXT4_STATE_XATTR);
2298ac27a0ecSDave Kleikamp 	}
2299ac27a0ecSDave Kleikamp 	return 0;
2300ac27a0ecSDave Kleikamp }
2301ac27a0ecSDave Kleikamp 
23023fd16462SJan Kara static int ext4_xattr_value_same(struct ext4_xattr_search *s,
23033fd16462SJan Kara 				 struct ext4_xattr_info *i)
23043fd16462SJan Kara {
23053fd16462SJan Kara 	void *value;
23063fd16462SJan Kara 
23070bd454c0STahsin Erdogan 	/* When e_value_inum is set the value is stored externally. */
23080bd454c0STahsin Erdogan 	if (s->here->e_value_inum)
23090bd454c0STahsin Erdogan 		return 0;
23103fd16462SJan Kara 	if (le32_to_cpu(s->here->e_value_size) != i->value_len)
23113fd16462SJan Kara 		return 0;
23123fd16462SJan Kara 	value = ((void *)s->base) + le16_to_cpu(s->here->e_value_offs);
23133fd16462SJan Kara 	return !memcmp(value, i->value, i->value_len);
23143fd16462SJan Kara }
23153fd16462SJan Kara 
2316dec214d0STahsin Erdogan static struct buffer_head *ext4_xattr_get_block(struct inode *inode)
2317dec214d0STahsin Erdogan {
2318dec214d0STahsin Erdogan 	struct buffer_head *bh;
2319dec214d0STahsin Erdogan 	int error;
2320dec214d0STahsin Erdogan 
2321dec214d0STahsin Erdogan 	if (!EXT4_I(inode)->i_file_acl)
2322dec214d0STahsin Erdogan 		return NULL;
2323fb265c9cSTheodore Ts'o 	bh = ext4_sb_bread(inode->i_sb, EXT4_I(inode)->i_file_acl, REQ_PRIO);
2324fb265c9cSTheodore Ts'o 	if (IS_ERR(bh))
2325fb265c9cSTheodore Ts'o 		return bh;
2326dec214d0STahsin Erdogan 	error = ext4_xattr_check_block(inode, bh);
2327ecaaf408SVasily Averin 	if (error) {
2328ecaaf408SVasily Averin 		brelse(bh);
2329dec214d0STahsin Erdogan 		return ERR_PTR(error);
2330ecaaf408SVasily Averin 	}
2331dec214d0STahsin Erdogan 	return bh;
2332dec214d0STahsin Erdogan }
2333dec214d0STahsin Erdogan 
2334ac27a0ecSDave Kleikamp /*
2335617ba13bSMingming Cao  * ext4_xattr_set_handle()
2336ac27a0ecSDave Kleikamp  *
23376e9510b0SWang Sheng-Hui  * Create, replace or remove an extended attribute for this inode.  Value
2338ac27a0ecSDave Kleikamp  * is NULL to remove an existing extended attribute, and non-NULL to
2339ac27a0ecSDave Kleikamp  * either replace an existing extended attribute, or create a new extended
2340ac27a0ecSDave Kleikamp  * attribute. The flags XATTR_REPLACE and XATTR_CREATE
2341ac27a0ecSDave Kleikamp  * specify that an extended attribute must exist and must not exist
2342ac27a0ecSDave Kleikamp  * previous to the call, respectively.
2343ac27a0ecSDave Kleikamp  *
2344ac27a0ecSDave Kleikamp  * Returns 0, or a negative error number on failure.
2345ac27a0ecSDave Kleikamp  */
2346ac27a0ecSDave Kleikamp int
2347617ba13bSMingming Cao ext4_xattr_set_handle(handle_t *handle, struct inode *inode, int name_index,
2348ac27a0ecSDave Kleikamp 		      const char *name, const void *value, size_t value_len,
2349ac27a0ecSDave Kleikamp 		      int flags)
2350ac27a0ecSDave Kleikamp {
2351617ba13bSMingming Cao 	struct ext4_xattr_info i = {
2352ac27a0ecSDave Kleikamp 		.name_index = name_index,
2353ac27a0ecSDave Kleikamp 		.name = name,
2354ac27a0ecSDave Kleikamp 		.value = value,
2355ac27a0ecSDave Kleikamp 		.value_len = value_len,
2356e50e5129SAndreas Dilger 		.in_inode = 0,
2357ac27a0ecSDave Kleikamp 	};
2358617ba13bSMingming Cao 	struct ext4_xattr_ibody_find is = {
2359ac27a0ecSDave Kleikamp 		.s = { .not_found = -ENODATA, },
2360ac27a0ecSDave Kleikamp 	};
2361617ba13bSMingming Cao 	struct ext4_xattr_block_find bs = {
2362ac27a0ecSDave Kleikamp 		.s = { .not_found = -ENODATA, },
2363ac27a0ecSDave Kleikamp 	};
2364c755e251STheodore Ts'o 	int no_expand;
2365ac27a0ecSDave Kleikamp 	int error;
2366ac27a0ecSDave Kleikamp 
2367ac27a0ecSDave Kleikamp 	if (!name)
2368ac27a0ecSDave Kleikamp 		return -EINVAL;
2369ac27a0ecSDave Kleikamp 	if (strlen(name) > 255)
2370ac27a0ecSDave Kleikamp 		return -ERANGE;
2371b8cb5a54STahsin Erdogan 
2372c755e251STheodore Ts'o 	ext4_write_lock_xattr(inode, &no_expand);
23734d20c685SKalpak Shah 
2374c1a5d5f6STahsin Erdogan 	/* Check journal credits under write lock. */
2375c1a5d5f6STahsin Erdogan 	if (ext4_handle_valid(handle)) {
2376dec214d0STahsin Erdogan 		struct buffer_head *bh;
2377c1a5d5f6STahsin Erdogan 		int credits;
2378c1a5d5f6STahsin Erdogan 
2379dec214d0STahsin Erdogan 		bh = ext4_xattr_get_block(inode);
2380dec214d0STahsin Erdogan 		if (IS_ERR(bh)) {
2381dec214d0STahsin Erdogan 			error = PTR_ERR(bh);
2382dec214d0STahsin Erdogan 			goto cleanup;
2383dec214d0STahsin Erdogan 		}
2384dec214d0STahsin Erdogan 
2385af65207cSTahsin Erdogan 		credits = __ext4_xattr_set_credits(inode->i_sb, inode, bh,
2386af65207cSTahsin Erdogan 						   value_len,
2387af65207cSTahsin Erdogan 						   flags & XATTR_CREATE);
2388dec214d0STahsin Erdogan 		brelse(bh);
2389dec214d0STahsin Erdogan 
2390a9a8344eSJan Kara 		if (jbd2_handle_buffer_credits(handle) < credits) {
2391c1a5d5f6STahsin Erdogan 			error = -ENOSPC;
2392c1a5d5f6STahsin Erdogan 			goto cleanup;
2393c1a5d5f6STahsin Erdogan 		}
2394163f0ec1SJan Kara 		WARN_ON_ONCE(!(current->flags & PF_MEMALLOC_NOFS));
2395c1a5d5f6STahsin Erdogan 	}
2396c1a5d5f6STahsin Erdogan 
239766543617SEric Sandeen 	error = ext4_reserve_inode_write(handle, inode, &is.iloc);
239886ebfd08SEric Sandeen 	if (error)
239986ebfd08SEric Sandeen 		goto cleanup;
240086ebfd08SEric Sandeen 
240119f5fb7aSTheodore Ts'o 	if (ext4_test_inode_state(inode, EXT4_STATE_NEW)) {
2402617ba13bSMingming Cao 		struct ext4_inode *raw_inode = ext4_raw_inode(&is.iloc);
2403617ba13bSMingming Cao 		memset(raw_inode, 0, EXT4_SB(inode->i_sb)->s_inode_size);
240419f5fb7aSTheodore Ts'o 		ext4_clear_inode_state(inode, EXT4_STATE_NEW);
2405ac27a0ecSDave Kleikamp 	}
2406ac27a0ecSDave Kleikamp 
2407617ba13bSMingming Cao 	error = ext4_xattr_ibody_find(inode, &i, &is);
2408ac27a0ecSDave Kleikamp 	if (error)
2409ac27a0ecSDave Kleikamp 		goto cleanup;
2410ac27a0ecSDave Kleikamp 	if (is.s.not_found)
2411617ba13bSMingming Cao 		error = ext4_xattr_block_find(inode, &i, &bs);
2412ac27a0ecSDave Kleikamp 	if (error)
2413ac27a0ecSDave Kleikamp 		goto cleanup;
2414ac27a0ecSDave Kleikamp 	if (is.s.not_found && bs.s.not_found) {
2415ac27a0ecSDave Kleikamp 		error = -ENODATA;
2416ac27a0ecSDave Kleikamp 		if (flags & XATTR_REPLACE)
2417ac27a0ecSDave Kleikamp 			goto cleanup;
2418ac27a0ecSDave Kleikamp 		error = 0;
2419ac27a0ecSDave Kleikamp 		if (!value)
2420ac27a0ecSDave Kleikamp 			goto cleanup;
2421ac27a0ecSDave Kleikamp 	} else {
2422ac27a0ecSDave Kleikamp 		error = -EEXIST;
2423ac27a0ecSDave Kleikamp 		if (flags & XATTR_CREATE)
2424ac27a0ecSDave Kleikamp 			goto cleanup;
2425ac27a0ecSDave Kleikamp 	}
2426dec214d0STahsin Erdogan 
2427ac27a0ecSDave Kleikamp 	if (!value) {
2428ac27a0ecSDave Kleikamp 		if (!is.s.not_found)
2429e50e5129SAndreas Dilger 			error = ext4_xattr_ibody_set(handle, inode, &i, &is);
2430ac27a0ecSDave Kleikamp 		else if (!bs.s.not_found)
2431617ba13bSMingming Cao 			error = ext4_xattr_block_set(handle, inode, &i, &bs);
2432ac27a0ecSDave Kleikamp 	} else {
24333fd16462SJan Kara 		error = 0;
24343fd16462SJan Kara 		/* Xattr value did not change? Save us some work and bail out */
24353fd16462SJan Kara 		if (!is.s.not_found && ext4_xattr_value_same(&is.s, &i))
24363fd16462SJan Kara 			goto cleanup;
24373fd16462SJan Kara 		if (!bs.s.not_found && ext4_xattr_value_same(&bs.s, &i))
24383fd16462SJan Kara 			goto cleanup;
24393fd16462SJan Kara 
2440b347e2bcSTahsin Erdogan 		if (ext4_has_feature_ea_inode(inode->i_sb) &&
2441b347e2bcSTahsin Erdogan 		    (EXT4_XATTR_SIZE(i.value_len) >
2442b347e2bcSTahsin Erdogan 			EXT4_XATTR_MIN_LARGE_EA_SIZE(inode->i_sb->s_blocksize)))
2443b347e2bcSTahsin Erdogan 			i.in_inode = 1;
2444b347e2bcSTahsin Erdogan retry_inode:
2445e50e5129SAndreas Dilger 		error = ext4_xattr_ibody_set(handle, inode, &i, &is);
2446ac27a0ecSDave Kleikamp 		if (!error && !bs.s.not_found) {
2447ac27a0ecSDave Kleikamp 			i.value = NULL;
2448617ba13bSMingming Cao 			error = ext4_xattr_block_set(handle, inode, &i, &bs);
2449ac27a0ecSDave Kleikamp 		} else if (error == -ENOSPC) {
24507e01c8e5STiger Yang 			if (EXT4_I(inode)->i_file_acl && !bs.s.base) {
245145ae932dSVasily Averin 				brelse(bs.bh);
245245ae932dSVasily Averin 				bs.bh = NULL;
24537e01c8e5STiger Yang 				error = ext4_xattr_block_find(inode, &i, &bs);
24547e01c8e5STiger Yang 				if (error)
24557e01c8e5STiger Yang 					goto cleanup;
24567e01c8e5STiger Yang 			}
2457617ba13bSMingming Cao 			error = ext4_xattr_block_set(handle, inode, &i, &bs);
2458b347e2bcSTahsin Erdogan 			if (!error && !is.s.not_found) {
2459ac27a0ecSDave Kleikamp 				i.value = NULL;
2460e50e5129SAndreas Dilger 				error = ext4_xattr_ibody_set(handle, inode, &i,
2461e50e5129SAndreas Dilger 							     &is);
2462b347e2bcSTahsin Erdogan 			} else if (error == -ENOSPC) {
2463b347e2bcSTahsin Erdogan 				/*
2464b347e2bcSTahsin Erdogan 				 * Xattr does not fit in the block, store at
2465b347e2bcSTahsin Erdogan 				 * external inode if possible.
2466b347e2bcSTahsin Erdogan 				 */
2467b347e2bcSTahsin Erdogan 				if (ext4_has_feature_ea_inode(inode->i_sb) &&
24686b224899Szhangyi (F) 				    i.value_len && !i.in_inode) {
2469b347e2bcSTahsin Erdogan 					i.in_inode = 1;
2470b347e2bcSTahsin Erdogan 					goto retry_inode;
2471b347e2bcSTahsin Erdogan 				}
2472ac27a0ecSDave Kleikamp 			}
2473ac27a0ecSDave Kleikamp 		}
2474ac27a0ecSDave Kleikamp 	}
2475ac27a0ecSDave Kleikamp 	if (!error) {
2476617ba13bSMingming Cao 		ext4_xattr_update_super_block(handle, inode->i_sb);
2477eeca7ea1SDeepa Dinamani 		inode->i_ctime = current_time(inode);
2478a642c2c0SJeff Layton 		inode_inc_iversion(inode);
24796dd4ee7cSKalpak Shah 		if (!value)
2480c755e251STheodore Ts'o 			no_expand = 0;
2481617ba13bSMingming Cao 		error = ext4_mark_iloc_dirty(handle, inode, &is.iloc);
2482ac27a0ecSDave Kleikamp 		/*
2483617ba13bSMingming Cao 		 * The bh is consumed by ext4_mark_iloc_dirty, even with
2484ac27a0ecSDave Kleikamp 		 * error != 0.
2485ac27a0ecSDave Kleikamp 		 */
2486ac27a0ecSDave Kleikamp 		is.iloc.bh = NULL;
2487ac27a0ecSDave Kleikamp 		if (IS_SYNC(inode))
24880390131bSFrank Mayhar 			ext4_handle_sync(handle);
2489ac27a0ecSDave Kleikamp 	}
2490e85c81baSXin Yin 	ext4_fc_mark_ineligible(inode->i_sb, EXT4_FC_REASON_XATTR, handle);
2491ac27a0ecSDave Kleikamp 
2492ac27a0ecSDave Kleikamp cleanup:
2493ac27a0ecSDave Kleikamp 	brelse(is.iloc.bh);
2494ac27a0ecSDave Kleikamp 	brelse(bs.bh);
2495c755e251STheodore Ts'o 	ext4_write_unlock_xattr(inode, &no_expand);
2496ac27a0ecSDave Kleikamp 	return error;
2497ac27a0ecSDave Kleikamp }
2498ac27a0ecSDave Kleikamp 
2499af65207cSTahsin Erdogan int ext4_xattr_set_credits(struct inode *inode, size_t value_len,
2500af65207cSTahsin Erdogan 			   bool is_create, int *credits)
2501c1a5d5f6STahsin Erdogan {
2502dec214d0STahsin Erdogan 	struct buffer_head *bh;
2503dec214d0STahsin Erdogan 	int err;
2504c1a5d5f6STahsin Erdogan 
2505dec214d0STahsin Erdogan 	*credits = 0;
2506dec214d0STahsin Erdogan 
2507dec214d0STahsin Erdogan 	if (!EXT4_SB(inode->i_sb)->s_journal)
2508c1a5d5f6STahsin Erdogan 		return 0;
2509c1a5d5f6STahsin Erdogan 
2510dec214d0STahsin Erdogan 	down_read(&EXT4_I(inode)->xattr_sem);
2511c1a5d5f6STahsin Erdogan 
2512dec214d0STahsin Erdogan 	bh = ext4_xattr_get_block(inode);
2513dec214d0STahsin Erdogan 	if (IS_ERR(bh)) {
2514dec214d0STahsin Erdogan 		err = PTR_ERR(bh);
2515dec214d0STahsin Erdogan 	} else {
2516af65207cSTahsin Erdogan 		*credits = __ext4_xattr_set_credits(inode->i_sb, inode, bh,
2517af65207cSTahsin Erdogan 						    value_len, is_create);
2518dec214d0STahsin Erdogan 		brelse(bh);
2519dec214d0STahsin Erdogan 		err = 0;
2520c1a5d5f6STahsin Erdogan 	}
2521dec214d0STahsin Erdogan 
2522dec214d0STahsin Erdogan 	up_read(&EXT4_I(inode)->xattr_sem);
2523dec214d0STahsin Erdogan 	return err;
2524c1a5d5f6STahsin Erdogan }
2525c1a5d5f6STahsin Erdogan 
2526ac27a0ecSDave Kleikamp /*
2527617ba13bSMingming Cao  * ext4_xattr_set()
2528ac27a0ecSDave Kleikamp  *
2529617ba13bSMingming Cao  * Like ext4_xattr_set_handle, but start from an inode. This extended
2530ac27a0ecSDave Kleikamp  * attribute modification is a filesystem transaction by itself.
2531ac27a0ecSDave Kleikamp  *
2532ac27a0ecSDave Kleikamp  * Returns 0, or a negative error number on failure.
2533ac27a0ecSDave Kleikamp  */
2534ac27a0ecSDave Kleikamp int
2535617ba13bSMingming Cao ext4_xattr_set(struct inode *inode, int name_index, const char *name,
2536ac27a0ecSDave Kleikamp 	       const void *value, size_t value_len, int flags)
2537ac27a0ecSDave Kleikamp {
2538ac27a0ecSDave Kleikamp 	handle_t *handle;
2539e50e5129SAndreas Dilger 	struct super_block *sb = inode->i_sb;
2540ac27a0ecSDave Kleikamp 	int error, retries = 0;
2541c1a5d5f6STahsin Erdogan 	int credits;
2542ac27a0ecSDave Kleikamp 
2543b8cb5a54STahsin Erdogan 	error = dquot_initialize(inode);
2544b8cb5a54STahsin Erdogan 	if (error)
2545b8cb5a54STahsin Erdogan 		return error;
2546e50e5129SAndreas Dilger 
2547ac27a0ecSDave Kleikamp retry:
2548af65207cSTahsin Erdogan 	error = ext4_xattr_set_credits(inode, value_len, flags & XATTR_CREATE,
2549af65207cSTahsin Erdogan 				       &credits);
2550dec214d0STahsin Erdogan 	if (error)
2551dec214d0STahsin Erdogan 		return error;
2552dec214d0STahsin Erdogan 
25539924a92aSTheodore Ts'o 	handle = ext4_journal_start(inode, EXT4_HT_XATTR, credits);
2554ac27a0ecSDave Kleikamp 	if (IS_ERR(handle)) {
2555ac27a0ecSDave Kleikamp 		error = PTR_ERR(handle);
2556ac27a0ecSDave Kleikamp 	} else {
2557ac27a0ecSDave Kleikamp 		int error2;
2558ac27a0ecSDave Kleikamp 
2559617ba13bSMingming Cao 		error = ext4_xattr_set_handle(handle, inode, name_index, name,
2560ac27a0ecSDave Kleikamp 					      value, value_len, flags);
2561617ba13bSMingming Cao 		error2 = ext4_journal_stop(handle);
2562ac27a0ecSDave Kleikamp 		if (error == -ENOSPC &&
2563e50e5129SAndreas Dilger 		    ext4_should_retry_alloc(sb, &retries))
2564ac27a0ecSDave Kleikamp 			goto retry;
2565ac27a0ecSDave Kleikamp 		if (error == 0)
2566ac27a0ecSDave Kleikamp 			error = error2;
2567ac27a0ecSDave Kleikamp 	}
2568e85c81baSXin Yin 	ext4_fc_mark_ineligible(inode->i_sb, EXT4_FC_REASON_XATTR, NULL);
2569ac27a0ecSDave Kleikamp 
2570ac27a0ecSDave Kleikamp 	return error;
2571ac27a0ecSDave Kleikamp }
2572ac27a0ecSDave Kleikamp 
2573ac27a0ecSDave Kleikamp /*
25746dd4ee7cSKalpak Shah  * Shift the EA entries in the inode to create space for the increased
25756dd4ee7cSKalpak Shah  * i_extra_isize.
25766dd4ee7cSKalpak Shah  */
25776dd4ee7cSKalpak Shah static void ext4_xattr_shift_entries(struct ext4_xattr_entry *entry,
25786dd4ee7cSKalpak Shah 				     int value_offs_shift, void *to,
257994405713SJan Kara 				     void *from, size_t n)
25806dd4ee7cSKalpak Shah {
25816dd4ee7cSKalpak Shah 	struct ext4_xattr_entry *last = entry;
25826dd4ee7cSKalpak Shah 	int new_offs;
25836dd4ee7cSKalpak Shah 
258494405713SJan Kara 	/* We always shift xattr headers further thus offsets get lower */
258594405713SJan Kara 	BUG_ON(value_offs_shift > 0);
258694405713SJan Kara 
25876dd4ee7cSKalpak Shah 	/* Adjust the value offsets of the entries */
25886dd4ee7cSKalpak Shah 	for (; !IS_LAST_ENTRY(last); last = EXT4_XATTR_NEXT(last)) {
2589e50e5129SAndreas Dilger 		if (!last->e_value_inum && last->e_value_size) {
25906dd4ee7cSKalpak Shah 			new_offs = le16_to_cpu(last->e_value_offs) +
25916dd4ee7cSKalpak Shah 							value_offs_shift;
25926dd4ee7cSKalpak Shah 			last->e_value_offs = cpu_to_le16(new_offs);
25936dd4ee7cSKalpak Shah 		}
25946dd4ee7cSKalpak Shah 	}
25956dd4ee7cSKalpak Shah 	/* Shift the entries by n bytes */
25966dd4ee7cSKalpak Shah 	memmove(to, from, n);
25976dd4ee7cSKalpak Shah }
25986dd4ee7cSKalpak Shah 
25996dd4ee7cSKalpak Shah /*
26003f2571c1SJan Kara  * Move xattr pointed to by 'entry' from inode into external xattr block
26013f2571c1SJan Kara  */
26023f2571c1SJan Kara static int ext4_xattr_move_to_block(handle_t *handle, struct inode *inode,
26033f2571c1SJan Kara 				    struct ext4_inode *raw_inode,
26043f2571c1SJan Kara 				    struct ext4_xattr_entry *entry)
26053f2571c1SJan Kara {
26063f2571c1SJan Kara 	struct ext4_xattr_ibody_find *is = NULL;
26073f2571c1SJan Kara 	struct ext4_xattr_block_find *bs = NULL;
26083f2571c1SJan Kara 	char *buffer = NULL, *b_entry_name = NULL;
2609f6109100STahsin Erdogan 	size_t value_size = le32_to_cpu(entry->e_value_size);
26103f2571c1SJan Kara 	struct ext4_xattr_info i = {
26113f2571c1SJan Kara 		.value = NULL,
26123f2571c1SJan Kara 		.value_len = 0,
26133f2571c1SJan Kara 		.name_index = entry->e_name_index,
2614f6109100STahsin Erdogan 		.in_inode = !!entry->e_value_inum,
26153f2571c1SJan Kara 	};
26163f2571c1SJan Kara 	struct ext4_xattr_ibody_header *header = IHDR(inode, raw_inode);
26173f2571c1SJan Kara 	int error;
26183f2571c1SJan Kara 
26193f2571c1SJan Kara 	is = kzalloc(sizeof(struct ext4_xattr_ibody_find), GFP_NOFS);
26203f2571c1SJan Kara 	bs = kzalloc(sizeof(struct ext4_xattr_block_find), GFP_NOFS);
26213f2571c1SJan Kara 	b_entry_name = kmalloc(entry->e_name_len + 1, GFP_NOFS);
26221e9d62d2SJun Nie 	if (!is || !bs || !b_entry_name) {
26233f2571c1SJan Kara 		error = -ENOMEM;
26243f2571c1SJan Kara 		goto out;
26253f2571c1SJan Kara 	}
26263f2571c1SJan Kara 
26273f2571c1SJan Kara 	is->s.not_found = -ENODATA;
26283f2571c1SJan Kara 	bs->s.not_found = -ENODATA;
26293f2571c1SJan Kara 	is->iloc.bh = NULL;
26303f2571c1SJan Kara 	bs->bh = NULL;
26313f2571c1SJan Kara 
26323f2571c1SJan Kara 	/* Save the entry name and the entry value */
2633f6109100STahsin Erdogan 	if (entry->e_value_inum) {
26341e9d62d2SJun Nie 		buffer = kvmalloc(value_size, GFP_NOFS);
26351e9d62d2SJun Nie 		if (!buffer) {
26361e9d62d2SJun Nie 			error = -ENOMEM;
26371e9d62d2SJun Nie 			goto out;
26381e9d62d2SJun Nie 		}
26391e9d62d2SJun Nie 
2640b9fc761eSTahsin Erdogan 		error = ext4_xattr_inode_get(inode, entry, buffer, value_size);
2641f6109100STahsin Erdogan 		if (error)
2642f6109100STahsin Erdogan 			goto out;
2643f6109100STahsin Erdogan 	} else {
2644f6109100STahsin Erdogan 		size_t value_offs = le16_to_cpu(entry->e_value_offs);
26451e9d62d2SJun Nie 		buffer = (void *)IFIRST(header) + value_offs;
2646f6109100STahsin Erdogan 	}
2647f6109100STahsin Erdogan 
26483f2571c1SJan Kara 	memcpy(b_entry_name, entry->e_name, entry->e_name_len);
26493f2571c1SJan Kara 	b_entry_name[entry->e_name_len] = '\0';
26503f2571c1SJan Kara 	i.name = b_entry_name;
26513f2571c1SJan Kara 
26523f2571c1SJan Kara 	error = ext4_get_inode_loc(inode, &is->iloc);
26533f2571c1SJan Kara 	if (error)
26543f2571c1SJan Kara 		goto out;
26553f2571c1SJan Kara 
26563f2571c1SJan Kara 	error = ext4_xattr_ibody_find(inode, &i, is);
26573f2571c1SJan Kara 	if (error)
26583f2571c1SJan Kara 		goto out;
26593f2571c1SJan Kara 
26603f2571c1SJan Kara 	i.value = buffer;
26613f2571c1SJan Kara 	i.value_len = value_size;
26623f2571c1SJan Kara 	error = ext4_xattr_block_find(inode, &i, bs);
26633f2571c1SJan Kara 	if (error)
26643f2571c1SJan Kara 		goto out;
26653f2571c1SJan Kara 
26661e9d62d2SJun Nie 	/* Move ea entry from the inode into the block */
26673f2571c1SJan Kara 	error = ext4_xattr_block_set(handle, inode, &i, bs);
26683f2571c1SJan Kara 	if (error)
26693f2571c1SJan Kara 		goto out;
26701e9d62d2SJun Nie 
26711e9d62d2SJun Nie 	/* Remove the chosen entry from the inode */
26721e9d62d2SJun Nie 	i.value = NULL;
26731e9d62d2SJun Nie 	i.value_len = 0;
26741e9d62d2SJun Nie 	error = ext4_xattr_ibody_set(handle, inode, &i, is);
26751e9d62d2SJun Nie 
26763f2571c1SJan Kara out:
26773f2571c1SJan Kara 	kfree(b_entry_name);
26781e9d62d2SJun Nie 	if (entry->e_value_inum && buffer)
2679cc12a6f2SYe Bin 		kvfree(buffer);
26803f2571c1SJan Kara 	if (is)
26813f2571c1SJan Kara 		brelse(is->iloc.bh);
26826bdc9977SVasily Averin 	if (bs)
26836bdc9977SVasily Averin 		brelse(bs->bh);
26843f2571c1SJan Kara 	kfree(is);
26853f2571c1SJan Kara 	kfree(bs);
26863f2571c1SJan Kara 
26873f2571c1SJan Kara 	return error;
26883f2571c1SJan Kara }
26893f2571c1SJan Kara 
2690dfa2064bSJan Kara static int ext4_xattr_make_inode_space(handle_t *handle, struct inode *inode,
2691dfa2064bSJan Kara 				       struct ext4_inode *raw_inode,
2692dfa2064bSJan Kara 				       int isize_diff, size_t ifree,
2693dfa2064bSJan Kara 				       size_t bfree, int *total_ino)
2694dfa2064bSJan Kara {
2695dfa2064bSJan Kara 	struct ext4_xattr_ibody_header *header = IHDR(inode, raw_inode);
2696dfa2064bSJan Kara 	struct ext4_xattr_entry *small_entry;
2697dfa2064bSJan Kara 	struct ext4_xattr_entry *entry;
2698dfa2064bSJan Kara 	struct ext4_xattr_entry *last;
2699dfa2064bSJan Kara 	unsigned int entry_size;	/* EA entry size */
2700dfa2064bSJan Kara 	unsigned int total_size;	/* EA entry size + value size */
2701dfa2064bSJan Kara 	unsigned int min_total_size;
2702dfa2064bSJan Kara 	int error;
2703dfa2064bSJan Kara 
2704dfa2064bSJan Kara 	while (isize_diff > ifree) {
2705dfa2064bSJan Kara 		entry = NULL;
2706dfa2064bSJan Kara 		small_entry = NULL;
2707dfa2064bSJan Kara 		min_total_size = ~0U;
2708dfa2064bSJan Kara 		last = IFIRST(header);
2709dfa2064bSJan Kara 		/* Find the entry best suited to be pushed into EA block */
2710dfa2064bSJan Kara 		for (; !IS_LAST_ENTRY(last); last = EXT4_XATTR_NEXT(last)) {
27118cdb5240STheodore Ts'o 			/* never move system.data out of the inode */
27128cdb5240STheodore Ts'o 			if ((last->e_name_len == 4) &&
27138cdb5240STheodore Ts'o 			    (last->e_name_index == EXT4_XATTR_INDEX_SYSTEM) &&
27148cdb5240STheodore Ts'o 			    !memcmp(last->e_name, "data", 4))
27158cdb5240STheodore Ts'o 				continue;
27169bb21cedSTahsin Erdogan 			total_size = EXT4_XATTR_LEN(last->e_name_len);
27179bb21cedSTahsin Erdogan 			if (!last->e_value_inum)
27189bb21cedSTahsin Erdogan 				total_size += EXT4_XATTR_SIZE(
27199bb21cedSTahsin Erdogan 					       le32_to_cpu(last->e_value_size));
2720dfa2064bSJan Kara 			if (total_size <= bfree &&
2721dfa2064bSJan Kara 			    total_size < min_total_size) {
2722dfa2064bSJan Kara 				if (total_size + ifree < isize_diff) {
2723dfa2064bSJan Kara 					small_entry = last;
2724dfa2064bSJan Kara 				} else {
2725dfa2064bSJan Kara 					entry = last;
2726dfa2064bSJan Kara 					min_total_size = total_size;
2727dfa2064bSJan Kara 				}
2728dfa2064bSJan Kara 			}
2729dfa2064bSJan Kara 		}
2730dfa2064bSJan Kara 
2731dfa2064bSJan Kara 		if (entry == NULL) {
2732dfa2064bSJan Kara 			if (small_entry == NULL)
2733dfa2064bSJan Kara 				return -ENOSPC;
2734dfa2064bSJan Kara 			entry = small_entry;
2735dfa2064bSJan Kara 		}
2736dfa2064bSJan Kara 
2737dfa2064bSJan Kara 		entry_size = EXT4_XATTR_LEN(entry->e_name_len);
27389bb21cedSTahsin Erdogan 		total_size = entry_size;
27399bb21cedSTahsin Erdogan 		if (!entry->e_value_inum)
27409bb21cedSTahsin Erdogan 			total_size += EXT4_XATTR_SIZE(
27419bb21cedSTahsin Erdogan 					      le32_to_cpu(entry->e_value_size));
2742dfa2064bSJan Kara 		error = ext4_xattr_move_to_block(handle, inode, raw_inode,
2743dfa2064bSJan Kara 						 entry);
2744dfa2064bSJan Kara 		if (error)
2745dfa2064bSJan Kara 			return error;
2746dfa2064bSJan Kara 
2747dfa2064bSJan Kara 		*total_ino -= entry_size;
2748dfa2064bSJan Kara 		ifree += total_size;
2749dfa2064bSJan Kara 		bfree -= total_size;
2750dfa2064bSJan Kara 	}
2751dfa2064bSJan Kara 
2752dfa2064bSJan Kara 	return 0;
2753dfa2064bSJan Kara }
2754dfa2064bSJan Kara 
27553f2571c1SJan Kara /*
27566dd4ee7cSKalpak Shah  * Expand an inode by new_extra_isize bytes when EAs are present.
27576dd4ee7cSKalpak Shah  * Returns 0 on success or negative error number on failure.
27586dd4ee7cSKalpak Shah  */
27596dd4ee7cSKalpak Shah int ext4_expand_extra_isize_ea(struct inode *inode, int new_extra_isize,
27606dd4ee7cSKalpak Shah 			       struct ext4_inode *raw_inode, handle_t *handle)
27616dd4ee7cSKalpak Shah {
27626dd4ee7cSKalpak Shah 	struct ext4_xattr_ibody_header *header;
2763cf0a5e81SMiao Xie 	struct ext4_sb_info *sbi = EXT4_SB(inode->i_sb);
2764cf0a5e81SMiao Xie 	static unsigned int mnt_count;
2765e3014d14SJan Kara 	size_t min_offs;
2766e3014d14SJan Kara 	size_t ifree, bfree;
27677b1b2c1bSTheodore Ts'o 	int total_ino;
27686e0cd088SJan Kara 	void *base, *end;
2769d0141191SJan Kara 	int error = 0, tried_min_extra_isize = 0;
2770cf0a5e81SMiao Xie 	int s_min_extra_isize = le16_to_cpu(sbi->s_es->s_min_extra_isize);
2771d0141191SJan Kara 	int isize_diff;	/* How much do we need to grow i_extra_isize */
2772c755e251STheodore Ts'o 
27736dd4ee7cSKalpak Shah retry:
2774d0141191SJan Kara 	isize_diff = new_extra_isize - EXT4_I(inode)->i_extra_isize;
27752e81a4eeSJan Kara 	if (EXT4_I(inode)->i_extra_isize >= new_extra_isize)
2776b640b2c5SMiao Xie 		return 0;
27776dd4ee7cSKalpak Shah 
27786dd4ee7cSKalpak Shah 	header = IHDR(inode, raw_inode);
27796dd4ee7cSKalpak Shah 
27806dd4ee7cSKalpak Shah 	/*
27816dd4ee7cSKalpak Shah 	 * Check if enough free space is available in the inode to shift the
27826dd4ee7cSKalpak Shah 	 * entries ahead by new_extra_isize.
27836dd4ee7cSKalpak Shah 	 */
27846dd4ee7cSKalpak Shah 
27856e0cd088SJan Kara 	base = IFIRST(header);
27866dd4ee7cSKalpak Shah 	end = (void *)raw_inode + EXT4_SB(inode->i_sb)->s_inode_size;
27876dd4ee7cSKalpak Shah 	min_offs = end - base;
2788a805622aSTheodore Ts'o 	total_ino = sizeof(struct ext4_xattr_ibody_header) + sizeof(u32);
27896dd4ee7cSKalpak Shah 
27909e92f48cSTheodore Ts'o 	error = xattr_check_inode(inode, header, end);
27919e92f48cSTheodore Ts'o 	if (error)
27929e92f48cSTheodore Ts'o 		goto cleanup;
27939e92f48cSTheodore Ts'o 
27946e0cd088SJan Kara 	ifree = ext4_xattr_free_space(base, &min_offs, base, &total_ino);
2795e3014d14SJan Kara 	if (ifree >= isize_diff)
2796e3014d14SJan Kara 		goto shift;
27976dd4ee7cSKalpak Shah 
27986dd4ee7cSKalpak Shah 	/*
27996dd4ee7cSKalpak Shah 	 * Enough free space isn't available in the inode, check if
28006dd4ee7cSKalpak Shah 	 * EA block can hold new_extra_isize bytes.
28016dd4ee7cSKalpak Shah 	 */
28026dd4ee7cSKalpak Shah 	if (EXT4_I(inode)->i_file_acl) {
280353692ec0SVasily Averin 		struct buffer_head *bh;
280453692ec0SVasily Averin 
2805fb265c9cSTheodore Ts'o 		bh = ext4_sb_bread(inode->i_sb, EXT4_I(inode)->i_file_acl, REQ_PRIO);
2806fb265c9cSTheodore Ts'o 		if (IS_ERR(bh)) {
2807fb265c9cSTheodore Ts'o 			error = PTR_ERR(bh);
28086dd4ee7cSKalpak Shah 			goto cleanup;
2809fb265c9cSTheodore Ts'o 		}
2810de05ca85STheodore Ts'o 		error = ext4_xattr_check_block(inode, bh);
281153692ec0SVasily Averin 		if (error) {
281253692ec0SVasily Averin 			brelse(bh);
28136dd4ee7cSKalpak Shah 			goto cleanup;
281453692ec0SVasily Averin 		}
28156dd4ee7cSKalpak Shah 		base = BHDR(bh);
28166dd4ee7cSKalpak Shah 		end = bh->b_data + bh->b_size;
28176dd4ee7cSKalpak Shah 		min_offs = end - base;
28186e0cd088SJan Kara 		bfree = ext4_xattr_free_space(BFIRST(bh), &min_offs, base,
28196e0cd088SJan Kara 					      NULL);
2820b640b2c5SMiao Xie 		brelse(bh);
2821e3014d14SJan Kara 		if (bfree + ifree < isize_diff) {
28226dd4ee7cSKalpak Shah 			if (!tried_min_extra_isize && s_min_extra_isize) {
28236dd4ee7cSKalpak Shah 				tried_min_extra_isize++;
28246dd4ee7cSKalpak Shah 				new_extra_isize = s_min_extra_isize;
28256dd4ee7cSKalpak Shah 				goto retry;
28266dd4ee7cSKalpak Shah 			}
2827dfa2064bSJan Kara 			error = -ENOSPC;
28286dd4ee7cSKalpak Shah 			goto cleanup;
28296dd4ee7cSKalpak Shah 		}
28306dd4ee7cSKalpak Shah 	} else {
2831e3014d14SJan Kara 		bfree = inode->i_sb->s_blocksize;
28326dd4ee7cSKalpak Shah 	}
28336dd4ee7cSKalpak Shah 
2834dfa2064bSJan Kara 	error = ext4_xattr_make_inode_space(handle, inode, raw_inode,
2835dfa2064bSJan Kara 					    isize_diff, ifree, bfree,
2836dfa2064bSJan Kara 					    &total_ino);
2837dfa2064bSJan Kara 	if (error) {
2838dfa2064bSJan Kara 		if (error == -ENOSPC && !tried_min_extra_isize &&
28396dd4ee7cSKalpak Shah 		    s_min_extra_isize) {
28406dd4ee7cSKalpak Shah 			tried_min_extra_isize++;
28416dd4ee7cSKalpak Shah 			new_extra_isize = s_min_extra_isize;
28426dd4ee7cSKalpak Shah 			goto retry;
28436dd4ee7cSKalpak Shah 		}
28446dd4ee7cSKalpak Shah 		goto cleanup;
28456dd4ee7cSKalpak Shah 	}
2846e3014d14SJan Kara shift:
2847e3014d14SJan Kara 	/* Adjust the offsets and shift the remaining entries ahead */
28486e0cd088SJan Kara 	ext4_xattr_shift_entries(IFIRST(header), EXT4_I(inode)->i_extra_isize
2849e3014d14SJan Kara 			- new_extra_isize, (void *)raw_inode +
2850e3014d14SJan Kara 			EXT4_GOOD_OLD_INODE_SIZE + new_extra_isize,
285194405713SJan Kara 			(void *)header, total_ino);
2852e3014d14SJan Kara 	EXT4_I(inode)->i_extra_isize = new_extra_isize;
28536dd4ee7cSKalpak Shah 
28546dd4ee7cSKalpak Shah cleanup:
2855b640b2c5SMiao Xie 	if (error && (mnt_count != le16_to_cpu(sbi->s_es->s_mnt_count))) {
2856cf0a5e81SMiao Xie 		ext4_warning(inode->i_sb, "Unable to expand inode %lu. Delete some EAs or run e2fsck.",
2857cf0a5e81SMiao Xie 			     inode->i_ino);
2858cf0a5e81SMiao Xie 		mnt_count = le16_to_cpu(sbi->s_es->s_mnt_count);
2859cf0a5e81SMiao Xie 	}
28606dd4ee7cSKalpak Shah 	return error;
28616dd4ee7cSKalpak Shah }
28626dd4ee7cSKalpak Shah 
2863e50e5129SAndreas Dilger #define EIA_INCR 16 /* must be 2^n */
2864e50e5129SAndreas Dilger #define EIA_MASK (EIA_INCR - 1)
2865dec214d0STahsin Erdogan 
2866dec214d0STahsin Erdogan /* Add the large xattr @inode into @ea_inode_array for deferred iput().
28670421a189STahsin Erdogan  * If @ea_inode_array is new or full it will be grown and the old
2868e50e5129SAndreas Dilger  * contents copied over.
2869e50e5129SAndreas Dilger  */
2870e50e5129SAndreas Dilger static int
28710421a189STahsin Erdogan ext4_expand_inode_array(struct ext4_xattr_inode_array **ea_inode_array,
28720421a189STahsin Erdogan 			struct inode *inode)
2873e50e5129SAndreas Dilger {
28740421a189STahsin Erdogan 	if (*ea_inode_array == NULL) {
2875e50e5129SAndreas Dilger 		/*
2876e50e5129SAndreas Dilger 		 * Start with 15 inodes, so it fits into a power-of-two size.
28770421a189STahsin Erdogan 		 * If *ea_inode_array is NULL, this is essentially offsetof()
2878e50e5129SAndreas Dilger 		 */
28790421a189STahsin Erdogan 		(*ea_inode_array) =
28800421a189STahsin Erdogan 			kmalloc(offsetof(struct ext4_xattr_inode_array,
28810421a189STahsin Erdogan 					 inodes[EIA_MASK]),
2882e50e5129SAndreas Dilger 				GFP_NOFS);
28830421a189STahsin Erdogan 		if (*ea_inode_array == NULL)
2884e50e5129SAndreas Dilger 			return -ENOMEM;
28850421a189STahsin Erdogan 		(*ea_inode_array)->count = 0;
28860421a189STahsin Erdogan 	} else if (((*ea_inode_array)->count & EIA_MASK) == EIA_MASK) {
2887e50e5129SAndreas Dilger 		/* expand the array once all 15 + n * 16 slots are full */
28880421a189STahsin Erdogan 		struct ext4_xattr_inode_array *new_array = NULL;
28890421a189STahsin Erdogan 		int count = (*ea_inode_array)->count;
2890e50e5129SAndreas Dilger 
2891e50e5129SAndreas Dilger 		/* if new_array is NULL, this is essentially offsetof() */
2892e50e5129SAndreas Dilger 		new_array = kmalloc(
28930421a189STahsin Erdogan 				offsetof(struct ext4_xattr_inode_array,
28940421a189STahsin Erdogan 					 inodes[count + EIA_INCR]),
2895e50e5129SAndreas Dilger 				GFP_NOFS);
2896e50e5129SAndreas Dilger 		if (new_array == NULL)
2897e50e5129SAndreas Dilger 			return -ENOMEM;
28980421a189STahsin Erdogan 		memcpy(new_array, *ea_inode_array,
28990421a189STahsin Erdogan 		       offsetof(struct ext4_xattr_inode_array, inodes[count]));
29000421a189STahsin Erdogan 		kfree(*ea_inode_array);
29010421a189STahsin Erdogan 		*ea_inode_array = new_array;
2902e50e5129SAndreas Dilger 	}
29030421a189STahsin Erdogan 	(*ea_inode_array)->inodes[(*ea_inode_array)->count++] = inode;
2904e50e5129SAndreas Dilger 	return 0;
2905e50e5129SAndreas Dilger }
2906e50e5129SAndreas Dilger 
29076dd4ee7cSKalpak Shah /*
2908617ba13bSMingming Cao  * ext4_xattr_delete_inode()
2909ac27a0ecSDave Kleikamp  *
2910e50e5129SAndreas Dilger  * Free extended attribute resources associated with this inode. Traverse
2911dec214d0STahsin Erdogan  * all entries and decrement reference on any xattr inodes associated with this
2912dec214d0STahsin Erdogan  * inode. This is called immediately before an inode is freed. We have exclusive
2913dec214d0STahsin Erdogan  * access to the inode. If an orphan inode is deleted it will also release its
2914dec214d0STahsin Erdogan  * references on xattr block and xattr inodes.
2915ac27a0ecSDave Kleikamp  */
2916dec214d0STahsin Erdogan int ext4_xattr_delete_inode(handle_t *handle, struct inode *inode,
291730a7eb97STahsin Erdogan 			    struct ext4_xattr_inode_array **ea_inode_array,
291830a7eb97STahsin Erdogan 			    int extra_credits)
2919ac27a0ecSDave Kleikamp {
2920ac27a0ecSDave Kleikamp 	struct buffer_head *bh = NULL;
2921e50e5129SAndreas Dilger 	struct ext4_xattr_ibody_header *header;
292230a7eb97STahsin Erdogan 	struct ext4_iloc iloc = { .bh = NULL };
2923dec214d0STahsin Erdogan 	struct ext4_xattr_entry *entry;
2924a6d05676STahsin Erdogan 	struct inode *ea_inode;
292530a7eb97STahsin Erdogan 	int error;
292630a7eb97STahsin Erdogan 
292783448bdfSJan Kara 	error = ext4_journal_ensure_credits(handle, extra_credits,
292883448bdfSJan Kara 			ext4_free_metadata_revoke_credits(inode->i_sb, 1));
2929a4130367SJan Kara 	if (error < 0) {
293030a7eb97STahsin Erdogan 		EXT4_ERROR_INODE(inode, "ensure credits (error %d)", error);
293130a7eb97STahsin Erdogan 		goto cleanup;
293230a7eb97STahsin Erdogan 	}
2933ac27a0ecSDave Kleikamp 
2934dec214d0STahsin Erdogan 	if (ext4_has_feature_ea_inode(inode->i_sb) &&
2935dec214d0STahsin Erdogan 	    ext4_test_inode_state(inode, EXT4_STATE_XATTR)) {
2936e50e5129SAndreas Dilger 
2937e50e5129SAndreas Dilger 		error = ext4_get_inode_loc(inode, &iloc);
2938dec214d0STahsin Erdogan 		if (error) {
2939dec214d0STahsin Erdogan 			EXT4_ERROR_INODE(inode, "inode loc (error %d)", error);
2940e50e5129SAndreas Dilger 			goto cleanup;
2941e50e5129SAndreas Dilger 		}
2942dec214d0STahsin Erdogan 
2943188c299eSJan Kara 		error = ext4_journal_get_write_access(handle, inode->i_sb,
2944188c299eSJan Kara 						iloc.bh, EXT4_JTR_NONE);
2945dec214d0STahsin Erdogan 		if (error) {
2946dec214d0STahsin Erdogan 			EXT4_ERROR_INODE(inode, "write access (error %d)",
2947dec214d0STahsin Erdogan 					 error);
2948dec214d0STahsin Erdogan 			goto cleanup;
2949dec214d0STahsin Erdogan 		}
2950dec214d0STahsin Erdogan 
2951dec214d0STahsin Erdogan 		header = IHDR(inode, ext4_raw_inode(&iloc));
2952dec214d0STahsin Erdogan 		if (header->h_magic == cpu_to_le32(EXT4_XATTR_MAGIC))
2953dec214d0STahsin Erdogan 			ext4_xattr_inode_dec_ref_all(handle, inode, iloc.bh,
2954dec214d0STahsin Erdogan 						     IFIRST(header),
2955dec214d0STahsin Erdogan 						     false /* block_csum */,
2956dec214d0STahsin Erdogan 						     ea_inode_array,
2957dec214d0STahsin Erdogan 						     extra_credits,
2958dec214d0STahsin Erdogan 						     false /* skip_quota */);
2959dec214d0STahsin Erdogan 	}
2960dec214d0STahsin Erdogan 
2961dec214d0STahsin Erdogan 	if (EXT4_I(inode)->i_file_acl) {
2962fb265c9cSTheodore Ts'o 		bh = ext4_sb_bread(inode->i_sb, EXT4_I(inode)->i_file_acl, REQ_PRIO);
2963fb265c9cSTheodore Ts'o 		if (IS_ERR(bh)) {
2964fb265c9cSTheodore Ts'o 			error = PTR_ERR(bh);
2965878520acSTheodore Ts'o 			if (error == -EIO) {
296654d3adbcSTheodore Ts'o 				EXT4_ERROR_INODE_ERR(inode, EIO,
296754d3adbcSTheodore Ts'o 						     "block %llu read error",
296824676da4STheodore Ts'o 						     EXT4_I(inode)->i_file_acl);
2969878520acSTheodore Ts'o 			}
29707159a986SDan Carpenter 			bh = NULL;
2971ac27a0ecSDave Kleikamp 			goto cleanup;
2972ac27a0ecSDave Kleikamp 		}
2973dec214d0STahsin Erdogan 		error = ext4_xattr_check_block(inode, bh);
2974de05ca85STheodore Ts'o 		if (error)
2975ac27a0ecSDave Kleikamp 			goto cleanup;
2976e50e5129SAndreas Dilger 
297730a7eb97STahsin Erdogan 		if (ext4_has_feature_ea_inode(inode->i_sb)) {
2978dec214d0STahsin Erdogan 			for (entry = BFIRST(bh); !IS_LAST_ENTRY(entry);
2979a6d05676STahsin Erdogan 			     entry = EXT4_XATTR_NEXT(entry)) {
2980a6d05676STahsin Erdogan 				if (!entry->e_value_inum)
2981a6d05676STahsin Erdogan 					continue;
2982a6d05676STahsin Erdogan 				error = ext4_xattr_inode_iget(inode,
2983a6d05676STahsin Erdogan 					      le32_to_cpu(entry->e_value_inum),
2984a6d05676STahsin Erdogan 					      le32_to_cpu(entry->e_hash),
2985a6d05676STahsin Erdogan 					      &ea_inode);
2986a6d05676STahsin Erdogan 				if (error)
2987a6d05676STahsin Erdogan 					continue;
2988a6d05676STahsin Erdogan 				ext4_xattr_inode_free_quota(inode, ea_inode,
2989dec214d0STahsin Erdogan 					      le32_to_cpu(entry->e_value_size));
2990a6d05676STahsin Erdogan 				iput(ea_inode);
2991a6d05676STahsin Erdogan 			}
2992dec214d0STahsin Erdogan 
2993e50e5129SAndreas Dilger 		}
2994e50e5129SAndreas Dilger 
2995dec214d0STahsin Erdogan 		ext4_xattr_release_block(handle, inode, bh, ea_inode_array,
2996dec214d0STahsin Erdogan 					 extra_credits);
2997dec214d0STahsin Erdogan 		/*
2998dec214d0STahsin Erdogan 		 * Update i_file_acl value in the same transaction that releases
2999dec214d0STahsin Erdogan 		 * block.
3000dec214d0STahsin Erdogan 		 */
3001617ba13bSMingming Cao 		EXT4_I(inode)->i_file_acl = 0;
300230a7eb97STahsin Erdogan 		error = ext4_mark_inode_dirty(handle, inode);
300330a7eb97STahsin Erdogan 		if (error) {
300430a7eb97STahsin Erdogan 			EXT4_ERROR_INODE(inode, "mark inode dirty (error %d)",
300530a7eb97STahsin Erdogan 					 error);
300630a7eb97STahsin Erdogan 			goto cleanup;
300730a7eb97STahsin Erdogan 		}
3008e85c81baSXin Yin 		ext4_fc_mark_ineligible(inode->i_sb, EXT4_FC_REASON_XATTR, handle);
3009dec214d0STahsin Erdogan 	}
3010dec214d0STahsin Erdogan 	error = 0;
3011ac27a0ecSDave Kleikamp cleanup:
301230a7eb97STahsin Erdogan 	brelse(iloc.bh);
3013ac27a0ecSDave Kleikamp 	brelse(bh);
3014e50e5129SAndreas Dilger 	return error;
3015e50e5129SAndreas Dilger }
3016e50e5129SAndreas Dilger 
30170421a189STahsin Erdogan void ext4_xattr_inode_array_free(struct ext4_xattr_inode_array *ea_inode_array)
3018e50e5129SAndreas Dilger {
3019dec214d0STahsin Erdogan 	int idx;
3020e50e5129SAndreas Dilger 
30210421a189STahsin Erdogan 	if (ea_inode_array == NULL)
3022e50e5129SAndreas Dilger 		return;
3023e50e5129SAndreas Dilger 
3024dec214d0STahsin Erdogan 	for (idx = 0; idx < ea_inode_array->count; ++idx)
3025dec214d0STahsin Erdogan 		iput(ea_inode_array->inodes[idx]);
30260421a189STahsin Erdogan 	kfree(ea_inode_array);
3027ac27a0ecSDave Kleikamp }
3028ac27a0ecSDave Kleikamp 
3029ac27a0ecSDave Kleikamp /*
303047387409STahsin Erdogan  * ext4_xattr_block_cache_insert()
3031ac27a0ecSDave Kleikamp  *
303247387409STahsin Erdogan  * Create a new entry in the extended attribute block cache, and insert
3033ac27a0ecSDave Kleikamp  * it unless such an entry is already in the cache.
3034ac27a0ecSDave Kleikamp  *
3035ac27a0ecSDave Kleikamp  * Returns 0, or a negative error number on failure.
3036ac27a0ecSDave Kleikamp  */
3037ac27a0ecSDave Kleikamp static void
303847387409STahsin Erdogan ext4_xattr_block_cache_insert(struct mb_cache *ea_block_cache,
303947387409STahsin Erdogan 			      struct buffer_head *bh)
3040ac27a0ecSDave Kleikamp {
30416048c64bSAndreas Gruenbacher 	struct ext4_xattr_header *header = BHDR(bh);
30426048c64bSAndreas Gruenbacher 	__u32 hash = le32_to_cpu(header->h_hash);
30436048c64bSAndreas Gruenbacher 	int reusable = le32_to_cpu(header->h_refcount) <
30446048c64bSAndreas Gruenbacher 		       EXT4_XATTR_REFCOUNT_MAX;
3045ac27a0ecSDave Kleikamp 	int error;
3046ac27a0ecSDave Kleikamp 
3047cdb7ee4cSTahsin Erdogan 	if (!ea_block_cache)
3048cdb7ee4cSTahsin Erdogan 		return;
304947387409STahsin Erdogan 	error = mb_cache_entry_create(ea_block_cache, GFP_NOFS, hash,
30506048c64bSAndreas Gruenbacher 				      bh->b_blocknr, reusable);
3051ac27a0ecSDave Kleikamp 	if (error) {
305282939d79SJan Kara 		if (error == -EBUSY)
3053ac27a0ecSDave Kleikamp 			ea_bdebug(bh, "already in cache");
305482939d79SJan Kara 	} else
3055ac27a0ecSDave Kleikamp 		ea_bdebug(bh, "inserting [%x]", (int)hash);
3056ac27a0ecSDave Kleikamp }
3057ac27a0ecSDave Kleikamp 
3058ac27a0ecSDave Kleikamp /*
3059617ba13bSMingming Cao  * ext4_xattr_cmp()
3060ac27a0ecSDave Kleikamp  *
3061ac27a0ecSDave Kleikamp  * Compare two extended attribute blocks for equality.
3062ac27a0ecSDave Kleikamp  *
3063ac27a0ecSDave Kleikamp  * Returns 0 if the blocks are equal, 1 if they differ, and
3064ac27a0ecSDave Kleikamp  * a negative error number on errors.
3065ac27a0ecSDave Kleikamp  */
3066ac27a0ecSDave Kleikamp static int
3067617ba13bSMingming Cao ext4_xattr_cmp(struct ext4_xattr_header *header1,
3068617ba13bSMingming Cao 	       struct ext4_xattr_header *header2)
3069ac27a0ecSDave Kleikamp {
3070617ba13bSMingming Cao 	struct ext4_xattr_entry *entry1, *entry2;
3071ac27a0ecSDave Kleikamp 
3072ac27a0ecSDave Kleikamp 	entry1 = ENTRY(header1+1);
3073ac27a0ecSDave Kleikamp 	entry2 = ENTRY(header2+1);
3074ac27a0ecSDave Kleikamp 	while (!IS_LAST_ENTRY(entry1)) {
3075ac27a0ecSDave Kleikamp 		if (IS_LAST_ENTRY(entry2))
3076ac27a0ecSDave Kleikamp 			return 1;
3077ac27a0ecSDave Kleikamp 		if (entry1->e_hash != entry2->e_hash ||
3078ac27a0ecSDave Kleikamp 		    entry1->e_name_index != entry2->e_name_index ||
3079ac27a0ecSDave Kleikamp 		    entry1->e_name_len != entry2->e_name_len ||
3080ac27a0ecSDave Kleikamp 		    entry1->e_value_size != entry2->e_value_size ||
3081e50e5129SAndreas Dilger 		    entry1->e_value_inum != entry2->e_value_inum ||
3082ac27a0ecSDave Kleikamp 		    memcmp(entry1->e_name, entry2->e_name, entry1->e_name_len))
3083ac27a0ecSDave Kleikamp 			return 1;
30847cec1918STahsin Erdogan 		if (!entry1->e_value_inum &&
30857cec1918STahsin Erdogan 		    memcmp((char *)header1 + le16_to_cpu(entry1->e_value_offs),
3086ac27a0ecSDave Kleikamp 			   (char *)header2 + le16_to_cpu(entry2->e_value_offs),
3087ac27a0ecSDave Kleikamp 			   le32_to_cpu(entry1->e_value_size)))
3088ac27a0ecSDave Kleikamp 			return 1;
3089ac27a0ecSDave Kleikamp 
3090617ba13bSMingming Cao 		entry1 = EXT4_XATTR_NEXT(entry1);
3091617ba13bSMingming Cao 		entry2 = EXT4_XATTR_NEXT(entry2);
3092ac27a0ecSDave Kleikamp 	}
3093ac27a0ecSDave Kleikamp 	if (!IS_LAST_ENTRY(entry2))
3094ac27a0ecSDave Kleikamp 		return 1;
3095ac27a0ecSDave Kleikamp 	return 0;
3096ac27a0ecSDave Kleikamp }
3097ac27a0ecSDave Kleikamp 
3098ac27a0ecSDave Kleikamp /*
309947387409STahsin Erdogan  * ext4_xattr_block_cache_find()
3100ac27a0ecSDave Kleikamp  *
3101ac27a0ecSDave Kleikamp  * Find an identical extended attribute block.
3102ac27a0ecSDave Kleikamp  *
3103ac27a0ecSDave Kleikamp  * Returns a pointer to the block found, or NULL if such a block was
3104ac27a0ecSDave Kleikamp  * not found or an error occurred.
3105ac27a0ecSDave Kleikamp  */
3106ac27a0ecSDave Kleikamp static struct buffer_head *
310747387409STahsin Erdogan ext4_xattr_block_cache_find(struct inode *inode,
310847387409STahsin Erdogan 			    struct ext4_xattr_header *header,
31097a2508e1SJan Kara 			    struct mb_cache_entry **pce)
3110ac27a0ecSDave Kleikamp {
3111ac27a0ecSDave Kleikamp 	__u32 hash = le32_to_cpu(header->h_hash);
31127a2508e1SJan Kara 	struct mb_cache_entry *ce;
311347387409STahsin Erdogan 	struct mb_cache *ea_block_cache = EA_BLOCK_CACHE(inode);
3114ac27a0ecSDave Kleikamp 
3115cdb7ee4cSTahsin Erdogan 	if (!ea_block_cache)
3116cdb7ee4cSTahsin Erdogan 		return NULL;
3117ac27a0ecSDave Kleikamp 	if (!header->h_hash)
3118ac27a0ecSDave Kleikamp 		return NULL;  /* never share */
3119ac27a0ecSDave Kleikamp 	ea_idebug(inode, "looking for cached blocks [%x]", (int)hash);
312047387409STahsin Erdogan 	ce = mb_cache_entry_find_first(ea_block_cache, hash);
3121ac27a0ecSDave Kleikamp 	while (ce) {
3122ac27a0ecSDave Kleikamp 		struct buffer_head *bh;
3123ac27a0ecSDave Kleikamp 
3124fb265c9cSTheodore Ts'o 		bh = ext4_sb_bread(inode->i_sb, ce->e_value, REQ_PRIO);
3125fb265c9cSTheodore Ts'o 		if (IS_ERR(bh)) {
3126fb265c9cSTheodore Ts'o 			if (PTR_ERR(bh) == -ENOMEM)
3127fb265c9cSTheodore Ts'o 				return NULL;
31287159a986SDan Carpenter 			bh = NULL;
312924676da4STheodore Ts'o 			EXT4_ERROR_INODE(inode, "block %lu read error",
3130c07dfcb4STahsin Erdogan 					 (unsigned long)ce->e_value);
3131617ba13bSMingming Cao 		} else if (ext4_xattr_cmp(header, BHDR(bh)) == 0) {
3132ac27a0ecSDave Kleikamp 			*pce = ce;
3133ac27a0ecSDave Kleikamp 			return bh;
3134ac27a0ecSDave Kleikamp 		}
3135ac27a0ecSDave Kleikamp 		brelse(bh);
313647387409STahsin Erdogan 		ce = mb_cache_entry_find_next(ea_block_cache, ce);
3137ac27a0ecSDave Kleikamp 	}
3138ac27a0ecSDave Kleikamp 	return NULL;
3139ac27a0ecSDave Kleikamp }
3140ac27a0ecSDave Kleikamp 
3141ac27a0ecSDave Kleikamp #define NAME_HASH_SHIFT 5
3142ac27a0ecSDave Kleikamp #define VALUE_HASH_SHIFT 16
3143ac27a0ecSDave Kleikamp 
3144ac27a0ecSDave Kleikamp /*
3145617ba13bSMingming Cao  * ext4_xattr_hash_entry()
3146ac27a0ecSDave Kleikamp  *
3147ac27a0ecSDave Kleikamp  * Compute the hash of an extended attribute.
3148ac27a0ecSDave Kleikamp  */
3149b9fc761eSTahsin Erdogan static __le32 ext4_xattr_hash_entry(char *name, size_t name_len, __le32 *value,
3150b9fc761eSTahsin Erdogan 				    size_t value_count)
3151ac27a0ecSDave Kleikamp {
3152ac27a0ecSDave Kleikamp 	__u32 hash = 0;
3153ac27a0ecSDave Kleikamp 
3154b9fc761eSTahsin Erdogan 	while (name_len--) {
3155ac27a0ecSDave Kleikamp 		hash = (hash << NAME_HASH_SHIFT) ^
3156ac27a0ecSDave Kleikamp 		       (hash >> (8*sizeof(hash) - NAME_HASH_SHIFT)) ^
3157ac27a0ecSDave Kleikamp 		       *name++;
3158ac27a0ecSDave Kleikamp 	}
3159b9fc761eSTahsin Erdogan 	while (value_count--) {
3160ac27a0ecSDave Kleikamp 		hash = (hash << VALUE_HASH_SHIFT) ^
3161ac27a0ecSDave Kleikamp 		       (hash >> (8*sizeof(hash) - VALUE_HASH_SHIFT)) ^
3162ac27a0ecSDave Kleikamp 		       le32_to_cpu(*value++);
3163ac27a0ecSDave Kleikamp 	}
3164b9fc761eSTahsin Erdogan 	return cpu_to_le32(hash);
3165ac27a0ecSDave Kleikamp }
3166ac27a0ecSDave Kleikamp 
3167f3bbac32SLinus Torvalds /*
3168f3bbac32SLinus Torvalds  * ext4_xattr_hash_entry_signed()
3169f3bbac32SLinus Torvalds  *
3170f3bbac32SLinus Torvalds  * Compute the hash of an extended attribute incorrectly.
3171f3bbac32SLinus Torvalds  */
3172f3bbac32SLinus Torvalds static __le32 ext4_xattr_hash_entry_signed(char *name, size_t name_len, __le32 *value, size_t value_count)
3173f3bbac32SLinus Torvalds {
3174f3bbac32SLinus Torvalds 	__u32 hash = 0;
3175f3bbac32SLinus Torvalds 
3176f3bbac32SLinus Torvalds 	while (name_len--) {
3177f3bbac32SLinus Torvalds 		hash = (hash << NAME_HASH_SHIFT) ^
3178f3bbac32SLinus Torvalds 		       (hash >> (8*sizeof(hash) - NAME_HASH_SHIFT)) ^
3179f3bbac32SLinus Torvalds 		       (signed char)*name++;
3180f3bbac32SLinus Torvalds 	}
3181f3bbac32SLinus Torvalds 	while (value_count--) {
3182f3bbac32SLinus Torvalds 		hash = (hash << VALUE_HASH_SHIFT) ^
3183f3bbac32SLinus Torvalds 		       (hash >> (8*sizeof(hash) - VALUE_HASH_SHIFT)) ^
3184f3bbac32SLinus Torvalds 		       le32_to_cpu(*value++);
3185f3bbac32SLinus Torvalds 	}
3186f3bbac32SLinus Torvalds 	return cpu_to_le32(hash);
3187f3bbac32SLinus Torvalds }
3188f3bbac32SLinus Torvalds 
3189ac27a0ecSDave Kleikamp #undef NAME_HASH_SHIFT
3190ac27a0ecSDave Kleikamp #undef VALUE_HASH_SHIFT
3191ac27a0ecSDave Kleikamp 
3192ac27a0ecSDave Kleikamp #define BLOCK_HASH_SHIFT 16
3193ac27a0ecSDave Kleikamp 
3194ac27a0ecSDave Kleikamp /*
3195617ba13bSMingming Cao  * ext4_xattr_rehash()
3196ac27a0ecSDave Kleikamp  *
3197ac27a0ecSDave Kleikamp  * Re-compute the extended attribute hash value after an entry has changed.
3198ac27a0ecSDave Kleikamp  */
3199daf83281STahsin Erdogan static void ext4_xattr_rehash(struct ext4_xattr_header *header)
3200ac27a0ecSDave Kleikamp {
3201617ba13bSMingming Cao 	struct ext4_xattr_entry *here;
3202ac27a0ecSDave Kleikamp 	__u32 hash = 0;
3203ac27a0ecSDave Kleikamp 
3204ac27a0ecSDave Kleikamp 	here = ENTRY(header+1);
3205ac27a0ecSDave Kleikamp 	while (!IS_LAST_ENTRY(here)) {
3206ac27a0ecSDave Kleikamp 		if (!here->e_hash) {
3207ac27a0ecSDave Kleikamp 			/* Block is not shared if an entry's hash value == 0 */
3208ac27a0ecSDave Kleikamp 			hash = 0;
3209ac27a0ecSDave Kleikamp 			break;
3210ac27a0ecSDave Kleikamp 		}
3211ac27a0ecSDave Kleikamp 		hash = (hash << BLOCK_HASH_SHIFT) ^
3212ac27a0ecSDave Kleikamp 		       (hash >> (8*sizeof(hash) - BLOCK_HASH_SHIFT)) ^
3213ac27a0ecSDave Kleikamp 		       le32_to_cpu(here->e_hash);
3214617ba13bSMingming Cao 		here = EXT4_XATTR_NEXT(here);
3215ac27a0ecSDave Kleikamp 	}
3216ac27a0ecSDave Kleikamp 	header->h_hash = cpu_to_le32(hash);
3217ac27a0ecSDave Kleikamp }
3218ac27a0ecSDave Kleikamp 
3219ac27a0ecSDave Kleikamp #undef BLOCK_HASH_SHIFT
3220ac27a0ecSDave Kleikamp 
32219c191f70ST Makphaibulchoke #define	HASH_BUCKET_BITS	10
32229c191f70ST Makphaibulchoke 
32237a2508e1SJan Kara struct mb_cache *
322482939d79SJan Kara ext4_xattr_create_cache(void)
3225ac27a0ecSDave Kleikamp {
32267a2508e1SJan Kara 	return mb_cache_create(HASH_BUCKET_BITS);
3227ac27a0ecSDave Kleikamp }
3228ac27a0ecSDave Kleikamp 
32297a2508e1SJan Kara void ext4_xattr_destroy_cache(struct mb_cache *cache)
3230ac27a0ecSDave Kleikamp {
32319c191f70ST Makphaibulchoke 	if (cache)
32327a2508e1SJan Kara 		mb_cache_destroy(cache);
3233ac27a0ecSDave Kleikamp }
32349c191f70ST Makphaibulchoke 
3235