1b2441318SGreg Kroah-Hartman // SPDX-License-Identifier: GPL-2.0
21da177e4SLinus Torvalds /*
31da177e4SLinus Torvalds * linux/fs/ext2/inode.c
41da177e4SLinus Torvalds *
51da177e4SLinus Torvalds * Copyright (C) 1992, 1993, 1994, 1995
61da177e4SLinus Torvalds * Remy Card (card@masi.ibp.fr)
71da177e4SLinus Torvalds * Laboratoire MASI - Institut Blaise Pascal
81da177e4SLinus Torvalds * Universite Pierre et Marie Curie (Paris VI)
91da177e4SLinus Torvalds *
101da177e4SLinus Torvalds * from
111da177e4SLinus Torvalds *
121da177e4SLinus Torvalds * linux/fs/minix/inode.c
131da177e4SLinus Torvalds *
141da177e4SLinus Torvalds * Copyright (C) 1991, 1992 Linus Torvalds
151da177e4SLinus Torvalds *
161da177e4SLinus Torvalds * Goal-directed block allocation by Stephen Tweedie
171da177e4SLinus Torvalds * (sct@dcs.ed.ac.uk), 1993, 1998
181da177e4SLinus Torvalds * Big-endian to little-endian byte-swapping/bitmaps by
191da177e4SLinus Torvalds * David S. Miller (davem@caip.rutgers.edu), 1995
201da177e4SLinus Torvalds * 64-bit file support on 64-bit platforms by Jakub Jelinek
211da177e4SLinus Torvalds * (jj@sunsite.ms.mff.cuni.cz)
221da177e4SLinus Torvalds *
231da177e4SLinus Torvalds * Assorted race fixes, rewrite of ext2_get_block() by Al Viro, 2000
241da177e4SLinus Torvalds */
251da177e4SLinus Torvalds
261da177e4SLinus Torvalds #include <linux/time.h>
271da177e4SLinus Torvalds #include <linux/highuid.h>
281da177e4SLinus Torvalds #include <linux/pagemap.h>
29c94c2acfSMatthew Wilcox #include <linux/dax.h>
303dc29161SMatthew Wilcox #include <linux/blkdev.h>
311da177e4SLinus Torvalds #include <linux/quotaops.h>
321da177e4SLinus Torvalds #include <linux/writeback.h>
331da177e4SLinus Torvalds #include <linux/buffer_head.h>
341da177e4SLinus Torvalds #include <linux/mpage.h>
3568c9d702SJosef Bacik #include <linux/fiemap.h>
3625f4e702SChristoph Hellwig #include <linux/iomap.h>
378d6d0c4dSDuane Griffin #include <linux/namei.h>
38e2e40f2cSChristoph Hellwig #include <linux/uio.h>
391da177e4SLinus Torvalds #include "ext2.h"
401da177e4SLinus Torvalds #include "acl.h"
41c288d296SJan Kara #include "xattr.h"
421da177e4SLinus Torvalds
43a9185b41SChristoph Hellwig static int __ext2_write_inode(struct inode *inode, int do_sync);
44a9185b41SChristoph Hellwig
451da177e4SLinus Torvalds /*
461da177e4SLinus Torvalds * Test whether an inode is a fast symlink.
471da177e4SLinus Torvalds */
ext2_inode_is_fast_symlink(struct inode * inode)481da177e4SLinus Torvalds static inline int ext2_inode_is_fast_symlink(struct inode *inode)
491da177e4SLinus Torvalds {
501da177e4SLinus Torvalds int ea_blocks = EXT2_I(inode)->i_file_acl ?
511da177e4SLinus Torvalds (inode->i_sb->s_blocksize >> 9) : 0;
521da177e4SLinus Torvalds
531da177e4SLinus Torvalds return (S_ISLNK(inode->i_mode) &&
541da177e4SLinus Torvalds inode->i_blocks - ea_blocks == 0);
551da177e4SLinus Torvalds }
561da177e4SLinus Torvalds
57737f2e93Snpiggin@suse.de static void ext2_truncate_blocks(struct inode *inode, loff_t offset);
58737f2e93Snpiggin@suse.de
ext2_write_failed(struct address_space * mapping,loff_t to)59fb5de435SRitesh Harjani (IBM) void ext2_write_failed(struct address_space *mapping, loff_t to)
60737f2e93Snpiggin@suse.de {
61737f2e93Snpiggin@suse.de struct inode *inode = mapping->host;
62737f2e93Snpiggin@suse.de
63737f2e93Snpiggin@suse.de if (to > inode->i_size) {
647caef267SKirill A. Shutemov truncate_pagecache(inode, inode->i_size);
65737f2e93Snpiggin@suse.de ext2_truncate_blocks(inode, inode->i_size);
66737f2e93Snpiggin@suse.de }
67737f2e93Snpiggin@suse.de }
68737f2e93Snpiggin@suse.de
691da177e4SLinus Torvalds /*
701da177e4SLinus Torvalds * Called at the last iput() if i_nlink is zero.
711da177e4SLinus Torvalds */
ext2_evict_inode(struct inode * inode)7272edc4d0SAl Viro void ext2_evict_inode(struct inode * inode)
731da177e4SLinus Torvalds {
7472edc4d0SAl Viro struct ext2_block_alloc_info *rsv;
7572edc4d0SAl Viro int want_delete = 0;
7672edc4d0SAl Viro
7772edc4d0SAl Viro if (!inode->i_nlink && !is_bad_inode(inode)) {
7872edc4d0SAl Viro want_delete = 1;
79871a2931SChristoph Hellwig dquot_initialize(inode);
8072edc4d0SAl Viro } else {
8172edc4d0SAl Viro dquot_drop(inode);
8272edc4d0SAl Viro }
8372edc4d0SAl Viro
8491b0abe3SJohannes Weiner truncate_inode_pages_final(&inode->i_data);
85fef26658SMark Fasheh
8672edc4d0SAl Viro if (want_delete) {
871e8b212fSJan Kara sb_start_intwrite(inode->i_sb);
8872edc4d0SAl Viro /* set dtime */
89fe2c3254SArnd Bergmann EXT2_I(inode)->i_dtime = ktime_get_real_seconds();
901da177e4SLinus Torvalds mark_inode_dirty(inode);
91a9185b41SChristoph Hellwig __ext2_write_inode(inode, inode_needs_sync(inode));
9272edc4d0SAl Viro /* truncate to 0 */
931da177e4SLinus Torvalds inode->i_size = 0;
941da177e4SLinus Torvalds if (inode->i_blocks)
95737f2e93Snpiggin@suse.de ext2_truncate_blocks(inode, 0);
96c288d296SJan Kara ext2_xattr_delete_inode(inode);
9772edc4d0SAl Viro }
981da177e4SLinus Torvalds
9972edc4d0SAl Viro invalidate_inode_buffers(inode);
100dbd5768fSJan Kara clear_inode(inode);
10172edc4d0SAl Viro
10272edc4d0SAl Viro ext2_discard_reservation(inode);
10372edc4d0SAl Viro rsv = EXT2_I(inode)->i_block_alloc_info;
10472edc4d0SAl Viro EXT2_I(inode)->i_block_alloc_info = NULL;
10572edc4d0SAl Viro if (unlikely(rsv))
10672edc4d0SAl Viro kfree(rsv);
10772edc4d0SAl Viro
1081e8b212fSJan Kara if (want_delete) {
10972edc4d0SAl Viro ext2_free_inode(inode);
1101e8b212fSJan Kara sb_end_intwrite(inode->i_sb);
1111e8b212fSJan Kara }
1121da177e4SLinus Torvalds }
1131da177e4SLinus Torvalds
1141da177e4SLinus Torvalds typedef struct {
1151da177e4SLinus Torvalds __le32 *p;
1161da177e4SLinus Torvalds __le32 key;
1171da177e4SLinus Torvalds struct buffer_head *bh;
1181da177e4SLinus Torvalds } Indirect;
1191da177e4SLinus Torvalds
add_chain(Indirect * p,struct buffer_head * bh,__le32 * v)1201da177e4SLinus Torvalds static inline void add_chain(Indirect *p, struct buffer_head *bh, __le32 *v)
1211da177e4SLinus Torvalds {
1221da177e4SLinus Torvalds p->key = *(p->p = v);
1231da177e4SLinus Torvalds p->bh = bh;
1241da177e4SLinus Torvalds }
1251da177e4SLinus Torvalds
verify_chain(Indirect * from,Indirect * to)1261da177e4SLinus Torvalds static inline int verify_chain(Indirect *from, Indirect *to)
1271da177e4SLinus Torvalds {
1281da177e4SLinus Torvalds while (from <= to && from->key == *from->p)
1291da177e4SLinus Torvalds from++;
1301da177e4SLinus Torvalds return (from > to);
1311da177e4SLinus Torvalds }
1321da177e4SLinus Torvalds
1331da177e4SLinus Torvalds /**
1341da177e4SLinus Torvalds * ext2_block_to_path - parse the block number into array of offsets
1351da177e4SLinus Torvalds * @inode: inode in question (we are only interested in its superblock)
1361da177e4SLinus Torvalds * @i_block: block number to be parsed
1371da177e4SLinus Torvalds * @offsets: array to store the offsets in
1381da177e4SLinus Torvalds * @boundary: set this non-zero if the referred-to block is likely to be
1391da177e4SLinus Torvalds * followed (on disk) by an indirect block.
1401da177e4SLinus Torvalds * To store the locations of file's data ext2 uses a data structure common
1411da177e4SLinus Torvalds * for UNIX filesystems - tree of pointers anchored in the inode, with
1421da177e4SLinus Torvalds * data blocks at leaves and indirect blocks in intermediate nodes.
1431da177e4SLinus Torvalds * This function translates the block number into path in that tree -
1441da177e4SLinus Torvalds * return value is the path length and @offsets[n] is the offset of
1451da177e4SLinus Torvalds * pointer to (n+1)th node in the nth one. If @block is out of range
1461da177e4SLinus Torvalds * (negative or too large) warning is printed and zero returned.
1471da177e4SLinus Torvalds *
1481da177e4SLinus Torvalds * Note: function doesn't find node addresses, so no IO is needed. All
1491da177e4SLinus Torvalds * we need to know is the capacity of indirect blocks (taken from the
1501da177e4SLinus Torvalds * inode->i_sb).
1511da177e4SLinus Torvalds */
1521da177e4SLinus Torvalds
1531da177e4SLinus Torvalds /*
1541da177e4SLinus Torvalds * Portability note: the last comparison (check that we fit into triple
1551da177e4SLinus Torvalds * indirect block) is spelled differently, because otherwise on an
1561da177e4SLinus Torvalds * architecture with 32-bit longs and 8Kb pages we might get into trouble
1571da177e4SLinus Torvalds * if our filesystem had 8Kb blocks. We might use long long, but that would
1581da177e4SLinus Torvalds * kill us on x86. Oh, well, at least the sign propagation does not matter -
1591da177e4SLinus Torvalds * i_block would have to be negative in the very beginning, so we would not
1601da177e4SLinus Torvalds * get there at all.
1611da177e4SLinus Torvalds */
1621da177e4SLinus Torvalds
ext2_block_to_path(struct inode * inode,long i_block,int offsets[4],int * boundary)1631da177e4SLinus Torvalds static int ext2_block_to_path(struct inode *inode,
1641da177e4SLinus Torvalds long i_block, int offsets[4], int *boundary)
1651da177e4SLinus Torvalds {
1661da177e4SLinus Torvalds int ptrs = EXT2_ADDR_PER_BLOCK(inode->i_sb);
1671da177e4SLinus Torvalds int ptrs_bits = EXT2_ADDR_PER_BLOCK_BITS(inode->i_sb);
1681da177e4SLinus Torvalds const long direct_blocks = EXT2_NDIR_BLOCKS,
1691da177e4SLinus Torvalds indirect_blocks = ptrs,
1701da177e4SLinus Torvalds double_blocks = (1 << (ptrs_bits * 2));
1711da177e4SLinus Torvalds int n = 0;
1721da177e4SLinus Torvalds int final = 0;
1731da177e4SLinus Torvalds
1741da177e4SLinus Torvalds if (i_block < 0) {
1752314b07cSAlexey Fisher ext2_msg(inode->i_sb, KERN_WARNING,
1762314b07cSAlexey Fisher "warning: %s: block < 0", __func__);
1771da177e4SLinus Torvalds } else if (i_block < direct_blocks) {
1781da177e4SLinus Torvalds offsets[n++] = i_block;
1791da177e4SLinus Torvalds final = direct_blocks;
1801da177e4SLinus Torvalds } else if ( (i_block -= direct_blocks) < indirect_blocks) {
1811da177e4SLinus Torvalds offsets[n++] = EXT2_IND_BLOCK;
1821da177e4SLinus Torvalds offsets[n++] = i_block;
1831da177e4SLinus Torvalds final = ptrs;
1841da177e4SLinus Torvalds } else if ((i_block -= indirect_blocks) < double_blocks) {
1851da177e4SLinus Torvalds offsets[n++] = EXT2_DIND_BLOCK;
1861da177e4SLinus Torvalds offsets[n++] = i_block >> ptrs_bits;
1871da177e4SLinus Torvalds offsets[n++] = i_block & (ptrs - 1);
1881da177e4SLinus Torvalds final = ptrs;
1891da177e4SLinus Torvalds } else if (((i_block -= double_blocks) >> (ptrs_bits * 2)) < ptrs) {
1901da177e4SLinus Torvalds offsets[n++] = EXT2_TIND_BLOCK;
1911da177e4SLinus Torvalds offsets[n++] = i_block >> (ptrs_bits * 2);
1921da177e4SLinus Torvalds offsets[n++] = (i_block >> ptrs_bits) & (ptrs - 1);
1931da177e4SLinus Torvalds offsets[n++] = i_block & (ptrs - 1);
1941da177e4SLinus Torvalds final = ptrs;
1951da177e4SLinus Torvalds } else {
1962314b07cSAlexey Fisher ext2_msg(inode->i_sb, KERN_WARNING,
1972314b07cSAlexey Fisher "warning: %s: block is too big", __func__);
1981da177e4SLinus Torvalds }
1991da177e4SLinus Torvalds if (boundary)
200a686cd89SMartin J. Bligh *boundary = final - 1 - (i_block & (ptrs - 1));
201a686cd89SMartin J. Bligh
2021da177e4SLinus Torvalds return n;
2031da177e4SLinus Torvalds }
2041da177e4SLinus Torvalds
2051da177e4SLinus Torvalds /**
2061da177e4SLinus Torvalds * ext2_get_branch - read the chain of indirect blocks leading to data
2071da177e4SLinus Torvalds * @inode: inode in question
2081da177e4SLinus Torvalds * @depth: depth of the chain (1 - direct pointer, etc.)
2091da177e4SLinus Torvalds * @offsets: offsets of pointers in inode/indirect blocks
2101da177e4SLinus Torvalds * @chain: place to store the result
2111da177e4SLinus Torvalds * @err: here we store the error value
2121da177e4SLinus Torvalds *
2131da177e4SLinus Torvalds * Function fills the array of triples <key, p, bh> and returns %NULL
2141da177e4SLinus Torvalds * if everything went OK or the pointer to the last filled triple
2151da177e4SLinus Torvalds * (incomplete one) otherwise. Upon the return chain[i].key contains
2161da177e4SLinus Torvalds * the number of (i+1)-th block in the chain (as it is stored in memory,
2171da177e4SLinus Torvalds * i.e. little-endian 32-bit), chain[i].p contains the address of that
2181da177e4SLinus Torvalds * number (it points into struct inode for i==0 and into the bh->b_data
2191da177e4SLinus Torvalds * for i>0) and chain[i].bh points to the buffer_head of i-th indirect
2201da177e4SLinus Torvalds * block for i>0 and NULL for i==0. In other words, it holds the block
2211da177e4SLinus Torvalds * numbers of the chain, addresses they were taken from (and where we can
2221da177e4SLinus Torvalds * verify that chain did not change) and buffer_heads hosting these
2231da177e4SLinus Torvalds * numbers.
2241da177e4SLinus Torvalds *
2251da177e4SLinus Torvalds * Function stops when it stumbles upon zero pointer (absent block)
2261da177e4SLinus Torvalds * (pointer to last triple returned, *@err == 0)
2271da177e4SLinus Torvalds * or when it gets an IO error reading an indirect block
2281da177e4SLinus Torvalds * (ditto, *@err == -EIO)
2291da177e4SLinus Torvalds * or when it notices that chain had been changed while it was reading
2301da177e4SLinus Torvalds * (ditto, *@err == -EAGAIN)
2311da177e4SLinus Torvalds * or when it reads all @depth-1 indirect blocks successfully and finds
2321da177e4SLinus Torvalds * the whole chain, all way to the data (returns %NULL, *err == 0).
2331da177e4SLinus Torvalds */
ext2_get_branch(struct inode * inode,int depth,int * offsets,Indirect chain[4],int * err)2341da177e4SLinus Torvalds static Indirect *ext2_get_branch(struct inode *inode,
2351da177e4SLinus Torvalds int depth,
2361da177e4SLinus Torvalds int *offsets,
2371da177e4SLinus Torvalds Indirect chain[4],
2381da177e4SLinus Torvalds int *err)
2391da177e4SLinus Torvalds {
2401da177e4SLinus Torvalds struct super_block *sb = inode->i_sb;
2411da177e4SLinus Torvalds Indirect *p = chain;
2421da177e4SLinus Torvalds struct buffer_head *bh;
2431da177e4SLinus Torvalds
2441da177e4SLinus Torvalds *err = 0;
2451da177e4SLinus Torvalds /* i_data is not going away, no lock needed */
2461da177e4SLinus Torvalds add_chain (chain, NULL, EXT2_I(inode)->i_data + *offsets);
2471da177e4SLinus Torvalds if (!p->key)
2481da177e4SLinus Torvalds goto no_block;
2491da177e4SLinus Torvalds while (--depth) {
2501da177e4SLinus Torvalds bh = sb_bread(sb, le32_to_cpu(p->key));
2511da177e4SLinus Torvalds if (!bh)
2521da177e4SLinus Torvalds goto failure;
2531da177e4SLinus Torvalds read_lock(&EXT2_I(inode)->i_meta_lock);
2541da177e4SLinus Torvalds if (!verify_chain(chain, p))
2551da177e4SLinus Torvalds goto changed;
2561da177e4SLinus Torvalds add_chain(++p, bh, (__le32*)bh->b_data + *++offsets);
2571da177e4SLinus Torvalds read_unlock(&EXT2_I(inode)->i_meta_lock);
2581da177e4SLinus Torvalds if (!p->key)
2591da177e4SLinus Torvalds goto no_block;
2601da177e4SLinus Torvalds }
2611da177e4SLinus Torvalds return NULL;
2621da177e4SLinus Torvalds
2631da177e4SLinus Torvalds changed:
2641da177e4SLinus Torvalds read_unlock(&EXT2_I(inode)->i_meta_lock);
2651da177e4SLinus Torvalds brelse(bh);
2661da177e4SLinus Torvalds *err = -EAGAIN;
2671da177e4SLinus Torvalds goto no_block;
2681da177e4SLinus Torvalds failure:
2691da177e4SLinus Torvalds *err = -EIO;
2701da177e4SLinus Torvalds no_block:
2711da177e4SLinus Torvalds return p;
2721da177e4SLinus Torvalds }
2731da177e4SLinus Torvalds
2741da177e4SLinus Torvalds /**
2751da177e4SLinus Torvalds * ext2_find_near - find a place for allocation with sufficient locality
2761da177e4SLinus Torvalds * @inode: owner
2771da177e4SLinus Torvalds * @ind: descriptor of indirect block.
2781da177e4SLinus Torvalds *
2791cc8dcf5SBenoit Boissinot * This function returns the preferred place for block allocation.
2801da177e4SLinus Torvalds * It is used when heuristic for sequential allocation fails.
2811da177e4SLinus Torvalds * Rules are:
2821da177e4SLinus Torvalds * + if there is a block to the left of our position - allocate near it.
2831da177e4SLinus Torvalds * + if pointer will live in indirect block - allocate near that block.
2841da177e4SLinus Torvalds * + if pointer will live in inode - allocate in the same cylinder group.
2851da177e4SLinus Torvalds *
2861da177e4SLinus Torvalds * In the latter case we colour the starting block by the callers PID to
2871da177e4SLinus Torvalds * prevent it from clashing with concurrent allocations for a different inode
2881da177e4SLinus Torvalds * in the same block group. The PID is used here so that functionally related
2891da177e4SLinus Torvalds * files will be close-by on-disk.
2901da177e4SLinus Torvalds *
2911da177e4SLinus Torvalds * Caller must make sure that @ind is valid and will stay that way.
2921da177e4SLinus Torvalds */
2931da177e4SLinus Torvalds
ext2_find_near(struct inode * inode,Indirect * ind)2944c8b3125SAkinobu Mita static ext2_fsblk_t ext2_find_near(struct inode *inode, Indirect *ind)
2951da177e4SLinus Torvalds {
2961da177e4SLinus Torvalds struct ext2_inode_info *ei = EXT2_I(inode);
2971da177e4SLinus Torvalds __le32 *start = ind->bh ? (__le32 *) ind->bh->b_data : ei->i_data;
2981da177e4SLinus Torvalds __le32 *p;
2994c8b3125SAkinobu Mita ext2_fsblk_t bg_start;
3004c8b3125SAkinobu Mita ext2_fsblk_t colour;
3011da177e4SLinus Torvalds
3021da177e4SLinus Torvalds /* Try to find previous block */
3031da177e4SLinus Torvalds for (p = ind->p - 1; p >= start; p--)
3041da177e4SLinus Torvalds if (*p)
3051da177e4SLinus Torvalds return le32_to_cpu(*p);
3061da177e4SLinus Torvalds
3071da177e4SLinus Torvalds /* No such thing, so let's try location of indirect block */
3081da177e4SLinus Torvalds if (ind->bh)
3091da177e4SLinus Torvalds return ind->bh->b_blocknr;
3101da177e4SLinus Torvalds
3111da177e4SLinus Torvalds /*
31225985edcSLucas De Marchi * It is going to be referred from inode itself? OK, just put it into
3131da177e4SLinus Torvalds * the same cylinder group then.
3141da177e4SLinus Torvalds */
31524097d12SAkinobu Mita bg_start = ext2_group_first_block_no(inode->i_sb, ei->i_block_group);
3161da177e4SLinus Torvalds colour = (current->pid % 16) *
3171da177e4SLinus Torvalds (EXT2_BLOCKS_PER_GROUP(inode->i_sb) / 16);
3181da177e4SLinus Torvalds return bg_start + colour;
3191da177e4SLinus Torvalds }
3201da177e4SLinus Torvalds
3211da177e4SLinus Torvalds /**
3221cc8dcf5SBenoit Boissinot * ext2_find_goal - find a preferred place for allocation.
3231da177e4SLinus Torvalds * @inode: owner
3241da177e4SLinus Torvalds * @block: block we want
3251da177e4SLinus Torvalds * @partial: pointer to the last triple within a chain
3261da177e4SLinus Torvalds *
327a686cd89SMartin J. Bligh * Returns preferred place for a block (the goal).
3281da177e4SLinus Torvalds */
3291da177e4SLinus Torvalds
ext2_find_goal(struct inode * inode,long block,Indirect * partial)3304c8b3125SAkinobu Mita static inline ext2_fsblk_t ext2_find_goal(struct inode *inode, long block,
331a686cd89SMartin J. Bligh Indirect *partial)
3321da177e4SLinus Torvalds {
333a686cd89SMartin J. Bligh struct ext2_block_alloc_info *block_i;
334a686cd89SMartin J. Bligh
335a686cd89SMartin J. Bligh block_i = EXT2_I(inode)->i_block_alloc_info;
336a686cd89SMartin J. Bligh
3371da177e4SLinus Torvalds /*
3381da177e4SLinus Torvalds * try the heuristic for sequential allocation,
3391da177e4SLinus Torvalds * failing that at least try to get decent locality.
3401da177e4SLinus Torvalds */
341a686cd89SMartin J. Bligh if (block_i && (block == block_i->last_alloc_logical_block + 1)
342a686cd89SMartin J. Bligh && (block_i->last_alloc_physical_block != 0)) {
343a686cd89SMartin J. Bligh return block_i->last_alloc_physical_block + 1;
3441da177e4SLinus Torvalds }
345a686cd89SMartin J. Bligh
346a686cd89SMartin J. Bligh return ext2_find_near(inode, partial);
347a686cd89SMartin J. Bligh }
348a686cd89SMartin J. Bligh
349a686cd89SMartin J. Bligh /**
350a686cd89SMartin J. Bligh * ext2_blks_to_allocate: Look up the block map and count the number
351a686cd89SMartin J. Bligh * of direct blocks need to be allocated for the given branch.
352a686cd89SMartin J. Bligh *
353a686cd89SMartin J. Bligh * @branch: chain of indirect blocks
354a686cd89SMartin J. Bligh * @k: number of blocks need for indirect blocks
355a686cd89SMartin J. Bligh * @blks: number of data blocks to be mapped.
356a686cd89SMartin J. Bligh * @blocks_to_boundary: the offset in the indirect block
357a686cd89SMartin J. Bligh *
358cf1013f4SChengguang Xu * return the number of direct blocks to allocate.
359a686cd89SMartin J. Bligh */
360a686cd89SMartin J. Bligh static int
ext2_blks_to_allocate(Indirect * branch,int k,unsigned long blks,int blocks_to_boundary)361a686cd89SMartin J. Bligh ext2_blks_to_allocate(Indirect * branch, int k, unsigned long blks,
362a686cd89SMartin J. Bligh int blocks_to_boundary)
363a686cd89SMartin J. Bligh {
364a686cd89SMartin J. Bligh unsigned long count = 0;
365a686cd89SMartin J. Bligh
366a686cd89SMartin J. Bligh /*
367a686cd89SMartin J. Bligh * Simple case, [t,d]Indirect block(s) has not allocated yet
368a686cd89SMartin J. Bligh * then it's clear blocks on that path have not allocated
369a686cd89SMartin J. Bligh */
370a686cd89SMartin J. Bligh if (k > 0) {
371a686cd89SMartin J. Bligh /* right now don't hanel cross boundary allocation */
372a686cd89SMartin J. Bligh if (blks < blocks_to_boundary + 1)
373a686cd89SMartin J. Bligh count += blks;
374a686cd89SMartin J. Bligh else
375a686cd89SMartin J. Bligh count += blocks_to_boundary + 1;
376a686cd89SMartin J. Bligh return count;
377a686cd89SMartin J. Bligh }
378a686cd89SMartin J. Bligh
379a686cd89SMartin J. Bligh count++;
380a686cd89SMartin J. Bligh while (count < blks && count <= blocks_to_boundary
381a686cd89SMartin J. Bligh && le32_to_cpu(*(branch[0].p + count)) == 0) {
382a686cd89SMartin J. Bligh count++;
383a686cd89SMartin J. Bligh }
384a686cd89SMartin J. Bligh return count;
385a686cd89SMartin J. Bligh }
386a686cd89SMartin J. Bligh
387a686cd89SMartin J. Bligh /**
388*df1ae36aSMatthew Wilcox (Oracle) * ext2_alloc_blocks: Allocate multiple blocks needed for a branch.
389*df1ae36aSMatthew Wilcox (Oracle) * @inode: Owner.
390*df1ae36aSMatthew Wilcox (Oracle) * @goal: Preferred place for allocation.
391*df1ae36aSMatthew Wilcox (Oracle) * @indirect_blks: The number of blocks needed to allocate for indirect blocks.
392*df1ae36aSMatthew Wilcox (Oracle) * @blks: The number of blocks need to allocate for direct blocks.
393*df1ae36aSMatthew Wilcox (Oracle) * @new_blocks: On return it will store the new block numbers for
394*df1ae36aSMatthew Wilcox (Oracle) * the indirect blocks(if needed) and the first direct block.
395*df1ae36aSMatthew Wilcox (Oracle) * @err: Error pointer.
396*df1ae36aSMatthew Wilcox (Oracle) *
397*df1ae36aSMatthew Wilcox (Oracle) * Return: Number of blocks allocated.
398a686cd89SMartin J. Bligh */
ext2_alloc_blocks(struct inode * inode,ext2_fsblk_t goal,int indirect_blks,int blks,ext2_fsblk_t new_blocks[4],int * err)399a686cd89SMartin J. Bligh static int ext2_alloc_blocks(struct inode *inode,
400a686cd89SMartin J. Bligh ext2_fsblk_t goal, int indirect_blks, int blks,
401a686cd89SMartin J. Bligh ext2_fsblk_t new_blocks[4], int *err)
402a686cd89SMartin J. Bligh {
403a686cd89SMartin J. Bligh int target, i;
404a686cd89SMartin J. Bligh unsigned long count = 0;
405a686cd89SMartin J. Bligh int index = 0;
406a686cd89SMartin J. Bligh ext2_fsblk_t current_block = 0;
407a686cd89SMartin J. Bligh int ret = 0;
408a686cd89SMartin J. Bligh
409a686cd89SMartin J. Bligh /*
410a686cd89SMartin J. Bligh * Here we try to allocate the requested multiple blocks at once,
411a686cd89SMartin J. Bligh * on a best-effort basis.
412a686cd89SMartin J. Bligh * To build a branch, we should allocate blocks for
413a686cd89SMartin J. Bligh * the indirect blocks(if not allocated yet), and at least
414a686cd89SMartin J. Bligh * the first direct block of this branch. That's the
415a686cd89SMartin J. Bligh * minimum number of blocks need to allocate(required)
416a686cd89SMartin J. Bligh */
417a686cd89SMartin J. Bligh target = blks + indirect_blks;
418a686cd89SMartin J. Bligh
419a686cd89SMartin J. Bligh while (1) {
420a686cd89SMartin J. Bligh count = target;
421a686cd89SMartin J. Bligh /* allocating blocks for indirect blocks and direct blocks */
422b450159dSYe Bin current_block = ext2_new_blocks(inode, goal, &count, err, 0);
423a686cd89SMartin J. Bligh if (*err)
424a686cd89SMartin J. Bligh goto failed_out;
425a686cd89SMartin J. Bligh
426a686cd89SMartin J. Bligh target -= count;
427a686cd89SMartin J. Bligh /* allocate blocks for indirect blocks */
428a686cd89SMartin J. Bligh while (index < indirect_blks && count) {
429a686cd89SMartin J. Bligh new_blocks[index++] = current_block++;
430a686cd89SMartin J. Bligh count--;
431a686cd89SMartin J. Bligh }
432a686cd89SMartin J. Bligh
433a686cd89SMartin J. Bligh if (count > 0)
434a686cd89SMartin J. Bligh break;
435a686cd89SMartin J. Bligh }
436a686cd89SMartin J. Bligh
437a686cd89SMartin J. Bligh /* save the new block number for the first direct block */
438a686cd89SMartin J. Bligh new_blocks[index] = current_block;
439a686cd89SMartin J. Bligh
440a686cd89SMartin J. Bligh /* total number of blocks allocated for direct blocks */
441a686cd89SMartin J. Bligh ret = count;
442a686cd89SMartin J. Bligh *err = 0;
443a686cd89SMartin J. Bligh return ret;
444a686cd89SMartin J. Bligh failed_out:
445a686cd89SMartin J. Bligh for (i = 0; i <index; i++)
446a686cd89SMartin J. Bligh ext2_free_blocks(inode, new_blocks[i], 1);
447addacc7dSAl Viro if (index)
448addacc7dSAl Viro mark_inode_dirty(inode);
449a686cd89SMartin J. Bligh return ret;
4501da177e4SLinus Torvalds }
4511da177e4SLinus Torvalds
4521da177e4SLinus Torvalds /**
4531da177e4SLinus Torvalds * ext2_alloc_branch - allocate and set up a chain of blocks.
4541da177e4SLinus Torvalds * @inode: owner
4551206d028SShuning Zhang * @indirect_blks: depth of the chain (number of blocks to allocate)
4561206d028SShuning Zhang * @blks: number of allocated direct blocks
4571206d028SShuning Zhang * @goal: preferred place for allocation
4581da177e4SLinus Torvalds * @offsets: offsets (in the blocks) to store the pointers to next.
4591da177e4SLinus Torvalds * @branch: place to store the chain in.
4601da177e4SLinus Torvalds *
4611da177e4SLinus Torvalds * This function allocates @num blocks, zeroes out all but the last one,
4621da177e4SLinus Torvalds * links them into chain and (if we are synchronous) writes them to disk.
4631da177e4SLinus Torvalds * In other words, it prepares a branch that can be spliced onto the
4641da177e4SLinus Torvalds * inode. It stores the information about that chain in the branch[], in
4651da177e4SLinus Torvalds * the same format as ext2_get_branch() would do. We are calling it after
4661da177e4SLinus Torvalds * we had read the existing part of chain and partial points to the last
4671da177e4SLinus Torvalds * triple of that (one with zero ->key). Upon the exit we have the same
46872b43570SNamhyung Kim * picture as after the successful ext2_get_block(), except that in one
4691da177e4SLinus Torvalds * place chain is disconnected - *branch->p is still zero (we did not
4701da177e4SLinus Torvalds * set the last link), but branch->key contains the number that should
4711da177e4SLinus Torvalds * be placed into *branch->p to fill that gap.
4721da177e4SLinus Torvalds *
4731da177e4SLinus Torvalds * If allocation fails we free all blocks we've allocated (and forget
4741da177e4SLinus Torvalds * their buffer_heads) and return the error value the from failed
4751da177e4SLinus Torvalds * ext2_alloc_block() (normally -ENOSPC). Otherwise we set the chain
4761da177e4SLinus Torvalds * as described above and return 0.
4771da177e4SLinus Torvalds */
4781da177e4SLinus Torvalds
ext2_alloc_branch(struct inode * inode,int indirect_blks,int * blks,ext2_fsblk_t goal,int * offsets,Indirect * branch)4791da177e4SLinus Torvalds static int ext2_alloc_branch(struct inode *inode,
480a686cd89SMartin J. Bligh int indirect_blks, int *blks, ext2_fsblk_t goal,
481a686cd89SMartin J. Bligh int *offsets, Indirect *branch)
4821da177e4SLinus Torvalds {
4831da177e4SLinus Torvalds int blocksize = inode->i_sb->s_blocksize;
484a686cd89SMartin J. Bligh int i, n = 0;
485a686cd89SMartin J. Bligh int err = 0;
4861da177e4SLinus Torvalds struct buffer_head *bh;
487a686cd89SMartin J. Bligh int num;
488a686cd89SMartin J. Bligh ext2_fsblk_t new_blocks[4];
489a686cd89SMartin J. Bligh ext2_fsblk_t current_block;
490a686cd89SMartin J. Bligh
491a686cd89SMartin J. Bligh num = ext2_alloc_blocks(inode, goal, indirect_blks,
492a686cd89SMartin J. Bligh *blks, new_blocks, &err);
493a686cd89SMartin J. Bligh if (err)
494a686cd89SMartin J. Bligh return err;
495a686cd89SMartin J. Bligh
496a686cd89SMartin J. Bligh branch[0].key = cpu_to_le32(new_blocks[0]);
4971da177e4SLinus Torvalds /*
498a686cd89SMartin J. Bligh * metadata blocks and data blocks are allocated.
4991da177e4SLinus Torvalds */
500a686cd89SMartin J. Bligh for (n = 1; n <= indirect_blks; n++) {
501a686cd89SMartin J. Bligh /*
502a686cd89SMartin J. Bligh * Get buffer_head for parent block, zero it out
503a686cd89SMartin J. Bligh * and set the pointer to new one, then send
504a686cd89SMartin J. Bligh * parent to disk.
505a686cd89SMartin J. Bligh */
506a686cd89SMartin J. Bligh bh = sb_getblk(inode->i_sb, new_blocks[n-1]);
5078d8759ebSWang Shilong if (unlikely(!bh)) {
5088d8759ebSWang Shilong err = -ENOMEM;
5098d8759ebSWang Shilong goto failed;
5108d8759ebSWang Shilong }
511a686cd89SMartin J. Bligh branch[n].bh = bh;
5121da177e4SLinus Torvalds lock_buffer(bh);
5131da177e4SLinus Torvalds memset(bh->b_data, 0, blocksize);
5141da177e4SLinus Torvalds branch[n].p = (__le32 *) bh->b_data + offsets[n];
515a686cd89SMartin J. Bligh branch[n].key = cpu_to_le32(new_blocks[n]);
5161da177e4SLinus Torvalds *branch[n].p = branch[n].key;
517a686cd89SMartin J. Bligh if ( n == indirect_blks) {
518a686cd89SMartin J. Bligh current_block = new_blocks[n];
519a686cd89SMartin J. Bligh /*
520a686cd89SMartin J. Bligh * End of chain, update the last new metablock of
521a686cd89SMartin J. Bligh * the chain to point to the new allocated
522a686cd89SMartin J. Bligh * data blocks numbers
523a686cd89SMartin J. Bligh */
524a686cd89SMartin J. Bligh for (i=1; i < num; i++)
525a686cd89SMartin J. Bligh *(branch[n].p + i) = cpu_to_le32(++current_block);
526a686cd89SMartin J. Bligh }
5271da177e4SLinus Torvalds set_buffer_uptodate(bh);
5281da177e4SLinus Torvalds unlock_buffer(bh);
5291da177e4SLinus Torvalds mark_buffer_dirty_inode(bh, inode);
5301da177e4SLinus Torvalds /* We used to sync bh here if IS_SYNC(inode).
531a2a735adSJan Kara * But we now rely upon generic_write_sync()
5321da177e4SLinus Torvalds * and b_inode_buffers. But not for directories.
5331da177e4SLinus Torvalds */
5341da177e4SLinus Torvalds if (S_ISDIR(inode->i_mode) && IS_DIRSYNC(inode))
5351da177e4SLinus Torvalds sync_dirty_buffer(bh);
5361da177e4SLinus Torvalds }
537a686cd89SMartin J. Bligh *blks = num;
5381da177e4SLinus Torvalds return err;
5398d8759ebSWang Shilong
5408d8759ebSWang Shilong failed:
5418d8759ebSWang Shilong for (i = 1; i < n; i++)
5428d8759ebSWang Shilong bforget(branch[i].bh);
5438d8759ebSWang Shilong for (i = 0; i < indirect_blks; i++)
5448d8759ebSWang Shilong ext2_free_blocks(inode, new_blocks[i], 1);
5458d8759ebSWang Shilong ext2_free_blocks(inode, new_blocks[i], num);
5468d8759ebSWang Shilong return err;
5471da177e4SLinus Torvalds }
5481da177e4SLinus Torvalds
5491da177e4SLinus Torvalds /**
5501da177e4SLinus Torvalds * ext2_splice_branch - splice the allocated branch onto inode.
5511da177e4SLinus Torvalds * @inode: owner
5521da177e4SLinus Torvalds * @block: (logical) number of block we are adding
5531da177e4SLinus Torvalds * @where: location of missing link
554a686cd89SMartin J. Bligh * @num: number of indirect blocks we are adding
555a686cd89SMartin J. Bligh * @blks: number of direct blocks we are adding
5561da177e4SLinus Torvalds *
557a686cd89SMartin J. Bligh * This function fills the missing link and does all housekeeping needed in
5581da177e4SLinus Torvalds * inode (->i_blocks, etc.). In case of success we end up with the full
559a686cd89SMartin J. Bligh * chain to new block and return 0.
5601da177e4SLinus Torvalds */
ext2_splice_branch(struct inode * inode,long block,Indirect * where,int num,int blks)561a686cd89SMartin J. Bligh static void ext2_splice_branch(struct inode *inode,
562a686cd89SMartin J. Bligh long block, Indirect *where, int num, int blks)
5631da177e4SLinus Torvalds {
5641da177e4SLinus Torvalds int i;
565a686cd89SMartin J. Bligh struct ext2_block_alloc_info *block_i;
566a686cd89SMartin J. Bligh ext2_fsblk_t current_block;
5671da177e4SLinus Torvalds
568a686cd89SMartin J. Bligh block_i = EXT2_I(inode)->i_block_alloc_info;
5691da177e4SLinus Torvalds
570a686cd89SMartin J. Bligh /* XXX LOCKING probably should have i_meta_lock ?*/
5711da177e4SLinus Torvalds /* That's it */
5721da177e4SLinus Torvalds
5731da177e4SLinus Torvalds *where->p = where->key;
5741da177e4SLinus Torvalds
575a686cd89SMartin J. Bligh /*
576a686cd89SMartin J. Bligh * Update the host buffer_head or inode to point to more just allocated
577a686cd89SMartin J. Bligh * direct blocks blocks
578a686cd89SMartin J. Bligh */
579a686cd89SMartin J. Bligh if (num == 0 && blks > 1) {
580a686cd89SMartin J. Bligh current_block = le32_to_cpu(where->key) + 1;
581a686cd89SMartin J. Bligh for (i = 1; i < blks; i++)
582a686cd89SMartin J. Bligh *(where->p + i ) = cpu_to_le32(current_block++);
583a686cd89SMartin J. Bligh }
584a686cd89SMartin J. Bligh
585a686cd89SMartin J. Bligh /*
586a686cd89SMartin J. Bligh * update the most recently allocated logical & physical block
587a686cd89SMartin J. Bligh * in i_block_alloc_info, to assist find the proper goal block for next
588a686cd89SMartin J. Bligh * allocation
589a686cd89SMartin J. Bligh */
590a686cd89SMartin J. Bligh if (block_i) {
591a686cd89SMartin J. Bligh block_i->last_alloc_logical_block = block + blks - 1;
592a686cd89SMartin J. Bligh block_i->last_alloc_physical_block =
593a686cd89SMartin J. Bligh le32_to_cpu(where[num].key) + blks - 1;
594a686cd89SMartin J. Bligh }
5951da177e4SLinus Torvalds
5961da177e4SLinus Torvalds /* We are done with atomic stuff, now do the rest of housekeeping */
5971da177e4SLinus Torvalds
5981da177e4SLinus Torvalds /* had we spliced it onto indirect block? */
5991da177e4SLinus Torvalds if (where->bh)
6001da177e4SLinus Torvalds mark_buffer_dirty_inode(where->bh, inode);
6011da177e4SLinus Torvalds
602fc4eed64SJeff Layton inode_set_ctime_current(inode);
6031da177e4SLinus Torvalds mark_inode_dirty(inode);
6041da177e4SLinus Torvalds }
6051da177e4SLinus Torvalds
6061da177e4SLinus Torvalds /*
6071da177e4SLinus Torvalds * Allocation strategy is simple: if we have to allocate something, we will
6081da177e4SLinus Torvalds * have to go the whole way to leaf. So let's do it before attaching anything
6091da177e4SLinus Torvalds * to tree, set linkage between the newborn blocks, write them if sync is
6101da177e4SLinus Torvalds * required, recheck the path, free and repeat if check fails, otherwise
6111da177e4SLinus Torvalds * set the last missing link (that will protect us from any truncate-generated
6121da177e4SLinus Torvalds * removals - all blocks on the path are immune now) and possibly force the
6131da177e4SLinus Torvalds * write on the parent block.
6141da177e4SLinus Torvalds * That has a nice additional property: no special recovery from the failed
6151da177e4SLinus Torvalds * allocations is needed - we simply release blocks and do not touch anything
6161da177e4SLinus Torvalds * reachable from inode.
617a686cd89SMartin J. Bligh *
618a686cd89SMartin J. Bligh * `handle' can be NULL if create == 0.
619a686cd89SMartin J. Bligh *
620a686cd89SMartin J. Bligh * return > 0, # of blocks mapped or allocated.
621a686cd89SMartin J. Bligh * return = 0, if plain lookup failed.
622a686cd89SMartin J. Bligh * return < 0, error case.
6231da177e4SLinus Torvalds */
ext2_get_blocks(struct inode * inode,sector_t iblock,unsigned long maxblocks,u32 * bno,bool * new,bool * boundary,int create)624a686cd89SMartin J. Bligh static int ext2_get_blocks(struct inode *inode,
625a686cd89SMartin J. Bligh sector_t iblock, unsigned long maxblocks,
6266750ad71SChristoph Hellwig u32 *bno, bool *new, bool *boundary,
627a686cd89SMartin J. Bligh int create)
6281da177e4SLinus Torvalds {
629e952813eSArnd Bergmann int err;
6301da177e4SLinus Torvalds int offsets[4];
6311da177e4SLinus Torvalds Indirect chain[4];
6321da177e4SLinus Torvalds Indirect *partial;
633a686cd89SMartin J. Bligh ext2_fsblk_t goal;
634a686cd89SMartin J. Bligh int indirect_blks;
635a686cd89SMartin J. Bligh int blocks_to_boundary = 0;
636a686cd89SMartin J. Bligh int depth;
637a686cd89SMartin J. Bligh struct ext2_inode_info *ei = EXT2_I(inode);
638a686cd89SMartin J. Bligh int count = 0;
639a686cd89SMartin J. Bligh ext2_fsblk_t first_block = 0;
640a686cd89SMartin J. Bligh
6417ba3ec57SJan Kara BUG_ON(maxblocks == 0);
6427ba3ec57SJan Kara
643a686cd89SMartin J. Bligh depth = ext2_block_to_path(inode,iblock,offsets,&blocks_to_boundary);
6441da177e4SLinus Torvalds
6451da177e4SLinus Torvalds if (depth == 0)
646e952813eSArnd Bergmann return -EIO;
6471da177e4SLinus Torvalds
648316cb4efSJan Kara partial = ext2_get_branch(inode, depth, offsets, chain, &err);
6491da177e4SLinus Torvalds /* Simplest case - block found, no allocation needed */
6501da177e4SLinus Torvalds if (!partial) {
651a686cd89SMartin J. Bligh first_block = le32_to_cpu(chain[depth - 1].key);
652a686cd89SMartin J. Bligh count++;
653a686cd89SMartin J. Bligh /*map more blocks*/
654a686cd89SMartin J. Bligh while (count < maxblocks && count <= blocks_to_boundary) {
655a686cd89SMartin J. Bligh ext2_fsblk_t blk;
656a686cd89SMartin J. Bligh
657316cb4efSJan Kara if (!verify_chain(chain, chain + depth - 1)) {
658a686cd89SMartin J. Bligh /*
659a686cd89SMartin J. Bligh * Indirect block might be removed by
660a686cd89SMartin J. Bligh * truncate while we were reading it.
661a686cd89SMartin J. Bligh * Handling of that case: forget what we've
662a686cd89SMartin J. Bligh * got now, go to reread.
663a686cd89SMartin J. Bligh */
664316cb4efSJan Kara err = -EAGAIN;
665a686cd89SMartin J. Bligh count = 0;
6664d9bcaddSErnesto A. Fernández partial = chain + depth - 1;
667316cb4efSJan Kara break;
668a686cd89SMartin J. Bligh }
669a686cd89SMartin J. Bligh blk = le32_to_cpu(*(chain[depth-1].p + count));
670a686cd89SMartin J. Bligh if (blk == first_block + count)
671a686cd89SMartin J. Bligh count++;
672a686cd89SMartin J. Bligh else
673a686cd89SMartin J. Bligh break;
674a686cd89SMartin J. Bligh }
675316cb4efSJan Kara if (err != -EAGAIN)
676a686cd89SMartin J. Bligh goto got_it;
6771da177e4SLinus Torvalds }
6781da177e4SLinus Torvalds
6791da177e4SLinus Torvalds /* Next simple case - plain lookup or failed read of indirect block */
680a686cd89SMartin J. Bligh if (!create || err == -EIO)
681a686cd89SMartin J. Bligh goto cleanup;
682a686cd89SMartin J. Bligh
683a686cd89SMartin J. Bligh mutex_lock(&ei->truncate_mutex);
684316cb4efSJan Kara /*
685316cb4efSJan Kara * If the indirect block is missing while we are reading
68672b43570SNamhyung Kim * the chain(ext2_get_branch() returns -EAGAIN err), or
687316cb4efSJan Kara * if the chain has been changed after we grab the semaphore,
688316cb4efSJan Kara * (either because another process truncated this branch, or
689316cb4efSJan Kara * another get_block allocated this branch) re-grab the chain to see if
690316cb4efSJan Kara * the request block has been allocated or not.
691316cb4efSJan Kara *
692316cb4efSJan Kara * Since we already block the truncate/other get_block
693316cb4efSJan Kara * at this point, we will have the current copy of the chain when we
694316cb4efSJan Kara * splice the branch into the tree.
695316cb4efSJan Kara */
696316cb4efSJan Kara if (err == -EAGAIN || !verify_chain(chain, partial)) {
697316cb4efSJan Kara while (partial > chain) {
698316cb4efSJan Kara brelse(partial->bh);
699316cb4efSJan Kara partial--;
700316cb4efSJan Kara }
701316cb4efSJan Kara partial = ext2_get_branch(inode, depth, offsets, chain, &err);
702316cb4efSJan Kara if (!partial) {
703316cb4efSJan Kara count++;
704316cb4efSJan Kara mutex_unlock(&ei->truncate_mutex);
705316cb4efSJan Kara goto got_it;
706316cb4efSJan Kara }
707e705f4b8SChengguang Xu
708e705f4b8SChengguang Xu if (err) {
709e705f4b8SChengguang Xu mutex_unlock(&ei->truncate_mutex);
710e705f4b8SChengguang Xu goto cleanup;
711e705f4b8SChengguang Xu }
712316cb4efSJan Kara }
7131da177e4SLinus Torvalds
7141da177e4SLinus Torvalds /*
715a686cd89SMartin J. Bligh * Okay, we need to do block allocation. Lazily initialize the block
716a686cd89SMartin J. Bligh * allocation info here if necessary
7171da177e4SLinus Torvalds */
718a686cd89SMartin J. Bligh if (S_ISREG(inode->i_mode) && (!ei->i_block_alloc_info))
719a686cd89SMartin J. Bligh ext2_init_block_alloc_info(inode);
7201da177e4SLinus Torvalds
721fb01bfdaSAkinobu Mita goal = ext2_find_goal(inode, iblock, partial);
7221da177e4SLinus Torvalds
723a686cd89SMartin J. Bligh /* the number of blocks need to allocate for [d,t]indirect blocks */
724a686cd89SMartin J. Bligh indirect_blks = (chain + depth) - partial - 1;
725a686cd89SMartin J. Bligh /*
7264bc74ba1SLiu Xiang * Next look up the indirect map to count the total number of
727a686cd89SMartin J. Bligh * direct blocks to allocate for this branch.
728a686cd89SMartin J. Bligh */
729a686cd89SMartin J. Bligh count = ext2_blks_to_allocate(partial, indirect_blks,
730a686cd89SMartin J. Bligh maxblocks, blocks_to_boundary);
731a686cd89SMartin J. Bligh /*
732a686cd89SMartin J. Bligh * XXX ???? Block out ext2_truncate while we alter the tree
733a686cd89SMartin J. Bligh */
734a686cd89SMartin J. Bligh err = ext2_alloc_branch(inode, indirect_blks, &count, goal,
7351da177e4SLinus Torvalds offsets + (partial - chain), partial);
736a686cd89SMartin J. Bligh
737a686cd89SMartin J. Bligh if (err) {
738a686cd89SMartin J. Bligh mutex_unlock(&ei->truncate_mutex);
7391da177e4SLinus Torvalds goto cleanup;
740a686cd89SMartin J. Bligh }
7411da177e4SLinus Torvalds
742fbbbad4bSMatthew Wilcox if (IS_DAX(inode)) {
743225c5161SJan Kara /*
744225c5161SJan Kara * We must unmap blocks before zeroing so that writeback cannot
745225c5161SJan Kara * overwrite zeros with stale data from block device page cache.
746225c5161SJan Kara */
74769a9bea1SJan Kara clean_bdev_aliases(inode->i_sb->s_bdev,
74869a9bea1SJan Kara le32_to_cpu(chain[depth-1].key),
74969a9bea1SJan Kara count);
7506d79125bSCarsten Otte /*
751289c6aedSMatthew Wilcox * block must be initialised before we put it in the tree
752289c6aedSMatthew Wilcox * so that it's not found by another thread before it's
753289c6aedSMatthew Wilcox * initialised
7546d79125bSCarsten Otte */
7553dc29161SMatthew Wilcox err = sb_issue_zeroout(inode->i_sb,
7563dc29161SMatthew Wilcox le32_to_cpu(chain[depth-1].key), count,
7573dc29161SMatthew Wilcox GFP_NOFS);
758a686cd89SMartin J. Bligh if (err) {
759a686cd89SMartin J. Bligh mutex_unlock(&ei->truncate_mutex);
7606d79125bSCarsten Otte goto cleanup;
7616d79125bSCarsten Otte }
7626750ad71SChristoph Hellwig }
763e568df6bSJan Kara *new = true;
7646d79125bSCarsten Otte
765a686cd89SMartin J. Bligh ext2_splice_branch(inode, iblock, partial, indirect_blks, count);
766a686cd89SMartin J. Bligh mutex_unlock(&ei->truncate_mutex);
767a686cd89SMartin J. Bligh got_it:
768a686cd89SMartin J. Bligh if (count > blocks_to_boundary)
7696750ad71SChristoph Hellwig *boundary = true;
770a686cd89SMartin J. Bligh err = count;
771a686cd89SMartin J. Bligh /* Clean up and exit */
772a686cd89SMartin J. Bligh partial = chain + depth - 1; /* the whole chain */
773a686cd89SMartin J. Bligh cleanup:
774a686cd89SMartin J. Bligh while (partial > chain) {
775a686cd89SMartin J. Bligh brelse(partial->bh);
776a686cd89SMartin J. Bligh partial--;
777a686cd89SMartin J. Bligh }
778e952813eSArnd Bergmann if (err > 0)
779e952813eSArnd Bergmann *bno = le32_to_cpu(chain[depth-1].key);
780a686cd89SMartin J. Bligh return err;
7811da177e4SLinus Torvalds }
7821da177e4SLinus Torvalds
ext2_get_block(struct inode * inode,sector_t iblock,struct buffer_head * bh_result,int create)7836750ad71SChristoph Hellwig int ext2_get_block(struct inode *inode, sector_t iblock,
7846750ad71SChristoph Hellwig struct buffer_head *bh_result, int create)
785a686cd89SMartin J. Bligh {
786a686cd89SMartin J. Bligh unsigned max_blocks = bh_result->b_size >> inode->i_blkbits;
7876750ad71SChristoph Hellwig bool new = false, boundary = false;
7886750ad71SChristoph Hellwig u32 bno;
7896750ad71SChristoph Hellwig int ret;
7906750ad71SChristoph Hellwig
7916750ad71SChristoph Hellwig ret = ext2_get_blocks(inode, iblock, max_blocks, &bno, &new, &boundary,
7926750ad71SChristoph Hellwig create);
7936750ad71SChristoph Hellwig if (ret <= 0)
794a686cd89SMartin J. Bligh return ret;
795a686cd89SMartin J. Bligh
7966750ad71SChristoph Hellwig map_bh(bh_result, inode->i_sb, bno);
7976750ad71SChristoph Hellwig bh_result->b_size = (ret << inode->i_blkbits);
7986750ad71SChristoph Hellwig if (new)
7996750ad71SChristoph Hellwig set_buffer_new(bh_result);
8006750ad71SChristoph Hellwig if (boundary)
8016750ad71SChristoph Hellwig set_buffer_boundary(bh_result);
8026750ad71SChristoph Hellwig return 0;
8036750ad71SChristoph Hellwig
804a686cd89SMartin J. Bligh }
805a686cd89SMartin J. Bligh
ext2_iomap_begin(struct inode * inode,loff_t offset,loff_t length,unsigned flags,struct iomap * iomap,struct iomap * srcmap)80625f4e702SChristoph Hellwig static int ext2_iomap_begin(struct inode *inode, loff_t offset, loff_t length,
807c039b997SGoldwyn Rodrigues unsigned flags, struct iomap *iomap, struct iomap *srcmap)
80825f4e702SChristoph Hellwig {
80925f4e702SChristoph Hellwig unsigned int blkbits = inode->i_blkbits;
81025f4e702SChristoph Hellwig unsigned long first_block = offset >> blkbits;
81125f4e702SChristoph Hellwig unsigned long max_blocks = (length + (1 << blkbits) - 1) >> blkbits;
8128cf037a8SDan Williams struct ext2_sb_info *sbi = EXT2_SB(inode->i_sb);
81325f4e702SChristoph Hellwig bool new = false, boundary = false;
81425f4e702SChristoph Hellwig u32 bno;
81525f4e702SChristoph Hellwig int ret;
816fb5de435SRitesh Harjani (IBM) bool create = flags & IOMAP_WRITE;
817fb5de435SRitesh Harjani (IBM)
818fb5de435SRitesh Harjani (IBM) /*
819fb5de435SRitesh Harjani (IBM) * For writes that could fill holes inside i_size on a
820fb5de435SRitesh Harjani (IBM) * DIO_SKIP_HOLES filesystem we forbid block creations: only
821fb5de435SRitesh Harjani (IBM) * overwrites are permitted.
822fb5de435SRitesh Harjani (IBM) */
823fb5de435SRitesh Harjani (IBM) if ((flags & IOMAP_DIRECT) &&
824fb5de435SRitesh Harjani (IBM) (first_block << blkbits) < i_size_read(inode))
825fb5de435SRitesh Harjani (IBM) create = 0;
826fb5de435SRitesh Harjani (IBM)
827fb5de435SRitesh Harjani (IBM) /*
828fb5de435SRitesh Harjani (IBM) * Writes that span EOF might trigger an IO size update on completion,
829fb5de435SRitesh Harjani (IBM) * so consider them to be dirty for the purposes of O_DSYNC even if
830fb5de435SRitesh Harjani (IBM) * there is no other metadata changes pending or have been made here.
831fb5de435SRitesh Harjani (IBM) */
832fb5de435SRitesh Harjani (IBM) if ((flags & IOMAP_WRITE) && offset + length > i_size_read(inode))
833fb5de435SRitesh Harjani (IBM) iomap->flags |= IOMAP_F_DIRTY;
83425f4e702SChristoph Hellwig
83525f4e702SChristoph Hellwig ret = ext2_get_blocks(inode, first_block, max_blocks,
836fb5de435SRitesh Harjani (IBM) &bno, &new, &boundary, create);
83725f4e702SChristoph Hellwig if (ret < 0)
83825f4e702SChristoph Hellwig return ret;
83925f4e702SChristoph Hellwig
84025f4e702SChristoph Hellwig iomap->flags = 0;
841d5bfccdfSChristoph Hellwig iomap->offset = (u64)first_block << blkbits;
842de205114SChristoph Hellwig if (flags & IOMAP_DAX)
8438cf037a8SDan Williams iomap->dax_dev = sbi->s_daxdev;
844de205114SChristoph Hellwig else
845de205114SChristoph Hellwig iomap->bdev = inode->i_sb->s_bdev;
84625f4e702SChristoph Hellwig
84725f4e702SChristoph Hellwig if (ret == 0) {
848fb5de435SRitesh Harjani (IBM) /*
849fb5de435SRitesh Harjani (IBM) * Switch to buffered-io for writing to holes in a non-extent
850fb5de435SRitesh Harjani (IBM) * based filesystem to avoid stale data exposure problem.
851fb5de435SRitesh Harjani (IBM) */
852fb5de435SRitesh Harjani (IBM) if (!create && (flags & IOMAP_WRITE) && (flags & IOMAP_DIRECT))
853fb5de435SRitesh Harjani (IBM) return -ENOTBLK;
85425f4e702SChristoph Hellwig iomap->type = IOMAP_HOLE;
85519fe5f64SAndreas Gruenbacher iomap->addr = IOMAP_NULL_ADDR;
85625f4e702SChristoph Hellwig iomap->length = 1 << blkbits;
85725f4e702SChristoph Hellwig } else {
85825f4e702SChristoph Hellwig iomap->type = IOMAP_MAPPED;
85919fe5f64SAndreas Gruenbacher iomap->addr = (u64)bno << blkbits;
860de205114SChristoph Hellwig if (flags & IOMAP_DAX)
861de205114SChristoph Hellwig iomap->addr += sbi->s_dax_part_off;
86225f4e702SChristoph Hellwig iomap->length = (u64)ret << blkbits;
86325f4e702SChristoph Hellwig iomap->flags |= IOMAP_F_MERGED;
86425f4e702SChristoph Hellwig }
86525f4e702SChristoph Hellwig
86625f4e702SChristoph Hellwig if (new)
86725f4e702SChristoph Hellwig iomap->flags |= IOMAP_F_NEW;
86825f4e702SChristoph Hellwig return 0;
86925f4e702SChristoph Hellwig }
87025f4e702SChristoph Hellwig
87125f4e702SChristoph Hellwig static int
ext2_iomap_end(struct inode * inode,loff_t offset,loff_t length,ssize_t written,unsigned flags,struct iomap * iomap)87225f4e702SChristoph Hellwig ext2_iomap_end(struct inode *inode, loff_t offset, loff_t length,
87325f4e702SChristoph Hellwig ssize_t written, unsigned flags, struct iomap *iomap)
87425f4e702SChristoph Hellwig {
875fb5de435SRitesh Harjani (IBM) /*
876fb5de435SRitesh Harjani (IBM) * Switch to buffered-io in case of any error.
877fb5de435SRitesh Harjani (IBM) * Blocks allocated can be used by the buffered-io path.
878fb5de435SRitesh Harjani (IBM) */
879fb5de435SRitesh Harjani (IBM) if ((flags & IOMAP_DIRECT) && (flags & IOMAP_WRITE) && written == 0)
880fb5de435SRitesh Harjani (IBM) return -ENOTBLK;
881fb5de435SRitesh Harjani (IBM)
88225f4e702SChristoph Hellwig if (iomap->type == IOMAP_MAPPED &&
88325f4e702SChristoph Hellwig written < length &&
88425f4e702SChristoph Hellwig (flags & IOMAP_WRITE))
88525f4e702SChristoph Hellwig ext2_write_failed(inode->i_mapping, offset + length);
88625f4e702SChristoph Hellwig return 0;
88725f4e702SChristoph Hellwig }
88825f4e702SChristoph Hellwig
8898ff6daa1SChristoph Hellwig const struct iomap_ops ext2_iomap_ops = {
89025f4e702SChristoph Hellwig .iomap_begin = ext2_iomap_begin,
89125f4e702SChristoph Hellwig .iomap_end = ext2_iomap_end,
89225f4e702SChristoph Hellwig };
89325f4e702SChristoph Hellwig
ext2_fiemap(struct inode * inode,struct fiemap_extent_info * fieinfo,u64 start,u64 len)89468c9d702SJosef Bacik int ext2_fiemap(struct inode *inode, struct fiemap_extent_info *fieinfo,
89568c9d702SJosef Bacik u64 start, u64 len)
89668c9d702SJosef Bacik {
8978b1e7076SChristoph Hellwig int ret;
8988b1e7076SChristoph Hellwig
8998b1e7076SChristoph Hellwig inode_lock(inode);
9008b1e7076SChristoph Hellwig len = min_t(u64, len, i_size_read(inode));
9018b1e7076SChristoph Hellwig ret = iomap_fiemap(inode, fieinfo, start, len, &ext2_iomap_ops);
9028b1e7076SChristoph Hellwig inode_unlock(inode);
9038b1e7076SChristoph Hellwig
9048b1e7076SChristoph Hellwig return ret;
90568c9d702SJosef Bacik }
90668c9d702SJosef Bacik
ext2_read_folio(struct file * file,struct folio * folio)907f132ab7dSMatthew Wilcox (Oracle) static int ext2_read_folio(struct file *file, struct folio *folio)
9081da177e4SLinus Torvalds {
909f132ab7dSMatthew Wilcox (Oracle) return mpage_read_folio(folio, ext2_get_block);
9101da177e4SLinus Torvalds }
9111da177e4SLinus Torvalds
ext2_readahead(struct readahead_control * rac)912d4388340SMatthew Wilcox (Oracle) static void ext2_readahead(struct readahead_control *rac)
9131da177e4SLinus Torvalds {
914d4388340SMatthew Wilcox (Oracle) mpage_readahead(rac, ext2_get_block);
9151da177e4SLinus Torvalds }
9161da177e4SLinus Torvalds
9171da177e4SLinus Torvalds static int
ext2_write_begin(struct file * file,struct address_space * mapping,loff_t pos,unsigned len,struct page ** pagep,void ** fsdata)918f34fb6ecSNick Piggin ext2_write_begin(struct file *file, struct address_space *mapping,
9199d6b0cd7SMatthew Wilcox (Oracle) loff_t pos, unsigned len, struct page **pagep, void **fsdata)
9201da177e4SLinus Torvalds {
921737f2e93Snpiggin@suse.de int ret;
922737f2e93Snpiggin@suse.de
923b3992d1eSMatthew Wilcox (Oracle) ret = block_write_begin(mapping, pos, len, pagep, ext2_get_block);
924737f2e93Snpiggin@suse.de if (ret < 0)
925737f2e93Snpiggin@suse.de ext2_write_failed(mapping, pos + len);
926737f2e93Snpiggin@suse.de return ret;
927737f2e93Snpiggin@suse.de }
928737f2e93Snpiggin@suse.de
ext2_write_end(struct file * file,struct address_space * mapping,loff_t pos,unsigned len,unsigned copied,struct page * page,void * fsdata)929737f2e93Snpiggin@suse.de static int ext2_write_end(struct file *file, struct address_space *mapping,
930737f2e93Snpiggin@suse.de loff_t pos, unsigned len, unsigned copied,
931737f2e93Snpiggin@suse.de struct page *page, void *fsdata)
932737f2e93Snpiggin@suse.de {
933737f2e93Snpiggin@suse.de int ret;
934737f2e93Snpiggin@suse.de
935737f2e93Snpiggin@suse.de ret = generic_write_end(file, mapping, pos, len, copied, page, fsdata);
936737f2e93Snpiggin@suse.de if (ret < len)
937737f2e93Snpiggin@suse.de ext2_write_failed(mapping, pos + len);
938737f2e93Snpiggin@suse.de return ret;
9391da177e4SLinus Torvalds }
9401da177e4SLinus Torvalds
ext2_bmap(struct address_space * mapping,sector_t block)9411da177e4SLinus Torvalds static sector_t ext2_bmap(struct address_space *mapping, sector_t block)
9421da177e4SLinus Torvalds {
9431da177e4SLinus Torvalds return generic_block_bmap(mapping,block,ext2_get_block);
9441da177e4SLinus Torvalds }
9451da177e4SLinus Torvalds
9461da177e4SLinus Torvalds static int
ext2_writepages(struct address_space * mapping,struct writeback_control * wbc)9471da177e4SLinus Torvalds ext2_writepages(struct address_space *mapping, struct writeback_control *wbc)
9481da177e4SLinus Torvalds {
9491da177e4SLinus Torvalds return mpage_writepages(mapping, wbc, ext2_get_block);
9501da177e4SLinus Torvalds }
9511da177e4SLinus Torvalds
952fb094c90SDan Williams static int
ext2_dax_writepages(struct address_space * mapping,struct writeback_control * wbc)953fb094c90SDan Williams ext2_dax_writepages(struct address_space *mapping, struct writeback_control *wbc)
954fb094c90SDan Williams {
9553f666c56SVivek Goyal struct ext2_sb_info *sbi = EXT2_SB(mapping->host->i_sb);
9563f666c56SVivek Goyal
9573f666c56SVivek Goyal return dax_writeback_mapping_range(mapping, sbi->s_daxdev, wbc);
958fb094c90SDan Williams }
959fb094c90SDan Williams
960f5e54d6eSChristoph Hellwig const struct address_space_operations ext2_aops = {
961e621900aSMatthew Wilcox (Oracle) .dirty_folio = block_dirty_folio,
9627ba13abbSMatthew Wilcox (Oracle) .invalidate_folio = block_invalidate_folio,
963f132ab7dSMatthew Wilcox (Oracle) .read_folio = ext2_read_folio,
964d4388340SMatthew Wilcox (Oracle) .readahead = ext2_readahead,
965f34fb6ecSNick Piggin .write_begin = ext2_write_begin,
966737f2e93Snpiggin@suse.de .write_end = ext2_write_end,
9671da177e4SLinus Torvalds .bmap = ext2_bmap,
968fb5de435SRitesh Harjani (IBM) .direct_IO = noop_direct_IO,
9691da177e4SLinus Torvalds .writepages = ext2_writepages,
97067235182SMatthew Wilcox (Oracle) .migrate_folio = buffer_migrate_folio,
9718ab22b9aSHisashi Hifumi .is_partially_uptodate = block_is_partially_uptodate,
972aa261f54SAndi Kleen .error_remove_page = generic_error_remove_page,
9731da177e4SLinus Torvalds };
9741da177e4SLinus Torvalds
975fb094c90SDan Williams static const struct address_space_operations ext2_dax_aops = {
976fb094c90SDan Williams .writepages = ext2_dax_writepages,
977fb094c90SDan Williams .direct_IO = noop_direct_IO,
97846de8b97SMatthew Wilcox (Oracle) .dirty_folio = noop_dirty_folio,
979fb094c90SDan Williams };
980fb094c90SDan Williams
9811da177e4SLinus Torvalds /*
9821da177e4SLinus Torvalds * Probably it should be a library function... search for first non-zero word
9831da177e4SLinus Torvalds * or memcmp with zero_page, whatever is better for particular architecture.
9841da177e4SLinus Torvalds * Linus?
9851da177e4SLinus Torvalds */
all_zeroes(__le32 * p,__le32 * q)9861da177e4SLinus Torvalds static inline int all_zeroes(__le32 *p, __le32 *q)
9871da177e4SLinus Torvalds {
9881da177e4SLinus Torvalds while (p < q)
9891da177e4SLinus Torvalds if (*p++)
9901da177e4SLinus Torvalds return 0;
9911da177e4SLinus Torvalds return 1;
9921da177e4SLinus Torvalds }
9931da177e4SLinus Torvalds
9941da177e4SLinus Torvalds /**
9951da177e4SLinus Torvalds * ext2_find_shared - find the indirect blocks for partial truncation.
9961da177e4SLinus Torvalds * @inode: inode in question
9971da177e4SLinus Torvalds * @depth: depth of the affected branch
9981da177e4SLinus Torvalds * @offsets: offsets of pointers in that branch (see ext2_block_to_path)
9991da177e4SLinus Torvalds * @chain: place to store the pointers to partial indirect blocks
10001da177e4SLinus Torvalds * @top: place to the (detached) top of branch
10011da177e4SLinus Torvalds *
10021da177e4SLinus Torvalds * This is a helper function used by ext2_truncate().
10031da177e4SLinus Torvalds *
10041da177e4SLinus Torvalds * When we do truncate() we may have to clean the ends of several indirect
10051da177e4SLinus Torvalds * blocks but leave the blocks themselves alive. Block is partially
100625985edcSLucas De Marchi * truncated if some data below the new i_size is referred from it (and
10071da177e4SLinus Torvalds * it is on the path to the first completely truncated data block, indeed).
10081da177e4SLinus Torvalds * We have to free the top of that path along with everything to the right
10091da177e4SLinus Torvalds * of the path. Since no allocation past the truncation point is possible
10101da177e4SLinus Torvalds * until ext2_truncate() finishes, we may safely do the latter, but top
10111da177e4SLinus Torvalds * of branch may require special attention - pageout below the truncation
10121da177e4SLinus Torvalds * point might try to populate it.
10131da177e4SLinus Torvalds *
10141da177e4SLinus Torvalds * We atomically detach the top of branch from the tree, store the block
10151da177e4SLinus Torvalds * number of its root in *@top, pointers to buffer_heads of partially
10161da177e4SLinus Torvalds * truncated blocks - in @chain[].bh and pointers to their last elements
10171da177e4SLinus Torvalds * that should not be removed - in @chain[].p. Return value is the pointer
10181da177e4SLinus Torvalds * to last filled element of @chain.
10191da177e4SLinus Torvalds *
10201da177e4SLinus Torvalds * The work left to caller to do the actual freeing of subtrees:
10211da177e4SLinus Torvalds * a) free the subtree starting from *@top
10221da177e4SLinus Torvalds * b) free the subtrees whose roots are stored in
10231da177e4SLinus Torvalds * (@chain[i].p+1 .. end of @chain[i].bh->b_data)
10241da177e4SLinus Torvalds * c) free the subtrees growing from the inode past the @chain[0].p
10251da177e4SLinus Torvalds * (no partially truncated stuff there).
10261da177e4SLinus Torvalds */
10271da177e4SLinus Torvalds
ext2_find_shared(struct inode * inode,int depth,int offsets[4],Indirect chain[4],__le32 * top)10281da177e4SLinus Torvalds static Indirect *ext2_find_shared(struct inode *inode,
10291da177e4SLinus Torvalds int depth,
10301da177e4SLinus Torvalds int offsets[4],
10311da177e4SLinus Torvalds Indirect chain[4],
10321da177e4SLinus Torvalds __le32 *top)
10331da177e4SLinus Torvalds {
10341da177e4SLinus Torvalds Indirect *partial, *p;
10351da177e4SLinus Torvalds int k, err;
10361da177e4SLinus Torvalds
10371da177e4SLinus Torvalds *top = 0;
10381da177e4SLinus Torvalds for (k = depth; k > 1 && !offsets[k-1]; k--)
10391da177e4SLinus Torvalds ;
10401da177e4SLinus Torvalds partial = ext2_get_branch(inode, k, offsets, chain, &err);
10411da177e4SLinus Torvalds if (!partial)
10421da177e4SLinus Torvalds partial = chain + k-1;
10431da177e4SLinus Torvalds /*
10441da177e4SLinus Torvalds * If the branch acquired continuation since we've looked at it -
10451da177e4SLinus Torvalds * fine, it should all survive and (new) top doesn't belong to us.
10461da177e4SLinus Torvalds */
10471da177e4SLinus Torvalds write_lock(&EXT2_I(inode)->i_meta_lock);
10481da177e4SLinus Torvalds if (!partial->key && *partial->p) {
10491da177e4SLinus Torvalds write_unlock(&EXT2_I(inode)->i_meta_lock);
10501da177e4SLinus Torvalds goto no_top;
10511da177e4SLinus Torvalds }
10521da177e4SLinus Torvalds for (p=partial; p>chain && all_zeroes((__le32*)p->bh->b_data,p->p); p--)
10531da177e4SLinus Torvalds ;
10541da177e4SLinus Torvalds /*
10551da177e4SLinus Torvalds * OK, we've found the last block that must survive. The rest of our
10561da177e4SLinus Torvalds * branch should be detached before unlocking. However, if that rest
10571da177e4SLinus Torvalds * of branch is all ours and does not grow immediately from the inode
10581da177e4SLinus Torvalds * it's easier to cheat and just decrement partial->p.
10591da177e4SLinus Torvalds */
10601da177e4SLinus Torvalds if (p == chain + k - 1 && p > chain) {
10611da177e4SLinus Torvalds p->p--;
10621da177e4SLinus Torvalds } else {
10631da177e4SLinus Torvalds *top = *p->p;
10641da177e4SLinus Torvalds *p->p = 0;
10651da177e4SLinus Torvalds }
10661da177e4SLinus Torvalds write_unlock(&EXT2_I(inode)->i_meta_lock);
10671da177e4SLinus Torvalds
10681da177e4SLinus Torvalds while(partial > p)
10691da177e4SLinus Torvalds {
10701da177e4SLinus Torvalds brelse(partial->bh);
10711da177e4SLinus Torvalds partial--;
10721da177e4SLinus Torvalds }
10731da177e4SLinus Torvalds no_top:
10741da177e4SLinus Torvalds return partial;
10751da177e4SLinus Torvalds }
10761da177e4SLinus Torvalds
10771da177e4SLinus Torvalds /**
10781da177e4SLinus Torvalds * ext2_free_data - free a list of data blocks
10791da177e4SLinus Torvalds * @inode: inode we are dealing with
10801da177e4SLinus Torvalds * @p: array of block numbers
10811da177e4SLinus Torvalds * @q: points immediately past the end of array
10821da177e4SLinus Torvalds *
108325985edcSLucas De Marchi * We are freeing all blocks referred from that array (numbers are
10841da177e4SLinus Torvalds * stored as little-endian 32-bit) and updating @inode->i_blocks
10851da177e4SLinus Torvalds * appropriately.
10861da177e4SLinus Torvalds */
ext2_free_data(struct inode * inode,__le32 * p,__le32 * q)10871da177e4SLinus Torvalds static inline void ext2_free_data(struct inode *inode, __le32 *p, __le32 *q)
10881da177e4SLinus Torvalds {
10892ebc736cSGeorg Ottinger ext2_fsblk_t block_to_free = 0, count = 0;
10902ebc736cSGeorg Ottinger ext2_fsblk_t nr;
10911da177e4SLinus Torvalds
10921da177e4SLinus Torvalds for ( ; p < q ; p++) {
10931da177e4SLinus Torvalds nr = le32_to_cpu(*p);
10941da177e4SLinus Torvalds if (nr) {
10951da177e4SLinus Torvalds *p = 0;
10961da177e4SLinus Torvalds /* accumulate blocks to free if they're contiguous */
10971da177e4SLinus Torvalds if (count == 0)
10981da177e4SLinus Torvalds goto free_this;
10991da177e4SLinus Torvalds else if (block_to_free == nr - count)
11001da177e4SLinus Torvalds count++;
11011da177e4SLinus Torvalds else {
11021da177e4SLinus Torvalds ext2_free_blocks (inode, block_to_free, count);
1103addacc7dSAl Viro mark_inode_dirty(inode);
11041da177e4SLinus Torvalds free_this:
11051da177e4SLinus Torvalds block_to_free = nr;
11061da177e4SLinus Torvalds count = 1;
11071da177e4SLinus Torvalds }
11081da177e4SLinus Torvalds }
11091da177e4SLinus Torvalds }
11101da177e4SLinus Torvalds if (count > 0) {
11111da177e4SLinus Torvalds ext2_free_blocks (inode, block_to_free, count);
1112addacc7dSAl Viro mark_inode_dirty(inode);
11131da177e4SLinus Torvalds }
11141da177e4SLinus Torvalds }
11151da177e4SLinus Torvalds
11161da177e4SLinus Torvalds /**
11171da177e4SLinus Torvalds * ext2_free_branches - free an array of branches
11181da177e4SLinus Torvalds * @inode: inode we are dealing with
11191da177e4SLinus Torvalds * @p: array of block numbers
11201da177e4SLinus Torvalds * @q: pointer immediately past the end of array
11211da177e4SLinus Torvalds * @depth: depth of the branches to free
11221da177e4SLinus Torvalds *
112325985edcSLucas De Marchi * We are freeing all blocks referred from these branches (numbers are
11241da177e4SLinus Torvalds * stored as little-endian 32-bit) and updating @inode->i_blocks
11251da177e4SLinus Torvalds * appropriately.
11261da177e4SLinus Torvalds */
ext2_free_branches(struct inode * inode,__le32 * p,__le32 * q,int depth)11271da177e4SLinus Torvalds static void ext2_free_branches(struct inode *inode, __le32 *p, __le32 *q, int depth)
11281da177e4SLinus Torvalds {
11291da177e4SLinus Torvalds struct buffer_head * bh;
11302ebc736cSGeorg Ottinger ext2_fsblk_t nr;
11311da177e4SLinus Torvalds
11321da177e4SLinus Torvalds if (depth--) {
11331da177e4SLinus Torvalds int addr_per_block = EXT2_ADDR_PER_BLOCK(inode->i_sb);
11341da177e4SLinus Torvalds for ( ; p < q ; p++) {
11351da177e4SLinus Torvalds nr = le32_to_cpu(*p);
11361da177e4SLinus Torvalds if (!nr)
11371da177e4SLinus Torvalds continue;
11381da177e4SLinus Torvalds *p = 0;
11391da177e4SLinus Torvalds bh = sb_bread(inode->i_sb, nr);
11401da177e4SLinus Torvalds /*
11411da177e4SLinus Torvalds * A read failure? Report error and clear slot
11421da177e4SLinus Torvalds * (should be rare).
11431da177e4SLinus Torvalds */
11441da177e4SLinus Torvalds if (!bh) {
11451da177e4SLinus Torvalds ext2_error(inode->i_sb, "ext2_free_branches",
11461da177e4SLinus Torvalds "Read failure, inode=%ld, block=%ld",
11471da177e4SLinus Torvalds inode->i_ino, nr);
11481da177e4SLinus Torvalds continue;
11491da177e4SLinus Torvalds }
11501da177e4SLinus Torvalds ext2_free_branches(inode,
11511da177e4SLinus Torvalds (__le32*)bh->b_data,
11521da177e4SLinus Torvalds (__le32*)bh->b_data + addr_per_block,
11531da177e4SLinus Torvalds depth);
11541da177e4SLinus Torvalds bforget(bh);
11551da177e4SLinus Torvalds ext2_free_blocks(inode, nr, 1);
11561da177e4SLinus Torvalds mark_inode_dirty(inode);
11571da177e4SLinus Torvalds }
11581da177e4SLinus Torvalds } else
11591da177e4SLinus Torvalds ext2_free_data(inode, p, q);
11601da177e4SLinus Torvalds }
11611da177e4SLinus Torvalds
116270f3bad8SJan Kara /* mapping->invalidate_lock must be held when calling this function */
__ext2_truncate_blocks(struct inode * inode,loff_t offset)1163737f2e93Snpiggin@suse.de static void __ext2_truncate_blocks(struct inode *inode, loff_t offset)
11641da177e4SLinus Torvalds {
11651da177e4SLinus Torvalds __le32 *i_data = EXT2_I(inode)->i_data;
1166a686cd89SMartin J. Bligh struct ext2_inode_info *ei = EXT2_I(inode);
11671da177e4SLinus Torvalds int addr_per_block = EXT2_ADDR_PER_BLOCK(inode->i_sb);
11681da177e4SLinus Torvalds int offsets[4];
11691da177e4SLinus Torvalds Indirect chain[4];
11701da177e4SLinus Torvalds Indirect *partial;
11711da177e4SLinus Torvalds __le32 nr = 0;
11721da177e4SLinus Torvalds int n;
11731da177e4SLinus Torvalds long iblock;
11741da177e4SLinus Torvalds unsigned blocksize;
11751da177e4SLinus Torvalds blocksize = inode->i_sb->s_blocksize;
1176737f2e93Snpiggin@suse.de iblock = (offset + blocksize-1) >> EXT2_BLOCK_SIZE_BITS(inode->i_sb);
11771da177e4SLinus Torvalds
11785726b27bSRoss Zwisler #ifdef CONFIG_FS_DAX
117970f3bad8SJan Kara WARN_ON(!rwsem_is_locked(&inode->i_mapping->invalidate_lock));
11805726b27bSRoss Zwisler #endif
11815726b27bSRoss Zwisler
11821da177e4SLinus Torvalds n = ext2_block_to_path(inode, iblock, offsets, NULL);
11831da177e4SLinus Torvalds if (n == 0)
11841da177e4SLinus Torvalds return;
11851da177e4SLinus Torvalds
1186a686cd89SMartin J. Bligh /*
1187a686cd89SMartin J. Bligh * From here we block out all ext2_get_block() callers who want to
1188a686cd89SMartin J. Bligh * modify the block allocation tree.
1189a686cd89SMartin J. Bligh */
1190a686cd89SMartin J. Bligh mutex_lock(&ei->truncate_mutex);
1191a686cd89SMartin J. Bligh
11921da177e4SLinus Torvalds if (n == 1) {
11931da177e4SLinus Torvalds ext2_free_data(inode, i_data+offsets[0],
11941da177e4SLinus Torvalds i_data + EXT2_NDIR_BLOCKS);
11951da177e4SLinus Torvalds goto do_indirects;
11961da177e4SLinus Torvalds }
11971da177e4SLinus Torvalds
11981da177e4SLinus Torvalds partial = ext2_find_shared(inode, n, offsets, chain, &nr);
11991da177e4SLinus Torvalds /* Kill the top of shared branch (already detached) */
12001da177e4SLinus Torvalds if (nr) {
12011da177e4SLinus Torvalds if (partial == chain)
12021da177e4SLinus Torvalds mark_inode_dirty(inode);
12031da177e4SLinus Torvalds else
12041da177e4SLinus Torvalds mark_buffer_dirty_inode(partial->bh, inode);
12051da177e4SLinus Torvalds ext2_free_branches(inode, &nr, &nr+1, (chain+n-1) - partial);
12061da177e4SLinus Torvalds }
12071da177e4SLinus Torvalds /* Clear the ends of indirect blocks on the shared branch */
12081da177e4SLinus Torvalds while (partial > chain) {
12091da177e4SLinus Torvalds ext2_free_branches(inode,
12101da177e4SLinus Torvalds partial->p + 1,
12111da177e4SLinus Torvalds (__le32*)partial->bh->b_data+addr_per_block,
12121da177e4SLinus Torvalds (chain+n-1) - partial);
12131da177e4SLinus Torvalds mark_buffer_dirty_inode(partial->bh, inode);
12141da177e4SLinus Torvalds brelse (partial->bh);
12151da177e4SLinus Torvalds partial--;
12161da177e4SLinus Torvalds }
12171da177e4SLinus Torvalds do_indirects:
12181da177e4SLinus Torvalds /* Kill the remaining (whole) subtrees */
12191da177e4SLinus Torvalds switch (offsets[0]) {
12201da177e4SLinus Torvalds default:
12211da177e4SLinus Torvalds nr = i_data[EXT2_IND_BLOCK];
12221da177e4SLinus Torvalds if (nr) {
12231da177e4SLinus Torvalds i_data[EXT2_IND_BLOCK] = 0;
12241da177e4SLinus Torvalds mark_inode_dirty(inode);
12251da177e4SLinus Torvalds ext2_free_branches(inode, &nr, &nr+1, 1);
12261da177e4SLinus Torvalds }
1227df561f66SGustavo A. R. Silva fallthrough;
12281da177e4SLinus Torvalds case EXT2_IND_BLOCK:
12291da177e4SLinus Torvalds nr = i_data[EXT2_DIND_BLOCK];
12301da177e4SLinus Torvalds if (nr) {
12311da177e4SLinus Torvalds i_data[EXT2_DIND_BLOCK] = 0;
12321da177e4SLinus Torvalds mark_inode_dirty(inode);
12331da177e4SLinus Torvalds ext2_free_branches(inode, &nr, &nr+1, 2);
12341da177e4SLinus Torvalds }
1235df561f66SGustavo A. R. Silva fallthrough;
12361da177e4SLinus Torvalds case EXT2_DIND_BLOCK:
12371da177e4SLinus Torvalds nr = i_data[EXT2_TIND_BLOCK];
12381da177e4SLinus Torvalds if (nr) {
12391da177e4SLinus Torvalds i_data[EXT2_TIND_BLOCK] = 0;
12401da177e4SLinus Torvalds mark_inode_dirty(inode);
12411da177e4SLinus Torvalds ext2_free_branches(inode, &nr, &nr+1, 3);
12421da177e4SLinus Torvalds }
12438fca3c8aSGustavo A. R. Silva break;
12441da177e4SLinus Torvalds case EXT2_TIND_BLOCK:
12451da177e4SLinus Torvalds ;
12461da177e4SLinus Torvalds }
1247a686cd89SMartin J. Bligh
1248a686cd89SMartin J. Bligh ext2_discard_reservation(inode);
1249a686cd89SMartin J. Bligh
1250a686cd89SMartin J. Bligh mutex_unlock(&ei->truncate_mutex);
1251737f2e93Snpiggin@suse.de }
1252737f2e93Snpiggin@suse.de
ext2_truncate_blocks(struct inode * inode,loff_t offset)1253737f2e93Snpiggin@suse.de static void ext2_truncate_blocks(struct inode *inode, loff_t offset)
1254737f2e93Snpiggin@suse.de {
1255737f2e93Snpiggin@suse.de if (!(S_ISREG(inode->i_mode) || S_ISDIR(inode->i_mode) ||
1256737f2e93Snpiggin@suse.de S_ISLNK(inode->i_mode)))
1257737f2e93Snpiggin@suse.de return;
1258737f2e93Snpiggin@suse.de if (ext2_inode_is_fast_symlink(inode))
1259737f2e93Snpiggin@suse.de return;
12605726b27bSRoss Zwisler
126170f3bad8SJan Kara filemap_invalidate_lock(inode->i_mapping);
1262737f2e93Snpiggin@suse.de __ext2_truncate_blocks(inode, offset);
126370f3bad8SJan Kara filemap_invalidate_unlock(inode->i_mapping);
1264737f2e93Snpiggin@suse.de }
1265737f2e93Snpiggin@suse.de
ext2_setsize(struct inode * inode,loff_t newsize)12662c27c65eSChristoph Hellwig static int ext2_setsize(struct inode *inode, loff_t newsize)
1267737f2e93Snpiggin@suse.de {
1268737f2e93Snpiggin@suse.de int error;
1269737f2e93Snpiggin@suse.de
1270737f2e93Snpiggin@suse.de if (!(S_ISREG(inode->i_mode) || S_ISDIR(inode->i_mode) ||
1271737f2e93Snpiggin@suse.de S_ISLNK(inode->i_mode)))
1272737f2e93Snpiggin@suse.de return -EINVAL;
1273737f2e93Snpiggin@suse.de if (ext2_inode_is_fast_symlink(inode))
1274737f2e93Snpiggin@suse.de return -EINVAL;
1275737f2e93Snpiggin@suse.de if (IS_APPEND(inode) || IS_IMMUTABLE(inode))
1276737f2e93Snpiggin@suse.de return -EPERM;
1277737f2e93Snpiggin@suse.de
1278562c72aaSChristoph Hellwig inode_dio_wait(inode);
1279562c72aaSChristoph Hellwig
12800cc5b4ceSChristoph Hellwig if (IS_DAX(inode))
1281fcced95bSRitesh Harjani (IBM) error = dax_truncate_page(inode, newsize, NULL,
128200697eedSJan Kara &ext2_iomap_ops);
1283737f2e93Snpiggin@suse.de else
1284737f2e93Snpiggin@suse.de error = block_truncate_page(inode->i_mapping,
1285737f2e93Snpiggin@suse.de newsize, ext2_get_block);
1286737f2e93Snpiggin@suse.de if (error)
1287737f2e93Snpiggin@suse.de return error;
1288737f2e93Snpiggin@suse.de
128970f3bad8SJan Kara filemap_invalidate_lock(inode->i_mapping);
12902c27c65eSChristoph Hellwig truncate_setsize(inode, newsize);
1291737f2e93Snpiggin@suse.de __ext2_truncate_blocks(inode, newsize);
129270f3bad8SJan Kara filemap_invalidate_unlock(inode->i_mapping);
1293737f2e93Snpiggin@suse.de
1294fc4eed64SJeff Layton inode->i_mtime = inode_set_ctime_current(inode);
12951da177e4SLinus Torvalds if (inode_needs_sync(inode)) {
12961da177e4SLinus Torvalds sync_mapping_buffers(inode->i_mapping);
1297c3765016SChristoph Hellwig sync_inode_metadata(inode, 1);
12981da177e4SLinus Torvalds } else {
12991da177e4SLinus Torvalds mark_inode_dirty(inode);
13001da177e4SLinus Torvalds }
1301737f2e93Snpiggin@suse.de
1302737f2e93Snpiggin@suse.de return 0;
13031da177e4SLinus Torvalds }
13041da177e4SLinus Torvalds
ext2_get_inode(struct super_block * sb,ino_t ino,struct buffer_head ** p)13051da177e4SLinus Torvalds static struct ext2_inode *ext2_get_inode(struct super_block *sb, ino_t ino,
13061da177e4SLinus Torvalds struct buffer_head **p)
13071da177e4SLinus Torvalds {
13081da177e4SLinus Torvalds struct buffer_head * bh;
13091da177e4SLinus Torvalds unsigned long block_group;
13101da177e4SLinus Torvalds unsigned long block;
13111da177e4SLinus Torvalds unsigned long offset;
13121da177e4SLinus Torvalds struct ext2_group_desc * gdp;
13131da177e4SLinus Torvalds
13141da177e4SLinus Torvalds *p = NULL;
13151da177e4SLinus Torvalds if ((ino != EXT2_ROOT_INO && ino < EXT2_FIRST_INO(sb)) ||
13161da177e4SLinus Torvalds ino > le32_to_cpu(EXT2_SB(sb)->s_es->s_inodes_count))
13171da177e4SLinus Torvalds goto Einval;
13181da177e4SLinus Torvalds
13191da177e4SLinus Torvalds block_group = (ino - 1) / EXT2_INODES_PER_GROUP(sb);
1320ef2fb679SEric Sandeen gdp = ext2_get_group_desc(sb, block_group, NULL);
13211da177e4SLinus Torvalds if (!gdp)
13221da177e4SLinus Torvalds goto Egdp;
13231da177e4SLinus Torvalds /*
13241da177e4SLinus Torvalds * Figure out the offset within the block group inode table
13251da177e4SLinus Torvalds */
13261da177e4SLinus Torvalds offset = ((ino - 1) % EXT2_INODES_PER_GROUP(sb)) * EXT2_INODE_SIZE(sb);
13271da177e4SLinus Torvalds block = le32_to_cpu(gdp->bg_inode_table) +
13281da177e4SLinus Torvalds (offset >> EXT2_BLOCK_SIZE_BITS(sb));
13291da177e4SLinus Torvalds if (!(bh = sb_bread(sb, block)))
13301da177e4SLinus Torvalds goto Eio;
13311da177e4SLinus Torvalds
13321da177e4SLinus Torvalds *p = bh;
13331da177e4SLinus Torvalds offset &= (EXT2_BLOCK_SIZE(sb) - 1);
13341da177e4SLinus Torvalds return (struct ext2_inode *) (bh->b_data + offset);
13351da177e4SLinus Torvalds
13361da177e4SLinus Torvalds Einval:
13371da177e4SLinus Torvalds ext2_error(sb, "ext2_get_inode", "bad inode number: %lu",
13381da177e4SLinus Torvalds (unsigned long) ino);
13391da177e4SLinus Torvalds return ERR_PTR(-EINVAL);
13401da177e4SLinus Torvalds Eio:
13411da177e4SLinus Torvalds ext2_error(sb, "ext2_get_inode",
13421da177e4SLinus Torvalds "unable to read inode block - inode=%lu, block=%lu",
13431da177e4SLinus Torvalds (unsigned long) ino, block);
13441da177e4SLinus Torvalds Egdp:
13451da177e4SLinus Torvalds return ERR_PTR(-EIO);
13461da177e4SLinus Torvalds }
13471da177e4SLinus Torvalds
ext2_set_inode_flags(struct inode * inode)13481da177e4SLinus Torvalds void ext2_set_inode_flags(struct inode *inode)
13491da177e4SLinus Torvalds {
13501da177e4SLinus Torvalds unsigned int flags = EXT2_I(inode)->i_flags;
13511da177e4SLinus Torvalds
1352fbbbad4bSMatthew Wilcox inode->i_flags &= ~(S_SYNC | S_APPEND | S_IMMUTABLE | S_NOATIME |
1353fbbbad4bSMatthew Wilcox S_DIRSYNC | S_DAX);
13541da177e4SLinus Torvalds if (flags & EXT2_SYNC_FL)
13551da177e4SLinus Torvalds inode->i_flags |= S_SYNC;
13561da177e4SLinus Torvalds if (flags & EXT2_APPEND_FL)
13571da177e4SLinus Torvalds inode->i_flags |= S_APPEND;
13581da177e4SLinus Torvalds if (flags & EXT2_IMMUTABLE_FL)
13591da177e4SLinus Torvalds inode->i_flags |= S_IMMUTABLE;
13601da177e4SLinus Torvalds if (flags & EXT2_NOATIME_FL)
13611da177e4SLinus Torvalds inode->i_flags |= S_NOATIME;
13621da177e4SLinus Torvalds if (flags & EXT2_DIRSYNC_FL)
13631da177e4SLinus Torvalds inode->i_flags |= S_DIRSYNC;
13640a6cf913SRoss Zwisler if (test_opt(inode->i_sb, DAX) && S_ISREG(inode->i_mode))
1365fbbbad4bSMatthew Wilcox inode->i_flags |= S_DAX;
13661da177e4SLinus Torvalds }
13671da177e4SLinus Torvalds
ext2_set_file_ops(struct inode * inode)1368fb094c90SDan Williams void ext2_set_file_ops(struct inode *inode)
1369fb094c90SDan Williams {
1370fb094c90SDan Williams inode->i_op = &ext2_file_inode_operations;
1371fb094c90SDan Williams inode->i_fop = &ext2_file_operations;
1372fb094c90SDan Williams if (IS_DAX(inode))
1373fb094c90SDan Williams inode->i_mapping->a_ops = &ext2_dax_aops;
1374fb094c90SDan Williams else
1375fb094c90SDan Williams inode->i_mapping->a_ops = &ext2_aops;
1376fb094c90SDan Williams }
1377fb094c90SDan Williams
ext2_iget(struct super_block * sb,unsigned long ino)137852fcf703SDavid Howells struct inode *ext2_iget (struct super_block *sb, unsigned long ino)
13791da177e4SLinus Torvalds {
138052fcf703SDavid Howells struct ext2_inode_info *ei;
1381936bbf3aSJan Kara struct buffer_head * bh = NULL;
138252fcf703SDavid Howells struct ext2_inode *raw_inode;
138352fcf703SDavid Howells struct inode *inode;
138452fcf703SDavid Howells long ret = -EIO;
13851da177e4SLinus Torvalds int n;
1386b8a9f9e1SEric W. Biederman uid_t i_uid;
1387b8a9f9e1SEric W. Biederman gid_t i_gid;
13881da177e4SLinus Torvalds
138952fcf703SDavid Howells inode = iget_locked(sb, ino);
139052fcf703SDavid Howells if (!inode)
139152fcf703SDavid Howells return ERR_PTR(-ENOMEM);
139252fcf703SDavid Howells if (!(inode->i_state & I_NEW))
139352fcf703SDavid Howells return inode;
139452fcf703SDavid Howells
139552fcf703SDavid Howells ei = EXT2_I(inode);
1396a686cd89SMartin J. Bligh ei->i_block_alloc_info = NULL;
1397a686cd89SMartin J. Bligh
139852fcf703SDavid Howells raw_inode = ext2_get_inode(inode->i_sb, ino, &bh);
139952fcf703SDavid Howells if (IS_ERR(raw_inode)) {
140052fcf703SDavid Howells ret = PTR_ERR(raw_inode);
14011da177e4SLinus Torvalds goto bad_inode;
140252fcf703SDavid Howells }
14031da177e4SLinus Torvalds
14041da177e4SLinus Torvalds inode->i_mode = le16_to_cpu(raw_inode->i_mode);
1405b8a9f9e1SEric W. Biederman i_uid = (uid_t)le16_to_cpu(raw_inode->i_uid_low);
1406b8a9f9e1SEric W. Biederman i_gid = (gid_t)le16_to_cpu(raw_inode->i_gid_low);
14071da177e4SLinus Torvalds if (!(test_opt (inode->i_sb, NO_UID32))) {
1408b8a9f9e1SEric W. Biederman i_uid |= le16_to_cpu(raw_inode->i_uid_high) << 16;
1409b8a9f9e1SEric W. Biederman i_gid |= le16_to_cpu(raw_inode->i_gid_high) << 16;
14101da177e4SLinus Torvalds }
1411b8a9f9e1SEric W. Biederman i_uid_write(inode, i_uid);
1412b8a9f9e1SEric W. Biederman i_gid_write(inode, i_gid);
1413bfe86848SMiklos Szeredi set_nlink(inode, le16_to_cpu(raw_inode->i_links_count));
14141da177e4SLinus Torvalds inode->i_size = le32_to_cpu(raw_inode->i_size);
14154d7bf11dSMarkus Rechberger inode->i_atime.tv_sec = (signed)le32_to_cpu(raw_inode->i_atime);
1416fc4eed64SJeff Layton inode_set_ctime(inode, (signed)le32_to_cpu(raw_inode->i_ctime), 0);
14174d7bf11dSMarkus Rechberger inode->i_mtime.tv_sec = (signed)le32_to_cpu(raw_inode->i_mtime);
1418fc4eed64SJeff Layton inode->i_atime.tv_nsec = inode->i_mtime.tv_nsec = 0;
14191da177e4SLinus Torvalds ei->i_dtime = le32_to_cpu(raw_inode->i_dtime);
14201da177e4SLinus Torvalds /* We now have enough fields to check if the inode was active or not.
14211da177e4SLinus Torvalds * This is needed because nfsd might try to access dead inodes
14221da177e4SLinus Torvalds * the test is that same one that e2fsck uses
14231da177e4SLinus Torvalds * NeilBrown 1999oct15
14241da177e4SLinus Torvalds */
14251da177e4SLinus Torvalds if (inode->i_nlink == 0 && (inode->i_mode == 0 || ei->i_dtime)) {
14261da177e4SLinus Torvalds /* this inode is deleted */
142752fcf703SDavid Howells ret = -ESTALE;
14281da177e4SLinus Torvalds goto bad_inode;
14291da177e4SLinus Torvalds }
14301da177e4SLinus Torvalds inode->i_blocks = le32_to_cpu(raw_inode->i_blocks);
14311da177e4SLinus Torvalds ei->i_flags = le32_to_cpu(raw_inode->i_flags);
14329e796c9dSToshi Kani ext2_set_inode_flags(inode);
14331da177e4SLinus Torvalds ei->i_faddr = le32_to_cpu(raw_inode->i_faddr);
14341da177e4SLinus Torvalds ei->i_frag_no = raw_inode->i_frag;
14351da177e4SLinus Torvalds ei->i_frag_size = raw_inode->i_fsize;
14361da177e4SLinus Torvalds ei->i_file_acl = le32_to_cpu(raw_inode->i_file_acl);
14371da177e4SLinus Torvalds ei->i_dir_acl = 0;
1438ff0031d8SCarlos Maiolino
1439ff0031d8SCarlos Maiolino if (ei->i_file_acl &&
1440ff0031d8SCarlos Maiolino !ext2_data_block_valid(EXT2_SB(sb), ei->i_file_acl, 1)) {
1441ff0031d8SCarlos Maiolino ext2_error(sb, "ext2_iget", "bad extended attribute block %u",
1442ff0031d8SCarlos Maiolino ei->i_file_acl);
1443ff0031d8SCarlos Maiolino ret = -EFSCORRUPTED;
1444ff0031d8SCarlos Maiolino goto bad_inode;
1445ff0031d8SCarlos Maiolino }
1446ff0031d8SCarlos Maiolino
14471da177e4SLinus Torvalds if (S_ISREG(inode->i_mode))
14481da177e4SLinus Torvalds inode->i_size |= ((__u64)le32_to_cpu(raw_inode->i_size_high)) << 32;
14491da177e4SLinus Torvalds else
14501da177e4SLinus Torvalds ei->i_dir_acl = le32_to_cpu(raw_inode->i_dir_acl);
1451b46dc033SDarrick J. Wong if (i_size_read(inode) < 0) {
1452b46dc033SDarrick J. Wong ret = -EFSCORRUPTED;
1453b46dc033SDarrick J. Wong goto bad_inode;
1454b46dc033SDarrick J. Wong }
14551da177e4SLinus Torvalds ei->i_dtime = 0;
14561da177e4SLinus Torvalds inode->i_generation = le32_to_cpu(raw_inode->i_generation);
14571da177e4SLinus Torvalds ei->i_state = 0;
14581da177e4SLinus Torvalds ei->i_block_group = (ino - 1) / EXT2_INODES_PER_GROUP(inode->i_sb);
14591da177e4SLinus Torvalds ei->i_dir_start_lookup = 0;
14601da177e4SLinus Torvalds
14611da177e4SLinus Torvalds /*
14621da177e4SLinus Torvalds * NOTE! The in-memory inode i_data array is in little-endian order
14631da177e4SLinus Torvalds * even on big-endian machines: we do NOT byteswap the block numbers!
14641da177e4SLinus Torvalds */
14651da177e4SLinus Torvalds for (n = 0; n < EXT2_N_BLOCKS; n++)
14661da177e4SLinus Torvalds ei->i_data[n] = raw_inode->i_block[n];
14671da177e4SLinus Torvalds
14681da177e4SLinus Torvalds if (S_ISREG(inode->i_mode)) {
1469fb094c90SDan Williams ext2_set_file_ops(inode);
14701da177e4SLinus Torvalds } else if (S_ISDIR(inode->i_mode)) {
14711da177e4SLinus Torvalds inode->i_op = &ext2_dir_inode_operations;
14721da177e4SLinus Torvalds inode->i_fop = &ext2_dir_operations;
14731da177e4SLinus Torvalds inode->i_mapping->a_ops = &ext2_aops;
14741da177e4SLinus Torvalds } else if (S_ISLNK(inode->i_mode)) {
14758d6d0c4dSDuane Griffin if (ext2_inode_is_fast_symlink(inode)) {
1476cbe0fa38SAl Viro inode->i_link = (char *)ei->i_data;
14771da177e4SLinus Torvalds inode->i_op = &ext2_fast_symlink_inode_operations;
14788d6d0c4dSDuane Griffin nd_terminate_link(ei->i_data, inode->i_size,
14798d6d0c4dSDuane Griffin sizeof(ei->i_data) - 1);
14808d6d0c4dSDuane Griffin } else {
14811da177e4SLinus Torvalds inode->i_op = &ext2_symlink_inode_operations;
148221fc61c7SAl Viro inode_nohighmem(inode);
14831da177e4SLinus Torvalds inode->i_mapping->a_ops = &ext2_aops;
14841da177e4SLinus Torvalds }
14851da177e4SLinus Torvalds } else {
14861da177e4SLinus Torvalds inode->i_op = &ext2_special_inode_operations;
14871da177e4SLinus Torvalds if (raw_inode->i_block[0])
14881da177e4SLinus Torvalds init_special_inode(inode, inode->i_mode,
14891da177e4SLinus Torvalds old_decode_dev(le32_to_cpu(raw_inode->i_block[0])));
14901da177e4SLinus Torvalds else
14911da177e4SLinus Torvalds init_special_inode(inode, inode->i_mode,
14921da177e4SLinus Torvalds new_decode_dev(le32_to_cpu(raw_inode->i_block[1])));
14931da177e4SLinus Torvalds }
14941da177e4SLinus Torvalds brelse (bh);
149552fcf703SDavid Howells unlock_new_inode(inode);
149652fcf703SDavid Howells return inode;
14971da177e4SLinus Torvalds
14981da177e4SLinus Torvalds bad_inode:
1499936bbf3aSJan Kara brelse(bh);
150052fcf703SDavid Howells iget_failed(inode);
150152fcf703SDavid Howells return ERR_PTR(ret);
15021da177e4SLinus Torvalds }
15031da177e4SLinus Torvalds
__ext2_write_inode(struct inode * inode,int do_sync)1504a9185b41SChristoph Hellwig static int __ext2_write_inode(struct inode *inode, int do_sync)
15051da177e4SLinus Torvalds {
15061da177e4SLinus Torvalds struct ext2_inode_info *ei = EXT2_I(inode);
15071da177e4SLinus Torvalds struct super_block *sb = inode->i_sb;
15081da177e4SLinus Torvalds ino_t ino = inode->i_ino;
1509b8a9f9e1SEric W. Biederman uid_t uid = i_uid_read(inode);
1510b8a9f9e1SEric W. Biederman gid_t gid = i_gid_read(inode);
15111da177e4SLinus Torvalds struct buffer_head * bh;
15121da177e4SLinus Torvalds struct ext2_inode * raw_inode = ext2_get_inode(sb, ino, &bh);
15131da177e4SLinus Torvalds int n;
15141da177e4SLinus Torvalds int err = 0;
15151da177e4SLinus Torvalds
15161da177e4SLinus Torvalds if (IS_ERR(raw_inode))
15171da177e4SLinus Torvalds return -EIO;
15181da177e4SLinus Torvalds
15192aab03b8SXiang wangx /* For fields not tracking in the in-memory inode,
15201da177e4SLinus Torvalds * initialise them to zero for new inodes. */
15211da177e4SLinus Torvalds if (ei->i_state & EXT2_STATE_NEW)
15221da177e4SLinus Torvalds memset(raw_inode, 0, EXT2_SB(sb)->s_inode_size);
15231da177e4SLinus Torvalds
15241da177e4SLinus Torvalds raw_inode->i_mode = cpu_to_le16(inode->i_mode);
15251da177e4SLinus Torvalds if (!(test_opt(sb, NO_UID32))) {
15261da177e4SLinus Torvalds raw_inode->i_uid_low = cpu_to_le16(low_16_bits(uid));
15271da177e4SLinus Torvalds raw_inode->i_gid_low = cpu_to_le16(low_16_bits(gid));
15281da177e4SLinus Torvalds /*
15291da177e4SLinus Torvalds * Fix up interoperability with old kernels. Otherwise, old inodes get
15301da177e4SLinus Torvalds * re-used with the upper 16 bits of the uid/gid intact
15311da177e4SLinus Torvalds */
15321da177e4SLinus Torvalds if (!ei->i_dtime) {
15331da177e4SLinus Torvalds raw_inode->i_uid_high = cpu_to_le16(high_16_bits(uid));
15341da177e4SLinus Torvalds raw_inode->i_gid_high = cpu_to_le16(high_16_bits(gid));
15351da177e4SLinus Torvalds } else {
15361da177e4SLinus Torvalds raw_inode->i_uid_high = 0;
15371da177e4SLinus Torvalds raw_inode->i_gid_high = 0;
15381da177e4SLinus Torvalds }
15391da177e4SLinus Torvalds } else {
15401da177e4SLinus Torvalds raw_inode->i_uid_low = cpu_to_le16(fs_high2lowuid(uid));
15411da177e4SLinus Torvalds raw_inode->i_gid_low = cpu_to_le16(fs_high2lowgid(gid));
15421da177e4SLinus Torvalds raw_inode->i_uid_high = 0;
15431da177e4SLinus Torvalds raw_inode->i_gid_high = 0;
15441da177e4SLinus Torvalds }
15451da177e4SLinus Torvalds raw_inode->i_links_count = cpu_to_le16(inode->i_nlink);
15461da177e4SLinus Torvalds raw_inode->i_size = cpu_to_le32(inode->i_size);
15471da177e4SLinus Torvalds raw_inode->i_atime = cpu_to_le32(inode->i_atime.tv_sec);
1548fc4eed64SJeff Layton raw_inode->i_ctime = cpu_to_le32(inode_get_ctime(inode).tv_sec);
15491da177e4SLinus Torvalds raw_inode->i_mtime = cpu_to_le32(inode->i_mtime.tv_sec);
15501da177e4SLinus Torvalds
15511da177e4SLinus Torvalds raw_inode->i_blocks = cpu_to_le32(inode->i_blocks);
15521da177e4SLinus Torvalds raw_inode->i_dtime = cpu_to_le32(ei->i_dtime);
15531da177e4SLinus Torvalds raw_inode->i_flags = cpu_to_le32(ei->i_flags);
15541da177e4SLinus Torvalds raw_inode->i_faddr = cpu_to_le32(ei->i_faddr);
15551da177e4SLinus Torvalds raw_inode->i_frag = ei->i_frag_no;
15561da177e4SLinus Torvalds raw_inode->i_fsize = ei->i_frag_size;
15571da177e4SLinus Torvalds raw_inode->i_file_acl = cpu_to_le32(ei->i_file_acl);
15581da177e4SLinus Torvalds if (!S_ISREG(inode->i_mode))
15591da177e4SLinus Torvalds raw_inode->i_dir_acl = cpu_to_le32(ei->i_dir_acl);
15601da177e4SLinus Torvalds else {
15611da177e4SLinus Torvalds raw_inode->i_size_high = cpu_to_le32(inode->i_size >> 32);
15621da177e4SLinus Torvalds if (inode->i_size > 0x7fffffffULL) {
15631da177e4SLinus Torvalds if (!EXT2_HAS_RO_COMPAT_FEATURE(sb,
15641da177e4SLinus Torvalds EXT2_FEATURE_RO_COMPAT_LARGE_FILE) ||
15651da177e4SLinus Torvalds EXT2_SB(sb)->s_es->s_rev_level ==
15661da177e4SLinus Torvalds cpu_to_le32(EXT2_GOOD_OLD_REV)) {
15671da177e4SLinus Torvalds /* If this is the first large file
15681da177e4SLinus Torvalds * created, add a flag to the superblock.
15691da177e4SLinus Torvalds */
1570c15271f4SJan Blunck spin_lock(&EXT2_SB(sb)->s_lock);
15711da177e4SLinus Torvalds ext2_update_dynamic_rev(sb);
15721da177e4SLinus Torvalds EXT2_SET_RO_COMPAT_FEATURE(sb,
15731da177e4SLinus Torvalds EXT2_FEATURE_RO_COMPAT_LARGE_FILE);
1574c15271f4SJan Blunck spin_unlock(&EXT2_SB(sb)->s_lock);
157565547661SJan Kara ext2_sync_super(sb, EXT2_SB(sb)->s_es, 1);
15761da177e4SLinus Torvalds }
15771da177e4SLinus Torvalds }
15781da177e4SLinus Torvalds }
15791da177e4SLinus Torvalds
15801da177e4SLinus Torvalds raw_inode->i_generation = cpu_to_le32(inode->i_generation);
15811da177e4SLinus Torvalds if (S_ISCHR(inode->i_mode) || S_ISBLK(inode->i_mode)) {
15821da177e4SLinus Torvalds if (old_valid_dev(inode->i_rdev)) {
15831da177e4SLinus Torvalds raw_inode->i_block[0] =
15841da177e4SLinus Torvalds cpu_to_le32(old_encode_dev(inode->i_rdev));
15851da177e4SLinus Torvalds raw_inode->i_block[1] = 0;
15861da177e4SLinus Torvalds } else {
15871da177e4SLinus Torvalds raw_inode->i_block[0] = 0;
15881da177e4SLinus Torvalds raw_inode->i_block[1] =
15891da177e4SLinus Torvalds cpu_to_le32(new_encode_dev(inode->i_rdev));
15901da177e4SLinus Torvalds raw_inode->i_block[2] = 0;
15911da177e4SLinus Torvalds }
15921da177e4SLinus Torvalds } else for (n = 0; n < EXT2_N_BLOCKS; n++)
15931da177e4SLinus Torvalds raw_inode->i_block[n] = ei->i_data[n];
15941da177e4SLinus Torvalds mark_buffer_dirty(bh);
15951da177e4SLinus Torvalds if (do_sync) {
15961da177e4SLinus Torvalds sync_dirty_buffer(bh);
15971da177e4SLinus Torvalds if (buffer_req(bh) && !buffer_uptodate(bh)) {
15981da177e4SLinus Torvalds printk ("IO error syncing ext2 inode [%s:%08lx]\n",
15991da177e4SLinus Torvalds sb->s_id, (unsigned long) ino);
16001da177e4SLinus Torvalds err = -EIO;
16011da177e4SLinus Torvalds }
16021da177e4SLinus Torvalds }
16031da177e4SLinus Torvalds ei->i_state &= ~EXT2_STATE_NEW;
16041da177e4SLinus Torvalds brelse (bh);
16051da177e4SLinus Torvalds return err;
16061da177e4SLinus Torvalds }
16071da177e4SLinus Torvalds
ext2_write_inode(struct inode * inode,struct writeback_control * wbc)1608a9185b41SChristoph Hellwig int ext2_write_inode(struct inode *inode, struct writeback_control *wbc)
1609a9185b41SChristoph Hellwig {
1610a9185b41SChristoph Hellwig return __ext2_write_inode(inode, wbc->sync_mode == WB_SYNC_ALL);
1611a9185b41SChristoph Hellwig }
1612a9185b41SChristoph Hellwig
ext2_getattr(struct mnt_idmap * idmap,const struct path * path,struct kstat * stat,u32 request_mask,unsigned int query_flags)1613b74d24f7SChristian Brauner int ext2_getattr(struct mnt_idmap *idmap, const struct path *path,
1614549c7297SChristian Brauner struct kstat *stat, u32 request_mask, unsigned int query_flags)
161593bc420eSyangerkun {
161693bc420eSyangerkun struct inode *inode = d_inode(path->dentry);
161793bc420eSyangerkun struct ext2_inode_info *ei = EXT2_I(inode);
161893bc420eSyangerkun unsigned int flags;
161993bc420eSyangerkun
162093bc420eSyangerkun flags = ei->i_flags & EXT2_FL_USER_VISIBLE;
162193bc420eSyangerkun if (flags & EXT2_APPEND_FL)
162293bc420eSyangerkun stat->attributes |= STATX_ATTR_APPEND;
162393bc420eSyangerkun if (flags & EXT2_COMPR_FL)
162493bc420eSyangerkun stat->attributes |= STATX_ATTR_COMPRESSED;
162593bc420eSyangerkun if (flags & EXT2_IMMUTABLE_FL)
162693bc420eSyangerkun stat->attributes |= STATX_ATTR_IMMUTABLE;
162793bc420eSyangerkun if (flags & EXT2_NODUMP_FL)
162893bc420eSyangerkun stat->attributes |= STATX_ATTR_NODUMP;
162993bc420eSyangerkun stat->attributes_mask |= (STATX_ATTR_APPEND |
163093bc420eSyangerkun STATX_ATTR_COMPRESSED |
163193bc420eSyangerkun STATX_ATTR_ENCRYPTED |
163293bc420eSyangerkun STATX_ATTR_IMMUTABLE |
163393bc420eSyangerkun STATX_ATTR_NODUMP);
163493bc420eSyangerkun
16350d72b928SJeff Layton generic_fillattr(&nop_mnt_idmap, request_mask, inode, stat);
163693bc420eSyangerkun return 0;
163793bc420eSyangerkun }
163893bc420eSyangerkun
ext2_setattr(struct mnt_idmap * idmap,struct dentry * dentry,struct iattr * iattr)1639c1632a0fSChristian Brauner int ext2_setattr(struct mnt_idmap *idmap, struct dentry *dentry,
1640549c7297SChristian Brauner struct iattr *iattr)
16411da177e4SLinus Torvalds {
16422b0143b5SDavid Howells struct inode *inode = d_inode(dentry);
16431da177e4SLinus Torvalds int error;
16441da177e4SLinus Torvalds
1645c1632a0fSChristian Brauner error = setattr_prepare(&nop_mnt_idmap, dentry, iattr);
16461da177e4SLinus Torvalds if (error)
16471da177e4SLinus Torvalds return error;
1648907f4554SChristoph Hellwig
1649f861646aSChristian Brauner if (is_quota_modification(&nop_mnt_idmap, inode, iattr)) {
1650c2edb305SJan Kara error = dquot_initialize(inode);
1651c2edb305SJan Kara if (error)
1652c2edb305SJan Kara return error;
1653c2edb305SJan Kara }
1654f861646aSChristian Brauner if (i_uid_needs_update(&nop_mnt_idmap, iattr, inode) ||
1655f861646aSChristian Brauner i_gid_needs_update(&nop_mnt_idmap, iattr, inode)) {
1656f861646aSChristian Brauner error = dquot_transfer(&nop_mnt_idmap, inode, iattr);
16571da177e4SLinus Torvalds if (error)
16581da177e4SLinus Torvalds return error;
16591da177e4SLinus Torvalds }
1660af5a30d8SNick Piggin if (iattr->ia_valid & ATTR_SIZE && iattr->ia_size != inode->i_size) {
1661737f2e93Snpiggin@suse.de error = ext2_setsize(inode, iattr->ia_size);
1662737f2e93Snpiggin@suse.de if (error)
1663737f2e93Snpiggin@suse.de return error;
1664737f2e93Snpiggin@suse.de }
1665c1632a0fSChristian Brauner setattr_copy(&nop_mnt_idmap, inode, iattr);
1666737f2e93Snpiggin@suse.de if (iattr->ia_valid & ATTR_MODE)
166713e83a49SChristian Brauner error = posix_acl_chmod(&nop_mnt_idmap, dentry, inode->i_mode);
1668737f2e93Snpiggin@suse.de mark_inode_dirty(inode);
1669737f2e93Snpiggin@suse.de
16701da177e4SLinus Torvalds return error;
16711da177e4SLinus Torvalds }
1672