1b3b94faaSDavid Teigland /* 2b3b94faaSDavid Teigland * Copyright (C) Sistina Software, Inc. 1997-2003 All rights reserved. 3da6dd40dSBob Peterson * Copyright (C) 2004-2007 Red Hat, Inc. All rights reserved. 4b3b94faaSDavid Teigland * 5b3b94faaSDavid Teigland * This copyrighted material is made available to anyone wishing to use, 6b3b94faaSDavid Teigland * modify, copy, or redistribute it subject to the terms and conditions 7e9fc2aa0SSteven Whitehouse * of the GNU General Public License version 2. 8b3b94faaSDavid Teigland */ 9b3b94faaSDavid Teigland 10b3b94faaSDavid Teigland #include <linux/sched.h> 11b3b94faaSDavid Teigland #include <linux/slab.h> 12b3b94faaSDavid Teigland #include <linux/spinlock.h> 13b3b94faaSDavid Teigland #include <linux/completion.h> 14b3b94faaSDavid Teigland #include <linux/buffer_head.h> 155c676f6dSSteven Whitehouse #include <linux/gfs2_ondisk.h> 1671b86f56SSteven Whitehouse #include <linux/crc32.h> 17a25311c8SSteven Whitehouse #include <linux/delay.h> 18ec69b188SSteven Whitehouse #include <linux/kthread.h> 19ec69b188SSteven Whitehouse #include <linux/freezer.h> 20254db57fSSteven Whitehouse #include <linux/bio.h> 21885bcecaSSteven Whitehouse #include <linux/blkdev.h> 224667a0ecSSteven Whitehouse #include <linux/writeback.h> 234a36d08dSBob Peterson #include <linux/list_sort.h> 24b3b94faaSDavid Teigland 25b3b94faaSDavid Teigland #include "gfs2.h" 265c676f6dSSteven Whitehouse #include "incore.h" 27b3b94faaSDavid Teigland #include "bmap.h" 28b3b94faaSDavid Teigland #include "glock.h" 29b3b94faaSDavid Teigland #include "log.h" 30b3b94faaSDavid Teigland #include "lops.h" 31b3b94faaSDavid Teigland #include "meta_io.h" 325c676f6dSSteven Whitehouse #include "util.h" 3371b86f56SSteven Whitehouse #include "dir.h" 3463997775SSteven Whitehouse #include "trace_gfs2.h" 35b3b94faaSDavid Teigland 36b3b94faaSDavid Teigland /** 37b3b94faaSDavid Teigland * gfs2_struct2blk - compute stuff 38b3b94faaSDavid Teigland * @sdp: the filesystem 39b3b94faaSDavid Teigland * @nstruct: the number of structures 40b3b94faaSDavid Teigland * @ssize: the size of the structures 41b3b94faaSDavid Teigland * 42b3b94faaSDavid Teigland * Compute the number of log descriptor blocks needed to hold a certain number 43b3b94faaSDavid Teigland * of structures of a certain size. 44b3b94faaSDavid Teigland * 45b3b94faaSDavid Teigland * Returns: the number of blocks needed (minimum is always 1) 46b3b94faaSDavid Teigland */ 47b3b94faaSDavid Teigland 48b3b94faaSDavid Teigland unsigned int gfs2_struct2blk(struct gfs2_sbd *sdp, unsigned int nstruct, 49b3b94faaSDavid Teigland unsigned int ssize) 50b3b94faaSDavid Teigland { 51b3b94faaSDavid Teigland unsigned int blks; 52b3b94faaSDavid Teigland unsigned int first, second; 53b3b94faaSDavid Teigland 54b3b94faaSDavid Teigland blks = 1; 55faa31ce8SSteven Whitehouse first = (sdp->sd_sb.sb_bsize - sizeof(struct gfs2_log_descriptor)) / ssize; 56b3b94faaSDavid Teigland 57b3b94faaSDavid Teigland if (nstruct > first) { 58568f4c96SSteven Whitehouse second = (sdp->sd_sb.sb_bsize - 59568f4c96SSteven Whitehouse sizeof(struct gfs2_meta_header)) / ssize; 605c676f6dSSteven Whitehouse blks += DIV_ROUND_UP(nstruct - first, second); 61b3b94faaSDavid Teigland } 62b3b94faaSDavid Teigland 63b3b94faaSDavid Teigland return blks; 64b3b94faaSDavid Teigland } 65b3b94faaSDavid Teigland 66ddacfaf7SSteven Whitehouse /** 671e1a3d03SSteven Whitehouse * gfs2_remove_from_ail - Remove an entry from the ail lists, updating counters 681e1a3d03SSteven Whitehouse * @mapping: The associated mapping (maybe NULL) 691e1a3d03SSteven Whitehouse * @bd: The gfs2_bufdata to remove 701e1a3d03SSteven Whitehouse * 71c618e87aSSteven Whitehouse * The ail lock _must_ be held when calling this function 721e1a3d03SSteven Whitehouse * 731e1a3d03SSteven Whitehouse */ 741e1a3d03SSteven Whitehouse 75f91a0d3eSSteven Whitehouse void gfs2_remove_from_ail(struct gfs2_bufdata *bd) 761e1a3d03SSteven Whitehouse { 7716ca9412SBenjamin Marzinski bd->bd_tr = NULL; 781ad38c43SSteven Whitehouse list_del_init(&bd->bd_ail_st_list); 791ad38c43SSteven Whitehouse list_del_init(&bd->bd_ail_gl_list); 801e1a3d03SSteven Whitehouse atomic_dec(&bd->bd_gl->gl_ail_count); 811e1a3d03SSteven Whitehouse brelse(bd->bd_bh); 821e1a3d03SSteven Whitehouse } 831e1a3d03SSteven Whitehouse 841e1a3d03SSteven Whitehouse /** 85ddacfaf7SSteven Whitehouse * gfs2_ail1_start_one - Start I/O on a part of the AIL 86ddacfaf7SSteven Whitehouse * @sdp: the filesystem 874667a0ecSSteven Whitehouse * @wbc: The writeback control structure 884667a0ecSSteven Whitehouse * @ai: The ail structure 89ddacfaf7SSteven Whitehouse * 90ddacfaf7SSteven Whitehouse */ 91ddacfaf7SSteven Whitehouse 924f1de018SSteven Whitehouse static int gfs2_ail1_start_one(struct gfs2_sbd *sdp, 934667a0ecSSteven Whitehouse struct writeback_control *wbc, 9416ca9412SBenjamin Marzinski struct gfs2_trans *tr) 95d6a079e8SDave Chinner __releases(&sdp->sd_ail_lock) 96d6a079e8SDave Chinner __acquires(&sdp->sd_ail_lock) 97ddacfaf7SSteven Whitehouse { 985ac048bbSSteven Whitehouse struct gfs2_glock *gl = NULL; 994667a0ecSSteven Whitehouse struct address_space *mapping; 100ddacfaf7SSteven Whitehouse struct gfs2_bufdata *bd, *s; 101ddacfaf7SSteven Whitehouse struct buffer_head *bh; 102ddacfaf7SSteven Whitehouse 10316ca9412SBenjamin Marzinski list_for_each_entry_safe_reverse(bd, s, &tr->tr_ail1_list, bd_ail_st_list) { 104ddacfaf7SSteven Whitehouse bh = bd->bd_bh; 105ddacfaf7SSteven Whitehouse 10616ca9412SBenjamin Marzinski gfs2_assert(sdp, bd->bd_tr == tr); 107ddacfaf7SSteven Whitehouse 108ddacfaf7SSteven Whitehouse if (!buffer_busy(bh)) { 10916615be1SSteven Whitehouse if (!buffer_uptodate(bh)) 110ddacfaf7SSteven Whitehouse gfs2_io_error_bh(sdp, bh); 11116ca9412SBenjamin Marzinski list_move(&bd->bd_ail_st_list, &tr->tr_ail2_list); 112ddacfaf7SSteven Whitehouse continue; 113ddacfaf7SSteven Whitehouse } 114ddacfaf7SSteven Whitehouse 115ddacfaf7SSteven Whitehouse if (!buffer_dirty(bh)) 116ddacfaf7SSteven Whitehouse continue; 1175ac048bbSSteven Whitehouse if (gl == bd->bd_gl) 1185ac048bbSSteven Whitehouse continue; 1195ac048bbSSteven Whitehouse gl = bd->bd_gl; 12016ca9412SBenjamin Marzinski list_move(&bd->bd_ail_st_list, &tr->tr_ail1_list); 1214667a0ecSSteven Whitehouse mapping = bh->b_page->mapping; 1224f1de018SSteven Whitehouse if (!mapping) 1234f1de018SSteven Whitehouse continue; 124d6a079e8SDave Chinner spin_unlock(&sdp->sd_ail_lock); 1254667a0ecSSteven Whitehouse generic_writepages(mapping, wbc); 126d6a079e8SDave Chinner spin_lock(&sdp->sd_ail_lock); 1274667a0ecSSteven Whitehouse if (wbc->nr_to_write <= 0) 128ddacfaf7SSteven Whitehouse break; 1294f1de018SSteven Whitehouse return 1; 130ddacfaf7SSteven Whitehouse } 1314f1de018SSteven Whitehouse 1324f1de018SSteven Whitehouse return 0; 1334667a0ecSSteven Whitehouse } 1344667a0ecSSteven Whitehouse 1354667a0ecSSteven Whitehouse 1364667a0ecSSteven Whitehouse /** 1374667a0ecSSteven Whitehouse * gfs2_ail1_flush - start writeback of some ail1 entries 1384667a0ecSSteven Whitehouse * @sdp: The super block 1394667a0ecSSteven Whitehouse * @wbc: The writeback control structure 1404667a0ecSSteven Whitehouse * 1414667a0ecSSteven Whitehouse * Writes back some ail1 entries, according to the limits in the 1424667a0ecSSteven Whitehouse * writeback control structure 1434667a0ecSSteven Whitehouse */ 1444667a0ecSSteven Whitehouse 1454667a0ecSSteven Whitehouse void gfs2_ail1_flush(struct gfs2_sbd *sdp, struct writeback_control *wbc) 1464667a0ecSSteven Whitehouse { 1474667a0ecSSteven Whitehouse struct list_head *head = &sdp->sd_ail1_list; 14816ca9412SBenjamin Marzinski struct gfs2_trans *tr; 149885bcecaSSteven Whitehouse struct blk_plug plug; 1504667a0ecSSteven Whitehouse 151c83ae9caSSteven Whitehouse trace_gfs2_ail_flush(sdp, wbc, 1); 152885bcecaSSteven Whitehouse blk_start_plug(&plug); 1534667a0ecSSteven Whitehouse spin_lock(&sdp->sd_ail_lock); 1544f1de018SSteven Whitehouse restart: 15516ca9412SBenjamin Marzinski list_for_each_entry_reverse(tr, head, tr_list) { 1564667a0ecSSteven Whitehouse if (wbc->nr_to_write <= 0) 1574667a0ecSSteven Whitehouse break; 15816ca9412SBenjamin Marzinski if (gfs2_ail1_start_one(sdp, wbc, tr)) 1594f1de018SSteven Whitehouse goto restart; 1604667a0ecSSteven Whitehouse } 1614667a0ecSSteven Whitehouse spin_unlock(&sdp->sd_ail_lock); 162885bcecaSSteven Whitehouse blk_finish_plug(&plug); 163c83ae9caSSteven Whitehouse trace_gfs2_ail_flush(sdp, wbc, 0); 1644667a0ecSSteven Whitehouse } 1654667a0ecSSteven Whitehouse 1664667a0ecSSteven Whitehouse /** 1674667a0ecSSteven Whitehouse * gfs2_ail1_start - start writeback of all ail1 entries 1684667a0ecSSteven Whitehouse * @sdp: The superblock 1694667a0ecSSteven Whitehouse */ 1704667a0ecSSteven Whitehouse 1714667a0ecSSteven Whitehouse static void gfs2_ail1_start(struct gfs2_sbd *sdp) 1724667a0ecSSteven Whitehouse { 1734667a0ecSSteven Whitehouse struct writeback_control wbc = { 1744667a0ecSSteven Whitehouse .sync_mode = WB_SYNC_NONE, 1754667a0ecSSteven Whitehouse .nr_to_write = LONG_MAX, 1764667a0ecSSteven Whitehouse .range_start = 0, 1774667a0ecSSteven Whitehouse .range_end = LLONG_MAX, 1784667a0ecSSteven Whitehouse }; 1794667a0ecSSteven Whitehouse 1804667a0ecSSteven Whitehouse return gfs2_ail1_flush(sdp, &wbc); 181ddacfaf7SSteven Whitehouse } 182ddacfaf7SSteven Whitehouse 183ddacfaf7SSteven Whitehouse /** 184ddacfaf7SSteven Whitehouse * gfs2_ail1_empty_one - Check whether or not a trans in the AIL has been synced 185ddacfaf7SSteven Whitehouse * @sdp: the filesystem 186ddacfaf7SSteven Whitehouse * @ai: the AIL entry 187ddacfaf7SSteven Whitehouse * 188ddacfaf7SSteven Whitehouse */ 189ddacfaf7SSteven Whitehouse 19016ca9412SBenjamin Marzinski static void gfs2_ail1_empty_one(struct gfs2_sbd *sdp, struct gfs2_trans *tr) 191ddacfaf7SSteven Whitehouse { 192ddacfaf7SSteven Whitehouse struct gfs2_bufdata *bd, *s; 193ddacfaf7SSteven Whitehouse struct buffer_head *bh; 194ddacfaf7SSteven Whitehouse 19516ca9412SBenjamin Marzinski list_for_each_entry_safe_reverse(bd, s, &tr->tr_ail1_list, 196ddacfaf7SSteven Whitehouse bd_ail_st_list) { 197ddacfaf7SSteven Whitehouse bh = bd->bd_bh; 19816ca9412SBenjamin Marzinski gfs2_assert(sdp, bd->bd_tr == tr); 1994667a0ecSSteven Whitehouse if (buffer_busy(bh)) 200ddacfaf7SSteven Whitehouse continue; 201ddacfaf7SSteven Whitehouse if (!buffer_uptodate(bh)) 202ddacfaf7SSteven Whitehouse gfs2_io_error_bh(sdp, bh); 20316ca9412SBenjamin Marzinski list_move(&bd->bd_ail_st_list, &tr->tr_ail2_list); 204ddacfaf7SSteven Whitehouse } 205ddacfaf7SSteven Whitehouse 206ddacfaf7SSteven Whitehouse } 207ddacfaf7SSteven Whitehouse 2084667a0ecSSteven Whitehouse /** 2094667a0ecSSteven Whitehouse * gfs2_ail1_empty - Try to empty the ail1 lists 2104667a0ecSSteven Whitehouse * @sdp: The superblock 2114667a0ecSSteven Whitehouse * 2124667a0ecSSteven Whitehouse * Tries to empty the ail1 lists, starting with the oldest first 2134667a0ecSSteven Whitehouse */ 214b3b94faaSDavid Teigland 2154667a0ecSSteven Whitehouse static int gfs2_ail1_empty(struct gfs2_sbd *sdp) 216b3b94faaSDavid Teigland { 21716ca9412SBenjamin Marzinski struct gfs2_trans *tr, *s; 2185d054964SBenjamin Marzinski int oldest_tr = 1; 219b3b94faaSDavid Teigland int ret; 220b3b94faaSDavid Teigland 221d6a079e8SDave Chinner spin_lock(&sdp->sd_ail_lock); 22216ca9412SBenjamin Marzinski list_for_each_entry_safe_reverse(tr, s, &sdp->sd_ail1_list, tr_list) { 22316ca9412SBenjamin Marzinski gfs2_ail1_empty_one(sdp, tr); 2245d054964SBenjamin Marzinski if (list_empty(&tr->tr_ail1_list) && oldest_tr) 22516ca9412SBenjamin Marzinski list_move(&tr->tr_list, &sdp->sd_ail2_list); 2264667a0ecSSteven Whitehouse else 2275d054964SBenjamin Marzinski oldest_tr = 0; 228b3b94faaSDavid Teigland } 229b3b94faaSDavid Teigland ret = list_empty(&sdp->sd_ail1_list); 230d6a079e8SDave Chinner spin_unlock(&sdp->sd_ail_lock); 231b3b94faaSDavid Teigland 232b3b94faaSDavid Teigland return ret; 233b3b94faaSDavid Teigland } 234b3b94faaSDavid Teigland 23526b06a69SSteven Whitehouse static void gfs2_ail1_wait(struct gfs2_sbd *sdp) 23626b06a69SSteven Whitehouse { 23716ca9412SBenjamin Marzinski struct gfs2_trans *tr; 23826b06a69SSteven Whitehouse struct gfs2_bufdata *bd; 23926b06a69SSteven Whitehouse struct buffer_head *bh; 24026b06a69SSteven Whitehouse 24126b06a69SSteven Whitehouse spin_lock(&sdp->sd_ail_lock); 24216ca9412SBenjamin Marzinski list_for_each_entry_reverse(tr, &sdp->sd_ail1_list, tr_list) { 24316ca9412SBenjamin Marzinski list_for_each_entry(bd, &tr->tr_ail1_list, bd_ail_st_list) { 24426b06a69SSteven Whitehouse bh = bd->bd_bh; 24526b06a69SSteven Whitehouse if (!buffer_locked(bh)) 24626b06a69SSteven Whitehouse continue; 24726b06a69SSteven Whitehouse get_bh(bh); 24826b06a69SSteven Whitehouse spin_unlock(&sdp->sd_ail_lock); 24926b06a69SSteven Whitehouse wait_on_buffer(bh); 25026b06a69SSteven Whitehouse brelse(bh); 25126b06a69SSteven Whitehouse return; 25226b06a69SSteven Whitehouse } 25326b06a69SSteven Whitehouse } 25426b06a69SSteven Whitehouse spin_unlock(&sdp->sd_ail_lock); 25526b06a69SSteven Whitehouse } 256ddacfaf7SSteven Whitehouse 257ddacfaf7SSteven Whitehouse /** 258ddacfaf7SSteven Whitehouse * gfs2_ail2_empty_one - Check whether or not a trans in the AIL has been synced 259ddacfaf7SSteven Whitehouse * @sdp: the filesystem 260ddacfaf7SSteven Whitehouse * @ai: the AIL entry 261ddacfaf7SSteven Whitehouse * 262ddacfaf7SSteven Whitehouse */ 263ddacfaf7SSteven Whitehouse 26416ca9412SBenjamin Marzinski static void gfs2_ail2_empty_one(struct gfs2_sbd *sdp, struct gfs2_trans *tr) 265ddacfaf7SSteven Whitehouse { 26616ca9412SBenjamin Marzinski struct list_head *head = &tr->tr_ail2_list; 267ddacfaf7SSteven Whitehouse struct gfs2_bufdata *bd; 268ddacfaf7SSteven Whitehouse 269ddacfaf7SSteven Whitehouse while (!list_empty(head)) { 270ddacfaf7SSteven Whitehouse bd = list_entry(head->prev, struct gfs2_bufdata, 271ddacfaf7SSteven Whitehouse bd_ail_st_list); 27216ca9412SBenjamin Marzinski gfs2_assert(sdp, bd->bd_tr == tr); 273f91a0d3eSSteven Whitehouse gfs2_remove_from_ail(bd); 274ddacfaf7SSteven Whitehouse } 275ddacfaf7SSteven Whitehouse } 276ddacfaf7SSteven Whitehouse 277b3b94faaSDavid Teigland static void ail2_empty(struct gfs2_sbd *sdp, unsigned int new_tail) 278b3b94faaSDavid Teigland { 27916ca9412SBenjamin Marzinski struct gfs2_trans *tr, *safe; 280b3b94faaSDavid Teigland unsigned int old_tail = sdp->sd_log_tail; 281b3b94faaSDavid Teigland int wrap = (new_tail < old_tail); 282b3b94faaSDavid Teigland int a, b, rm; 283b3b94faaSDavid Teigland 284d6a079e8SDave Chinner spin_lock(&sdp->sd_ail_lock); 285b3b94faaSDavid Teigland 28616ca9412SBenjamin Marzinski list_for_each_entry_safe(tr, safe, &sdp->sd_ail2_list, tr_list) { 28716ca9412SBenjamin Marzinski a = (old_tail <= tr->tr_first); 28816ca9412SBenjamin Marzinski b = (tr->tr_first < new_tail); 289b3b94faaSDavid Teigland rm = (wrap) ? (a || b) : (a && b); 290b3b94faaSDavid Teigland if (!rm) 291b3b94faaSDavid Teigland continue; 292b3b94faaSDavid Teigland 29316ca9412SBenjamin Marzinski gfs2_ail2_empty_one(sdp, tr); 29416ca9412SBenjamin Marzinski list_del(&tr->tr_list); 29516ca9412SBenjamin Marzinski gfs2_assert_warn(sdp, list_empty(&tr->tr_ail1_list)); 29616ca9412SBenjamin Marzinski gfs2_assert_warn(sdp, list_empty(&tr->tr_ail2_list)); 29716ca9412SBenjamin Marzinski kfree(tr); 298b3b94faaSDavid Teigland } 299b3b94faaSDavid Teigland 300d6a079e8SDave Chinner spin_unlock(&sdp->sd_ail_lock); 301b3b94faaSDavid Teigland } 302b3b94faaSDavid Teigland 303b3b94faaSDavid Teigland /** 30424972557SBenjamin Marzinski * gfs2_log_release - Release a given number of log blocks 30524972557SBenjamin Marzinski * @sdp: The GFS2 superblock 30624972557SBenjamin Marzinski * @blks: The number of blocks 30724972557SBenjamin Marzinski * 30824972557SBenjamin Marzinski */ 30924972557SBenjamin Marzinski 31024972557SBenjamin Marzinski void gfs2_log_release(struct gfs2_sbd *sdp, unsigned int blks) 31124972557SBenjamin Marzinski { 31224972557SBenjamin Marzinski 31324972557SBenjamin Marzinski atomic_add(blks, &sdp->sd_log_blks_free); 31424972557SBenjamin Marzinski trace_gfs2_log_blocks(sdp, blks); 31524972557SBenjamin Marzinski gfs2_assert_withdraw(sdp, atomic_read(&sdp->sd_log_blks_free) <= 31624972557SBenjamin Marzinski sdp->sd_jdesc->jd_blocks); 31724972557SBenjamin Marzinski up_read(&sdp->sd_log_flush_lock); 31824972557SBenjamin Marzinski } 31924972557SBenjamin Marzinski 32024972557SBenjamin Marzinski /** 321b3b94faaSDavid Teigland * gfs2_log_reserve - Make a log reservation 322b3b94faaSDavid Teigland * @sdp: The GFS2 superblock 323b3b94faaSDavid Teigland * @blks: The number of blocks to reserve 324b3b94faaSDavid Teigland * 32589918647SSteven Whitehouse * Note that we never give out the last few blocks of the journal. Thats 3262332c443SRobert Peterson * due to the fact that there is a small number of header blocks 327b004157aSSteven Whitehouse * associated with each log flush. The exact number can't be known until 328b004157aSSteven Whitehouse * flush time, so we ensure that we have just enough free blocks at all 329b004157aSSteven Whitehouse * times to avoid running out during a log flush. 330b004157aSSteven Whitehouse * 3315e687eacSBenjamin Marzinski * We no longer flush the log here, instead we wake up logd to do that 3325e687eacSBenjamin Marzinski * for us. To avoid the thundering herd and to ensure that we deal fairly 3335e687eacSBenjamin Marzinski * with queued waiters, we use an exclusive wait. This means that when we 3345e687eacSBenjamin Marzinski * get woken with enough journal space to get our reservation, we need to 3355e687eacSBenjamin Marzinski * wake the next waiter on the list. 3365e687eacSBenjamin Marzinski * 337b3b94faaSDavid Teigland * Returns: errno 338b3b94faaSDavid Teigland */ 339b3b94faaSDavid Teigland 340b3b94faaSDavid Teigland int gfs2_log_reserve(struct gfs2_sbd *sdp, unsigned int blks) 341b3b94faaSDavid Teigland { 3422e60d768SBenjamin Marzinski int ret = 0; 3435d054964SBenjamin Marzinski unsigned reserved_blks = 7 * (4096 / sdp->sd_vfs->s_blocksize); 3445e687eacSBenjamin Marzinski unsigned wanted = blks + reserved_blks; 3455e687eacSBenjamin Marzinski DEFINE_WAIT(wait); 3465e687eacSBenjamin Marzinski int did_wait = 0; 3475e687eacSBenjamin Marzinski unsigned int free_blocks; 348b3b94faaSDavid Teigland 349b3b94faaSDavid Teigland if (gfs2_assert_warn(sdp, blks) || 350b3b94faaSDavid Teigland gfs2_assert_warn(sdp, blks <= sdp->sd_jdesc->jd_blocks)) 351b3b94faaSDavid Teigland return -EINVAL; 3525e687eacSBenjamin Marzinski retry: 3535e687eacSBenjamin Marzinski free_blocks = atomic_read(&sdp->sd_log_blks_free); 3545e687eacSBenjamin Marzinski if (unlikely(free_blocks <= wanted)) { 3555e687eacSBenjamin Marzinski do { 3565e687eacSBenjamin Marzinski prepare_to_wait_exclusive(&sdp->sd_log_waitq, &wait, 3575e687eacSBenjamin Marzinski TASK_UNINTERRUPTIBLE); 3585e687eacSBenjamin Marzinski wake_up(&sdp->sd_logd_waitq); 3595e687eacSBenjamin Marzinski did_wait = 1; 3605e687eacSBenjamin Marzinski if (atomic_read(&sdp->sd_log_blks_free) <= wanted) 3615e687eacSBenjamin Marzinski io_schedule(); 3625e687eacSBenjamin Marzinski free_blocks = atomic_read(&sdp->sd_log_blks_free); 3635e687eacSBenjamin Marzinski } while(free_blocks <= wanted); 3645e687eacSBenjamin Marzinski finish_wait(&sdp->sd_log_waitq, &wait); 365b3b94faaSDavid Teigland } 3662e60d768SBenjamin Marzinski atomic_inc(&sdp->sd_reserving_log); 3675e687eacSBenjamin Marzinski if (atomic_cmpxchg(&sdp->sd_log_blks_free, free_blocks, 3682e60d768SBenjamin Marzinski free_blocks - blks) != free_blocks) { 3692e60d768SBenjamin Marzinski if (atomic_dec_and_test(&sdp->sd_reserving_log)) 3702e60d768SBenjamin Marzinski wake_up(&sdp->sd_reserving_log_wait); 3715e687eacSBenjamin Marzinski goto retry; 3722e60d768SBenjamin Marzinski } 37363997775SSteven Whitehouse trace_gfs2_log_blocks(sdp, -blks); 3745e687eacSBenjamin Marzinski 3755e687eacSBenjamin Marzinski /* 3765e687eacSBenjamin Marzinski * If we waited, then so might others, wake them up _after_ we get 3775e687eacSBenjamin Marzinski * our share of the log. 3785e687eacSBenjamin Marzinski */ 3795e687eacSBenjamin Marzinski if (unlikely(did_wait)) 3805e687eacSBenjamin Marzinski wake_up(&sdp->sd_log_waitq); 381484adff8SSteven Whitehouse 382484adff8SSteven Whitehouse down_read(&sdp->sd_log_flush_lock); 38324972557SBenjamin Marzinski if (unlikely(!test_bit(SDF_JOURNAL_LIVE, &sdp->sd_flags))) { 38424972557SBenjamin Marzinski gfs2_log_release(sdp, blks); 3852e60d768SBenjamin Marzinski ret = -EROFS; 38624972557SBenjamin Marzinski } 3872e60d768SBenjamin Marzinski if (atomic_dec_and_test(&sdp->sd_reserving_log)) 3882e60d768SBenjamin Marzinski wake_up(&sdp->sd_reserving_log_wait); 3892e60d768SBenjamin Marzinski return ret; 390b3b94faaSDavid Teigland } 391b3b94faaSDavid Teigland 392b3b94faaSDavid Teigland /** 393b3b94faaSDavid Teigland * log_distance - Compute distance between two journal blocks 394b3b94faaSDavid Teigland * @sdp: The GFS2 superblock 395b3b94faaSDavid Teigland * @newer: The most recent journal block of the pair 396b3b94faaSDavid Teigland * @older: The older journal block of the pair 397b3b94faaSDavid Teigland * 398b3b94faaSDavid Teigland * Compute the distance (in the journal direction) between two 399b3b94faaSDavid Teigland * blocks in the journal 400b3b94faaSDavid Teigland * 401b3b94faaSDavid Teigland * Returns: the distance in blocks 402b3b94faaSDavid Teigland */ 403b3b94faaSDavid Teigland 404faa31ce8SSteven Whitehouse static inline unsigned int log_distance(struct gfs2_sbd *sdp, unsigned int newer, 405b3b94faaSDavid Teigland unsigned int older) 406b3b94faaSDavid Teigland { 407b3b94faaSDavid Teigland int dist; 408b3b94faaSDavid Teigland 409b3b94faaSDavid Teigland dist = newer - older; 410b3b94faaSDavid Teigland if (dist < 0) 411b3b94faaSDavid Teigland dist += sdp->sd_jdesc->jd_blocks; 412b3b94faaSDavid Teigland 413b3b94faaSDavid Teigland return dist; 414b3b94faaSDavid Teigland } 415b3b94faaSDavid Teigland 4162332c443SRobert Peterson /** 4172332c443SRobert Peterson * calc_reserved - Calculate the number of blocks to reserve when 4182332c443SRobert Peterson * refunding a transaction's unused buffers. 4192332c443SRobert Peterson * @sdp: The GFS2 superblock 4202332c443SRobert Peterson * 4212332c443SRobert Peterson * This is complex. We need to reserve room for all our currently used 4222332c443SRobert Peterson * metadata buffers (e.g. normal file I/O rewriting file time stamps) and 4232332c443SRobert Peterson * all our journaled data buffers for journaled files (e.g. files in the 4242332c443SRobert Peterson * meta_fs like rindex, or files for which chattr +j was done.) 4252332c443SRobert Peterson * If we don't reserve enough space, gfs2_log_refund and gfs2_log_flush 4262332c443SRobert Peterson * will count it as free space (sd_log_blks_free) and corruption will follow. 4272332c443SRobert Peterson * 4282332c443SRobert Peterson * We can have metadata bufs and jdata bufs in the same journal. So each 4292332c443SRobert Peterson * type gets its own log header, for which we need to reserve a block. 4302332c443SRobert Peterson * In fact, each type has the potential for needing more than one header 4312332c443SRobert Peterson * in cases where we have more buffers than will fit on a journal page. 4322332c443SRobert Peterson * Metadata journal entries take up half the space of journaled buffer entries. 4332332c443SRobert Peterson * Thus, metadata entries have buf_limit (502) and journaled buffers have 4342332c443SRobert Peterson * databuf_limit (251) before they cause a wrap around. 4352332c443SRobert Peterson * 4362332c443SRobert Peterson * Also, we need to reserve blocks for revoke journal entries and one for an 4372332c443SRobert Peterson * overall header for the lot. 4382332c443SRobert Peterson * 4392332c443SRobert Peterson * Returns: the number of blocks reserved 4402332c443SRobert Peterson */ 4412332c443SRobert Peterson static unsigned int calc_reserved(struct gfs2_sbd *sdp) 4422332c443SRobert Peterson { 4432332c443SRobert Peterson unsigned int reserved = 0; 444022ef4feSSteven Whitehouse unsigned int mbuf; 445022ef4feSSteven Whitehouse unsigned int dbuf; 446022ef4feSSteven Whitehouse struct gfs2_trans *tr = sdp->sd_log_tr; 4472332c443SRobert Peterson 448022ef4feSSteven Whitehouse if (tr) { 449022ef4feSSteven Whitehouse mbuf = tr->tr_num_buf_new - tr->tr_num_buf_rm; 450022ef4feSSteven Whitehouse dbuf = tr->tr_num_databuf_new - tr->tr_num_databuf_rm; 451022ef4feSSteven Whitehouse reserved = mbuf + dbuf; 452022ef4feSSteven Whitehouse /* Account for header blocks */ 453022ef4feSSteven Whitehouse reserved += DIV_ROUND_UP(mbuf, buf_limit(sdp)); 454022ef4feSSteven Whitehouse reserved += DIV_ROUND_UP(dbuf, databuf_limit(sdp)); 455022ef4feSSteven Whitehouse } 4562332c443SRobert Peterson 4572e95e3f6SBenjamin Marzinski if (sdp->sd_log_commited_revoke > 0) 458022ef4feSSteven Whitehouse reserved += gfs2_struct2blk(sdp, sdp->sd_log_commited_revoke, 4592332c443SRobert Peterson sizeof(u64)); 4602332c443SRobert Peterson /* One for the overall header */ 4612332c443SRobert Peterson if (reserved) 4622332c443SRobert Peterson reserved++; 4632332c443SRobert Peterson return reserved; 4642332c443SRobert Peterson } 4652332c443SRobert Peterson 466b3b94faaSDavid Teigland static unsigned int current_tail(struct gfs2_sbd *sdp) 467b3b94faaSDavid Teigland { 46816ca9412SBenjamin Marzinski struct gfs2_trans *tr; 469b3b94faaSDavid Teigland unsigned int tail; 470b3b94faaSDavid Teigland 471d6a079e8SDave Chinner spin_lock(&sdp->sd_ail_lock); 472b3b94faaSDavid Teigland 473faa31ce8SSteven Whitehouse if (list_empty(&sdp->sd_ail1_list)) { 474b3b94faaSDavid Teigland tail = sdp->sd_log_head; 475faa31ce8SSteven Whitehouse } else { 47616ca9412SBenjamin Marzinski tr = list_entry(sdp->sd_ail1_list.prev, struct gfs2_trans, 47716ca9412SBenjamin Marzinski tr_list); 47816ca9412SBenjamin Marzinski tail = tr->tr_first; 479b3b94faaSDavid Teigland } 480b3b94faaSDavid Teigland 481d6a079e8SDave Chinner spin_unlock(&sdp->sd_ail_lock); 482b3b94faaSDavid Teigland 483b3b94faaSDavid Teigland return tail; 484b3b94faaSDavid Teigland } 485b3b94faaSDavid Teigland 4862332c443SRobert Peterson static void log_pull_tail(struct gfs2_sbd *sdp, unsigned int new_tail) 487b3b94faaSDavid Teigland { 488b3b94faaSDavid Teigland unsigned int dist = log_distance(sdp, new_tail, sdp->sd_log_tail); 489b3b94faaSDavid Teigland 490b3b94faaSDavid Teigland ail2_empty(sdp, new_tail); 491b3b94faaSDavid Teigland 492fd041f0bSSteven Whitehouse atomic_add(dist, &sdp->sd_log_blks_free); 49363997775SSteven Whitehouse trace_gfs2_log_blocks(sdp, dist); 4945e687eacSBenjamin Marzinski gfs2_assert_withdraw(sdp, atomic_read(&sdp->sd_log_blks_free) <= 4955e687eacSBenjamin Marzinski sdp->sd_jdesc->jd_blocks); 496b3b94faaSDavid Teigland 497b3b94faaSDavid Teigland sdp->sd_log_tail = new_tail; 498b3b94faaSDavid Teigland } 499b3b94faaSDavid Teigland 500b3b94faaSDavid Teigland 50134cc1781SSteven Whitehouse static void log_flush_wait(struct gfs2_sbd *sdp) 502b3b94faaSDavid Teigland { 50316615be1SSteven Whitehouse DEFINE_WAIT(wait); 504b3b94faaSDavid Teigland 50516615be1SSteven Whitehouse if (atomic_read(&sdp->sd_log_in_flight)) { 50616615be1SSteven Whitehouse do { 50716615be1SSteven Whitehouse prepare_to_wait(&sdp->sd_log_flush_wait, &wait, 50816615be1SSteven Whitehouse TASK_UNINTERRUPTIBLE); 50916615be1SSteven Whitehouse if (atomic_read(&sdp->sd_log_in_flight)) 51016615be1SSteven Whitehouse io_schedule(); 51116615be1SSteven Whitehouse } while(atomic_read(&sdp->sd_log_in_flight)); 51216615be1SSteven Whitehouse finish_wait(&sdp->sd_log_flush_wait, &wait); 513b3b94faaSDavid Teigland } 514b3b94faaSDavid Teigland } 515b3b94faaSDavid Teigland 51645138990SSteven Whitehouse static int ip_cmp(void *priv, struct list_head *a, struct list_head *b) 5174a36d08dSBob Peterson { 51845138990SSteven Whitehouse struct gfs2_inode *ipa, *ipb; 5194a36d08dSBob Peterson 52045138990SSteven Whitehouse ipa = list_entry(a, struct gfs2_inode, i_ordered); 52145138990SSteven Whitehouse ipb = list_entry(b, struct gfs2_inode, i_ordered); 5224a36d08dSBob Peterson 52345138990SSteven Whitehouse if (ipa->i_no_addr < ipb->i_no_addr) 5244a36d08dSBob Peterson return -1; 52545138990SSteven Whitehouse if (ipa->i_no_addr > ipb->i_no_addr) 5264a36d08dSBob Peterson return 1; 5274a36d08dSBob Peterson return 0; 5284a36d08dSBob Peterson } 5294a36d08dSBob Peterson 530d7b616e2SSteven Whitehouse static void gfs2_ordered_write(struct gfs2_sbd *sdp) 531d7b616e2SSteven Whitehouse { 53245138990SSteven Whitehouse struct gfs2_inode *ip; 533d7b616e2SSteven Whitehouse LIST_HEAD(written); 534d7b616e2SSteven Whitehouse 53545138990SSteven Whitehouse spin_lock(&sdp->sd_ordered_lock); 53645138990SSteven Whitehouse list_sort(NULL, &sdp->sd_log_le_ordered, &ip_cmp); 537d7b616e2SSteven Whitehouse while (!list_empty(&sdp->sd_log_le_ordered)) { 53845138990SSteven Whitehouse ip = list_entry(sdp->sd_log_le_ordered.next, struct gfs2_inode, i_ordered); 53945138990SSteven Whitehouse list_move(&ip->i_ordered, &written); 54045138990SSteven Whitehouse if (ip->i_inode.i_mapping->nrpages == 0) 541d7b616e2SSteven Whitehouse continue; 54245138990SSteven Whitehouse spin_unlock(&sdp->sd_ordered_lock); 54345138990SSteven Whitehouse filemap_fdatawrite(ip->i_inode.i_mapping); 54445138990SSteven Whitehouse spin_lock(&sdp->sd_ordered_lock); 545d7b616e2SSteven Whitehouse } 546d7b616e2SSteven Whitehouse list_splice(&written, &sdp->sd_log_le_ordered); 54745138990SSteven Whitehouse spin_unlock(&sdp->sd_ordered_lock); 548d7b616e2SSteven Whitehouse } 549d7b616e2SSteven Whitehouse 550d7b616e2SSteven Whitehouse static void gfs2_ordered_wait(struct gfs2_sbd *sdp) 551d7b616e2SSteven Whitehouse { 55245138990SSteven Whitehouse struct gfs2_inode *ip; 553d7b616e2SSteven Whitehouse 55445138990SSteven Whitehouse spin_lock(&sdp->sd_ordered_lock); 555d7b616e2SSteven Whitehouse while (!list_empty(&sdp->sd_log_le_ordered)) { 55645138990SSteven Whitehouse ip = list_entry(sdp->sd_log_le_ordered.next, struct gfs2_inode, i_ordered); 55745138990SSteven Whitehouse list_del(&ip->i_ordered); 55845138990SSteven Whitehouse WARN_ON(!test_and_clear_bit(GIF_ORDERED, &ip->i_flags)); 55945138990SSteven Whitehouse if (ip->i_inode.i_mapping->nrpages == 0) 560d7b616e2SSteven Whitehouse continue; 56145138990SSteven Whitehouse spin_unlock(&sdp->sd_ordered_lock); 56245138990SSteven Whitehouse filemap_fdatawait(ip->i_inode.i_mapping); 56345138990SSteven Whitehouse spin_lock(&sdp->sd_ordered_lock); 564d7b616e2SSteven Whitehouse } 56545138990SSteven Whitehouse spin_unlock(&sdp->sd_ordered_lock); 566d7b616e2SSteven Whitehouse } 56745138990SSteven Whitehouse 56845138990SSteven Whitehouse void gfs2_ordered_del_inode(struct gfs2_inode *ip) 56945138990SSteven Whitehouse { 57045138990SSteven Whitehouse struct gfs2_sbd *sdp = GFS2_SB(&ip->i_inode); 57145138990SSteven Whitehouse 57245138990SSteven Whitehouse spin_lock(&sdp->sd_ordered_lock); 57345138990SSteven Whitehouse if (test_and_clear_bit(GIF_ORDERED, &ip->i_flags)) 57445138990SSteven Whitehouse list_del(&ip->i_ordered); 57545138990SSteven Whitehouse spin_unlock(&sdp->sd_ordered_lock); 576d7b616e2SSteven Whitehouse } 577d7b616e2SSteven Whitehouse 5785d054964SBenjamin Marzinski void gfs2_add_revoke(struct gfs2_sbd *sdp, struct gfs2_bufdata *bd) 5795d054964SBenjamin Marzinski { 5805d054964SBenjamin Marzinski struct buffer_head *bh = bd->bd_bh; 5815d054964SBenjamin Marzinski struct gfs2_glock *gl = bd->bd_gl; 5825d054964SBenjamin Marzinski 5835d054964SBenjamin Marzinski bh->b_private = NULL; 5845d054964SBenjamin Marzinski bd->bd_blkno = bh->b_blocknr; 5859290a9a7SBob Peterson gfs2_remove_from_ail(bd); /* drops ref on bh */ 5869290a9a7SBob Peterson bd->bd_bh = NULL; 5875d054964SBenjamin Marzinski bd->bd_ops = &gfs2_revoke_lops; 5885d054964SBenjamin Marzinski sdp->sd_log_num_revoke++; 5895d054964SBenjamin Marzinski atomic_inc(&gl->gl_revokes); 5905d054964SBenjamin Marzinski set_bit(GLF_LFLUSH, &gl->gl_flags); 5915d054964SBenjamin Marzinski list_add(&bd->bd_list, &sdp->sd_log_le_revoke); 5925d054964SBenjamin Marzinski } 5935d054964SBenjamin Marzinski 5945d054964SBenjamin Marzinski void gfs2_write_revokes(struct gfs2_sbd *sdp) 5955d054964SBenjamin Marzinski { 5965d054964SBenjamin Marzinski struct gfs2_trans *tr; 5975d054964SBenjamin Marzinski struct gfs2_bufdata *bd, *tmp; 5985d054964SBenjamin Marzinski int have_revokes = 0; 5995d054964SBenjamin Marzinski int max_revokes = (sdp->sd_sb.sb_bsize - sizeof(struct gfs2_log_descriptor)) / sizeof(u64); 6005d054964SBenjamin Marzinski 6015d054964SBenjamin Marzinski gfs2_ail1_empty(sdp); 6025d054964SBenjamin Marzinski spin_lock(&sdp->sd_ail_lock); 6035d054964SBenjamin Marzinski list_for_each_entry(tr, &sdp->sd_ail1_list, tr_list) { 6045d054964SBenjamin Marzinski list_for_each_entry(bd, &tr->tr_ail2_list, bd_ail_st_list) { 6055d054964SBenjamin Marzinski if (list_empty(&bd->bd_list)) { 6065d054964SBenjamin Marzinski have_revokes = 1; 6075d054964SBenjamin Marzinski goto done; 6085d054964SBenjamin Marzinski } 6095d054964SBenjamin Marzinski } 6105d054964SBenjamin Marzinski } 6115d054964SBenjamin Marzinski done: 6125d054964SBenjamin Marzinski spin_unlock(&sdp->sd_ail_lock); 6135d054964SBenjamin Marzinski if (have_revokes == 0) 6145d054964SBenjamin Marzinski return; 6155d054964SBenjamin Marzinski while (sdp->sd_log_num_revoke > max_revokes) 6165d054964SBenjamin Marzinski max_revokes += (sdp->sd_sb.sb_bsize - sizeof(struct gfs2_meta_header)) / sizeof(u64); 6175d054964SBenjamin Marzinski max_revokes -= sdp->sd_log_num_revoke; 6185d054964SBenjamin Marzinski if (!sdp->sd_log_num_revoke) { 6195d054964SBenjamin Marzinski atomic_dec(&sdp->sd_log_blks_free); 6205d054964SBenjamin Marzinski /* If no blocks have been reserved, we need to also 6215d054964SBenjamin Marzinski * reserve a block for the header */ 6225d054964SBenjamin Marzinski if (!sdp->sd_log_blks_reserved) 6235d054964SBenjamin Marzinski atomic_dec(&sdp->sd_log_blks_free); 6245d054964SBenjamin Marzinski } 6255d054964SBenjamin Marzinski gfs2_log_lock(sdp); 6265d054964SBenjamin Marzinski spin_lock(&sdp->sd_ail_lock); 6275d054964SBenjamin Marzinski list_for_each_entry(tr, &sdp->sd_ail1_list, tr_list) { 6285d054964SBenjamin Marzinski list_for_each_entry_safe(bd, tmp, &tr->tr_ail2_list, bd_ail_st_list) { 6295d054964SBenjamin Marzinski if (max_revokes == 0) 6305d054964SBenjamin Marzinski goto out_of_blocks; 6315d054964SBenjamin Marzinski if (!list_empty(&bd->bd_list)) 6325d054964SBenjamin Marzinski continue; 6335d054964SBenjamin Marzinski gfs2_add_revoke(sdp, bd); 6345d054964SBenjamin Marzinski max_revokes--; 6355d054964SBenjamin Marzinski } 6365d054964SBenjamin Marzinski } 6375d054964SBenjamin Marzinski out_of_blocks: 6385d054964SBenjamin Marzinski spin_unlock(&sdp->sd_ail_lock); 6395d054964SBenjamin Marzinski gfs2_log_unlock(sdp); 6405d054964SBenjamin Marzinski 6415d054964SBenjamin Marzinski if (!sdp->sd_log_num_revoke) { 6425d054964SBenjamin Marzinski atomic_inc(&sdp->sd_log_blks_free); 6435d054964SBenjamin Marzinski if (!sdp->sd_log_blks_reserved) 6445d054964SBenjamin Marzinski atomic_inc(&sdp->sd_log_blks_free); 6455d054964SBenjamin Marzinski } 6465d054964SBenjamin Marzinski } 6475d054964SBenjamin Marzinski 648b3b94faaSDavid Teigland /** 64934cc1781SSteven Whitehouse * log_write_header - Get and initialize a journal header buffer 65034cc1781SSteven Whitehouse * @sdp: The GFS2 superblock 65134cc1781SSteven Whitehouse * 65234cc1781SSteven Whitehouse * Returns: the initialized log buffer descriptor 65334cc1781SSteven Whitehouse */ 65434cc1781SSteven Whitehouse 655fdb76a42SSteven Whitehouse static void log_write_header(struct gfs2_sbd *sdp, u32 flags) 65634cc1781SSteven Whitehouse { 65734cc1781SSteven Whitehouse struct gfs2_log_header *lh; 65834cc1781SSteven Whitehouse unsigned int tail; 65934cc1781SSteven Whitehouse u32 hash; 660*70fd7614SChristoph Hellwig int op_flags = REQ_PREFLUSH | REQ_FUA | REQ_META; 661e8c92ed7SSteven Whitehouse struct page *page = mempool_alloc(gfs2_page_pool, GFP_NOIO); 6622e60d768SBenjamin Marzinski enum gfs2_freeze_state state = atomic_read(&sdp->sd_freeze_state); 663e8c92ed7SSteven Whitehouse lh = page_address(page); 664e8c92ed7SSteven Whitehouse clear_page(lh); 66534cc1781SSteven Whitehouse 6662e60d768SBenjamin Marzinski gfs2_assert_withdraw(sdp, (state != SFS_FROZEN)); 6672e60d768SBenjamin Marzinski 66834cc1781SSteven Whitehouse tail = current_tail(sdp); 66934cc1781SSteven Whitehouse 67034cc1781SSteven Whitehouse lh->lh_header.mh_magic = cpu_to_be32(GFS2_MAGIC); 67134cc1781SSteven Whitehouse lh->lh_header.mh_type = cpu_to_be32(GFS2_METATYPE_LH); 67234cc1781SSteven Whitehouse lh->lh_header.__pad0 = cpu_to_be64(0); 67334cc1781SSteven Whitehouse lh->lh_header.mh_format = cpu_to_be32(GFS2_FORMAT_LH); 67434cc1781SSteven Whitehouse lh->lh_header.mh_jid = cpu_to_be32(sdp->sd_jdesc->jd_jid); 67534cc1781SSteven Whitehouse lh->lh_sequence = cpu_to_be64(sdp->sd_log_sequence++); 67634cc1781SSteven Whitehouse lh->lh_flags = cpu_to_be32(flags); 67734cc1781SSteven Whitehouse lh->lh_tail = cpu_to_be32(tail); 67834cc1781SSteven Whitehouse lh->lh_blkno = cpu_to_be32(sdp->sd_log_flush_head); 679e8c92ed7SSteven Whitehouse hash = gfs2_disk_hash(page_address(page), sizeof(struct gfs2_log_header)); 68034cc1781SSteven Whitehouse lh->lh_hash = cpu_to_be32(hash); 68134cc1781SSteven Whitehouse 68234cc1781SSteven Whitehouse if (test_bit(SDF_NOBARRIERS, &sdp->sd_flags)) { 68334cc1781SSteven Whitehouse gfs2_ordered_wait(sdp); 68434cc1781SSteven Whitehouse log_flush_wait(sdp); 685*70fd7614SChristoph Hellwig op_flags = REQ_SYNC | REQ_META | REQ_PRIO; 68634cc1781SSteven Whitehouse } 68734cc1781SSteven Whitehouse 688e8c92ed7SSteven Whitehouse sdp->sd_log_idle = (tail == sdp->sd_log_flush_head); 689e8c92ed7SSteven Whitehouse gfs2_log_write_page(sdp, page); 690e1b1afa6SMike Christie gfs2_log_flush_bio(sdp, REQ_OP_WRITE, op_flags); 691e8c92ed7SSteven Whitehouse log_flush_wait(sdp); 69234cc1781SSteven Whitehouse 69334cc1781SSteven Whitehouse if (sdp->sd_log_tail != tail) 69434cc1781SSteven Whitehouse log_pull_tail(sdp, tail); 69534cc1781SSteven Whitehouse } 69634cc1781SSteven Whitehouse 69734cc1781SSteven Whitehouse /** 698b09e593dSSteven Whitehouse * gfs2_log_flush - flush incore transaction(s) 699b3b94faaSDavid Teigland * @sdp: the filesystem 700b3b94faaSDavid Teigland * @gl: The glock structure to flush. If NULL, flush the whole incore log 701b3b94faaSDavid Teigland * 702b3b94faaSDavid Teigland */ 703b3b94faaSDavid Teigland 70424972557SBenjamin Marzinski void gfs2_log_flush(struct gfs2_sbd *sdp, struct gfs2_glock *gl, 70524972557SBenjamin Marzinski enum gfs2_flush_type type) 706b3b94faaSDavid Teigland { 70716ca9412SBenjamin Marzinski struct gfs2_trans *tr; 7082e60d768SBenjamin Marzinski enum gfs2_freeze_state state = atomic_read(&sdp->sd_freeze_state); 709b3b94faaSDavid Teigland 710484adff8SSteven Whitehouse down_write(&sdp->sd_log_flush_lock); 711f55ab26aSSteven Whitehouse 7122bcd610dSSteven Whitehouse /* Log might have been flushed while we waited for the flush lock */ 7132bcd610dSSteven Whitehouse if (gl && !test_bit(GLF_LFLUSH, &gl->gl_flags)) { 714484adff8SSteven Whitehouse up_write(&sdp->sd_log_flush_lock); 715f55ab26aSSteven Whitehouse return; 716f55ab26aSSteven Whitehouse } 71763997775SSteven Whitehouse trace_gfs2_log_flush(sdp, 1); 718f55ab26aSSteven Whitehouse 719400ac52eSBenjamin Marzinski if (type == SHUTDOWN_FLUSH) 720400ac52eSBenjamin Marzinski clear_bit(SDF_JOURNAL_LIVE, &sdp->sd_flags); 721400ac52eSBenjamin Marzinski 722b1ab1e44SSteven Whitehouse sdp->sd_log_flush_head = sdp->sd_log_head; 723b1ab1e44SSteven Whitehouse sdp->sd_log_flush_wrapped = 0; 72416ca9412SBenjamin Marzinski tr = sdp->sd_log_tr; 72516ca9412SBenjamin Marzinski if (tr) { 72616ca9412SBenjamin Marzinski sdp->sd_log_tr = NULL; 72716ca9412SBenjamin Marzinski INIT_LIST_HEAD(&tr->tr_ail1_list); 72816ca9412SBenjamin Marzinski INIT_LIST_HEAD(&tr->tr_ail2_list); 729b1ab1e44SSteven Whitehouse tr->tr_first = sdp->sd_log_flush_head; 7302e60d768SBenjamin Marzinski if (unlikely (state == SFS_FROZEN)) 7312e60d768SBenjamin Marzinski gfs2_assert_withdraw(sdp, !tr->tr_num_buf_new && !tr->tr_num_databuf_new); 73216ca9412SBenjamin Marzinski } 733b3b94faaSDavid Teigland 7342e60d768SBenjamin Marzinski if (unlikely(state == SFS_FROZEN)) 7352e60d768SBenjamin Marzinski gfs2_assert_withdraw(sdp, !sdp->sd_log_num_revoke); 736b3b94faaSDavid Teigland gfs2_assert_withdraw(sdp, 737b3b94faaSDavid Teigland sdp->sd_log_num_revoke == sdp->sd_log_commited_revoke); 738b3b94faaSDavid Teigland 739d7b616e2SSteven Whitehouse gfs2_ordered_write(sdp); 740d69a3c65SSteven Whitehouse lops_before_commit(sdp, tr); 741e1b1afa6SMike Christie gfs2_log_flush_bio(sdp, REQ_OP_WRITE, 0); 742d7b616e2SSteven Whitehouse 74334cc1781SSteven Whitehouse if (sdp->sd_log_head != sdp->sd_log_flush_head) { 744428fd95dSBob Peterson log_flush_wait(sdp); 745fdb76a42SSteven Whitehouse log_write_header(sdp, 0); 74634cc1781SSteven Whitehouse } else if (sdp->sd_log_tail != current_tail(sdp) && !sdp->sd_log_idle){ 747fd041f0bSSteven Whitehouse atomic_dec(&sdp->sd_log_blks_free); /* Adjust for unreserved buffer */ 74863997775SSteven Whitehouse trace_gfs2_log_blocks(sdp, -1); 749fdb76a42SSteven Whitehouse log_write_header(sdp, 0); 7502332c443SRobert Peterson } 75116ca9412SBenjamin Marzinski lops_after_commit(sdp, tr); 752fe1a698fSSteven Whitehouse 753fe1a698fSSteven Whitehouse gfs2_log_lock(sdp); 754b3b94faaSDavid Teigland sdp->sd_log_head = sdp->sd_log_flush_head; 755faa31ce8SSteven Whitehouse sdp->sd_log_blks_reserved = 0; 756b3b94faaSDavid Teigland sdp->sd_log_commited_revoke = 0; 757b3b94faaSDavid Teigland 758d6a079e8SDave Chinner spin_lock(&sdp->sd_ail_lock); 75916ca9412SBenjamin Marzinski if (tr && !list_empty(&tr->tr_ail1_list)) { 76016ca9412SBenjamin Marzinski list_add(&tr->tr_list, &sdp->sd_ail1_list); 76116ca9412SBenjamin Marzinski tr = NULL; 762b3b94faaSDavid Teigland } 763d6a079e8SDave Chinner spin_unlock(&sdp->sd_ail_lock); 764b3b94faaSDavid Teigland gfs2_log_unlock(sdp); 76524972557SBenjamin Marzinski 76624972557SBenjamin Marzinski if (type != NORMAL_FLUSH) { 76724972557SBenjamin Marzinski if (!sdp->sd_log_idle) { 76824972557SBenjamin Marzinski for (;;) { 76924972557SBenjamin Marzinski gfs2_ail1_start(sdp); 77024972557SBenjamin Marzinski gfs2_ail1_wait(sdp); 77124972557SBenjamin Marzinski if (gfs2_ail1_empty(sdp)) 77224972557SBenjamin Marzinski break; 77324972557SBenjamin Marzinski } 77424972557SBenjamin Marzinski atomic_dec(&sdp->sd_log_blks_free); /* Adjust for unreserved buffer */ 77524972557SBenjamin Marzinski trace_gfs2_log_blocks(sdp, -1); 77624972557SBenjamin Marzinski sdp->sd_log_flush_wrapped = 0; 77724972557SBenjamin Marzinski log_write_header(sdp, 0); 77824972557SBenjamin Marzinski sdp->sd_log_head = sdp->sd_log_flush_head; 77924972557SBenjamin Marzinski } 78024972557SBenjamin Marzinski if (type == SHUTDOWN_FLUSH || type == FREEZE_FLUSH) 78124972557SBenjamin Marzinski gfs2_log_shutdown(sdp); 7822e60d768SBenjamin Marzinski if (type == FREEZE_FLUSH) 7832e60d768SBenjamin Marzinski atomic_set(&sdp->sd_freeze_state, SFS_FROZEN); 78424972557SBenjamin Marzinski } 78524972557SBenjamin Marzinski 78663997775SSteven Whitehouse trace_gfs2_log_flush(sdp, 0); 787484adff8SSteven Whitehouse up_write(&sdp->sd_log_flush_lock); 788b3b94faaSDavid Teigland 78916ca9412SBenjamin Marzinski kfree(tr); 790b3b94faaSDavid Teigland } 791b3b94faaSDavid Teigland 792d69a3c65SSteven Whitehouse /** 793d69a3c65SSteven Whitehouse * gfs2_merge_trans - Merge a new transaction into a cached transaction 794d69a3c65SSteven Whitehouse * @old: Original transaction to be expanded 795d69a3c65SSteven Whitehouse * @new: New transaction to be merged 796d69a3c65SSteven Whitehouse */ 797d69a3c65SSteven Whitehouse 798d69a3c65SSteven Whitehouse static void gfs2_merge_trans(struct gfs2_trans *old, struct gfs2_trans *new) 799d69a3c65SSteven Whitehouse { 800d69a3c65SSteven Whitehouse WARN_ON_ONCE(old->tr_attached != 1); 801d69a3c65SSteven Whitehouse 802d69a3c65SSteven Whitehouse old->tr_num_buf_new += new->tr_num_buf_new; 803d69a3c65SSteven Whitehouse old->tr_num_databuf_new += new->tr_num_databuf_new; 804d69a3c65SSteven Whitehouse old->tr_num_buf_rm += new->tr_num_buf_rm; 805d69a3c65SSteven Whitehouse old->tr_num_databuf_rm += new->tr_num_databuf_rm; 806d69a3c65SSteven Whitehouse old->tr_num_revoke += new->tr_num_revoke; 807d69a3c65SSteven Whitehouse old->tr_num_revoke_rm += new->tr_num_revoke_rm; 808d69a3c65SSteven Whitehouse 809d69a3c65SSteven Whitehouse list_splice_tail_init(&new->tr_databuf, &old->tr_databuf); 810d69a3c65SSteven Whitehouse list_splice_tail_init(&new->tr_buf, &old->tr_buf); 811d69a3c65SSteven Whitehouse } 812d69a3c65SSteven Whitehouse 813b3b94faaSDavid Teigland static void log_refund(struct gfs2_sbd *sdp, struct gfs2_trans *tr) 814b3b94faaSDavid Teigland { 8152332c443SRobert Peterson unsigned int reserved; 816ac39aaddSSteven Whitehouse unsigned int unused; 817022ef4feSSteven Whitehouse unsigned int maxres; 818b3b94faaSDavid Teigland 819b3b94faaSDavid Teigland gfs2_log_lock(sdp); 820b3b94faaSDavid Teigland 821d69a3c65SSteven Whitehouse if (sdp->sd_log_tr) { 822d69a3c65SSteven Whitehouse gfs2_merge_trans(sdp->sd_log_tr, tr); 823d69a3c65SSteven Whitehouse } else if (tr->tr_num_buf_new || tr->tr_num_databuf_new) { 82424972557SBenjamin Marzinski gfs2_assert_withdraw(sdp, tr->tr_alloced); 82516ca9412SBenjamin Marzinski sdp->sd_log_tr = tr; 82616ca9412SBenjamin Marzinski tr->tr_attached = 1; 82716ca9412SBenjamin Marzinski } 828022ef4feSSteven Whitehouse 829022ef4feSSteven Whitehouse sdp->sd_log_commited_revoke += tr->tr_num_revoke - tr->tr_num_revoke_rm; 830022ef4feSSteven Whitehouse reserved = calc_reserved(sdp); 831022ef4feSSteven Whitehouse maxres = sdp->sd_log_blks_reserved + tr->tr_reserved; 832022ef4feSSteven Whitehouse gfs2_assert_withdraw(sdp, maxres >= reserved); 833022ef4feSSteven Whitehouse unused = maxres - reserved; 834022ef4feSSteven Whitehouse atomic_add(unused, &sdp->sd_log_blks_free); 835022ef4feSSteven Whitehouse trace_gfs2_log_blocks(sdp, unused); 836022ef4feSSteven Whitehouse gfs2_assert_withdraw(sdp, atomic_read(&sdp->sd_log_blks_free) <= 837022ef4feSSteven Whitehouse sdp->sd_jdesc->jd_blocks); 838022ef4feSSteven Whitehouse sdp->sd_log_blks_reserved = reserved; 839022ef4feSSteven Whitehouse 840b3b94faaSDavid Teigland gfs2_log_unlock(sdp); 841b3b94faaSDavid Teigland } 842b3b94faaSDavid Teigland 843b3b94faaSDavid Teigland /** 844b3b94faaSDavid Teigland * gfs2_log_commit - Commit a transaction to the log 845b3b94faaSDavid Teigland * @sdp: the filesystem 846b3b94faaSDavid Teigland * @tr: the transaction 847b3b94faaSDavid Teigland * 8485e687eacSBenjamin Marzinski * We wake up gfs2_logd if the number of pinned blocks exceed thresh1 8495e687eacSBenjamin Marzinski * or the total number of used blocks (pinned blocks plus AIL blocks) 8505e687eacSBenjamin Marzinski * is greater than thresh2. 8515e687eacSBenjamin Marzinski * 8525e687eacSBenjamin Marzinski * At mount time thresh1 is 1/3rd of journal size, thresh2 is 2/3rd of 8535e687eacSBenjamin Marzinski * journal size. 8545e687eacSBenjamin Marzinski * 855b3b94faaSDavid Teigland * Returns: errno 856b3b94faaSDavid Teigland */ 857b3b94faaSDavid Teigland 858b3b94faaSDavid Teigland void gfs2_log_commit(struct gfs2_sbd *sdp, struct gfs2_trans *tr) 859b3b94faaSDavid Teigland { 860b3b94faaSDavid Teigland log_refund(sdp, tr); 861b3b94faaSDavid Teigland 8625e687eacSBenjamin Marzinski if (atomic_read(&sdp->sd_log_pinned) > atomic_read(&sdp->sd_log_thresh1) || 8635e687eacSBenjamin Marzinski ((sdp->sd_jdesc->jd_blocks - atomic_read(&sdp->sd_log_blks_free)) > 8645e687eacSBenjamin Marzinski atomic_read(&sdp->sd_log_thresh2))) 8655e687eacSBenjamin Marzinski wake_up(&sdp->sd_logd_waitq); 866faa31ce8SSteven Whitehouse } 867b3b94faaSDavid Teigland 868b3b94faaSDavid Teigland /** 869b3b94faaSDavid Teigland * gfs2_log_shutdown - write a shutdown header into a journal 870b3b94faaSDavid Teigland * @sdp: the filesystem 871b3b94faaSDavid Teigland * 872b3b94faaSDavid Teigland */ 873b3b94faaSDavid Teigland 874b3b94faaSDavid Teigland void gfs2_log_shutdown(struct gfs2_sbd *sdp) 875b3b94faaSDavid Teigland { 876b3b94faaSDavid Teigland gfs2_assert_withdraw(sdp, !sdp->sd_log_blks_reserved); 877b3b94faaSDavid Teigland gfs2_assert_withdraw(sdp, !sdp->sd_log_num_revoke); 878b3b94faaSDavid Teigland gfs2_assert_withdraw(sdp, list_empty(&sdp->sd_ail1_list)); 879b3b94faaSDavid Teigland 880b3b94faaSDavid Teigland sdp->sd_log_flush_head = sdp->sd_log_head; 881b3b94faaSDavid Teigland sdp->sd_log_flush_wrapped = 0; 882b3b94faaSDavid Teigland 883fdb76a42SSteven Whitehouse log_write_header(sdp, GFS2_LOG_HEAD_UNMOUNT); 884b3b94faaSDavid Teigland 885a74604beSSteven Whitehouse gfs2_assert_warn(sdp, sdp->sd_log_head == sdp->sd_log_tail); 886a74604beSSteven Whitehouse gfs2_assert_warn(sdp, list_empty(&sdp->sd_ail2_list)); 887b3b94faaSDavid Teigland 888b3b94faaSDavid Teigland sdp->sd_log_head = sdp->sd_log_flush_head; 889b3b94faaSDavid Teigland sdp->sd_log_tail = sdp->sd_log_head; 890a25311c8SSteven Whitehouse } 891a25311c8SSteven Whitehouse 8925e687eacSBenjamin Marzinski static inline int gfs2_jrnl_flush_reqd(struct gfs2_sbd *sdp) 8935e687eacSBenjamin Marzinski { 8942e60d768SBenjamin Marzinski return (atomic_read(&sdp->sd_log_pinned) >= atomic_read(&sdp->sd_log_thresh1)); 8955e687eacSBenjamin Marzinski } 8965e687eacSBenjamin Marzinski 8975e687eacSBenjamin Marzinski static inline int gfs2_ail_flush_reqd(struct gfs2_sbd *sdp) 8985e687eacSBenjamin Marzinski { 8995e687eacSBenjamin Marzinski unsigned int used_blocks = sdp->sd_jdesc->jd_blocks - atomic_read(&sdp->sd_log_blks_free); 9005e687eacSBenjamin Marzinski return used_blocks >= atomic_read(&sdp->sd_log_thresh2); 9015e687eacSBenjamin Marzinski } 902ec69b188SSteven Whitehouse 903ec69b188SSteven Whitehouse /** 904ec69b188SSteven Whitehouse * gfs2_logd - Update log tail as Active Items get flushed to in-place blocks 905ec69b188SSteven Whitehouse * @sdp: Pointer to GFS2 superblock 906ec69b188SSteven Whitehouse * 907ec69b188SSteven Whitehouse * Also, periodically check to make sure that we're using the most recent 908ec69b188SSteven Whitehouse * journal index. 909ec69b188SSteven Whitehouse */ 910ec69b188SSteven Whitehouse 911ec69b188SSteven Whitehouse int gfs2_logd(void *data) 912ec69b188SSteven Whitehouse { 913ec69b188SSteven Whitehouse struct gfs2_sbd *sdp = data; 9145e687eacSBenjamin Marzinski unsigned long t = 1; 9155e687eacSBenjamin Marzinski DEFINE_WAIT(wait); 916ec69b188SSteven Whitehouse 917ec69b188SSteven Whitehouse while (!kthread_should_stop()) { 918ec69b188SSteven Whitehouse 9195e687eacSBenjamin Marzinski if (gfs2_jrnl_flush_reqd(sdp) || t == 0) { 9204667a0ecSSteven Whitehouse gfs2_ail1_empty(sdp); 92124972557SBenjamin Marzinski gfs2_log_flush(sdp, NULL, NORMAL_FLUSH); 922ec69b188SSteven Whitehouse } 923ec69b188SSteven Whitehouse 9245e687eacSBenjamin Marzinski if (gfs2_ail_flush_reqd(sdp)) { 9255e687eacSBenjamin Marzinski gfs2_ail1_start(sdp); 92626b06a69SSteven Whitehouse gfs2_ail1_wait(sdp); 9274667a0ecSSteven Whitehouse gfs2_ail1_empty(sdp); 92824972557SBenjamin Marzinski gfs2_log_flush(sdp, NULL, NORMAL_FLUSH); 9295e687eacSBenjamin Marzinski } 9305e687eacSBenjamin Marzinski 93126b06a69SSteven Whitehouse if (!gfs2_ail_flush_reqd(sdp)) 9325e687eacSBenjamin Marzinski wake_up(&sdp->sd_log_waitq); 93326b06a69SSteven Whitehouse 934ec69b188SSteven Whitehouse t = gfs2_tune_get(sdp, gt_logd_secs) * HZ; 935a0acae0eSTejun Heo 936a0acae0eSTejun Heo try_to_freeze(); 9375e687eacSBenjamin Marzinski 9385e687eacSBenjamin Marzinski do { 9395e687eacSBenjamin Marzinski prepare_to_wait(&sdp->sd_logd_waitq, &wait, 9405f487490SSteven Whitehouse TASK_INTERRUPTIBLE); 9415e687eacSBenjamin Marzinski if (!gfs2_ail_flush_reqd(sdp) && 9425e687eacSBenjamin Marzinski !gfs2_jrnl_flush_reqd(sdp) && 9435e687eacSBenjamin Marzinski !kthread_should_stop()) 9445e687eacSBenjamin Marzinski t = schedule_timeout(t); 9455e687eacSBenjamin Marzinski } while(t && !gfs2_ail_flush_reqd(sdp) && 9465e687eacSBenjamin Marzinski !gfs2_jrnl_flush_reqd(sdp) && 9475e687eacSBenjamin Marzinski !kthread_should_stop()); 9485e687eacSBenjamin Marzinski finish_wait(&sdp->sd_logd_waitq, &wait); 949ec69b188SSteven Whitehouse } 950ec69b188SSteven Whitehouse 951ec69b188SSteven Whitehouse return 0; 952ec69b188SSteven Whitehouse } 953ec69b188SSteven Whitehouse 954