1b3b94faaSDavid Teigland /* 2b3b94faaSDavid Teigland * Copyright (C) Sistina Software, Inc. 1997-2003 All rights reserved. 3da6dd40dSBob Peterson * Copyright (C) 2004-2007 Red Hat, Inc. All rights reserved. 4b3b94faaSDavid Teigland * 5b3b94faaSDavid Teigland * This copyrighted material is made available to anyone wishing to use, 6b3b94faaSDavid Teigland * modify, copy, or redistribute it subject to the terms and conditions 7e9fc2aa0SSteven Whitehouse * of the GNU General Public License version 2. 8b3b94faaSDavid Teigland */ 9b3b94faaSDavid Teigland 10b3b94faaSDavid Teigland #include <linux/sched.h> 11b3b94faaSDavid Teigland #include <linux/slab.h> 12b3b94faaSDavid Teigland #include <linux/spinlock.h> 13b3b94faaSDavid Teigland #include <linux/completion.h> 14b3b94faaSDavid Teigland #include <linux/buffer_head.h> 155c676f6dSSteven Whitehouse #include <linux/gfs2_ondisk.h> 1671b86f56SSteven Whitehouse #include <linux/crc32.h> 17a25311c8SSteven Whitehouse #include <linux/delay.h> 18ec69b188SSteven Whitehouse #include <linux/kthread.h> 19ec69b188SSteven Whitehouse #include <linux/freezer.h> 20254db57fSSteven Whitehouse #include <linux/bio.h> 21b3b94faaSDavid Teigland 22b3b94faaSDavid Teigland #include "gfs2.h" 235c676f6dSSteven Whitehouse #include "incore.h" 24b3b94faaSDavid Teigland #include "bmap.h" 25b3b94faaSDavid Teigland #include "glock.h" 26b3b94faaSDavid Teigland #include "log.h" 27b3b94faaSDavid Teigland #include "lops.h" 28b3b94faaSDavid Teigland #include "meta_io.h" 295c676f6dSSteven Whitehouse #include "util.h" 3071b86f56SSteven Whitehouse #include "dir.h" 3163997775SSteven Whitehouse #include "trace_gfs2.h" 32b3b94faaSDavid Teigland 33b3b94faaSDavid Teigland #define PULL 1 34b3b94faaSDavid Teigland 35b3b94faaSDavid Teigland /** 36b3b94faaSDavid Teigland * gfs2_struct2blk - compute stuff 37b3b94faaSDavid Teigland * @sdp: the filesystem 38b3b94faaSDavid Teigland * @nstruct: the number of structures 39b3b94faaSDavid Teigland * @ssize: the size of the structures 40b3b94faaSDavid Teigland * 41b3b94faaSDavid Teigland * Compute the number of log descriptor blocks needed to hold a certain number 42b3b94faaSDavid Teigland * of structures of a certain size. 43b3b94faaSDavid Teigland * 44b3b94faaSDavid Teigland * Returns: the number of blocks needed (minimum is always 1) 45b3b94faaSDavid Teigland */ 46b3b94faaSDavid Teigland 47b3b94faaSDavid Teigland unsigned int gfs2_struct2blk(struct gfs2_sbd *sdp, unsigned int nstruct, 48b3b94faaSDavid Teigland unsigned int ssize) 49b3b94faaSDavid Teigland { 50b3b94faaSDavid Teigland unsigned int blks; 51b3b94faaSDavid Teigland unsigned int first, second; 52b3b94faaSDavid Teigland 53b3b94faaSDavid Teigland blks = 1; 54faa31ce8SSteven Whitehouse first = (sdp->sd_sb.sb_bsize - sizeof(struct gfs2_log_descriptor)) / ssize; 55b3b94faaSDavid Teigland 56b3b94faaSDavid Teigland if (nstruct > first) { 57568f4c96SSteven Whitehouse second = (sdp->sd_sb.sb_bsize - 58568f4c96SSteven Whitehouse sizeof(struct gfs2_meta_header)) / ssize; 595c676f6dSSteven Whitehouse blks += DIV_ROUND_UP(nstruct - first, second); 60b3b94faaSDavid Teigland } 61b3b94faaSDavid Teigland 62b3b94faaSDavid Teigland return blks; 63b3b94faaSDavid Teigland } 64b3b94faaSDavid Teigland 65ddacfaf7SSteven Whitehouse /** 661e1a3d03SSteven Whitehouse * gfs2_remove_from_ail - Remove an entry from the ail lists, updating counters 671e1a3d03SSteven Whitehouse * @mapping: The associated mapping (maybe NULL) 681e1a3d03SSteven Whitehouse * @bd: The gfs2_bufdata to remove 691e1a3d03SSteven Whitehouse * 701e1a3d03SSteven Whitehouse * The log lock _must_ be held when calling this function 711e1a3d03SSteven Whitehouse * 721e1a3d03SSteven Whitehouse */ 731e1a3d03SSteven Whitehouse 74f91a0d3eSSteven Whitehouse void gfs2_remove_from_ail(struct gfs2_bufdata *bd) 751e1a3d03SSteven Whitehouse { 761e1a3d03SSteven Whitehouse bd->bd_ail = NULL; 771ad38c43SSteven Whitehouse list_del_init(&bd->bd_ail_st_list); 781ad38c43SSteven Whitehouse list_del_init(&bd->bd_ail_gl_list); 791e1a3d03SSteven Whitehouse atomic_dec(&bd->bd_gl->gl_ail_count); 801e1a3d03SSteven Whitehouse brelse(bd->bd_bh); 811e1a3d03SSteven Whitehouse } 821e1a3d03SSteven Whitehouse 831e1a3d03SSteven Whitehouse /** 84ddacfaf7SSteven Whitehouse * gfs2_ail1_start_one - Start I/O on a part of the AIL 85ddacfaf7SSteven Whitehouse * @sdp: the filesystem 86ddacfaf7SSteven Whitehouse * @tr: the part of the AIL 87ddacfaf7SSteven Whitehouse * 88ddacfaf7SSteven Whitehouse */ 89ddacfaf7SSteven Whitehouse 90ddacfaf7SSteven Whitehouse static void gfs2_ail1_start_one(struct gfs2_sbd *sdp, struct gfs2_ail *ai) 912d81afb8SHarvey Harrison __releases(&sdp->sd_log_lock) 922d81afb8SHarvey Harrison __acquires(&sdp->sd_log_lock) 93ddacfaf7SSteven Whitehouse { 94ddacfaf7SSteven Whitehouse struct gfs2_bufdata *bd, *s; 95ddacfaf7SSteven Whitehouse struct buffer_head *bh; 96ddacfaf7SSteven Whitehouse int retry; 97ddacfaf7SSteven Whitehouse 98ddacfaf7SSteven Whitehouse do { 99ddacfaf7SSteven Whitehouse retry = 0; 100ddacfaf7SSteven Whitehouse 101ddacfaf7SSteven Whitehouse list_for_each_entry_safe_reverse(bd, s, &ai->ai_ail1_list, 102ddacfaf7SSteven Whitehouse bd_ail_st_list) { 103ddacfaf7SSteven Whitehouse bh = bd->bd_bh; 104ddacfaf7SSteven Whitehouse 105ddacfaf7SSteven Whitehouse gfs2_assert(sdp, bd->bd_ail == ai); 106ddacfaf7SSteven Whitehouse 107ddacfaf7SSteven Whitehouse if (!buffer_busy(bh)) { 10816615be1SSteven Whitehouse if (!buffer_uptodate(bh)) 109ddacfaf7SSteven Whitehouse gfs2_io_error_bh(sdp, bh); 110ddacfaf7SSteven Whitehouse list_move(&bd->bd_ail_st_list, &ai->ai_ail2_list); 111ddacfaf7SSteven Whitehouse continue; 112ddacfaf7SSteven Whitehouse } 113ddacfaf7SSteven Whitehouse 114ddacfaf7SSteven Whitehouse if (!buffer_dirty(bh)) 115ddacfaf7SSteven Whitehouse continue; 116ddacfaf7SSteven Whitehouse 117ddacfaf7SSteven Whitehouse list_move(&bd->bd_ail_st_list, &ai->ai_ail1_list); 118ddacfaf7SSteven Whitehouse 11916615be1SSteven Whitehouse get_bh(bh); 120ddacfaf7SSteven Whitehouse gfs2_log_unlock(sdp); 12116615be1SSteven Whitehouse lock_buffer(bh); 12216615be1SSteven Whitehouse if (test_clear_buffer_dirty(bh)) { 12316615be1SSteven Whitehouse bh->b_end_io = end_buffer_write_sync; 124c969f58cSSteven Whitehouse submit_bh(WRITE_SYNC_PLUG, bh); 12516615be1SSteven Whitehouse } else { 12616615be1SSteven Whitehouse unlock_buffer(bh); 12716615be1SSteven Whitehouse brelse(bh); 12816615be1SSteven Whitehouse } 129ddacfaf7SSteven Whitehouse gfs2_log_lock(sdp); 130ddacfaf7SSteven Whitehouse 131ddacfaf7SSteven Whitehouse retry = 1; 132ddacfaf7SSteven Whitehouse break; 133ddacfaf7SSteven Whitehouse } 134ddacfaf7SSteven Whitehouse } while (retry); 135ddacfaf7SSteven Whitehouse } 136ddacfaf7SSteven Whitehouse 137ddacfaf7SSteven Whitehouse /** 138ddacfaf7SSteven Whitehouse * gfs2_ail1_empty_one - Check whether or not a trans in the AIL has been synced 139ddacfaf7SSteven Whitehouse * @sdp: the filesystem 140ddacfaf7SSteven Whitehouse * @ai: the AIL entry 141ddacfaf7SSteven Whitehouse * 142ddacfaf7SSteven Whitehouse */ 143ddacfaf7SSteven Whitehouse 144ddacfaf7SSteven Whitehouse static int gfs2_ail1_empty_one(struct gfs2_sbd *sdp, struct gfs2_ail *ai, int flags) 145ddacfaf7SSteven Whitehouse { 146ddacfaf7SSteven Whitehouse struct gfs2_bufdata *bd, *s; 147ddacfaf7SSteven Whitehouse struct buffer_head *bh; 148ddacfaf7SSteven Whitehouse 149ddacfaf7SSteven Whitehouse list_for_each_entry_safe_reverse(bd, s, &ai->ai_ail1_list, 150ddacfaf7SSteven Whitehouse bd_ail_st_list) { 151ddacfaf7SSteven Whitehouse bh = bd->bd_bh; 152ddacfaf7SSteven Whitehouse 153ddacfaf7SSteven Whitehouse gfs2_assert(sdp, bd->bd_ail == ai); 154ddacfaf7SSteven Whitehouse 155ddacfaf7SSteven Whitehouse if (buffer_busy(bh)) { 156ddacfaf7SSteven Whitehouse if (flags & DIO_ALL) 157ddacfaf7SSteven Whitehouse continue; 158ddacfaf7SSteven Whitehouse else 159ddacfaf7SSteven Whitehouse break; 160ddacfaf7SSteven Whitehouse } 161ddacfaf7SSteven Whitehouse 162ddacfaf7SSteven Whitehouse if (!buffer_uptodate(bh)) 163ddacfaf7SSteven Whitehouse gfs2_io_error_bh(sdp, bh); 164ddacfaf7SSteven Whitehouse 165ddacfaf7SSteven Whitehouse list_move(&bd->bd_ail_st_list, &ai->ai_ail2_list); 166ddacfaf7SSteven Whitehouse } 167ddacfaf7SSteven Whitehouse 168ddacfaf7SSteven Whitehouse return list_empty(&ai->ai_ail1_list); 169ddacfaf7SSteven Whitehouse } 170ddacfaf7SSteven Whitehouse 1715e687eacSBenjamin Marzinski static void gfs2_ail1_start(struct gfs2_sbd *sdp) 172b3b94faaSDavid Teigland { 173693ddeabSBob Peterson struct list_head *head; 174cd915493SSteven Whitehouse u64 sync_gen; 1755e687eacSBenjamin Marzinski struct gfs2_ail *ai; 17674669416SSteven Whitehouse int done = 0; 177b3b94faaSDavid Teigland 178b3b94faaSDavid Teigland gfs2_log_lock(sdp); 179693ddeabSBob Peterson head = &sdp->sd_ail1_list; 180b3b94faaSDavid Teigland if (list_empty(head)) { 181b3b94faaSDavid Teigland gfs2_log_unlock(sdp); 182b3b94faaSDavid Teigland return; 183b3b94faaSDavid Teigland } 184b3b94faaSDavid Teigland sync_gen = sdp->sd_ail_sync_gen++; 185b3b94faaSDavid Teigland 18674669416SSteven Whitehouse while(!done) { 18774669416SSteven Whitehouse done = 1; 1885e687eacSBenjamin Marzinski list_for_each_entry_reverse(ai, head, ai_list) { 189b3b94faaSDavid Teigland if (ai->ai_sync_gen >= sync_gen) 190b3b94faaSDavid Teigland continue; 191b3b94faaSDavid Teigland ai->ai_sync_gen = sync_gen; 19274669416SSteven Whitehouse gfs2_ail1_start_one(sdp, ai); /* This may drop log lock */ 19374669416SSteven Whitehouse done = 0; 194b3b94faaSDavid Teigland break; 195b3b94faaSDavid Teigland } 196b3b94faaSDavid Teigland } 197b3b94faaSDavid Teigland 198b3b94faaSDavid Teigland gfs2_log_unlock(sdp); 199b3b94faaSDavid Teigland } 200b3b94faaSDavid Teigland 201ec69b188SSteven Whitehouse static int gfs2_ail1_empty(struct gfs2_sbd *sdp, int flags) 202b3b94faaSDavid Teigland { 203b3b94faaSDavid Teigland struct gfs2_ail *ai, *s; 204b3b94faaSDavid Teigland int ret; 205b3b94faaSDavid Teigland 206b3b94faaSDavid Teigland gfs2_log_lock(sdp); 207b3b94faaSDavid Teigland 208b3b94faaSDavid Teigland list_for_each_entry_safe_reverse(ai, s, &sdp->sd_ail1_list, ai_list) { 209b3b94faaSDavid Teigland if (gfs2_ail1_empty_one(sdp, ai, flags)) 210b3b94faaSDavid Teigland list_move(&ai->ai_list, &sdp->sd_ail2_list); 211b3b94faaSDavid Teigland else if (!(flags & DIO_ALL)) 212b3b94faaSDavid Teigland break; 213b3b94faaSDavid Teigland } 214b3b94faaSDavid Teigland 215b3b94faaSDavid Teigland ret = list_empty(&sdp->sd_ail1_list); 216b3b94faaSDavid Teigland 217b3b94faaSDavid Teigland gfs2_log_unlock(sdp); 218b3b94faaSDavid Teigland 219b3b94faaSDavid Teigland return ret; 220b3b94faaSDavid Teigland } 221b3b94faaSDavid Teigland 222ddacfaf7SSteven Whitehouse 223ddacfaf7SSteven Whitehouse /** 224ddacfaf7SSteven Whitehouse * gfs2_ail2_empty_one - Check whether or not a trans in the AIL has been synced 225ddacfaf7SSteven Whitehouse * @sdp: the filesystem 226ddacfaf7SSteven Whitehouse * @ai: the AIL entry 227ddacfaf7SSteven Whitehouse * 228ddacfaf7SSteven Whitehouse */ 229ddacfaf7SSteven Whitehouse 230ddacfaf7SSteven Whitehouse static void gfs2_ail2_empty_one(struct gfs2_sbd *sdp, struct gfs2_ail *ai) 231ddacfaf7SSteven Whitehouse { 232ddacfaf7SSteven Whitehouse struct list_head *head = &ai->ai_ail2_list; 233ddacfaf7SSteven Whitehouse struct gfs2_bufdata *bd; 234ddacfaf7SSteven Whitehouse 235ddacfaf7SSteven Whitehouse while (!list_empty(head)) { 236ddacfaf7SSteven Whitehouse bd = list_entry(head->prev, struct gfs2_bufdata, 237ddacfaf7SSteven Whitehouse bd_ail_st_list); 238ddacfaf7SSteven Whitehouse gfs2_assert(sdp, bd->bd_ail == ai); 239f91a0d3eSSteven Whitehouse gfs2_remove_from_ail(bd); 240ddacfaf7SSteven Whitehouse } 241ddacfaf7SSteven Whitehouse } 242ddacfaf7SSteven Whitehouse 243b3b94faaSDavid Teigland static void ail2_empty(struct gfs2_sbd *sdp, unsigned int new_tail) 244b3b94faaSDavid Teigland { 245b3b94faaSDavid Teigland struct gfs2_ail *ai, *safe; 246b3b94faaSDavid Teigland unsigned int old_tail = sdp->sd_log_tail; 247b3b94faaSDavid Teigland int wrap = (new_tail < old_tail); 248b3b94faaSDavid Teigland int a, b, rm; 249b3b94faaSDavid Teigland 250b3b94faaSDavid Teigland gfs2_log_lock(sdp); 251b3b94faaSDavid Teigland 252b3b94faaSDavid Teigland list_for_each_entry_safe(ai, safe, &sdp->sd_ail2_list, ai_list) { 253b3b94faaSDavid Teigland a = (old_tail <= ai->ai_first); 254b3b94faaSDavid Teigland b = (ai->ai_first < new_tail); 255b3b94faaSDavid Teigland rm = (wrap) ? (a || b) : (a && b); 256b3b94faaSDavid Teigland if (!rm) 257b3b94faaSDavid Teigland continue; 258b3b94faaSDavid Teigland 259b3b94faaSDavid Teigland gfs2_ail2_empty_one(sdp, ai); 260b3b94faaSDavid Teigland list_del(&ai->ai_list); 261b3b94faaSDavid Teigland gfs2_assert_warn(sdp, list_empty(&ai->ai_ail1_list)); 262b3b94faaSDavid Teigland gfs2_assert_warn(sdp, list_empty(&ai->ai_ail2_list)); 263b3b94faaSDavid Teigland kfree(ai); 264b3b94faaSDavid Teigland } 265b3b94faaSDavid Teigland 266b3b94faaSDavid Teigland gfs2_log_unlock(sdp); 267b3b94faaSDavid Teigland } 268b3b94faaSDavid Teigland 269b3b94faaSDavid Teigland /** 270b3b94faaSDavid Teigland * gfs2_log_reserve - Make a log reservation 271b3b94faaSDavid Teigland * @sdp: The GFS2 superblock 272b3b94faaSDavid Teigland * @blks: The number of blocks to reserve 273b3b94faaSDavid Teigland * 27489918647SSteven Whitehouse * Note that we never give out the last few blocks of the journal. Thats 2752332c443SRobert Peterson * due to the fact that there is a small number of header blocks 276b004157aSSteven Whitehouse * associated with each log flush. The exact number can't be known until 277b004157aSSteven Whitehouse * flush time, so we ensure that we have just enough free blocks at all 278b004157aSSteven Whitehouse * times to avoid running out during a log flush. 279b004157aSSteven Whitehouse * 2805e687eacSBenjamin Marzinski * We no longer flush the log here, instead we wake up logd to do that 2815e687eacSBenjamin Marzinski * for us. To avoid the thundering herd and to ensure that we deal fairly 2825e687eacSBenjamin Marzinski * with queued waiters, we use an exclusive wait. This means that when we 2835e687eacSBenjamin Marzinski * get woken with enough journal space to get our reservation, we need to 2845e687eacSBenjamin Marzinski * wake the next waiter on the list. 2855e687eacSBenjamin Marzinski * 286b3b94faaSDavid Teigland * Returns: errno 287b3b94faaSDavid Teigland */ 288b3b94faaSDavid Teigland 289b3b94faaSDavid Teigland int gfs2_log_reserve(struct gfs2_sbd *sdp, unsigned int blks) 290b3b94faaSDavid Teigland { 29189918647SSteven Whitehouse unsigned reserved_blks = 6 * (4096 / sdp->sd_vfs->s_blocksize); 2925e687eacSBenjamin Marzinski unsigned wanted = blks + reserved_blks; 2935e687eacSBenjamin Marzinski DEFINE_WAIT(wait); 2945e687eacSBenjamin Marzinski int did_wait = 0; 2955e687eacSBenjamin Marzinski unsigned int free_blocks; 296b3b94faaSDavid Teigland 297b3b94faaSDavid Teigland if (gfs2_assert_warn(sdp, blks) || 298b3b94faaSDavid Teigland gfs2_assert_warn(sdp, blks <= sdp->sd_jdesc->jd_blocks)) 299b3b94faaSDavid Teigland return -EINVAL; 3005e687eacSBenjamin Marzinski retry: 3015e687eacSBenjamin Marzinski free_blocks = atomic_read(&sdp->sd_log_blks_free); 3025e687eacSBenjamin Marzinski if (unlikely(free_blocks <= wanted)) { 3035e687eacSBenjamin Marzinski do { 3045e687eacSBenjamin Marzinski prepare_to_wait_exclusive(&sdp->sd_log_waitq, &wait, 3055e687eacSBenjamin Marzinski TASK_UNINTERRUPTIBLE); 3065e687eacSBenjamin Marzinski wake_up(&sdp->sd_logd_waitq); 3075e687eacSBenjamin Marzinski did_wait = 1; 3085e687eacSBenjamin Marzinski if (atomic_read(&sdp->sd_log_blks_free) <= wanted) 3095e687eacSBenjamin Marzinski io_schedule(); 3105e687eacSBenjamin Marzinski free_blocks = atomic_read(&sdp->sd_log_blks_free); 3115e687eacSBenjamin Marzinski } while(free_blocks <= wanted); 3125e687eacSBenjamin Marzinski finish_wait(&sdp->sd_log_waitq, &wait); 313b3b94faaSDavid Teigland } 3145e687eacSBenjamin Marzinski if (atomic_cmpxchg(&sdp->sd_log_blks_free, free_blocks, 3155e687eacSBenjamin Marzinski free_blocks - blks) != free_blocks) 3165e687eacSBenjamin Marzinski goto retry; 31763997775SSteven Whitehouse trace_gfs2_log_blocks(sdp, -blks); 3185e687eacSBenjamin Marzinski 3195e687eacSBenjamin Marzinski /* 3205e687eacSBenjamin Marzinski * If we waited, then so might others, wake them up _after_ we get 3215e687eacSBenjamin Marzinski * our share of the log. 3225e687eacSBenjamin Marzinski */ 3235e687eacSBenjamin Marzinski if (unlikely(did_wait)) 3245e687eacSBenjamin Marzinski wake_up(&sdp->sd_log_waitq); 325484adff8SSteven Whitehouse 326484adff8SSteven Whitehouse down_read(&sdp->sd_log_flush_lock); 327b3b94faaSDavid Teigland 328b3b94faaSDavid Teigland return 0; 329b3b94faaSDavid Teigland } 330b3b94faaSDavid Teigland 331cd915493SSteven Whitehouse static u64 log_bmap(struct gfs2_sbd *sdp, unsigned int lbn) 332b3b94faaSDavid Teigland { 333da6dd40dSBob Peterson struct gfs2_journal_extent *je; 334b3b94faaSDavid Teigland 335da6dd40dSBob Peterson list_for_each_entry(je, &sdp->sd_jdesc->extent_list, extent_list) { 336da6dd40dSBob Peterson if (lbn >= je->lblock && lbn < je->lblock + je->blocks) 337ff91cc9bSSteven Whitehouse return je->dblock + lbn - je->lblock; 338da6dd40dSBob Peterson } 339b3b94faaSDavid Teigland 340da6dd40dSBob Peterson return -1; 341b3b94faaSDavid Teigland } 342b3b94faaSDavid Teigland 343b3b94faaSDavid Teigland /** 344b3b94faaSDavid Teigland * log_distance - Compute distance between two journal blocks 345b3b94faaSDavid Teigland * @sdp: The GFS2 superblock 346b3b94faaSDavid Teigland * @newer: The most recent journal block of the pair 347b3b94faaSDavid Teigland * @older: The older journal block of the pair 348b3b94faaSDavid Teigland * 349b3b94faaSDavid Teigland * Compute the distance (in the journal direction) between two 350b3b94faaSDavid Teigland * blocks in the journal 351b3b94faaSDavid Teigland * 352b3b94faaSDavid Teigland * Returns: the distance in blocks 353b3b94faaSDavid Teigland */ 354b3b94faaSDavid Teigland 355faa31ce8SSteven Whitehouse static inline unsigned int log_distance(struct gfs2_sbd *sdp, unsigned int newer, 356b3b94faaSDavid Teigland unsigned int older) 357b3b94faaSDavid Teigland { 358b3b94faaSDavid Teigland int dist; 359b3b94faaSDavid Teigland 360b3b94faaSDavid Teigland dist = newer - older; 361b3b94faaSDavid Teigland if (dist < 0) 362b3b94faaSDavid Teigland dist += sdp->sd_jdesc->jd_blocks; 363b3b94faaSDavid Teigland 364b3b94faaSDavid Teigland return dist; 365b3b94faaSDavid Teigland } 366b3b94faaSDavid Teigland 3672332c443SRobert Peterson /** 3682332c443SRobert Peterson * calc_reserved - Calculate the number of blocks to reserve when 3692332c443SRobert Peterson * refunding a transaction's unused buffers. 3702332c443SRobert Peterson * @sdp: The GFS2 superblock 3712332c443SRobert Peterson * 3722332c443SRobert Peterson * This is complex. We need to reserve room for all our currently used 3732332c443SRobert Peterson * metadata buffers (e.g. normal file I/O rewriting file time stamps) and 3742332c443SRobert Peterson * all our journaled data buffers for journaled files (e.g. files in the 3752332c443SRobert Peterson * meta_fs like rindex, or files for which chattr +j was done.) 3762332c443SRobert Peterson * If we don't reserve enough space, gfs2_log_refund and gfs2_log_flush 3772332c443SRobert Peterson * will count it as free space (sd_log_blks_free) and corruption will follow. 3782332c443SRobert Peterson * 3792332c443SRobert Peterson * We can have metadata bufs and jdata bufs in the same journal. So each 3802332c443SRobert Peterson * type gets its own log header, for which we need to reserve a block. 3812332c443SRobert Peterson * In fact, each type has the potential for needing more than one header 3822332c443SRobert Peterson * in cases where we have more buffers than will fit on a journal page. 3832332c443SRobert Peterson * Metadata journal entries take up half the space of journaled buffer entries. 3842332c443SRobert Peterson * Thus, metadata entries have buf_limit (502) and journaled buffers have 3852332c443SRobert Peterson * databuf_limit (251) before they cause a wrap around. 3862332c443SRobert Peterson * 3872332c443SRobert Peterson * Also, we need to reserve blocks for revoke journal entries and one for an 3882332c443SRobert Peterson * overall header for the lot. 3892332c443SRobert Peterson * 3902332c443SRobert Peterson * Returns: the number of blocks reserved 3912332c443SRobert Peterson */ 3922332c443SRobert Peterson static unsigned int calc_reserved(struct gfs2_sbd *sdp) 3932332c443SRobert Peterson { 3942332c443SRobert Peterson unsigned int reserved = 0; 3952332c443SRobert Peterson unsigned int mbuf_limit, metabufhdrs_needed; 3962332c443SRobert Peterson unsigned int dbuf_limit, databufhdrs_needed; 3972332c443SRobert Peterson unsigned int revokes = 0; 3982332c443SRobert Peterson 3992332c443SRobert Peterson mbuf_limit = buf_limit(sdp); 4002332c443SRobert Peterson metabufhdrs_needed = (sdp->sd_log_commited_buf + 4012332c443SRobert Peterson (mbuf_limit - 1)) / mbuf_limit; 4022332c443SRobert Peterson dbuf_limit = databuf_limit(sdp); 4032332c443SRobert Peterson databufhdrs_needed = (sdp->sd_log_commited_databuf + 4042332c443SRobert Peterson (dbuf_limit - 1)) / dbuf_limit; 4052332c443SRobert Peterson 4062e95e3f6SBenjamin Marzinski if (sdp->sd_log_commited_revoke > 0) 4072332c443SRobert Peterson revokes = gfs2_struct2blk(sdp, sdp->sd_log_commited_revoke, 4082332c443SRobert Peterson sizeof(u64)); 4092332c443SRobert Peterson 4102332c443SRobert Peterson reserved = sdp->sd_log_commited_buf + metabufhdrs_needed + 4112332c443SRobert Peterson sdp->sd_log_commited_databuf + databufhdrs_needed + 4122332c443SRobert Peterson revokes; 4132332c443SRobert Peterson /* One for the overall header */ 4142332c443SRobert Peterson if (reserved) 4152332c443SRobert Peterson reserved++; 4162332c443SRobert Peterson return reserved; 4172332c443SRobert Peterson } 4182332c443SRobert Peterson 419b3b94faaSDavid Teigland static unsigned int current_tail(struct gfs2_sbd *sdp) 420b3b94faaSDavid Teigland { 421b3b94faaSDavid Teigland struct gfs2_ail *ai; 422b3b94faaSDavid Teigland unsigned int tail; 423b3b94faaSDavid Teigland 424b3b94faaSDavid Teigland gfs2_log_lock(sdp); 425b3b94faaSDavid Teigland 426faa31ce8SSteven Whitehouse if (list_empty(&sdp->sd_ail1_list)) { 427b3b94faaSDavid Teigland tail = sdp->sd_log_head; 428faa31ce8SSteven Whitehouse } else { 429faa31ce8SSteven Whitehouse ai = list_entry(sdp->sd_ail1_list.prev, struct gfs2_ail, ai_list); 430b3b94faaSDavid Teigland tail = ai->ai_first; 431b3b94faaSDavid Teigland } 432b3b94faaSDavid Teigland 433b3b94faaSDavid Teigland gfs2_log_unlock(sdp); 434b3b94faaSDavid Teigland 435b3b94faaSDavid Teigland return tail; 436b3b94faaSDavid Teigland } 437b3b94faaSDavid Teigland 43816615be1SSteven Whitehouse void gfs2_log_incr_head(struct gfs2_sbd *sdp) 439b3b94faaSDavid Teigland { 440b3b94faaSDavid Teigland if (sdp->sd_log_flush_head == sdp->sd_log_tail) 44116615be1SSteven Whitehouse BUG_ON(sdp->sd_log_flush_head != sdp->sd_log_head); 442b3b94faaSDavid Teigland 443b3b94faaSDavid Teigland if (++sdp->sd_log_flush_head == sdp->sd_jdesc->jd_blocks) { 444b3b94faaSDavid Teigland sdp->sd_log_flush_head = 0; 445b3b94faaSDavid Teigland sdp->sd_log_flush_wrapped = 1; 446b3b94faaSDavid Teigland } 447b3b94faaSDavid Teigland } 448b3b94faaSDavid Teigland 449b3b94faaSDavid Teigland /** 45016615be1SSteven Whitehouse * gfs2_log_write_endio - End of I/O for a log buffer 45116615be1SSteven Whitehouse * @bh: The buffer head 45216615be1SSteven Whitehouse * @uptodate: I/O Status 45316615be1SSteven Whitehouse * 45416615be1SSteven Whitehouse */ 45516615be1SSteven Whitehouse 45616615be1SSteven Whitehouse static void gfs2_log_write_endio(struct buffer_head *bh, int uptodate) 45716615be1SSteven Whitehouse { 45816615be1SSteven Whitehouse struct gfs2_sbd *sdp = bh->b_private; 45916615be1SSteven Whitehouse bh->b_private = NULL; 46016615be1SSteven Whitehouse 46116615be1SSteven Whitehouse end_buffer_write_sync(bh, uptodate); 46216615be1SSteven Whitehouse if (atomic_dec_and_test(&sdp->sd_log_in_flight)) 46316615be1SSteven Whitehouse wake_up(&sdp->sd_log_flush_wait); 46416615be1SSteven Whitehouse } 46516615be1SSteven Whitehouse 46616615be1SSteven Whitehouse /** 467b3b94faaSDavid Teigland * gfs2_log_get_buf - Get and initialize a buffer to use for log control data 468b3b94faaSDavid Teigland * @sdp: The GFS2 superblock 469b3b94faaSDavid Teigland * 470b3b94faaSDavid Teigland * Returns: the buffer_head 471b3b94faaSDavid Teigland */ 472b3b94faaSDavid Teigland 473b3b94faaSDavid Teigland struct buffer_head *gfs2_log_get_buf(struct gfs2_sbd *sdp) 474b3b94faaSDavid Teigland { 475cd915493SSteven Whitehouse u64 blkno = log_bmap(sdp, sdp->sd_log_flush_head); 476b3b94faaSDavid Teigland struct buffer_head *bh; 477b3b94faaSDavid Teigland 47816615be1SSteven Whitehouse bh = sb_getblk(sdp->sd_vfs, blkno); 479b3b94faaSDavid Teigland lock_buffer(bh); 480b3b94faaSDavid Teigland memset(bh->b_data, 0, bh->b_size); 481b3b94faaSDavid Teigland set_buffer_uptodate(bh); 482b3b94faaSDavid Teigland clear_buffer_dirty(bh); 48316615be1SSteven Whitehouse gfs2_log_incr_head(sdp); 48416615be1SSteven Whitehouse atomic_inc(&sdp->sd_log_in_flight); 48516615be1SSteven Whitehouse bh->b_private = sdp; 48616615be1SSteven Whitehouse bh->b_end_io = gfs2_log_write_endio; 487b3b94faaSDavid Teigland 488b3b94faaSDavid Teigland return bh; 489b3b94faaSDavid Teigland } 490b3b94faaSDavid Teigland 491b3b94faaSDavid Teigland /** 49216615be1SSteven Whitehouse * gfs2_fake_write_endio - 49316615be1SSteven Whitehouse * @bh: The buffer head 49416615be1SSteven Whitehouse * @uptodate: The I/O Status 49516615be1SSteven Whitehouse * 49616615be1SSteven Whitehouse */ 49716615be1SSteven Whitehouse 49816615be1SSteven Whitehouse static void gfs2_fake_write_endio(struct buffer_head *bh, int uptodate) 49916615be1SSteven Whitehouse { 50016615be1SSteven Whitehouse struct buffer_head *real_bh = bh->b_private; 5015a60c532SSteven Whitehouse struct gfs2_bufdata *bd = real_bh->b_private; 5025a60c532SSteven Whitehouse struct gfs2_sbd *sdp = bd->bd_gl->gl_sbd; 50316615be1SSteven Whitehouse 50416615be1SSteven Whitehouse end_buffer_write_sync(bh, uptodate); 50516615be1SSteven Whitehouse free_buffer_head(bh); 50616615be1SSteven Whitehouse unlock_buffer(real_bh); 50716615be1SSteven Whitehouse brelse(real_bh); 50816615be1SSteven Whitehouse if (atomic_dec_and_test(&sdp->sd_log_in_flight)) 50916615be1SSteven Whitehouse wake_up(&sdp->sd_log_flush_wait); 51016615be1SSteven Whitehouse } 51116615be1SSteven Whitehouse 51216615be1SSteven Whitehouse /** 513b3b94faaSDavid Teigland * gfs2_log_fake_buf - Build a fake buffer head to write metadata buffer to log 514b3b94faaSDavid Teigland * @sdp: the filesystem 515b3b94faaSDavid Teigland * @data: the data the buffer_head should point to 516b3b94faaSDavid Teigland * 517b3b94faaSDavid Teigland * Returns: the log buffer descriptor 518b3b94faaSDavid Teigland */ 519b3b94faaSDavid Teigland 520b3b94faaSDavid Teigland struct buffer_head *gfs2_log_fake_buf(struct gfs2_sbd *sdp, 521b3b94faaSDavid Teigland struct buffer_head *real) 522b3b94faaSDavid Teigland { 523cd915493SSteven Whitehouse u64 blkno = log_bmap(sdp, sdp->sd_log_flush_head); 524b3b94faaSDavid Teigland struct buffer_head *bh; 525b3b94faaSDavid Teigland 52616615be1SSteven Whitehouse bh = alloc_buffer_head(GFP_NOFS | __GFP_NOFAIL); 527b3b94faaSDavid Teigland atomic_set(&bh->b_count, 1); 52816615be1SSteven Whitehouse bh->b_state = (1 << BH_Mapped) | (1 << BH_Uptodate) | (1 << BH_Lock); 52918ec7d5cSSteven Whitehouse set_bh_page(bh, real->b_page, bh_offset(real)); 530b3b94faaSDavid Teigland bh->b_blocknr = blkno; 531b3b94faaSDavid Teigland bh->b_size = sdp->sd_sb.sb_bsize; 532b3b94faaSDavid Teigland bh->b_bdev = sdp->sd_vfs->s_bdev; 53316615be1SSteven Whitehouse bh->b_private = real; 53416615be1SSteven Whitehouse bh->b_end_io = gfs2_fake_write_endio; 535b3b94faaSDavid Teigland 53616615be1SSteven Whitehouse gfs2_log_incr_head(sdp); 53716615be1SSteven Whitehouse atomic_inc(&sdp->sd_log_in_flight); 538b3b94faaSDavid Teigland 539b3b94faaSDavid Teigland return bh; 540b3b94faaSDavid Teigland } 541b3b94faaSDavid Teigland 5422332c443SRobert Peterson static void log_pull_tail(struct gfs2_sbd *sdp, unsigned int new_tail) 543b3b94faaSDavid Teigland { 544b3b94faaSDavid Teigland unsigned int dist = log_distance(sdp, new_tail, sdp->sd_log_tail); 545b3b94faaSDavid Teigland 546b3b94faaSDavid Teigland ail2_empty(sdp, new_tail); 547b3b94faaSDavid Teigland 548fd041f0bSSteven Whitehouse atomic_add(dist, &sdp->sd_log_blks_free); 54963997775SSteven Whitehouse trace_gfs2_log_blocks(sdp, dist); 5505e687eacSBenjamin Marzinski gfs2_assert_withdraw(sdp, atomic_read(&sdp->sd_log_blks_free) <= 5515e687eacSBenjamin Marzinski sdp->sd_jdesc->jd_blocks); 552b3b94faaSDavid Teigland 553b3b94faaSDavid Teigland sdp->sd_log_tail = new_tail; 554b3b94faaSDavid Teigland } 555b3b94faaSDavid Teigland 556b3b94faaSDavid Teigland /** 557b3b94faaSDavid Teigland * log_write_header - Get and initialize a journal header buffer 558b3b94faaSDavid Teigland * @sdp: The GFS2 superblock 559b3b94faaSDavid Teigland * 560b3b94faaSDavid Teigland * Returns: the initialized log buffer descriptor 561b3b94faaSDavid Teigland */ 562b3b94faaSDavid Teigland 563cd915493SSteven Whitehouse static void log_write_header(struct gfs2_sbd *sdp, u32 flags, int pull) 564b3b94faaSDavid Teigland { 565cd915493SSteven Whitehouse u64 blkno = log_bmap(sdp, sdp->sd_log_flush_head); 566b3b94faaSDavid Teigland struct buffer_head *bh; 567b3b94faaSDavid Teigland struct gfs2_log_header *lh; 568b3b94faaSDavid Teigland unsigned int tail; 569cd915493SSteven Whitehouse u32 hash; 570b3b94faaSDavid Teigland 571b3b94faaSDavid Teigland bh = sb_getblk(sdp->sd_vfs, blkno); 572b3b94faaSDavid Teigland lock_buffer(bh); 573b3b94faaSDavid Teigland memset(bh->b_data, 0, bh->b_size); 574b3b94faaSDavid Teigland set_buffer_uptodate(bh); 575b3b94faaSDavid Teigland clear_buffer_dirty(bh); 576b3b94faaSDavid Teigland 577b3b94faaSDavid Teigland gfs2_ail1_empty(sdp, 0); 578b3b94faaSDavid Teigland tail = current_tail(sdp); 579b3b94faaSDavid Teigland 580b3b94faaSDavid Teigland lh = (struct gfs2_log_header *)bh->b_data; 581b3b94faaSDavid Teigland memset(lh, 0, sizeof(struct gfs2_log_header)); 582b3b94faaSDavid Teigland lh->lh_header.mh_magic = cpu_to_be32(GFS2_MAGIC); 583e3167dedSSteven Whitehouse lh->lh_header.mh_type = cpu_to_be32(GFS2_METATYPE_LH); 5840ab7d13fSSteven Whitehouse lh->lh_header.__pad0 = cpu_to_be64(0); 585e3167dedSSteven Whitehouse lh->lh_header.mh_format = cpu_to_be32(GFS2_FORMAT_LH); 5860ab7d13fSSteven Whitehouse lh->lh_header.mh_jid = cpu_to_be32(sdp->sd_jdesc->jd_jid); 587e0f2bf78SSteven Whitehouse lh->lh_sequence = cpu_to_be64(sdp->sd_log_sequence++); 588e0f2bf78SSteven Whitehouse lh->lh_flags = cpu_to_be32(flags); 589e0f2bf78SSteven Whitehouse lh->lh_tail = cpu_to_be32(tail); 590e0f2bf78SSteven Whitehouse lh->lh_blkno = cpu_to_be32(sdp->sd_log_flush_head); 591b3b94faaSDavid Teigland hash = gfs2_disk_hash(bh->b_data, sizeof(struct gfs2_log_header)); 592b3b94faaSDavid Teigland lh->lh_hash = cpu_to_be32(hash); 593b3b94faaSDavid Teigland 594254db57fSSteven Whitehouse bh->b_end_io = end_buffer_write_sync; 595254db57fSSteven Whitehouse if (test_bit(SDF_NOBARRIERS, &sdp->sd_flags)) 596254db57fSSteven Whitehouse goto skip_barrier; 597254db57fSSteven Whitehouse get_bh(bh); 598c969f58cSSteven Whitehouse submit_bh(WRITE_SYNC | (1 << BIO_RW_BARRIER) | (1 << BIO_RW_META), bh); 599254db57fSSteven Whitehouse wait_on_buffer(bh); 600254db57fSSteven Whitehouse if (buffer_eopnotsupp(bh)) { 601254db57fSSteven Whitehouse clear_buffer_eopnotsupp(bh); 602254db57fSSteven Whitehouse set_buffer_uptodate(bh); 603913a71d2SSteven Whitehouse fs_info(sdp, "barrier sync failed - disabling barriers\n"); 604254db57fSSteven Whitehouse set_bit(SDF_NOBARRIERS, &sdp->sd_flags); 605254db57fSSteven Whitehouse lock_buffer(bh); 606254db57fSSteven Whitehouse skip_barrier: 607254db57fSSteven Whitehouse get_bh(bh); 608254db57fSSteven Whitehouse submit_bh(WRITE_SYNC | (1 << BIO_RW_META), bh); 609254db57fSSteven Whitehouse wait_on_buffer(bh); 610254db57fSSteven Whitehouse } 611254db57fSSteven Whitehouse if (!buffer_uptodate(bh)) 612b3b94faaSDavid Teigland gfs2_io_error_bh(sdp, bh); 613b3b94faaSDavid Teigland brelse(bh); 614b3b94faaSDavid Teigland 615b3b94faaSDavid Teigland if (sdp->sd_log_tail != tail) 6162332c443SRobert Peterson log_pull_tail(sdp, tail); 617b3b94faaSDavid Teigland else 618b3b94faaSDavid Teigland gfs2_assert_withdraw(sdp, !pull); 619b3b94faaSDavid Teigland 620b3b94faaSDavid Teigland sdp->sd_log_idle = (tail == sdp->sd_log_flush_head); 62116615be1SSteven Whitehouse gfs2_log_incr_head(sdp); 622b3b94faaSDavid Teigland } 623b3b94faaSDavid Teigland 624b3b94faaSDavid Teigland static void log_flush_commit(struct gfs2_sbd *sdp) 625b3b94faaSDavid Teigland { 62616615be1SSteven Whitehouse DEFINE_WAIT(wait); 627b3b94faaSDavid Teigland 62816615be1SSteven Whitehouse if (atomic_read(&sdp->sd_log_in_flight)) { 62916615be1SSteven Whitehouse do { 63016615be1SSteven Whitehouse prepare_to_wait(&sdp->sd_log_flush_wait, &wait, 63116615be1SSteven Whitehouse TASK_UNINTERRUPTIBLE); 63216615be1SSteven Whitehouse if (atomic_read(&sdp->sd_log_in_flight)) 63316615be1SSteven Whitehouse io_schedule(); 63416615be1SSteven Whitehouse } while(atomic_read(&sdp->sd_log_in_flight)); 63516615be1SSteven Whitehouse finish_wait(&sdp->sd_log_flush_wait, &wait); 636b3b94faaSDavid Teigland } 637b3b94faaSDavid Teigland 638b3b94faaSDavid Teigland log_write_header(sdp, 0, 0); 639b3b94faaSDavid Teigland } 640b3b94faaSDavid Teigland 641d7b616e2SSteven Whitehouse static void gfs2_ordered_write(struct gfs2_sbd *sdp) 642d7b616e2SSteven Whitehouse { 643d7b616e2SSteven Whitehouse struct gfs2_bufdata *bd; 644d7b616e2SSteven Whitehouse struct buffer_head *bh; 645d7b616e2SSteven Whitehouse LIST_HEAD(written); 646d7b616e2SSteven Whitehouse 647d7b616e2SSteven Whitehouse gfs2_log_lock(sdp); 648d7b616e2SSteven Whitehouse while (!list_empty(&sdp->sd_log_le_ordered)) { 649d7b616e2SSteven Whitehouse bd = list_entry(sdp->sd_log_le_ordered.next, struct gfs2_bufdata, bd_le.le_list); 650d7b616e2SSteven Whitehouse list_move(&bd->bd_le.le_list, &written); 651d7b616e2SSteven Whitehouse bh = bd->bd_bh; 652d7b616e2SSteven Whitehouse if (!buffer_dirty(bh)) 653d7b616e2SSteven Whitehouse continue; 654d7b616e2SSteven Whitehouse get_bh(bh); 655d7b616e2SSteven Whitehouse gfs2_log_unlock(sdp); 656d7b616e2SSteven Whitehouse lock_buffer(bh); 657b8e7cbb6SSteven Whitehouse if (buffer_mapped(bh) && test_clear_buffer_dirty(bh)) { 658d7b616e2SSteven Whitehouse bh->b_end_io = end_buffer_write_sync; 659c969f58cSSteven Whitehouse submit_bh(WRITE_SYNC_PLUG, bh); 660d7b616e2SSteven Whitehouse } else { 661d7b616e2SSteven Whitehouse unlock_buffer(bh); 662d7b616e2SSteven Whitehouse brelse(bh); 663d7b616e2SSteven Whitehouse } 664d7b616e2SSteven Whitehouse gfs2_log_lock(sdp); 665d7b616e2SSteven Whitehouse } 666d7b616e2SSteven Whitehouse list_splice(&written, &sdp->sd_log_le_ordered); 667d7b616e2SSteven Whitehouse gfs2_log_unlock(sdp); 668d7b616e2SSteven Whitehouse } 669d7b616e2SSteven Whitehouse 670d7b616e2SSteven Whitehouse static void gfs2_ordered_wait(struct gfs2_sbd *sdp) 671d7b616e2SSteven Whitehouse { 672d7b616e2SSteven Whitehouse struct gfs2_bufdata *bd; 673d7b616e2SSteven Whitehouse struct buffer_head *bh; 674d7b616e2SSteven Whitehouse 675d7b616e2SSteven Whitehouse gfs2_log_lock(sdp); 676d7b616e2SSteven Whitehouse while (!list_empty(&sdp->sd_log_le_ordered)) { 677d7b616e2SSteven Whitehouse bd = list_entry(sdp->sd_log_le_ordered.prev, struct gfs2_bufdata, bd_le.le_list); 678d7b616e2SSteven Whitehouse bh = bd->bd_bh; 679d7b616e2SSteven Whitehouse if (buffer_locked(bh)) { 680d7b616e2SSteven Whitehouse get_bh(bh); 681d7b616e2SSteven Whitehouse gfs2_log_unlock(sdp); 682d7b616e2SSteven Whitehouse wait_on_buffer(bh); 683d7b616e2SSteven Whitehouse brelse(bh); 684d7b616e2SSteven Whitehouse gfs2_log_lock(sdp); 685d7b616e2SSteven Whitehouse continue; 686d7b616e2SSteven Whitehouse } 687d7b616e2SSteven Whitehouse list_del_init(&bd->bd_le.le_list); 688d7b616e2SSteven Whitehouse } 689d7b616e2SSteven Whitehouse gfs2_log_unlock(sdp); 690d7b616e2SSteven Whitehouse } 691d7b616e2SSteven Whitehouse 692b3b94faaSDavid Teigland /** 693b09e593dSSteven Whitehouse * gfs2_log_flush - flush incore transaction(s) 694b3b94faaSDavid Teigland * @sdp: the filesystem 695b3b94faaSDavid Teigland * @gl: The glock structure to flush. If NULL, flush the whole incore log 696b3b94faaSDavid Teigland * 697b3b94faaSDavid Teigland */ 698b3b94faaSDavid Teigland 699*ed4878e8SBob Peterson void gfs2_log_flush(struct gfs2_sbd *sdp, struct gfs2_glock *gl) 700b3b94faaSDavid Teigland { 701b3b94faaSDavid Teigland struct gfs2_ail *ai; 702b3b94faaSDavid Teigland 703484adff8SSteven Whitehouse down_write(&sdp->sd_log_flush_lock); 704f55ab26aSSteven Whitehouse 7052bcd610dSSteven Whitehouse /* Log might have been flushed while we waited for the flush lock */ 7062bcd610dSSteven Whitehouse if (gl && !test_bit(GLF_LFLUSH, &gl->gl_flags)) { 707484adff8SSteven Whitehouse up_write(&sdp->sd_log_flush_lock); 708f55ab26aSSteven Whitehouse return; 709f55ab26aSSteven Whitehouse } 71063997775SSteven Whitehouse trace_gfs2_log_flush(sdp, 1); 711f55ab26aSSteven Whitehouse 712b09e593dSSteven Whitehouse ai = kzalloc(sizeof(struct gfs2_ail), GFP_NOFS | __GFP_NOFAIL); 713b09e593dSSteven Whitehouse INIT_LIST_HEAD(&ai->ai_ail1_list); 714b09e593dSSteven Whitehouse INIT_LIST_HEAD(&ai->ai_ail2_list); 715b3b94faaSDavid Teigland 71616615be1SSteven Whitehouse if (sdp->sd_log_num_buf != sdp->sd_log_commited_buf) { 71716615be1SSteven Whitehouse printk(KERN_INFO "GFS2: log buf %u %u\n", sdp->sd_log_num_buf, 71816615be1SSteven Whitehouse sdp->sd_log_commited_buf); 71916615be1SSteven Whitehouse gfs2_assert_withdraw(sdp, 0); 72016615be1SSteven Whitehouse } 72116615be1SSteven Whitehouse if (sdp->sd_log_num_databuf != sdp->sd_log_commited_databuf) { 72216615be1SSteven Whitehouse printk(KERN_INFO "GFS2: log databuf %u %u\n", 72316615be1SSteven Whitehouse sdp->sd_log_num_databuf, sdp->sd_log_commited_databuf); 72416615be1SSteven Whitehouse gfs2_assert_withdraw(sdp, 0); 72516615be1SSteven Whitehouse } 726b3b94faaSDavid Teigland gfs2_assert_withdraw(sdp, 727b3b94faaSDavid Teigland sdp->sd_log_num_revoke == sdp->sd_log_commited_revoke); 728b3b94faaSDavid Teigland 729b3b94faaSDavid Teigland sdp->sd_log_flush_head = sdp->sd_log_head; 730b3b94faaSDavid Teigland sdp->sd_log_flush_wrapped = 0; 731b3b94faaSDavid Teigland ai->ai_first = sdp->sd_log_flush_head; 732b3b94faaSDavid Teigland 733d7b616e2SSteven Whitehouse gfs2_ordered_write(sdp); 734b3b94faaSDavid Teigland lops_before_commit(sdp); 735d7b616e2SSteven Whitehouse gfs2_ordered_wait(sdp); 736d7b616e2SSteven Whitehouse 73716615be1SSteven Whitehouse if (sdp->sd_log_head != sdp->sd_log_flush_head) 738b3b94faaSDavid Teigland log_flush_commit(sdp); 7392332c443SRobert Peterson else if (sdp->sd_log_tail != current_tail(sdp) && !sdp->sd_log_idle){ 7402332c443SRobert Peterson gfs2_log_lock(sdp); 741fd041f0bSSteven Whitehouse atomic_dec(&sdp->sd_log_blks_free); /* Adjust for unreserved buffer */ 74263997775SSteven Whitehouse trace_gfs2_log_blocks(sdp, -1); 7432332c443SRobert Peterson gfs2_log_unlock(sdp); 744b3b94faaSDavid Teigland log_write_header(sdp, 0, PULL); 7452332c443SRobert Peterson } 746b3b94faaSDavid Teigland lops_after_commit(sdp, ai); 747fe1a698fSSteven Whitehouse 748fe1a698fSSteven Whitehouse gfs2_log_lock(sdp); 749b3b94faaSDavid Teigland sdp->sd_log_head = sdp->sd_log_flush_head; 750faa31ce8SSteven Whitehouse sdp->sd_log_blks_reserved = 0; 751faa31ce8SSteven Whitehouse sdp->sd_log_commited_buf = 0; 7522332c443SRobert Peterson sdp->sd_log_commited_databuf = 0; 753b3b94faaSDavid Teigland sdp->sd_log_commited_revoke = 0; 754b3b94faaSDavid Teigland 755b3b94faaSDavid Teigland if (!list_empty(&ai->ai_ail1_list)) { 756b3b94faaSDavid Teigland list_add(&ai->ai_list, &sdp->sd_ail1_list); 757b3b94faaSDavid Teigland ai = NULL; 758b3b94faaSDavid Teigland } 759b3b94faaSDavid Teigland gfs2_log_unlock(sdp); 76063997775SSteven Whitehouse trace_gfs2_log_flush(sdp, 0); 761484adff8SSteven Whitehouse up_write(&sdp->sd_log_flush_lock); 762b3b94faaSDavid Teigland 763b3b94faaSDavid Teigland kfree(ai); 764b3b94faaSDavid Teigland } 765b3b94faaSDavid Teigland 766b3b94faaSDavid Teigland static void log_refund(struct gfs2_sbd *sdp, struct gfs2_trans *tr) 767b3b94faaSDavid Teigland { 7682332c443SRobert Peterson unsigned int reserved; 769ac39aaddSSteven Whitehouse unsigned int unused; 770b3b94faaSDavid Teigland 771b3b94faaSDavid Teigland gfs2_log_lock(sdp); 772b3b94faaSDavid Teigland 773b3b94faaSDavid Teigland sdp->sd_log_commited_buf += tr->tr_num_buf_new - tr->tr_num_buf_rm; 7742332c443SRobert Peterson sdp->sd_log_commited_databuf += tr->tr_num_databuf_new - 7752332c443SRobert Peterson tr->tr_num_databuf_rm; 7762332c443SRobert Peterson gfs2_assert_withdraw(sdp, (((int)sdp->sd_log_commited_buf) >= 0) || 7772332c443SRobert Peterson (((int)sdp->sd_log_commited_databuf) >= 0)); 778b3b94faaSDavid Teigland sdp->sd_log_commited_revoke += tr->tr_num_revoke - tr->tr_num_revoke_rm; 7792332c443SRobert Peterson reserved = calc_reserved(sdp); 78062be1f71SRoel Kluin gfs2_assert_withdraw(sdp, sdp->sd_log_blks_reserved + tr->tr_reserved >= reserved); 781ac39aaddSSteven Whitehouse unused = sdp->sd_log_blks_reserved - reserved + tr->tr_reserved; 782ac39aaddSSteven Whitehouse atomic_add(unused, &sdp->sd_log_blks_free); 78363997775SSteven Whitehouse trace_gfs2_log_blocks(sdp, unused); 784fd041f0bSSteven Whitehouse gfs2_assert_withdraw(sdp, atomic_read(&sdp->sd_log_blks_free) <= 7852332c443SRobert Peterson sdp->sd_jdesc->jd_blocks); 786b3b94faaSDavid Teigland sdp->sd_log_blks_reserved = reserved; 787b3b94faaSDavid Teigland 788b3b94faaSDavid Teigland gfs2_log_unlock(sdp); 789b3b94faaSDavid Teigland } 790b3b94faaSDavid Teigland 791d0109bfaSBob Peterson static void buf_lo_incore_commit(struct gfs2_sbd *sdp, struct gfs2_trans *tr) 792d0109bfaSBob Peterson { 793d0109bfaSBob Peterson struct list_head *head = &tr->tr_list_buf; 794d0109bfaSBob Peterson struct gfs2_bufdata *bd; 795d0109bfaSBob Peterson 796d0109bfaSBob Peterson gfs2_log_lock(sdp); 797d0109bfaSBob Peterson while (!list_empty(head)) { 798d0109bfaSBob Peterson bd = list_entry(head->next, struct gfs2_bufdata, bd_list_tr); 799d0109bfaSBob Peterson list_del_init(&bd->bd_list_tr); 800d0109bfaSBob Peterson tr->tr_num_buf--; 801d0109bfaSBob Peterson } 802d0109bfaSBob Peterson gfs2_log_unlock(sdp); 803d0109bfaSBob Peterson gfs2_assert_warn(sdp, !tr->tr_num_buf); 804d0109bfaSBob Peterson } 805d0109bfaSBob Peterson 806b3b94faaSDavid Teigland /** 807b3b94faaSDavid Teigland * gfs2_log_commit - Commit a transaction to the log 808b3b94faaSDavid Teigland * @sdp: the filesystem 809b3b94faaSDavid Teigland * @tr: the transaction 810b3b94faaSDavid Teigland * 8115e687eacSBenjamin Marzinski * We wake up gfs2_logd if the number of pinned blocks exceed thresh1 8125e687eacSBenjamin Marzinski * or the total number of used blocks (pinned blocks plus AIL blocks) 8135e687eacSBenjamin Marzinski * is greater than thresh2. 8145e687eacSBenjamin Marzinski * 8155e687eacSBenjamin Marzinski * At mount time thresh1 is 1/3rd of journal size, thresh2 is 2/3rd of 8165e687eacSBenjamin Marzinski * journal size. 8175e687eacSBenjamin Marzinski * 818b3b94faaSDavid Teigland * Returns: errno 819b3b94faaSDavid Teigland */ 820b3b94faaSDavid Teigland 821b3b94faaSDavid Teigland void gfs2_log_commit(struct gfs2_sbd *sdp, struct gfs2_trans *tr) 822b3b94faaSDavid Teigland { 823b3b94faaSDavid Teigland log_refund(sdp, tr); 824d0109bfaSBob Peterson buf_lo_incore_commit(sdp, tr); 825b3b94faaSDavid Teigland 826484adff8SSteven Whitehouse up_read(&sdp->sd_log_flush_lock); 827b3b94faaSDavid Teigland 8285e687eacSBenjamin Marzinski if (atomic_read(&sdp->sd_log_pinned) > atomic_read(&sdp->sd_log_thresh1) || 8295e687eacSBenjamin Marzinski ((sdp->sd_jdesc->jd_blocks - atomic_read(&sdp->sd_log_blks_free)) > 8305e687eacSBenjamin Marzinski atomic_read(&sdp->sd_log_thresh2))) 8315e687eacSBenjamin Marzinski wake_up(&sdp->sd_logd_waitq); 832faa31ce8SSteven Whitehouse } 833b3b94faaSDavid Teigland 834b3b94faaSDavid Teigland /** 835b3b94faaSDavid Teigland * gfs2_log_shutdown - write a shutdown header into a journal 836b3b94faaSDavid Teigland * @sdp: the filesystem 837b3b94faaSDavid Teigland * 838b3b94faaSDavid Teigland */ 839b3b94faaSDavid Teigland 840b3b94faaSDavid Teigland void gfs2_log_shutdown(struct gfs2_sbd *sdp) 841b3b94faaSDavid Teigland { 842484adff8SSteven Whitehouse down_write(&sdp->sd_log_flush_lock); 843b3b94faaSDavid Teigland 844b3b94faaSDavid Teigland gfs2_assert_withdraw(sdp, !sdp->sd_log_blks_reserved); 845b3b94faaSDavid Teigland gfs2_assert_withdraw(sdp, !sdp->sd_log_num_buf); 846b3b94faaSDavid Teigland gfs2_assert_withdraw(sdp, !sdp->sd_log_num_revoke); 847b3b94faaSDavid Teigland gfs2_assert_withdraw(sdp, !sdp->sd_log_num_rg); 848b3b94faaSDavid Teigland gfs2_assert_withdraw(sdp, !sdp->sd_log_num_databuf); 849b3b94faaSDavid Teigland gfs2_assert_withdraw(sdp, list_empty(&sdp->sd_ail1_list)); 850b3b94faaSDavid Teigland 851b3b94faaSDavid Teigland sdp->sd_log_flush_head = sdp->sd_log_head; 852b3b94faaSDavid Teigland sdp->sd_log_flush_wrapped = 0; 853b3b94faaSDavid Teigland 8542332c443SRobert Peterson log_write_header(sdp, GFS2_LOG_HEAD_UNMOUNT, 8552332c443SRobert Peterson (sdp->sd_log_tail == current_tail(sdp)) ? 0 : PULL); 856b3b94faaSDavid Teigland 857fd041f0bSSteven Whitehouse gfs2_assert_warn(sdp, atomic_read(&sdp->sd_log_blks_free) == sdp->sd_jdesc->jd_blocks); 858a74604beSSteven Whitehouse gfs2_assert_warn(sdp, sdp->sd_log_head == sdp->sd_log_tail); 859a74604beSSteven Whitehouse gfs2_assert_warn(sdp, list_empty(&sdp->sd_ail2_list)); 860b3b94faaSDavid Teigland 861b3b94faaSDavid Teigland sdp->sd_log_head = sdp->sd_log_flush_head; 862b3b94faaSDavid Teigland sdp->sd_log_tail = sdp->sd_log_head; 863b3b94faaSDavid Teigland 864484adff8SSteven Whitehouse up_write(&sdp->sd_log_flush_lock); 865b3b94faaSDavid Teigland } 866b3b94faaSDavid Teigland 867a25311c8SSteven Whitehouse 868a25311c8SSteven Whitehouse /** 869a25311c8SSteven Whitehouse * gfs2_meta_syncfs - sync all the buffers in a filesystem 870a25311c8SSteven Whitehouse * @sdp: the filesystem 871a25311c8SSteven Whitehouse * 872a25311c8SSteven Whitehouse */ 873a25311c8SSteven Whitehouse 874a25311c8SSteven Whitehouse void gfs2_meta_syncfs(struct gfs2_sbd *sdp) 875a25311c8SSteven Whitehouse { 876a25311c8SSteven Whitehouse gfs2_log_flush(sdp, NULL); 877a25311c8SSteven Whitehouse for (;;) { 8785e687eacSBenjamin Marzinski gfs2_ail1_start(sdp); 879a25311c8SSteven Whitehouse if (gfs2_ail1_empty(sdp, DIO_ALL)) 880a25311c8SSteven Whitehouse break; 881a25311c8SSteven Whitehouse msleep(10); 882a25311c8SSteven Whitehouse } 883a25311c8SSteven Whitehouse } 884a25311c8SSteven Whitehouse 8855e687eacSBenjamin Marzinski static inline int gfs2_jrnl_flush_reqd(struct gfs2_sbd *sdp) 8865e687eacSBenjamin Marzinski { 8875e687eacSBenjamin Marzinski return (atomic_read(&sdp->sd_log_pinned) >= atomic_read(&sdp->sd_log_thresh1)); 8885e687eacSBenjamin Marzinski } 8895e687eacSBenjamin Marzinski 8905e687eacSBenjamin Marzinski static inline int gfs2_ail_flush_reqd(struct gfs2_sbd *sdp) 8915e687eacSBenjamin Marzinski { 8925e687eacSBenjamin Marzinski unsigned int used_blocks = sdp->sd_jdesc->jd_blocks - atomic_read(&sdp->sd_log_blks_free); 8935e687eacSBenjamin Marzinski return used_blocks >= atomic_read(&sdp->sd_log_thresh2); 8945e687eacSBenjamin Marzinski } 895ec69b188SSteven Whitehouse 896ec69b188SSteven Whitehouse /** 897ec69b188SSteven Whitehouse * gfs2_logd - Update log tail as Active Items get flushed to in-place blocks 898ec69b188SSteven Whitehouse * @sdp: Pointer to GFS2 superblock 899ec69b188SSteven Whitehouse * 900ec69b188SSteven Whitehouse * Also, periodically check to make sure that we're using the most recent 901ec69b188SSteven Whitehouse * journal index. 902ec69b188SSteven Whitehouse */ 903ec69b188SSteven Whitehouse 904ec69b188SSteven Whitehouse int gfs2_logd(void *data) 905ec69b188SSteven Whitehouse { 906ec69b188SSteven Whitehouse struct gfs2_sbd *sdp = data; 9075e687eacSBenjamin Marzinski unsigned long t = 1; 9085e687eacSBenjamin Marzinski DEFINE_WAIT(wait); 9095e687eacSBenjamin Marzinski unsigned preflush; 910ec69b188SSteven Whitehouse 911ec69b188SSteven Whitehouse while (!kthread_should_stop()) { 912ec69b188SSteven Whitehouse 9135e687eacSBenjamin Marzinski preflush = atomic_read(&sdp->sd_log_pinned); 9145e687eacSBenjamin Marzinski if (gfs2_jrnl_flush_reqd(sdp) || t == 0) { 915ec69b188SSteven Whitehouse gfs2_ail1_empty(sdp, DIO_ALL); 916ec69b188SSteven Whitehouse gfs2_log_flush(sdp, NULL); 9175e687eacSBenjamin Marzinski gfs2_ail1_empty(sdp, DIO_ALL); 918ec69b188SSteven Whitehouse } 919ec69b188SSteven Whitehouse 9205e687eacSBenjamin Marzinski if (gfs2_ail_flush_reqd(sdp)) { 9215e687eacSBenjamin Marzinski gfs2_ail1_start(sdp); 9225e687eacSBenjamin Marzinski io_schedule(); 9235e687eacSBenjamin Marzinski gfs2_ail1_empty(sdp, 0); 9245e687eacSBenjamin Marzinski gfs2_log_flush(sdp, NULL); 9255e687eacSBenjamin Marzinski gfs2_ail1_empty(sdp, DIO_ALL); 9265e687eacSBenjamin Marzinski } 9275e687eacSBenjamin Marzinski 9285e687eacSBenjamin Marzinski wake_up(&sdp->sd_log_waitq); 929ec69b188SSteven Whitehouse t = gfs2_tune_get(sdp, gt_logd_secs) * HZ; 930ec69b188SSteven Whitehouse if (freezing(current)) 931ec69b188SSteven Whitehouse refrigerator(); 9325e687eacSBenjamin Marzinski 9335e687eacSBenjamin Marzinski do { 9345e687eacSBenjamin Marzinski prepare_to_wait(&sdp->sd_logd_waitq, &wait, 9355e687eacSBenjamin Marzinski TASK_UNINTERRUPTIBLE); 9365e687eacSBenjamin Marzinski if (!gfs2_ail_flush_reqd(sdp) && 9375e687eacSBenjamin Marzinski !gfs2_jrnl_flush_reqd(sdp) && 9385e687eacSBenjamin Marzinski !kthread_should_stop()) 9395e687eacSBenjamin Marzinski t = schedule_timeout(t); 9405e687eacSBenjamin Marzinski } while(t && !gfs2_ail_flush_reqd(sdp) && 9415e687eacSBenjamin Marzinski !gfs2_jrnl_flush_reqd(sdp) && 9425e687eacSBenjamin Marzinski !kthread_should_stop()); 9435e687eacSBenjamin Marzinski finish_wait(&sdp->sd_logd_waitq, &wait); 944ec69b188SSteven Whitehouse } 945ec69b188SSteven Whitehouse 946ec69b188SSteven Whitehouse return 0; 947ec69b188SSteven Whitehouse } 948ec69b188SSteven Whitehouse 949