xref: /openbmc/linux/fs/gfs2/lops.c (revision dad30e90)
1b3b94faaSDavid Teigland /*
2b3b94faaSDavid Teigland  * Copyright (C) Sistina Software, Inc.  1997-2003 All rights reserved.
33a8a9a10SSteven Whitehouse  * Copyright (C) 2004-2006 Red Hat, Inc.  All rights reserved.
4b3b94faaSDavid Teigland  *
5b3b94faaSDavid Teigland  * This copyrighted material is made available to anyone wishing to use,
6b3b94faaSDavid Teigland  * modify, copy, or redistribute it subject to the terms and conditions
7e9fc2aa0SSteven Whitehouse  * of the GNU General Public License version 2.
8b3b94faaSDavid Teigland  */
9b3b94faaSDavid Teigland 
10b3b94faaSDavid Teigland #include <linux/sched.h>
11b3b94faaSDavid Teigland #include <linux/slab.h>
12b3b94faaSDavid Teigland #include <linux/spinlock.h>
13b3b94faaSDavid Teigland #include <linux/completion.h>
14b3b94faaSDavid Teigland #include <linux/buffer_head.h>
1575ca61c1SSteven Whitehouse #include <linux/mempool.h>
165c676f6dSSteven Whitehouse #include <linux/gfs2_ondisk.h>
17c969f58cSSteven Whitehouse #include <linux/bio.h>
18c969f58cSSteven Whitehouse #include <linux/fs.h>
19b3b94faaSDavid Teigland 
20b3b94faaSDavid Teigland #include "gfs2.h"
215c676f6dSSteven Whitehouse #include "incore.h"
222332c443SRobert Peterson #include "inode.h"
23b3b94faaSDavid Teigland #include "glock.h"
24b3b94faaSDavid Teigland #include "log.h"
25b3b94faaSDavid Teigland #include "lops.h"
26b3b94faaSDavid Teigland #include "meta_io.h"
27b3b94faaSDavid Teigland #include "recovery.h"
28b3b94faaSDavid Teigland #include "rgrp.h"
29b3b94faaSDavid Teigland #include "trans.h"
305c676f6dSSteven Whitehouse #include "util.h"
3163997775SSteven Whitehouse #include "trace_gfs2.h"
32b3b94faaSDavid Teigland 
339b9107a5SSteven Whitehouse /**
349b9107a5SSteven Whitehouse  * gfs2_pin - Pin a buffer in memory
359b9107a5SSteven Whitehouse  * @sdp: The superblock
369b9107a5SSteven Whitehouse  * @bh: The buffer to be pinned
379b9107a5SSteven Whitehouse  *
389b9107a5SSteven Whitehouse  * The log lock must be held when calling this function
399b9107a5SSteven Whitehouse  */
409b9107a5SSteven Whitehouse static void gfs2_pin(struct gfs2_sbd *sdp, struct buffer_head *bh)
419b9107a5SSteven Whitehouse {
429b9107a5SSteven Whitehouse 	struct gfs2_bufdata *bd;
439b9107a5SSteven Whitehouse 
4429687a2aSSteven Whitehouse 	BUG_ON(!current->journal_info);
459b9107a5SSteven Whitehouse 
469b9107a5SSteven Whitehouse 	clear_buffer_dirty(bh);
479b9107a5SSteven Whitehouse 	if (test_set_buffer_pinned(bh))
489b9107a5SSteven Whitehouse 		gfs2_assert_withdraw(sdp, 0);
499b9107a5SSteven Whitehouse 	if (!buffer_uptodate(bh))
509b9107a5SSteven Whitehouse 		gfs2_io_error_bh(sdp, bh);
519b9107a5SSteven Whitehouse 	bd = bh->b_private;
529b9107a5SSteven Whitehouse 	/* If this buffer is in the AIL and it has already been written
539b9107a5SSteven Whitehouse 	 * to in-place disk block, remove it from the AIL.
549b9107a5SSteven Whitehouse 	 */
55c618e87aSSteven Whitehouse 	spin_lock(&sdp->sd_ail_lock);
569b9107a5SSteven Whitehouse 	if (bd->bd_ail)
579b9107a5SSteven Whitehouse 		list_move(&bd->bd_ail_st_list, &bd->bd_ail->ai_ail2_list);
58c618e87aSSteven Whitehouse 	spin_unlock(&sdp->sd_ail_lock);
599b9107a5SSteven Whitehouse 	get_bh(bh);
605e687eacSBenjamin Marzinski 	atomic_inc(&sdp->sd_log_pinned);
6163997775SSteven Whitehouse 	trace_gfs2_pin(bd, 1);
629b9107a5SSteven Whitehouse }
639b9107a5SSteven Whitehouse 
647c9ca621SBob Peterson static bool buffer_is_rgrp(const struct gfs2_bufdata *bd)
657c9ca621SBob Peterson {
667c9ca621SBob Peterson 	return bd->bd_gl->gl_name.ln_type == LM_TYPE_RGRP;
677c9ca621SBob Peterson }
687c9ca621SBob Peterson 
697c9ca621SBob Peterson static void maybe_release_space(struct gfs2_bufdata *bd)
707c9ca621SBob Peterson {
717c9ca621SBob Peterson 	struct gfs2_glock *gl = bd->bd_gl;
727c9ca621SBob Peterson 	struct gfs2_sbd *sdp = gl->gl_sbd;
737c9ca621SBob Peterson 	struct gfs2_rgrpd *rgd = gl->gl_object;
747c9ca621SBob Peterson 	unsigned int index = bd->bd_bh->b_blocknr - gl->gl_name.ln_number;
757c9ca621SBob Peterson 	struct gfs2_bitmap *bi = rgd->rd_bits + index;
767c9ca621SBob Peterson 
777c9ca621SBob Peterson 	if (bi->bi_clone == 0)
787c9ca621SBob Peterson 		return;
797c9ca621SBob Peterson 	if (sdp->sd_args.ar_discard)
8066fc061bSSteven Whitehouse 		gfs2_rgrp_send_discards(sdp, rgd->rd_data0, bd->bd_bh, bi, 1, NULL);
817c9ca621SBob Peterson 	memcpy(bi->bi_clone + bi->bi_offset,
827c9ca621SBob Peterson 	       bd->bd_bh->b_data + bi->bi_offset, bi->bi_len);
837c9ca621SBob Peterson 	clear_bit(GBF_FULL, &bi->bi_flags);
847c9ca621SBob Peterson 	rgd->rd_free_clone = rgd->rd_free;
857c9ca621SBob Peterson }
867c9ca621SBob Peterson 
879b9107a5SSteven Whitehouse /**
889b9107a5SSteven Whitehouse  * gfs2_unpin - Unpin a buffer
899b9107a5SSteven Whitehouse  * @sdp: the filesystem the buffer belongs to
909b9107a5SSteven Whitehouse  * @bh: The buffer to unpin
919b9107a5SSteven Whitehouse  * @ai:
9229687a2aSSteven Whitehouse  * @flags: The inode dirty flags
939b9107a5SSteven Whitehouse  *
949b9107a5SSteven Whitehouse  */
959b9107a5SSteven Whitehouse 
969b9107a5SSteven Whitehouse static void gfs2_unpin(struct gfs2_sbd *sdp, struct buffer_head *bh,
979b9107a5SSteven Whitehouse 		       struct gfs2_ail *ai)
989b9107a5SSteven Whitehouse {
999b9107a5SSteven Whitehouse 	struct gfs2_bufdata *bd = bh->b_private;
1009b9107a5SSteven Whitehouse 
10129687a2aSSteven Whitehouse 	BUG_ON(!buffer_uptodate(bh));
10229687a2aSSteven Whitehouse 	BUG_ON(!buffer_pinned(bh));
1039b9107a5SSteven Whitehouse 
1049b9107a5SSteven Whitehouse 	lock_buffer(bh);
1059b9107a5SSteven Whitehouse 	mark_buffer_dirty(bh);
1069b9107a5SSteven Whitehouse 	clear_buffer_pinned(bh);
1079b9107a5SSteven Whitehouse 
1087c9ca621SBob Peterson 	if (buffer_is_rgrp(bd))
1097c9ca621SBob Peterson 		maybe_release_space(bd);
1107c9ca621SBob Peterson 
111d6a079e8SDave Chinner 	spin_lock(&sdp->sd_ail_lock);
1129b9107a5SSteven Whitehouse 	if (bd->bd_ail) {
1139b9107a5SSteven Whitehouse 		list_del(&bd->bd_ail_st_list);
1149b9107a5SSteven Whitehouse 		brelse(bh);
1159b9107a5SSteven Whitehouse 	} else {
1169b9107a5SSteven Whitehouse 		struct gfs2_glock *gl = bd->bd_gl;
1179b9107a5SSteven Whitehouse 		list_add(&bd->bd_ail_gl_list, &gl->gl_ail_list);
1189b9107a5SSteven Whitehouse 		atomic_inc(&gl->gl_ail_count);
1199b9107a5SSteven Whitehouse 	}
1209b9107a5SSteven Whitehouse 	bd->bd_ail = ai;
1219b9107a5SSteven Whitehouse 	list_add(&bd->bd_ail_st_list, &ai->ai_ail1_list);
122d6a079e8SDave Chinner 	spin_unlock(&sdp->sd_ail_lock);
123d6a079e8SDave Chinner 
12429687a2aSSteven Whitehouse 	clear_bit(GLF_LFLUSH, &bd->bd_gl->gl_flags);
12563997775SSteven Whitehouse 	trace_gfs2_pin(bd, 0);
1269b9107a5SSteven Whitehouse 	unlock_buffer(bh);
1275e687eacSBenjamin Marzinski 	atomic_dec(&sdp->sd_log_pinned);
1289b9107a5SSteven Whitehouse }
1299b9107a5SSteven Whitehouse 
130e8c92ed7SSteven Whitehouse static void gfs2_log_incr_head(struct gfs2_sbd *sdp)
13116615be1SSteven Whitehouse {
132e8c92ed7SSteven Whitehouse 	BUG_ON((sdp->sd_log_flush_head == sdp->sd_log_tail) &&
133e8c92ed7SSteven Whitehouse 	       (sdp->sd_log_flush_head != sdp->sd_log_head));
134e8c92ed7SSteven Whitehouse 
135e8c92ed7SSteven Whitehouse 	if (++sdp->sd_log_flush_head == sdp->sd_jdesc->jd_blocks) {
136e8c92ed7SSteven Whitehouse 		sdp->sd_log_flush_head = 0;
137e8c92ed7SSteven Whitehouse 		sdp->sd_log_flush_wrapped = 1;
138e8c92ed7SSteven Whitehouse 	}
13916615be1SSteven Whitehouse }
14016615be1SSteven Whitehouse 
141e8c92ed7SSteven Whitehouse static u64 gfs2_log_bmap(struct gfs2_sbd *sdp)
14216615be1SSteven Whitehouse {
143e8c92ed7SSteven Whitehouse 	unsigned int lbn = sdp->sd_log_flush_head;
144e8c92ed7SSteven Whitehouse 	struct gfs2_journal_extent *je;
145e8c92ed7SSteven Whitehouse 	u64 block;
14616615be1SSteven Whitehouse 
147e8c92ed7SSteven Whitehouse 	list_for_each_entry(je, &sdp->sd_jdesc->extent_list, extent_list) {
148e8c92ed7SSteven Whitehouse 		if (lbn >= je->lblock && lbn < je->lblock + je->blocks) {
149e8c92ed7SSteven Whitehouse 			block = je->dblock + lbn - je->lblock;
15047ac5537SSteven Whitehouse 			gfs2_log_incr_head(sdp);
151e8c92ed7SSteven Whitehouse 			return block;
152e8c92ed7SSteven Whitehouse 		}
153e8c92ed7SSteven Whitehouse 	}
15447ac5537SSteven Whitehouse 
155e8c92ed7SSteven Whitehouse 	return -1;
15647ac5537SSteven Whitehouse }
15747ac5537SSteven Whitehouse 
15847ac5537SSteven Whitehouse /**
159e8c92ed7SSteven Whitehouse  * gfs2_end_log_write_bh - end log write of pagecache data with buffers
160e8c92ed7SSteven Whitehouse  * @sdp: The superblock
161e8c92ed7SSteven Whitehouse  * @bvec: The bio_vec
162e8c92ed7SSteven Whitehouse  * @error: The i/o status
163e8c92ed7SSteven Whitehouse  *
164e8c92ed7SSteven Whitehouse  * This finds the relavent buffers and unlocks then and sets the
165e8c92ed7SSteven Whitehouse  * error flag according to the status of the i/o request. This is
166e8c92ed7SSteven Whitehouse  * used when the log is writing data which has an in-place version
167e8c92ed7SSteven Whitehouse  * that is pinned in the pagecache.
168e8c92ed7SSteven Whitehouse  */
169e8c92ed7SSteven Whitehouse 
170e8c92ed7SSteven Whitehouse static void gfs2_end_log_write_bh(struct gfs2_sbd *sdp, struct bio_vec *bvec,
171e8c92ed7SSteven Whitehouse 				  int error)
172e8c92ed7SSteven Whitehouse {
173e8c92ed7SSteven Whitehouse 	struct buffer_head *bh, *next;
174e8c92ed7SSteven Whitehouse 	struct page *page = bvec->bv_page;
175e8c92ed7SSteven Whitehouse 	unsigned size;
176e8c92ed7SSteven Whitehouse 
177e8c92ed7SSteven Whitehouse 	bh = page_buffers(page);
178e8c92ed7SSteven Whitehouse 	size = bvec->bv_len;
179e8c92ed7SSteven Whitehouse 	while (bh_offset(bh) < bvec->bv_offset)
180e8c92ed7SSteven Whitehouse 		bh = bh->b_this_page;
181e8c92ed7SSteven Whitehouse 	do {
182e8c92ed7SSteven Whitehouse 		if (error)
183e8c92ed7SSteven Whitehouse 			set_buffer_write_io_error(bh);
184e8c92ed7SSteven Whitehouse 		unlock_buffer(bh);
185e8c92ed7SSteven Whitehouse 		next = bh->b_this_page;
186e8c92ed7SSteven Whitehouse 		size -= bh->b_size;
187e8c92ed7SSteven Whitehouse 		brelse(bh);
188e8c92ed7SSteven Whitehouse 		bh = next;
189e8c92ed7SSteven Whitehouse 	} while(bh && size);
190e8c92ed7SSteven Whitehouse }
191e8c92ed7SSteven Whitehouse 
192e8c92ed7SSteven Whitehouse /**
193e8c92ed7SSteven Whitehouse  * gfs2_end_log_write - end of i/o to the log
194e8c92ed7SSteven Whitehouse  * @bio: The bio
195e8c92ed7SSteven Whitehouse  * @error: Status of i/o request
196e8c92ed7SSteven Whitehouse  *
197e8c92ed7SSteven Whitehouse  * Each bio_vec contains either data from the pagecache or data
198e8c92ed7SSteven Whitehouse  * relating to the log itself. Here we iterate over the bio_vec
199e8c92ed7SSteven Whitehouse  * array, processing both kinds of data.
20047ac5537SSteven Whitehouse  *
20147ac5537SSteven Whitehouse  */
20247ac5537SSteven Whitehouse 
203e8c92ed7SSteven Whitehouse static void gfs2_end_log_write(struct bio *bio, int error)
20447ac5537SSteven Whitehouse {
205e8c92ed7SSteven Whitehouse 	struct gfs2_sbd *sdp = bio->bi_private;
206e8c92ed7SSteven Whitehouse 	struct bio_vec *bvec;
207e8c92ed7SSteven Whitehouse 	struct page *page;
208e8c92ed7SSteven Whitehouse 	int i;
20947ac5537SSteven Whitehouse 
210e8c92ed7SSteven Whitehouse 	if (error) {
211e8c92ed7SSteven Whitehouse 		sdp->sd_log_error = error;
212e8c92ed7SSteven Whitehouse 		fs_err(sdp, "Error %d writing to log\n", error);
213e8c92ed7SSteven Whitehouse 	}
214e8c92ed7SSteven Whitehouse 
215e8c92ed7SSteven Whitehouse 	bio_for_each_segment(bvec, bio, i) {
216e8c92ed7SSteven Whitehouse 		page = bvec->bv_page;
217e8c92ed7SSteven Whitehouse 		if (page_has_buffers(page))
218e8c92ed7SSteven Whitehouse 			gfs2_end_log_write_bh(sdp, bvec, error);
219e8c92ed7SSteven Whitehouse 		else
220e8c92ed7SSteven Whitehouse 			mempool_free(page, gfs2_page_pool);
221e8c92ed7SSteven Whitehouse 	}
222e8c92ed7SSteven Whitehouse 
223e8c92ed7SSteven Whitehouse 	bio_put(bio);
22447ac5537SSteven Whitehouse 	if (atomic_dec_and_test(&sdp->sd_log_in_flight))
22547ac5537SSteven Whitehouse 		wake_up(&sdp->sd_log_flush_wait);
22647ac5537SSteven Whitehouse }
22747ac5537SSteven Whitehouse 
22847ac5537SSteven Whitehouse /**
229e8c92ed7SSteven Whitehouse  * gfs2_log_flush_bio - Submit any pending log bio
230e8c92ed7SSteven Whitehouse  * @sdp: The superblock
231e8c92ed7SSteven Whitehouse  * @rw: The rw flags
232e8c92ed7SSteven Whitehouse  *
233e8c92ed7SSteven Whitehouse  * Submit any pending part-built or full bio to the block device. If
234e8c92ed7SSteven Whitehouse  * there is no pending bio, then this is a no-op.
235e8c92ed7SSteven Whitehouse  */
236e8c92ed7SSteven Whitehouse 
237e8c92ed7SSteven Whitehouse void gfs2_log_flush_bio(struct gfs2_sbd *sdp, int rw)
238e8c92ed7SSteven Whitehouse {
239e8c92ed7SSteven Whitehouse 	if (sdp->sd_log_bio) {
240e8c92ed7SSteven Whitehouse 		atomic_inc(&sdp->sd_log_in_flight);
241e8c92ed7SSteven Whitehouse 		submit_bio(rw, sdp->sd_log_bio);
242e8c92ed7SSteven Whitehouse 		sdp->sd_log_bio = NULL;
243e8c92ed7SSteven Whitehouse 	}
244e8c92ed7SSteven Whitehouse }
245e8c92ed7SSteven Whitehouse 
246e8c92ed7SSteven Whitehouse /**
247e8c92ed7SSteven Whitehouse  * gfs2_log_alloc_bio - Allocate a new bio for log writing
248e8c92ed7SSteven Whitehouse  * @sdp: The superblock
249e8c92ed7SSteven Whitehouse  * @blkno: The next device block number we want to write to
250e8c92ed7SSteven Whitehouse  *
251e8c92ed7SSteven Whitehouse  * This should never be called when there is a cached bio in the
252e8c92ed7SSteven Whitehouse  * super block. When it returns, there will be a cached bio in the
253e8c92ed7SSteven Whitehouse  * super block which will have as many bio_vecs as the device is
254e8c92ed7SSteven Whitehouse  * happy to handle.
255e8c92ed7SSteven Whitehouse  *
256e8c92ed7SSteven Whitehouse  * Returns: Newly allocated bio
257e8c92ed7SSteven Whitehouse  */
258e8c92ed7SSteven Whitehouse 
259e8c92ed7SSteven Whitehouse static struct bio *gfs2_log_alloc_bio(struct gfs2_sbd *sdp, u64 blkno)
260e8c92ed7SSteven Whitehouse {
261e8c92ed7SSteven Whitehouse 	struct super_block *sb = sdp->sd_vfs;
262e8c92ed7SSteven Whitehouse 	unsigned nrvecs = bio_get_nr_vecs(sb->s_bdev);
263e8c92ed7SSteven Whitehouse 	struct bio *bio;
264e8c92ed7SSteven Whitehouse 
265e8c92ed7SSteven Whitehouse 	BUG_ON(sdp->sd_log_bio);
266e8c92ed7SSteven Whitehouse 
267e8c92ed7SSteven Whitehouse 	while (1) {
268e8c92ed7SSteven Whitehouse 		bio = bio_alloc(GFP_NOIO, nrvecs);
269e8c92ed7SSteven Whitehouse 		if (likely(bio))
270e8c92ed7SSteven Whitehouse 			break;
271e8c92ed7SSteven Whitehouse 		nrvecs = max(nrvecs/2, 1U);
272e8c92ed7SSteven Whitehouse 	}
273e8c92ed7SSteven Whitehouse 
274e8c92ed7SSteven Whitehouse 	bio->bi_sector = blkno * (sb->s_blocksize >> 9);
275e8c92ed7SSteven Whitehouse 	bio->bi_bdev = sb->s_bdev;
276e8c92ed7SSteven Whitehouse 	bio->bi_end_io = gfs2_end_log_write;
277e8c92ed7SSteven Whitehouse 	bio->bi_private = sdp;
278e8c92ed7SSteven Whitehouse 
279e8c92ed7SSteven Whitehouse 	sdp->sd_log_bio = bio;
280e8c92ed7SSteven Whitehouse 
281e8c92ed7SSteven Whitehouse 	return bio;
282e8c92ed7SSteven Whitehouse }
283e8c92ed7SSteven Whitehouse 
284e8c92ed7SSteven Whitehouse /**
285e8c92ed7SSteven Whitehouse  * gfs2_log_get_bio - Get cached log bio, or allocate a new one
286e8c92ed7SSteven Whitehouse  * @sdp: The superblock
287e8c92ed7SSteven Whitehouse  * @blkno: The device block number we want to write to
288e8c92ed7SSteven Whitehouse  *
289e8c92ed7SSteven Whitehouse  * If there is a cached bio, then if the next block number is sequential
290e8c92ed7SSteven Whitehouse  * with the previous one, return it, otherwise flush the bio to the
291e8c92ed7SSteven Whitehouse  * device. If there is not a cached bio, or we just flushed it, then
292e8c92ed7SSteven Whitehouse  * allocate a new one.
293e8c92ed7SSteven Whitehouse  *
294e8c92ed7SSteven Whitehouse  * Returns: The bio to use for log writes
295e8c92ed7SSteven Whitehouse  */
296e8c92ed7SSteven Whitehouse 
297e8c92ed7SSteven Whitehouse static struct bio *gfs2_log_get_bio(struct gfs2_sbd *sdp, u64 blkno)
298e8c92ed7SSteven Whitehouse {
299e8c92ed7SSteven Whitehouse 	struct bio *bio = sdp->sd_log_bio;
300e8c92ed7SSteven Whitehouse 	u64 nblk;
301e8c92ed7SSteven Whitehouse 
302e8c92ed7SSteven Whitehouse 	if (bio) {
303e8c92ed7SSteven Whitehouse 		nblk = bio->bi_sector + bio_sectors(bio);
304e8c92ed7SSteven Whitehouse 		nblk >>= sdp->sd_fsb2bb_shift;
305e8c92ed7SSteven Whitehouse 		if (blkno == nblk)
306e8c92ed7SSteven Whitehouse 			return bio;
307e8c92ed7SSteven Whitehouse 		gfs2_log_flush_bio(sdp, WRITE);
308e8c92ed7SSteven Whitehouse 	}
309e8c92ed7SSteven Whitehouse 
310e8c92ed7SSteven Whitehouse 	return gfs2_log_alloc_bio(sdp, blkno);
311e8c92ed7SSteven Whitehouse }
312e8c92ed7SSteven Whitehouse 
313e8c92ed7SSteven Whitehouse 
314e8c92ed7SSteven Whitehouse /**
315e8c92ed7SSteven Whitehouse  * gfs2_log_write - write to log
31647ac5537SSteven Whitehouse  * @sdp: the filesystem
317e8c92ed7SSteven Whitehouse  * @page: the page to write
318e8c92ed7SSteven Whitehouse  * @size: the size of the data to write
319e8c92ed7SSteven Whitehouse  * @offset: the offset within the page
32047ac5537SSteven Whitehouse  *
321e8c92ed7SSteven Whitehouse  * Try and add the page segment to the current bio. If that fails,
322e8c92ed7SSteven Whitehouse  * submit the current bio to the device and create a new one, and
323e8c92ed7SSteven Whitehouse  * then add the page segment to that.
32447ac5537SSteven Whitehouse  */
32547ac5537SSteven Whitehouse 
326e8c92ed7SSteven Whitehouse static void gfs2_log_write(struct gfs2_sbd *sdp, struct page *page,
327e8c92ed7SSteven Whitehouse 			   unsigned size, unsigned offset)
32847ac5537SSteven Whitehouse {
329e8c92ed7SSteven Whitehouse 	u64 blkno = gfs2_log_bmap(sdp);
330e8c92ed7SSteven Whitehouse 	struct bio *bio;
331e8c92ed7SSteven Whitehouse 	int ret;
33247ac5537SSteven Whitehouse 
333e8c92ed7SSteven Whitehouse 	bio = gfs2_log_get_bio(sdp, blkno);
334e8c92ed7SSteven Whitehouse 	ret = bio_add_page(bio, page, size, offset);
335e8c92ed7SSteven Whitehouse 	if (ret == 0) {
336e8c92ed7SSteven Whitehouse 		gfs2_log_flush_bio(sdp, WRITE);
337e8c92ed7SSteven Whitehouse 		bio = gfs2_log_alloc_bio(sdp, blkno);
338e8c92ed7SSteven Whitehouse 		ret = bio_add_page(bio, page, size, offset);
339e8c92ed7SSteven Whitehouse 		WARN_ON(ret == 0);
340e8c92ed7SSteven Whitehouse 	}
34147ac5537SSteven Whitehouse }
34216615be1SSteven Whitehouse 
343e8c92ed7SSteven Whitehouse /**
344e8c92ed7SSteven Whitehouse  * gfs2_log_write_bh - write a buffer's content to the log
345e8c92ed7SSteven Whitehouse  * @sdp: The super block
346e8c92ed7SSteven Whitehouse  * @bh: The buffer pointing to the in-place location
347e8c92ed7SSteven Whitehouse  *
348e8c92ed7SSteven Whitehouse  * This writes the content of the buffer to the next available location
349e8c92ed7SSteven Whitehouse  * in the log. The buffer will be unlocked once the i/o to the log has
350e8c92ed7SSteven Whitehouse  * completed.
351e8c92ed7SSteven Whitehouse  */
352e8c92ed7SSteven Whitehouse 
353e8c92ed7SSteven Whitehouse static void gfs2_log_write_bh(struct gfs2_sbd *sdp, struct buffer_head *bh)
35416615be1SSteven Whitehouse {
355e8c92ed7SSteven Whitehouse 	gfs2_log_write(sdp, bh->b_page, bh->b_size, bh_offset(bh));
356e8c92ed7SSteven Whitehouse }
357e8c92ed7SSteven Whitehouse 
358e8c92ed7SSteven Whitehouse /**
359e8c92ed7SSteven Whitehouse  * gfs2_log_write_page - write one block stored in a page, into the log
360e8c92ed7SSteven Whitehouse  * @sdp: The superblock
361e8c92ed7SSteven Whitehouse  * @page: The struct page
362e8c92ed7SSteven Whitehouse  *
363e8c92ed7SSteven Whitehouse  * This writes the first block-sized part of the page into the log. Note
364e8c92ed7SSteven Whitehouse  * that the page must have been allocated from the gfs2_page_pool mempool
365e8c92ed7SSteven Whitehouse  * and that after this has been called, ownership has been transferred and
366e8c92ed7SSteven Whitehouse  * the page may be freed at any time.
367e8c92ed7SSteven Whitehouse  */
368e8c92ed7SSteven Whitehouse 
369e8c92ed7SSteven Whitehouse void gfs2_log_write_page(struct gfs2_sbd *sdp, struct page *page)
370e8c92ed7SSteven Whitehouse {
371e8c92ed7SSteven Whitehouse 	struct super_block *sb = sdp->sd_vfs;
372e8c92ed7SSteven Whitehouse 	gfs2_log_write(sdp, page, sb->s_blocksize, 0);
373e8c92ed7SSteven Whitehouse }
374e8c92ed7SSteven Whitehouse 
375dad30e90SSteven Whitehouse static struct page *gfs2_get_log_desc(struct gfs2_sbd *sdp, u32 ld_type,
376dad30e90SSteven Whitehouse 				      u32 ld_length, u32 ld_data1)
377e8c92ed7SSteven Whitehouse {
378e8c92ed7SSteven Whitehouse 	void *page = mempool_alloc(gfs2_page_pool, GFP_NOIO);
379e8c92ed7SSteven Whitehouse 	struct gfs2_log_descriptor *ld = page_address(page);
380e8c92ed7SSteven Whitehouse 	clear_page(ld);
38116615be1SSteven Whitehouse 	ld->ld_header.mh_magic = cpu_to_be32(GFS2_MAGIC);
38216615be1SSteven Whitehouse 	ld->ld_header.mh_type = cpu_to_be32(GFS2_METATYPE_LD);
38316615be1SSteven Whitehouse 	ld->ld_header.mh_format = cpu_to_be32(GFS2_FORMAT_LD);
38416615be1SSteven Whitehouse 	ld->ld_type = cpu_to_be32(ld_type);
385dad30e90SSteven Whitehouse 	ld->ld_length = cpu_to_be32(ld_length);
386dad30e90SSteven Whitehouse 	ld->ld_data1 = cpu_to_be32(ld_data1);
38716615be1SSteven Whitehouse 	ld->ld_data2 = 0;
388e8c92ed7SSteven Whitehouse 	return page;
38916615be1SSteven Whitehouse }
39016615be1SSteven Whitehouse 
391b3b94faaSDavid Teigland static void buf_lo_add(struct gfs2_sbd *sdp, struct gfs2_log_element *le)
392b3b94faaSDavid Teigland {
393b3b94faaSDavid Teigland 	struct gfs2_bufdata *bd = container_of(le, struct gfs2_bufdata, bd_le);
3940ab7d13fSSteven Whitehouse 	struct gfs2_meta_header *mh;
395b3b94faaSDavid Teigland 	struct gfs2_trans *tr;
396b3b94faaSDavid Teigland 
3979b9107a5SSteven Whitehouse 	lock_buffer(bd->bd_bh);
3988bd95727SSteven Whitehouse 	gfs2_log_lock(sdp);
3999b9107a5SSteven Whitehouse 	if (!list_empty(&bd->bd_list_tr))
4009b9107a5SSteven Whitehouse 		goto out;
4015c676f6dSSteven Whitehouse 	tr = current->journal_info;
402b3b94faaSDavid Teigland 	tr->tr_touched = 1;
403b3b94faaSDavid Teigland 	tr->tr_num_buf++;
404b3b94faaSDavid Teigland 	list_add(&bd->bd_list_tr, &tr->tr_list_buf);
405b3b94faaSDavid Teigland 	if (!list_empty(&le->le_list))
4069b9107a5SSteven Whitehouse 		goto out;
4072bcd610dSSteven Whitehouse 	set_bit(GLF_LFLUSH, &bd->bd_gl->gl_flags);
4082bcd610dSSteven Whitehouse 	set_bit(GLF_DIRTY, &bd->bd_gl->gl_flags);
409b3b94faaSDavid Teigland 	gfs2_meta_check(sdp, bd->bd_bh);
410a98ab220SSteven Whitehouse 	gfs2_pin(sdp, bd->bd_bh);
4110ab7d13fSSteven Whitehouse 	mh = (struct gfs2_meta_header *)bd->bd_bh->b_data;
4120ab7d13fSSteven Whitehouse 	mh->__pad0 = cpu_to_be64(0);
4130ab7d13fSSteven Whitehouse 	mh->mh_jid = cpu_to_be32(sdp->sd_jdesc->jd_jid);
414b3b94faaSDavid Teigland 	sdp->sd_log_num_buf++;
415b3b94faaSDavid Teigland 	list_add(&le->le_list, &sdp->sd_log_le_buf);
416b3b94faaSDavid Teigland 	tr->tr_num_buf_new++;
4179b9107a5SSteven Whitehouse out:
4189b9107a5SSteven Whitehouse 	gfs2_log_unlock(sdp);
4199b9107a5SSteven Whitehouse 	unlock_buffer(bd->bd_bh);
420b3b94faaSDavid Teigland }
421b3b94faaSDavid Teigland 
422dad30e90SSteven Whitehouse static void gfs2_check_magic(struct buffer_head *bh)
423dad30e90SSteven Whitehouse {
424dad30e90SSteven Whitehouse 	void *kaddr;
425dad30e90SSteven Whitehouse 	__be32 *ptr;
426dad30e90SSteven Whitehouse 
427dad30e90SSteven Whitehouse 	clear_buffer_escaped(bh);
428dad30e90SSteven Whitehouse 	kaddr = kmap_atomic(bh->b_page);
429dad30e90SSteven Whitehouse 	ptr = kaddr + bh_offset(bh);
430dad30e90SSteven Whitehouse 	if (*ptr == cpu_to_be32(GFS2_MAGIC))
431dad30e90SSteven Whitehouse 		set_buffer_escaped(bh);
432dad30e90SSteven Whitehouse 	kunmap_atomic(kaddr);
433dad30e90SSteven Whitehouse }
434dad30e90SSteven Whitehouse 
435dad30e90SSteven Whitehouse static void gfs2_before_commit(struct gfs2_sbd *sdp, unsigned int limit,
436dad30e90SSteven Whitehouse 				unsigned int total, struct list_head *blist,
437dad30e90SSteven Whitehouse 				bool is_databuf)
438b3b94faaSDavid Teigland {
439b3b94faaSDavid Teigland 	struct gfs2_log_descriptor *ld;
440b3b94faaSDavid Teigland 	struct gfs2_bufdata *bd1 = NULL, *bd2;
441e8c92ed7SSteven Whitehouse 	struct page *page;
442b3b94faaSDavid Teigland 	unsigned int num;
443b3b94faaSDavid Teigland 	unsigned n;
444b3b94faaSDavid Teigland 	__be64 *ptr;
445b3b94faaSDavid Teigland 
446905d2aefSBob Peterson 	gfs2_log_lock(sdp);
447dad30e90SSteven Whitehouse 	bd1 = bd2 = list_prepare_entry(bd1, blist, bd_le.le_list);
448b3b94faaSDavid Teigland 	while(total) {
449b3b94faaSDavid Teigland 		num = total;
450b3b94faaSDavid Teigland 		if (total > limit)
451b3b94faaSDavid Teigland 			num = limit;
452905d2aefSBob Peterson 		gfs2_log_unlock(sdp);
453dad30e90SSteven Whitehouse 		page = gfs2_get_log_desc(sdp, GFS2_LOG_DESC_METADATA, num + 1, num);
454e8c92ed7SSteven Whitehouse 		ld = page_address(page);
455905d2aefSBob Peterson 		gfs2_log_lock(sdp);
456e8c92ed7SSteven Whitehouse 		ptr = (__be64 *)(ld + 1);
457b3b94faaSDavid Teigland 
458b3b94faaSDavid Teigland 		n = 0;
459dad30e90SSteven Whitehouse 		list_for_each_entry_continue(bd1, blist, bd_le.le_list) {
460b3b94faaSDavid Teigland 			*ptr++ = cpu_to_be64(bd1->bd_bh->b_blocknr);
461dad30e90SSteven Whitehouse 			if (is_databuf) {
462dad30e90SSteven Whitehouse 				gfs2_check_magic(bd1->bd_bh);
463dad30e90SSteven Whitehouse 				*ptr++ = cpu_to_be64(buffer_escaped(bd1->bd_bh) ? 1 : 0);
464dad30e90SSteven Whitehouse 			}
465b3b94faaSDavid Teigland 			if (++n >= num)
466b3b94faaSDavid Teigland 				break;
467b3b94faaSDavid Teigland 		}
468b3b94faaSDavid Teigland 
469905d2aefSBob Peterson 		gfs2_log_unlock(sdp);
470e8c92ed7SSteven Whitehouse 		gfs2_log_write_page(sdp, page);
471905d2aefSBob Peterson 		gfs2_log_lock(sdp);
472b3b94faaSDavid Teigland 
473b3b94faaSDavid Teigland 		n = 0;
474dad30e90SSteven Whitehouse 		list_for_each_entry_continue(bd2, blist, bd_le.le_list) {
47516615be1SSteven Whitehouse 			get_bh(bd2->bd_bh);
476905d2aefSBob Peterson 			gfs2_log_unlock(sdp);
47716615be1SSteven Whitehouse 			lock_buffer(bd2->bd_bh);
478dad30e90SSteven Whitehouse 
479dad30e90SSteven Whitehouse 			if (buffer_escaped(bd2->bd_bh)) {
480dad30e90SSteven Whitehouse 				void *kaddr;
481dad30e90SSteven Whitehouse 				page = mempool_alloc(gfs2_page_pool, GFP_NOIO);
482dad30e90SSteven Whitehouse 				ptr = page_address(page);
483dad30e90SSteven Whitehouse 				kaddr = kmap_atomic(bd2->bd_bh->b_page);
484dad30e90SSteven Whitehouse 				memcpy(ptr, kaddr + bh_offset(bd2->bd_bh),
485dad30e90SSteven Whitehouse 				       bd2->bd_bh->b_size);
486dad30e90SSteven Whitehouse 				kunmap_atomic(kaddr);
487dad30e90SSteven Whitehouse 				*(__be32 *)ptr = 0;
488dad30e90SSteven Whitehouse 				clear_buffer_escaped(bd2->bd_bh);
489dad30e90SSteven Whitehouse 				unlock_buffer(bd2->bd_bh);
490dad30e90SSteven Whitehouse 				brelse(bd2->bd_bh);
491dad30e90SSteven Whitehouse 				gfs2_log_write_page(sdp, page);
492dad30e90SSteven Whitehouse 			} else {
493e8c92ed7SSteven Whitehouse 				gfs2_log_write_bh(sdp, bd2->bd_bh);
494dad30e90SSteven Whitehouse 			}
495905d2aefSBob Peterson 			gfs2_log_lock(sdp);
496b3b94faaSDavid Teigland 			if (++n >= num)
497b3b94faaSDavid Teigland 				break;
498b3b94faaSDavid Teigland 		}
499b3b94faaSDavid Teigland 
500905d2aefSBob Peterson 		BUG_ON(total < num);
501b3b94faaSDavid Teigland 		total -= num;
502b3b94faaSDavid Teigland 	}
503905d2aefSBob Peterson 	gfs2_log_unlock(sdp);
504b3b94faaSDavid Teigland }
505b3b94faaSDavid Teigland 
506dad30e90SSteven Whitehouse static void buf_lo_before_commit(struct gfs2_sbd *sdp)
507dad30e90SSteven Whitehouse {
508dad30e90SSteven Whitehouse 	unsigned int limit = buf_limit(sdp); /* 503 for 4k blocks */
509dad30e90SSteven Whitehouse 
510dad30e90SSteven Whitehouse 	gfs2_before_commit(sdp, limit, sdp->sd_log_num_buf,
511dad30e90SSteven Whitehouse 			   &sdp->sd_log_le_buf, 0);
512dad30e90SSteven Whitehouse }
513dad30e90SSteven Whitehouse 
514b3b94faaSDavid Teigland static void buf_lo_after_commit(struct gfs2_sbd *sdp, struct gfs2_ail *ai)
515b3b94faaSDavid Teigland {
516b3b94faaSDavid Teigland 	struct list_head *head = &sdp->sd_log_le_buf;
517b3b94faaSDavid Teigland 	struct gfs2_bufdata *bd;
518b3b94faaSDavid Teigland 
519b3b94faaSDavid Teigland 	while (!list_empty(head)) {
520b3b94faaSDavid Teigland 		bd = list_entry(head->next, struct gfs2_bufdata, bd_le.le_list);
521b3b94faaSDavid Teigland 		list_del_init(&bd->bd_le.le_list);
522b3b94faaSDavid Teigland 		sdp->sd_log_num_buf--;
523b3b94faaSDavid Teigland 
524a98ab220SSteven Whitehouse 		gfs2_unpin(sdp, bd->bd_bh, ai);
525b3b94faaSDavid Teigland 	}
526b3b94faaSDavid Teigland 	gfs2_assert_warn(sdp, !sdp->sd_log_num_buf);
527b3b94faaSDavid Teigland }
528b3b94faaSDavid Teigland 
529b3b94faaSDavid Teigland static void buf_lo_before_scan(struct gfs2_jdesc *jd,
53055167622SAl Viro 			       struct gfs2_log_header_host *head, int pass)
531b3b94faaSDavid Teigland {
532feaa7bbaSSteven Whitehouse 	struct gfs2_sbd *sdp = GFS2_SB(jd->jd_inode);
533b3b94faaSDavid Teigland 
534b3b94faaSDavid Teigland 	if (pass != 0)
535b3b94faaSDavid Teigland 		return;
536b3b94faaSDavid Teigland 
537b3b94faaSDavid Teigland 	sdp->sd_found_blocks = 0;
538b3b94faaSDavid Teigland 	sdp->sd_replayed_blocks = 0;
539b3b94faaSDavid Teigland }
540b3b94faaSDavid Teigland 
541b3b94faaSDavid Teigland static int buf_lo_scan_elements(struct gfs2_jdesc *jd, unsigned int start,
542b3b94faaSDavid Teigland 				struct gfs2_log_descriptor *ld, __be64 *ptr,
543b3b94faaSDavid Teigland 				int pass)
544b3b94faaSDavid Teigland {
545feaa7bbaSSteven Whitehouse 	struct gfs2_inode *ip = GFS2_I(jd->jd_inode);
546feaa7bbaSSteven Whitehouse 	struct gfs2_sbd *sdp = GFS2_SB(jd->jd_inode);
5475c676f6dSSteven Whitehouse 	struct gfs2_glock *gl = ip->i_gl;
548b3b94faaSDavid Teigland 	unsigned int blks = be32_to_cpu(ld->ld_data1);
549b3b94faaSDavid Teigland 	struct buffer_head *bh_log, *bh_ip;
550cd915493SSteven Whitehouse 	u64 blkno;
551b3b94faaSDavid Teigland 	int error = 0;
552b3b94faaSDavid Teigland 
553b3b94faaSDavid Teigland 	if (pass != 1 || be32_to_cpu(ld->ld_type) != GFS2_LOG_DESC_METADATA)
554b3b94faaSDavid Teigland 		return 0;
555b3b94faaSDavid Teigland 
556b3b94faaSDavid Teigland 	gfs2_replay_incr_blk(sdp, &start);
557b3b94faaSDavid Teigland 
558b3b94faaSDavid Teigland 	for (; blks; gfs2_replay_incr_blk(sdp, &start), blks--) {
559b3b94faaSDavid Teigland 		blkno = be64_to_cpu(*ptr++);
560b3b94faaSDavid Teigland 
561b3b94faaSDavid Teigland 		sdp->sd_found_blocks++;
562b3b94faaSDavid Teigland 
563b3b94faaSDavid Teigland 		if (gfs2_revoke_check(sdp, blkno, start))
564b3b94faaSDavid Teigland 			continue;
565b3b94faaSDavid Teigland 
566b3b94faaSDavid Teigland 		error = gfs2_replay_read_block(jd, start, &bh_log);
567b3b94faaSDavid Teigland 		if (error)
568b3b94faaSDavid Teigland 			return error;
569b3b94faaSDavid Teigland 
570b3b94faaSDavid Teigland 		bh_ip = gfs2_meta_new(gl, blkno);
571b3b94faaSDavid Teigland 		memcpy(bh_ip->b_data, bh_log->b_data, bh_log->b_size);
572b3b94faaSDavid Teigland 
573b3b94faaSDavid Teigland 		if (gfs2_meta_check(sdp, bh_ip))
574b3b94faaSDavid Teigland 			error = -EIO;
575b3b94faaSDavid Teigland 		else
576b3b94faaSDavid Teigland 			mark_buffer_dirty(bh_ip);
577b3b94faaSDavid Teigland 
578b3b94faaSDavid Teigland 		brelse(bh_log);
579b3b94faaSDavid Teigland 		brelse(bh_ip);
580b3b94faaSDavid Teigland 
581b3b94faaSDavid Teigland 		if (error)
582b3b94faaSDavid Teigland 			break;
583b3b94faaSDavid Teigland 
584b3b94faaSDavid Teigland 		sdp->sd_replayed_blocks++;
585b3b94faaSDavid Teigland 	}
586b3b94faaSDavid Teigland 
587b3b94faaSDavid Teigland 	return error;
588b3b94faaSDavid Teigland }
589b3b94faaSDavid Teigland 
590b3b94faaSDavid Teigland static void buf_lo_after_scan(struct gfs2_jdesc *jd, int error, int pass)
591b3b94faaSDavid Teigland {
592feaa7bbaSSteven Whitehouse 	struct gfs2_inode *ip = GFS2_I(jd->jd_inode);
593feaa7bbaSSteven Whitehouse 	struct gfs2_sbd *sdp = GFS2_SB(jd->jd_inode);
594b3b94faaSDavid Teigland 
595b3b94faaSDavid Teigland 	if (error) {
5967276b3b0SSteven Whitehouse 		gfs2_meta_sync(ip->i_gl);
597b3b94faaSDavid Teigland 		return;
598b3b94faaSDavid Teigland 	}
599b3b94faaSDavid Teigland 	if (pass != 1)
600b3b94faaSDavid Teigland 		return;
601b3b94faaSDavid Teigland 
6027276b3b0SSteven Whitehouse 	gfs2_meta_sync(ip->i_gl);
603b3b94faaSDavid Teigland 
604b3b94faaSDavid Teigland 	fs_info(sdp, "jid=%u: Replayed %u of %u blocks\n",
605b3b94faaSDavid Teigland 	        jd->jd_jid, sdp->sd_replayed_blocks, sdp->sd_found_blocks);
606b3b94faaSDavid Teigland }
607b3b94faaSDavid Teigland 
608b3b94faaSDavid Teigland static void revoke_lo_add(struct gfs2_sbd *sdp, struct gfs2_log_element *le)
609b3b94faaSDavid Teigland {
610f42ab085SSteven Whitehouse 	struct gfs2_bufdata *bd = container_of(le, struct gfs2_bufdata, bd_le);
611f42ab085SSteven Whitehouse 	struct gfs2_glock *gl = bd->bd_gl;
612b3b94faaSDavid Teigland 	struct gfs2_trans *tr;
613b3b94faaSDavid Teigland 
6145c676f6dSSteven Whitehouse 	tr = current->journal_info;
615b3b94faaSDavid Teigland 	tr->tr_touched = 1;
616b3b94faaSDavid Teigland 	tr->tr_num_revoke++;
617b3b94faaSDavid Teigland 	sdp->sd_log_num_revoke++;
618f42ab085SSteven Whitehouse 	atomic_inc(&gl->gl_revokes);
619f42ab085SSteven Whitehouse 	set_bit(GLF_LFLUSH, &gl->gl_flags);
620b3b94faaSDavid Teigland 	list_add(&le->le_list, &sdp->sd_log_le_revoke);
621b3b94faaSDavid Teigland }
622b3b94faaSDavid Teigland 
623b3b94faaSDavid Teigland static void revoke_lo_before_commit(struct gfs2_sbd *sdp)
624b3b94faaSDavid Teigland {
625b3b94faaSDavid Teigland 	struct gfs2_log_descriptor *ld;
626b3b94faaSDavid Teigland 	struct gfs2_meta_header *mh;
627b3b94faaSDavid Teigland 	unsigned int offset;
628b3b94faaSDavid Teigland 	struct list_head *head = &sdp->sd_log_le_revoke;
62982e86087SSteven Whitehouse 	struct gfs2_bufdata *bd;
630e8c92ed7SSteven Whitehouse 	struct page *page;
631dad30e90SSteven Whitehouse 	unsigned int length;
632b3b94faaSDavid Teigland 
633b3b94faaSDavid Teigland 	if (!sdp->sd_log_num_revoke)
634b3b94faaSDavid Teigland 		return;
635b3b94faaSDavid Teigland 
636dad30e90SSteven Whitehouse 	length = gfs2_struct2blk(sdp, sdp->sd_log_num_revoke, sizeof(u64));
637dad30e90SSteven Whitehouse 	page = gfs2_get_log_desc(sdp, GFS2_LOG_DESC_REVOKE, length, sdp->sd_log_num_revoke);
638e8c92ed7SSteven Whitehouse 	ld = page_address(page);
639b3b94faaSDavid Teigland 	offset = sizeof(struct gfs2_log_descriptor);
640b3b94faaSDavid Teigland 
641f42ab085SSteven Whitehouse 	list_for_each_entry(bd, head, bd_le.le_list) {
642b3b94faaSDavid Teigland 		sdp->sd_log_num_revoke--;
643b3b94faaSDavid Teigland 
644cd915493SSteven Whitehouse 		if (offset + sizeof(u64) > sdp->sd_sb.sb_bsize) {
645b3b94faaSDavid Teigland 
646e8c92ed7SSteven Whitehouse 			gfs2_log_write_page(sdp, page);
647e8c92ed7SSteven Whitehouse 			page = mempool_alloc(gfs2_page_pool, GFP_NOIO);
648e8c92ed7SSteven Whitehouse 			mh = page_address(page);
649e8c92ed7SSteven Whitehouse 			clear_page(mh);
650b3b94faaSDavid Teigland 			mh->mh_magic = cpu_to_be32(GFS2_MAGIC);
651e3167dedSSteven Whitehouse 			mh->mh_type = cpu_to_be32(GFS2_METATYPE_LB);
652e3167dedSSteven Whitehouse 			mh->mh_format = cpu_to_be32(GFS2_FORMAT_LB);
653b3b94faaSDavid Teigland 			offset = sizeof(struct gfs2_meta_header);
654b3b94faaSDavid Teigland 		}
655b3b94faaSDavid Teigland 
656e8c92ed7SSteven Whitehouse 		*(__be64 *)(page_address(page) + offset) = cpu_to_be64(bd->bd_blkno);
657cd915493SSteven Whitehouse 		offset += sizeof(u64);
658b3b94faaSDavid Teigland 	}
659b3b94faaSDavid Teigland 	gfs2_assert_withdraw(sdp, !sdp->sd_log_num_revoke);
660b3b94faaSDavid Teigland 
661e8c92ed7SSteven Whitehouse 	gfs2_log_write_page(sdp, page);
662b3b94faaSDavid Teigland }
663b3b94faaSDavid Teigland 
664f42ab085SSteven Whitehouse static void revoke_lo_after_commit(struct gfs2_sbd *sdp, struct gfs2_ail *ai)
665f42ab085SSteven Whitehouse {
666f42ab085SSteven Whitehouse 	struct list_head *head = &sdp->sd_log_le_revoke;
667f42ab085SSteven Whitehouse 	struct gfs2_bufdata *bd;
668f42ab085SSteven Whitehouse 	struct gfs2_glock *gl;
669f42ab085SSteven Whitehouse 
670f42ab085SSteven Whitehouse 	while (!list_empty(head)) {
671f42ab085SSteven Whitehouse 		bd = list_entry(head->next, struct gfs2_bufdata, bd_le.le_list);
672f42ab085SSteven Whitehouse 		list_del_init(&bd->bd_le.le_list);
673f42ab085SSteven Whitehouse 		gl = bd->bd_gl;
674f42ab085SSteven Whitehouse 		atomic_dec(&gl->gl_revokes);
675f42ab085SSteven Whitehouse 		clear_bit(GLF_LFLUSH, &gl->gl_flags);
676f42ab085SSteven Whitehouse 		kmem_cache_free(gfs2_bufdata_cachep, bd);
677f42ab085SSteven Whitehouse 	}
678f42ab085SSteven Whitehouse }
679f42ab085SSteven Whitehouse 
680b3b94faaSDavid Teigland static void revoke_lo_before_scan(struct gfs2_jdesc *jd,
68155167622SAl Viro 				  struct gfs2_log_header_host *head, int pass)
682b3b94faaSDavid Teigland {
683feaa7bbaSSteven Whitehouse 	struct gfs2_sbd *sdp = GFS2_SB(jd->jd_inode);
684b3b94faaSDavid Teigland 
685b3b94faaSDavid Teigland 	if (pass != 0)
686b3b94faaSDavid Teigland 		return;
687b3b94faaSDavid Teigland 
688b3b94faaSDavid Teigland 	sdp->sd_found_revokes = 0;
689b3b94faaSDavid Teigland 	sdp->sd_replay_tail = head->lh_tail;
690b3b94faaSDavid Teigland }
691b3b94faaSDavid Teigland 
692b3b94faaSDavid Teigland static int revoke_lo_scan_elements(struct gfs2_jdesc *jd, unsigned int start,
693b3b94faaSDavid Teigland 				   struct gfs2_log_descriptor *ld, __be64 *ptr,
694b3b94faaSDavid Teigland 				   int pass)
695b3b94faaSDavid Teigland {
696feaa7bbaSSteven Whitehouse 	struct gfs2_sbd *sdp = GFS2_SB(jd->jd_inode);
697b3b94faaSDavid Teigland 	unsigned int blks = be32_to_cpu(ld->ld_length);
698b3b94faaSDavid Teigland 	unsigned int revokes = be32_to_cpu(ld->ld_data1);
699b3b94faaSDavid Teigland 	struct buffer_head *bh;
700b3b94faaSDavid Teigland 	unsigned int offset;
701cd915493SSteven Whitehouse 	u64 blkno;
702b3b94faaSDavid Teigland 	int first = 1;
703b3b94faaSDavid Teigland 	int error;
704b3b94faaSDavid Teigland 
705b3b94faaSDavid Teigland 	if (pass != 0 || be32_to_cpu(ld->ld_type) != GFS2_LOG_DESC_REVOKE)
706b3b94faaSDavid Teigland 		return 0;
707b3b94faaSDavid Teigland 
708b3b94faaSDavid Teigland 	offset = sizeof(struct gfs2_log_descriptor);
709b3b94faaSDavid Teigland 
710b3b94faaSDavid Teigland 	for (; blks; gfs2_replay_incr_blk(sdp, &start), blks--) {
711b3b94faaSDavid Teigland 		error = gfs2_replay_read_block(jd, start, &bh);
712b3b94faaSDavid Teigland 		if (error)
713b3b94faaSDavid Teigland 			return error;
714b3b94faaSDavid Teigland 
715b3b94faaSDavid Teigland 		if (!first)
716b3b94faaSDavid Teigland 			gfs2_metatype_check(sdp, bh, GFS2_METATYPE_LB);
717b3b94faaSDavid Teigland 
718cd915493SSteven Whitehouse 		while (offset + sizeof(u64) <= sdp->sd_sb.sb_bsize) {
719b3b94faaSDavid Teigland 			blkno = be64_to_cpu(*(__be64 *)(bh->b_data + offset));
720b3b94faaSDavid Teigland 
721b3b94faaSDavid Teigland 			error = gfs2_revoke_add(sdp, blkno, start);
7223ad62e87SBob Peterson 			if (error < 0) {
7233ad62e87SBob Peterson 				brelse(bh);
724b3b94faaSDavid Teigland 				return error;
7253ad62e87SBob Peterson 			}
726b3b94faaSDavid Teigland 			else if (error)
727b3b94faaSDavid Teigland 				sdp->sd_found_revokes++;
728b3b94faaSDavid Teigland 
729b3b94faaSDavid Teigland 			if (!--revokes)
730b3b94faaSDavid Teigland 				break;
731cd915493SSteven Whitehouse 			offset += sizeof(u64);
732b3b94faaSDavid Teigland 		}
733b3b94faaSDavid Teigland 
734b3b94faaSDavid Teigland 		brelse(bh);
735b3b94faaSDavid Teigland 		offset = sizeof(struct gfs2_meta_header);
736b3b94faaSDavid Teigland 		first = 0;
737b3b94faaSDavid Teigland 	}
738b3b94faaSDavid Teigland 
739b3b94faaSDavid Teigland 	return 0;
740b3b94faaSDavid Teigland }
741b3b94faaSDavid Teigland 
742b3b94faaSDavid Teigland static void revoke_lo_after_scan(struct gfs2_jdesc *jd, int error, int pass)
743b3b94faaSDavid Teigland {
744feaa7bbaSSteven Whitehouse 	struct gfs2_sbd *sdp = GFS2_SB(jd->jd_inode);
745b3b94faaSDavid Teigland 
746b3b94faaSDavid Teigland 	if (error) {
747b3b94faaSDavid Teigland 		gfs2_revoke_clean(sdp);
748b3b94faaSDavid Teigland 		return;
749b3b94faaSDavid Teigland 	}
750b3b94faaSDavid Teigland 	if (pass != 1)
751b3b94faaSDavid Teigland 		return;
752b3b94faaSDavid Teigland 
753b3b94faaSDavid Teigland 	fs_info(sdp, "jid=%u: Found %u revoke tags\n",
754b3b94faaSDavid Teigland 	        jd->jd_jid, sdp->sd_found_revokes);
755b3b94faaSDavid Teigland 
756b3b94faaSDavid Teigland 	gfs2_revoke_clean(sdp);
757b3b94faaSDavid Teigland }
758b3b94faaSDavid Teigland 
75918ec7d5cSSteven Whitehouse /**
76018ec7d5cSSteven Whitehouse  * databuf_lo_add - Add a databuf to the transaction.
76118ec7d5cSSteven Whitehouse  *
76218ec7d5cSSteven Whitehouse  * This is used in two distinct cases:
76318ec7d5cSSteven Whitehouse  * i) In ordered write mode
76418ec7d5cSSteven Whitehouse  *    We put the data buffer on a list so that we can ensure that its
76518ec7d5cSSteven Whitehouse  *    synced to disk at the right time
76618ec7d5cSSteven Whitehouse  * ii) In journaled data mode
76718ec7d5cSSteven Whitehouse  *    We need to journal the data block in the same way as metadata in
76818ec7d5cSSteven Whitehouse  *    the functions above. The difference is that here we have a tag
76918ec7d5cSSteven Whitehouse  *    which is two __be64's being the block number (as per meta data)
77018ec7d5cSSteven Whitehouse  *    and a flag which says whether the data block needs escaping or
77118ec7d5cSSteven Whitehouse  *    not. This means we need a new log entry for each 251 or so data
77218ec7d5cSSteven Whitehouse  *    blocks, which isn't an enormous overhead but twice as much as
77318ec7d5cSSteven Whitehouse  *    for normal metadata blocks.
77418ec7d5cSSteven Whitehouse  */
775b3b94faaSDavid Teigland static void databuf_lo_add(struct gfs2_sbd *sdp, struct gfs2_log_element *le)
776b3b94faaSDavid Teigland {
77718ec7d5cSSteven Whitehouse 	struct gfs2_bufdata *bd = container_of(le, struct gfs2_bufdata, bd_le);
7785c676f6dSSteven Whitehouse 	struct gfs2_trans *tr = current->journal_info;
77918ec7d5cSSteven Whitehouse 	struct address_space *mapping = bd->bd_bh->b_page->mapping;
780feaa7bbaSSteven Whitehouse 	struct gfs2_inode *ip = GFS2_I(mapping->host);
781b3b94faaSDavid Teigland 
7829b9107a5SSteven Whitehouse 	lock_buffer(bd->bd_bh);
7838bd95727SSteven Whitehouse 	gfs2_log_lock(sdp);
7849ff8ec32SSteven Whitehouse 	if (tr) {
7859b9107a5SSteven Whitehouse 		if (!list_empty(&bd->bd_list_tr))
7869b9107a5SSteven Whitehouse 			goto out;
78718ec7d5cSSteven Whitehouse 		tr->tr_touched = 1;
788773ed1a0SRobert Peterson 		if (gfs2_is_jdata(ip)) {
78918ec7d5cSSteven Whitehouse 			tr->tr_num_buf++;
79018ec7d5cSSteven Whitehouse 			list_add(&bd->bd_list_tr, &tr->tr_list_buf);
791773ed1a0SRobert Peterson 		}
7929ff8ec32SSteven Whitehouse 	}
793ddf4b426SBenjamin Marzinski 	if (!list_empty(&le->le_list))
7949b9107a5SSteven Whitehouse 		goto out;
7952332c443SRobert Peterson 
7962bcd610dSSteven Whitehouse 	set_bit(GLF_LFLUSH, &bd->bd_gl->gl_flags);
7972bcd610dSSteven Whitehouse 	set_bit(GLF_DIRTY, &bd->bd_gl->gl_flags);
7982332c443SRobert Peterson 	if (gfs2_is_jdata(ip)) {
7992332c443SRobert Peterson 		gfs2_pin(sdp, bd->bd_bh);
8002332c443SRobert Peterson 		tr->tr_num_databuf_new++;
801bdcb8856SBob Peterson 		sdp->sd_log_num_databuf++;
802e5884636SDave Chinner 		list_add_tail(&le->le_list, &sdp->sd_log_le_databuf);
803d7b616e2SSteven Whitehouse 	} else {
804e5884636SDave Chinner 		list_add_tail(&le->le_list, &sdp->sd_log_le_ordered);
805d7b616e2SSteven Whitehouse 	}
8069b9107a5SSteven Whitehouse out:
807b3b94faaSDavid Teigland 	gfs2_log_unlock(sdp);
8089b9107a5SSteven Whitehouse 	unlock_buffer(bd->bd_bh);
809b3b94faaSDavid Teigland }
810b3b94faaSDavid Teigland 
81118ec7d5cSSteven Whitehouse /**
81218ec7d5cSSteven Whitehouse  * databuf_lo_before_commit - Scan the data buffers, writing as we go
81318ec7d5cSSteven Whitehouse  *
81418ec7d5cSSteven Whitehouse  */
815d7b616e2SSteven Whitehouse 
816b3b94faaSDavid Teigland static void databuf_lo_before_commit(struct gfs2_sbd *sdp)
817b3b94faaSDavid Teigland {
818dad30e90SSteven Whitehouse 	unsigned int limit = buf_limit(sdp) / 2;
819b3b94faaSDavid Teigland 
820dad30e90SSteven Whitehouse 	gfs2_before_commit(sdp, limit, sdp->sd_log_num_databuf,
821dad30e90SSteven Whitehouse 			   &sdp->sd_log_le_databuf, 1);
822b3b94faaSDavid Teigland }
823b3b94faaSDavid Teigland 
82418ec7d5cSSteven Whitehouse static int databuf_lo_scan_elements(struct gfs2_jdesc *jd, unsigned int start,
82518ec7d5cSSteven Whitehouse 				    struct gfs2_log_descriptor *ld,
82618ec7d5cSSteven Whitehouse 				    __be64 *ptr, int pass)
82718ec7d5cSSteven Whitehouse {
828feaa7bbaSSteven Whitehouse 	struct gfs2_inode *ip = GFS2_I(jd->jd_inode);
829feaa7bbaSSteven Whitehouse 	struct gfs2_sbd *sdp = GFS2_SB(jd->jd_inode);
8305c676f6dSSteven Whitehouse 	struct gfs2_glock *gl = ip->i_gl;
83118ec7d5cSSteven Whitehouse 	unsigned int blks = be32_to_cpu(ld->ld_data1);
83218ec7d5cSSteven Whitehouse 	struct buffer_head *bh_log, *bh_ip;
833cd915493SSteven Whitehouse 	u64 blkno;
834cd915493SSteven Whitehouse 	u64 esc;
83518ec7d5cSSteven Whitehouse 	int error = 0;
83618ec7d5cSSteven Whitehouse 
83718ec7d5cSSteven Whitehouse 	if (pass != 1 || be32_to_cpu(ld->ld_type) != GFS2_LOG_DESC_JDATA)
83818ec7d5cSSteven Whitehouse 		return 0;
83918ec7d5cSSteven Whitehouse 
84018ec7d5cSSteven Whitehouse 	gfs2_replay_incr_blk(sdp, &start);
84118ec7d5cSSteven Whitehouse 	for (; blks; gfs2_replay_incr_blk(sdp, &start), blks--) {
84218ec7d5cSSteven Whitehouse 		blkno = be64_to_cpu(*ptr++);
84318ec7d5cSSteven Whitehouse 		esc = be64_to_cpu(*ptr++);
84418ec7d5cSSteven Whitehouse 
84518ec7d5cSSteven Whitehouse 		sdp->sd_found_blocks++;
84618ec7d5cSSteven Whitehouse 
84718ec7d5cSSteven Whitehouse 		if (gfs2_revoke_check(sdp, blkno, start))
84818ec7d5cSSteven Whitehouse 			continue;
84918ec7d5cSSteven Whitehouse 
85018ec7d5cSSteven Whitehouse 		error = gfs2_replay_read_block(jd, start, &bh_log);
85118ec7d5cSSteven Whitehouse 		if (error)
85218ec7d5cSSteven Whitehouse 			return error;
85318ec7d5cSSteven Whitehouse 
85418ec7d5cSSteven Whitehouse 		bh_ip = gfs2_meta_new(gl, blkno);
85518ec7d5cSSteven Whitehouse 		memcpy(bh_ip->b_data, bh_log->b_data, bh_log->b_size);
85618ec7d5cSSteven Whitehouse 
85718ec7d5cSSteven Whitehouse 		/* Unescape */
85818ec7d5cSSteven Whitehouse 		if (esc) {
85918ec7d5cSSteven Whitehouse 			__be32 *eptr = (__be32 *)bh_ip->b_data;
86018ec7d5cSSteven Whitehouse 			*eptr = cpu_to_be32(GFS2_MAGIC);
86118ec7d5cSSteven Whitehouse 		}
86218ec7d5cSSteven Whitehouse 		mark_buffer_dirty(bh_ip);
86318ec7d5cSSteven Whitehouse 
86418ec7d5cSSteven Whitehouse 		brelse(bh_log);
86518ec7d5cSSteven Whitehouse 		brelse(bh_ip);
86618ec7d5cSSteven Whitehouse 
86718ec7d5cSSteven Whitehouse 		sdp->sd_replayed_blocks++;
86818ec7d5cSSteven Whitehouse 	}
86918ec7d5cSSteven Whitehouse 
87018ec7d5cSSteven Whitehouse 	return error;
87118ec7d5cSSteven Whitehouse }
87218ec7d5cSSteven Whitehouse 
87318ec7d5cSSteven Whitehouse /* FIXME: sort out accounting for log blocks etc. */
87418ec7d5cSSteven Whitehouse 
87518ec7d5cSSteven Whitehouse static void databuf_lo_after_scan(struct gfs2_jdesc *jd, int error, int pass)
87618ec7d5cSSteven Whitehouse {
877feaa7bbaSSteven Whitehouse 	struct gfs2_inode *ip = GFS2_I(jd->jd_inode);
878feaa7bbaSSteven Whitehouse 	struct gfs2_sbd *sdp = GFS2_SB(jd->jd_inode);
87918ec7d5cSSteven Whitehouse 
88018ec7d5cSSteven Whitehouse 	if (error) {
8817276b3b0SSteven Whitehouse 		gfs2_meta_sync(ip->i_gl);
88218ec7d5cSSteven Whitehouse 		return;
88318ec7d5cSSteven Whitehouse 	}
88418ec7d5cSSteven Whitehouse 	if (pass != 1)
88518ec7d5cSSteven Whitehouse 		return;
88618ec7d5cSSteven Whitehouse 
88718ec7d5cSSteven Whitehouse 	/* data sync? */
8887276b3b0SSteven Whitehouse 	gfs2_meta_sync(ip->i_gl);
88918ec7d5cSSteven Whitehouse 
89018ec7d5cSSteven Whitehouse 	fs_info(sdp, "jid=%u: Replayed %u of %u data blocks\n",
89118ec7d5cSSteven Whitehouse 		jd->jd_jid, sdp->sd_replayed_blocks, sdp->sd_found_blocks);
89218ec7d5cSSteven Whitehouse }
89318ec7d5cSSteven Whitehouse 
89418ec7d5cSSteven Whitehouse static void databuf_lo_after_commit(struct gfs2_sbd *sdp, struct gfs2_ail *ai)
89518ec7d5cSSteven Whitehouse {
89618ec7d5cSSteven Whitehouse 	struct list_head *head = &sdp->sd_log_le_databuf;
89718ec7d5cSSteven Whitehouse 	struct gfs2_bufdata *bd;
89818ec7d5cSSteven Whitehouse 
89918ec7d5cSSteven Whitehouse 	while (!list_empty(head)) {
90018ec7d5cSSteven Whitehouse 		bd = list_entry(head->next, struct gfs2_bufdata, bd_le.le_list);
901b8e1aabfSSteven Whitehouse 		list_del_init(&bd->bd_le.le_list);
90218ec7d5cSSteven Whitehouse 		sdp->sd_log_num_databuf--;
90318ec7d5cSSteven Whitehouse 		gfs2_unpin(sdp, bd->bd_bh, ai);
90418ec7d5cSSteven Whitehouse 	}
90518ec7d5cSSteven Whitehouse 	gfs2_assert_warn(sdp, !sdp->sd_log_num_databuf);
90618ec7d5cSSteven Whitehouse }
90718ec7d5cSSteven Whitehouse 
90818ec7d5cSSteven Whitehouse 
909b09e593dSSteven Whitehouse const struct gfs2_log_operations gfs2_buf_lops = {
910b3b94faaSDavid Teigland 	.lo_add = buf_lo_add,
911b3b94faaSDavid Teigland 	.lo_before_commit = buf_lo_before_commit,
912b3b94faaSDavid Teigland 	.lo_after_commit = buf_lo_after_commit,
913b3b94faaSDavid Teigland 	.lo_before_scan = buf_lo_before_scan,
914b3b94faaSDavid Teigland 	.lo_scan_elements = buf_lo_scan_elements,
915b3b94faaSDavid Teigland 	.lo_after_scan = buf_lo_after_scan,
916ea67eedbSSteven Whitehouse 	.lo_name = "buf",
917b3b94faaSDavid Teigland };
918b3b94faaSDavid Teigland 
919b09e593dSSteven Whitehouse const struct gfs2_log_operations gfs2_revoke_lops = {
920b3b94faaSDavid Teigland 	.lo_add = revoke_lo_add,
921b3b94faaSDavid Teigland 	.lo_before_commit = revoke_lo_before_commit,
922f42ab085SSteven Whitehouse 	.lo_after_commit = revoke_lo_after_commit,
923b3b94faaSDavid Teigland 	.lo_before_scan = revoke_lo_before_scan,
924b3b94faaSDavid Teigland 	.lo_scan_elements = revoke_lo_scan_elements,
925b3b94faaSDavid Teigland 	.lo_after_scan = revoke_lo_after_scan,
926ea67eedbSSteven Whitehouse 	.lo_name = "revoke",
927b3b94faaSDavid Teigland };
928b3b94faaSDavid Teigland 
929b09e593dSSteven Whitehouse const struct gfs2_log_operations gfs2_rg_lops = {
930ea67eedbSSteven Whitehouse 	.lo_name = "rg",
931b3b94faaSDavid Teigland };
932b3b94faaSDavid Teigland 
933b09e593dSSteven Whitehouse const struct gfs2_log_operations gfs2_databuf_lops = {
934b3b94faaSDavid Teigland 	.lo_add = databuf_lo_add,
935b3b94faaSDavid Teigland 	.lo_before_commit = databuf_lo_before_commit,
93618ec7d5cSSteven Whitehouse 	.lo_after_commit = databuf_lo_after_commit,
93718ec7d5cSSteven Whitehouse 	.lo_scan_elements = databuf_lo_scan_elements,
93818ec7d5cSSteven Whitehouse 	.lo_after_scan = databuf_lo_after_scan,
939ea67eedbSSteven Whitehouse 	.lo_name = "databuf",
940b3b94faaSDavid Teigland };
941b3b94faaSDavid Teigland 
942b09e593dSSteven Whitehouse const struct gfs2_log_operations *gfs2_log_ops[] = {
943b3b94faaSDavid Teigland 	&gfs2_databuf_lops,
94416615be1SSteven Whitehouse 	&gfs2_buf_lops,
94516615be1SSteven Whitehouse 	&gfs2_rg_lops,
94616615be1SSteven Whitehouse 	&gfs2_revoke_lops,
947ea67eedbSSteven Whitehouse 	NULL,
948b3b94faaSDavid Teigland };
949b3b94faaSDavid Teigland 
950