xref: /openbmc/linux/drivers/block/drbd/drbd_worker.c (revision fc8ce194)
1b411b363SPhilipp Reisner /*
2b411b363SPhilipp Reisner    drbd_worker.c
3b411b363SPhilipp Reisner 
4b411b363SPhilipp Reisner    This file is part of DRBD by Philipp Reisner and Lars Ellenberg.
5b411b363SPhilipp Reisner 
6b411b363SPhilipp Reisner    Copyright (C) 2001-2008, LINBIT Information Technologies GmbH.
7b411b363SPhilipp Reisner    Copyright (C) 1999-2008, Philipp Reisner <philipp.reisner@linbit.com>.
8b411b363SPhilipp Reisner    Copyright (C) 2002-2008, Lars Ellenberg <lars.ellenberg@linbit.com>.
9b411b363SPhilipp Reisner 
10b411b363SPhilipp Reisner    drbd is free software; you can redistribute it and/or modify
11b411b363SPhilipp Reisner    it under the terms of the GNU General Public License as published by
12b411b363SPhilipp Reisner    the Free Software Foundation; either version 2, or (at your option)
13b411b363SPhilipp Reisner    any later version.
14b411b363SPhilipp Reisner 
15b411b363SPhilipp Reisner    drbd is distributed in the hope that it will be useful,
16b411b363SPhilipp Reisner    but WITHOUT ANY WARRANTY; without even the implied warranty of
17b411b363SPhilipp Reisner    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
18b411b363SPhilipp Reisner    GNU General Public License for more details.
19b411b363SPhilipp Reisner 
20b411b363SPhilipp Reisner    You should have received a copy of the GNU General Public License
21b411b363SPhilipp Reisner    along with drbd; see the file COPYING.  If not, write to
22b411b363SPhilipp Reisner    the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139, USA.
23b411b363SPhilipp Reisner 
24b411b363SPhilipp Reisner  */
25b411b363SPhilipp Reisner 
26b411b363SPhilipp Reisner #include <linux/module.h>
27b411b363SPhilipp Reisner #include <linux/drbd.h>
28b411b363SPhilipp Reisner #include <linux/sched.h>
29b411b363SPhilipp Reisner #include <linux/smp_lock.h>
30b411b363SPhilipp Reisner #include <linux/wait.h>
31b411b363SPhilipp Reisner #include <linux/mm.h>
32b411b363SPhilipp Reisner #include <linux/memcontrol.h>
33b411b363SPhilipp Reisner #include <linux/mm_inline.h>
34b411b363SPhilipp Reisner #include <linux/slab.h>
35b411b363SPhilipp Reisner #include <linux/random.h>
36b411b363SPhilipp Reisner #include <linux/string.h>
37b411b363SPhilipp Reisner #include <linux/scatterlist.h>
38b411b363SPhilipp Reisner 
39b411b363SPhilipp Reisner #include "drbd_int.h"
40b411b363SPhilipp Reisner #include "drbd_req.h"
41b411b363SPhilipp Reisner 
42b411b363SPhilipp Reisner #define SLEEP_TIME (HZ/10)
43b411b363SPhilipp Reisner 
44b411b363SPhilipp Reisner static int w_make_ov_request(struct drbd_conf *mdev, struct drbd_work *w, int cancel);
45b411b363SPhilipp Reisner 
46b411b363SPhilipp Reisner 
47b411b363SPhilipp Reisner 
48b411b363SPhilipp Reisner /* defined here:
49b411b363SPhilipp Reisner    drbd_md_io_complete
5045bb912bSLars Ellenberg    drbd_endio_sec
51b411b363SPhilipp Reisner    drbd_endio_pri
52b411b363SPhilipp Reisner 
53b411b363SPhilipp Reisner  * more endio handlers:
54b411b363SPhilipp Reisner    atodb_endio in drbd_actlog.c
55b411b363SPhilipp Reisner    drbd_bm_async_io_complete in drbd_bitmap.c
56b411b363SPhilipp Reisner 
57b411b363SPhilipp Reisner  * For all these callbacks, note the following:
58b411b363SPhilipp Reisner  * The callbacks will be called in irq context by the IDE drivers,
59b411b363SPhilipp Reisner  * and in Softirqs/Tasklets/BH context by the SCSI drivers.
60b411b363SPhilipp Reisner  * Try to get the locking right :)
61b411b363SPhilipp Reisner  *
62b411b363SPhilipp Reisner  */
63b411b363SPhilipp Reisner 
64b411b363SPhilipp Reisner 
65b411b363SPhilipp Reisner /* About the global_state_lock
66b411b363SPhilipp Reisner    Each state transition on an device holds a read lock. In case we have
67b411b363SPhilipp Reisner    to evaluate the sync after dependencies, we grab a write lock, because
68b411b363SPhilipp Reisner    we need stable states on all devices for that.  */
69b411b363SPhilipp Reisner rwlock_t global_state_lock;
70b411b363SPhilipp Reisner 
71b411b363SPhilipp Reisner /* used for synchronous meta data and bitmap IO
72b411b363SPhilipp Reisner  * submitted by drbd_md_sync_page_io()
73b411b363SPhilipp Reisner  */
74b411b363SPhilipp Reisner void drbd_md_io_complete(struct bio *bio, int error)
75b411b363SPhilipp Reisner {
76b411b363SPhilipp Reisner 	struct drbd_md_io *md_io;
77b411b363SPhilipp Reisner 
78b411b363SPhilipp Reisner 	md_io = (struct drbd_md_io *)bio->bi_private;
79b411b363SPhilipp Reisner 	md_io->error = error;
80b411b363SPhilipp Reisner 
81b411b363SPhilipp Reisner 	complete(&md_io->event);
82b411b363SPhilipp Reisner }
83b411b363SPhilipp Reisner 
84b411b363SPhilipp Reisner /* reads on behalf of the partner,
85b411b363SPhilipp Reisner  * "submitted" by the receiver
86b411b363SPhilipp Reisner  */
8745bb912bSLars Ellenberg void drbd_endio_read_sec_final(struct drbd_epoch_entry *e) __releases(local)
88b411b363SPhilipp Reisner {
89b411b363SPhilipp Reisner 	unsigned long flags = 0;
9045bb912bSLars Ellenberg 	struct drbd_conf *mdev = e->mdev;
91b411b363SPhilipp Reisner 
92b411b363SPhilipp Reisner 	D_ASSERT(e->block_id != ID_VACANT);
93b411b363SPhilipp Reisner 
94b411b363SPhilipp Reisner 	spin_lock_irqsave(&mdev->req_lock, flags);
95b411b363SPhilipp Reisner 	mdev->read_cnt += e->size >> 9;
96b411b363SPhilipp Reisner 	list_del(&e->w.list);
97b411b363SPhilipp Reisner 	if (list_empty(&mdev->read_ee))
98b411b363SPhilipp Reisner 		wake_up(&mdev->ee_wait);
9945bb912bSLars Ellenberg 	if (test_bit(__EE_WAS_ERROR, &e->flags))
10045bb912bSLars Ellenberg 		__drbd_chk_io_error(mdev, FALSE);
101b411b363SPhilipp Reisner 	spin_unlock_irqrestore(&mdev->req_lock, flags);
102b411b363SPhilipp Reisner 
103b411b363SPhilipp Reisner 	drbd_queue_work(&mdev->data.work, &e->w);
104b411b363SPhilipp Reisner 	put_ldev(mdev);
105b411b363SPhilipp Reisner }
106b411b363SPhilipp Reisner 
10745bb912bSLars Ellenberg static int is_failed_barrier(int ee_flags)
10845bb912bSLars Ellenberg {
10945bb912bSLars Ellenberg 	return (ee_flags & (EE_IS_BARRIER|EE_WAS_ERROR|EE_RESUBMITTED))
11045bb912bSLars Ellenberg 			== (EE_IS_BARRIER|EE_WAS_ERROR);
11145bb912bSLars Ellenberg }
11245bb912bSLars Ellenberg 
113b411b363SPhilipp Reisner /* writes on behalf of the partner, or resync writes,
11445bb912bSLars Ellenberg  * "submitted" by the receiver, final stage.  */
11545bb912bSLars Ellenberg static void drbd_endio_write_sec_final(struct drbd_epoch_entry *e) __releases(local)
116b411b363SPhilipp Reisner {
117b411b363SPhilipp Reisner 	unsigned long flags = 0;
11845bb912bSLars Ellenberg 	struct drbd_conf *mdev = e->mdev;
119b411b363SPhilipp Reisner 	sector_t e_sector;
120b411b363SPhilipp Reisner 	int do_wake;
121b411b363SPhilipp Reisner 	int is_syncer_req;
122b411b363SPhilipp Reisner 	int do_al_complete_io;
123b411b363SPhilipp Reisner 
12445bb912bSLars Ellenberg 	/* if this is a failed barrier request, disable use of barriers,
12545bb912bSLars Ellenberg 	 * and schedule for resubmission */
12645bb912bSLars Ellenberg 	if (is_failed_barrier(e->flags)) {
127b411b363SPhilipp Reisner 		drbd_bump_write_ordering(mdev, WO_bdev_flush);
128b411b363SPhilipp Reisner 		spin_lock_irqsave(&mdev->req_lock, flags);
129b411b363SPhilipp Reisner 		list_del(&e->w.list);
130fc8ce194SPhilipp Reisner 		e->flags = (e->flags & ~EE_WAS_ERROR) | EE_RESUBMITTED;
131b411b363SPhilipp Reisner 		e->w.cb = w_e_reissue;
132b411b363SPhilipp Reisner 		/* put_ldev actually happens below, once we come here again. */
133b411b363SPhilipp Reisner 		__release(local);
134b411b363SPhilipp Reisner 		spin_unlock_irqrestore(&mdev->req_lock, flags);
135b411b363SPhilipp Reisner 		drbd_queue_work(&mdev->data.work, &e->w);
136b411b363SPhilipp Reisner 		return;
137b411b363SPhilipp Reisner 	}
138b411b363SPhilipp Reisner 
139b411b363SPhilipp Reisner 	D_ASSERT(e->block_id != ID_VACANT);
140b411b363SPhilipp Reisner 
141b411b363SPhilipp Reisner 	/* after we moved e to done_ee,
142b411b363SPhilipp Reisner 	 * we may no longer access it,
143b411b363SPhilipp Reisner 	 * it may be freed/reused already!
144b411b363SPhilipp Reisner 	 * (as soon as we release the req_lock) */
145b411b363SPhilipp Reisner 	e_sector = e->sector;
146b411b363SPhilipp Reisner 	do_al_complete_io = e->flags & EE_CALL_AL_COMPLETE_IO;
14745bb912bSLars Ellenberg 	is_syncer_req = is_syncer_block_id(e->block_id);
148b411b363SPhilipp Reisner 
14945bb912bSLars Ellenberg 	spin_lock_irqsave(&mdev->req_lock, flags);
15045bb912bSLars Ellenberg 	mdev->writ_cnt += e->size >> 9;
151b411b363SPhilipp Reisner 	list_del(&e->w.list); /* has been on active_ee or sync_ee */
152b411b363SPhilipp Reisner 	list_add_tail(&e->w.list, &mdev->done_ee);
153b411b363SPhilipp Reisner 
154b411b363SPhilipp Reisner 	/* No hlist_del_init(&e->colision) here, we did not send the Ack yet,
155b411b363SPhilipp Reisner 	 * neither did we wake possibly waiting conflicting requests.
156b411b363SPhilipp Reisner 	 * done from "drbd_process_done_ee" within the appropriate w.cb
157b411b363SPhilipp Reisner 	 * (e_end_block/e_end_resync_block) or from _drbd_clear_done_ee */
158b411b363SPhilipp Reisner 
159b411b363SPhilipp Reisner 	do_wake = is_syncer_req
160b411b363SPhilipp Reisner 		? list_empty(&mdev->sync_ee)
161b411b363SPhilipp Reisner 		: list_empty(&mdev->active_ee);
162b411b363SPhilipp Reisner 
16345bb912bSLars Ellenberg 	if (test_bit(__EE_WAS_ERROR, &e->flags))
164b411b363SPhilipp Reisner 		__drbd_chk_io_error(mdev, FALSE);
165b411b363SPhilipp Reisner 	spin_unlock_irqrestore(&mdev->req_lock, flags);
166b411b363SPhilipp Reisner 
167b411b363SPhilipp Reisner 	if (is_syncer_req)
168b411b363SPhilipp Reisner 		drbd_rs_complete_io(mdev, e_sector);
169b411b363SPhilipp Reisner 
170b411b363SPhilipp Reisner 	if (do_wake)
171b411b363SPhilipp Reisner 		wake_up(&mdev->ee_wait);
172b411b363SPhilipp Reisner 
173b411b363SPhilipp Reisner 	if (do_al_complete_io)
174b411b363SPhilipp Reisner 		drbd_al_complete_io(mdev, e_sector);
175b411b363SPhilipp Reisner 
176b411b363SPhilipp Reisner 	wake_asender(mdev);
177b411b363SPhilipp Reisner 	put_ldev(mdev);
17845bb912bSLars Ellenberg }
179b411b363SPhilipp Reisner 
18045bb912bSLars Ellenberg /* writes on behalf of the partner, or resync writes,
18145bb912bSLars Ellenberg  * "submitted" by the receiver.
18245bb912bSLars Ellenberg  */
18345bb912bSLars Ellenberg void drbd_endio_sec(struct bio *bio, int error)
18445bb912bSLars Ellenberg {
18545bb912bSLars Ellenberg 	struct drbd_epoch_entry *e = bio->bi_private;
18645bb912bSLars Ellenberg 	struct drbd_conf *mdev = e->mdev;
18745bb912bSLars Ellenberg 	int uptodate = bio_flagged(bio, BIO_UPTODATE);
18845bb912bSLars Ellenberg 	int is_write = bio_data_dir(bio) == WRITE;
18945bb912bSLars Ellenberg 
19045bb912bSLars Ellenberg 	if (error)
19145bb912bSLars Ellenberg 		dev_warn(DEV, "%s: error=%d s=%llus\n",
19245bb912bSLars Ellenberg 				is_write ? "write" : "read", error,
19345bb912bSLars Ellenberg 				(unsigned long long)e->sector);
19445bb912bSLars Ellenberg 	if (!error && !uptodate) {
19545bb912bSLars Ellenberg 		dev_warn(DEV, "%s: setting error to -EIO s=%llus\n",
19645bb912bSLars Ellenberg 				is_write ? "write" : "read",
19745bb912bSLars Ellenberg 				(unsigned long long)e->sector);
19845bb912bSLars Ellenberg 		/* strange behavior of some lower level drivers...
19945bb912bSLars Ellenberg 		 * fail the request by clearing the uptodate flag,
20045bb912bSLars Ellenberg 		 * but do not return any error?! */
20145bb912bSLars Ellenberg 		error = -EIO;
20245bb912bSLars Ellenberg 	}
20345bb912bSLars Ellenberg 
20445bb912bSLars Ellenberg 	if (error)
20545bb912bSLars Ellenberg 		set_bit(__EE_WAS_ERROR, &e->flags);
20645bb912bSLars Ellenberg 
20745bb912bSLars Ellenberg 	bio_put(bio); /* no need for the bio anymore */
20845bb912bSLars Ellenberg 	if (atomic_dec_and_test(&e->pending_bios)) {
20945bb912bSLars Ellenberg 		if (is_write)
21045bb912bSLars Ellenberg 			drbd_endio_write_sec_final(e);
21145bb912bSLars Ellenberg 		else
21245bb912bSLars Ellenberg 			drbd_endio_read_sec_final(e);
21345bb912bSLars Ellenberg 	}
214b411b363SPhilipp Reisner }
215b411b363SPhilipp Reisner 
216b411b363SPhilipp Reisner /* read, readA or write requests on R_PRIMARY coming from drbd_make_request
217b411b363SPhilipp Reisner  */
218b411b363SPhilipp Reisner void drbd_endio_pri(struct bio *bio, int error)
219b411b363SPhilipp Reisner {
220b411b363SPhilipp Reisner 	unsigned long flags;
221b411b363SPhilipp Reisner 	struct drbd_request *req = bio->bi_private;
222b411b363SPhilipp Reisner 	struct drbd_conf *mdev = req->mdev;
223b411b363SPhilipp Reisner 	struct bio_and_error m;
224b411b363SPhilipp Reisner 	enum drbd_req_event what;
225b411b363SPhilipp Reisner 	int uptodate = bio_flagged(bio, BIO_UPTODATE);
226b411b363SPhilipp Reisner 
227b411b363SPhilipp Reisner 	if (error)
228b411b363SPhilipp Reisner 		dev_warn(DEV, "p %s: error=%d\n",
229b411b363SPhilipp Reisner 			 bio_data_dir(bio) == WRITE ? "write" : "read", error);
230b411b363SPhilipp Reisner 	if (!error && !uptodate) {
231b411b363SPhilipp Reisner 		dev_warn(DEV, "p %s: setting error to -EIO\n",
232b411b363SPhilipp Reisner 			 bio_data_dir(bio) == WRITE ? "write" : "read");
233b411b363SPhilipp Reisner 		/* strange behavior of some lower level drivers...
234b411b363SPhilipp Reisner 		 * fail the request by clearing the uptodate flag,
235b411b363SPhilipp Reisner 		 * but do not return any error?! */
236b411b363SPhilipp Reisner 		error = -EIO;
237b411b363SPhilipp Reisner 	}
238b411b363SPhilipp Reisner 
239b411b363SPhilipp Reisner 	/* to avoid recursion in __req_mod */
240b411b363SPhilipp Reisner 	if (unlikely(error)) {
241b411b363SPhilipp Reisner 		what = (bio_data_dir(bio) == WRITE)
242b411b363SPhilipp Reisner 			? write_completed_with_error
243b411b363SPhilipp Reisner 			: (bio_rw(bio) == READA)
244b411b363SPhilipp Reisner 			  ? read_completed_with_error
245b411b363SPhilipp Reisner 			  : read_ahead_completed_with_error;
246b411b363SPhilipp Reisner 	} else
247b411b363SPhilipp Reisner 		what = completed_ok;
248b411b363SPhilipp Reisner 
249b411b363SPhilipp Reisner 	bio_put(req->private_bio);
250b411b363SPhilipp Reisner 	req->private_bio = ERR_PTR(error);
251b411b363SPhilipp Reisner 
252b411b363SPhilipp Reisner 	spin_lock_irqsave(&mdev->req_lock, flags);
253b411b363SPhilipp Reisner 	__req_mod(req, what, &m);
254b411b363SPhilipp Reisner 	spin_unlock_irqrestore(&mdev->req_lock, flags);
255b411b363SPhilipp Reisner 
256b411b363SPhilipp Reisner 	if (m.bio)
257b411b363SPhilipp Reisner 		complete_master_bio(mdev, &m);
258b411b363SPhilipp Reisner }
259b411b363SPhilipp Reisner 
260b411b363SPhilipp Reisner int w_io_error(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
261b411b363SPhilipp Reisner {
262b411b363SPhilipp Reisner 	struct drbd_request *req = container_of(w, struct drbd_request, w);
263b411b363SPhilipp Reisner 
264b411b363SPhilipp Reisner 	/* NOTE: mdev->ldev can be NULL by the time we get here! */
265b411b363SPhilipp Reisner 	/* D_ASSERT(mdev->ldev->dc.on_io_error != EP_PASS_ON); */
266b411b363SPhilipp Reisner 
267b411b363SPhilipp Reisner 	/* the only way this callback is scheduled is from _req_may_be_done,
268b411b363SPhilipp Reisner 	 * when it is done and had a local write error, see comments there */
269b411b363SPhilipp Reisner 	drbd_req_free(req);
270b411b363SPhilipp Reisner 
271b411b363SPhilipp Reisner 	return TRUE;
272b411b363SPhilipp Reisner }
273b411b363SPhilipp Reisner 
274b411b363SPhilipp Reisner int w_read_retry_remote(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
275b411b363SPhilipp Reisner {
276b411b363SPhilipp Reisner 	struct drbd_request *req = container_of(w, struct drbd_request, w);
277b411b363SPhilipp Reisner 
278b411b363SPhilipp Reisner 	/* We should not detach for read io-error,
279b411b363SPhilipp Reisner 	 * but try to WRITE the P_DATA_REPLY to the failed location,
280b411b363SPhilipp Reisner 	 * to give the disk the chance to relocate that block */
281b411b363SPhilipp Reisner 
282b411b363SPhilipp Reisner 	spin_lock_irq(&mdev->req_lock);
283b411b363SPhilipp Reisner 	if (cancel ||
284b411b363SPhilipp Reisner 	    mdev->state.conn < C_CONNECTED ||
285b411b363SPhilipp Reisner 	    mdev->state.pdsk <= D_INCONSISTENT) {
286b411b363SPhilipp Reisner 		_req_mod(req, send_canceled);
287b411b363SPhilipp Reisner 		spin_unlock_irq(&mdev->req_lock);
288b411b363SPhilipp Reisner 		dev_alert(DEV, "WE ARE LOST. Local IO failure, no peer.\n");
289b411b363SPhilipp Reisner 		return 1;
290b411b363SPhilipp Reisner 	}
291b411b363SPhilipp Reisner 	spin_unlock_irq(&mdev->req_lock);
292b411b363SPhilipp Reisner 
293b411b363SPhilipp Reisner 	return w_send_read_req(mdev, w, 0);
294b411b363SPhilipp Reisner }
295b411b363SPhilipp Reisner 
296b411b363SPhilipp Reisner int w_resync_inactive(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
297b411b363SPhilipp Reisner {
298b411b363SPhilipp Reisner 	ERR_IF(cancel) return 1;
299b411b363SPhilipp Reisner 	dev_err(DEV, "resync inactive, but callback triggered??\n");
300b411b363SPhilipp Reisner 	return 1; /* Simply ignore this! */
301b411b363SPhilipp Reisner }
302b411b363SPhilipp Reisner 
30345bb912bSLars Ellenberg void drbd_csum_ee(struct drbd_conf *mdev, struct crypto_hash *tfm, struct drbd_epoch_entry *e, void *digest)
30445bb912bSLars Ellenberg {
30545bb912bSLars Ellenberg 	struct hash_desc desc;
30645bb912bSLars Ellenberg 	struct scatterlist sg;
30745bb912bSLars Ellenberg 	struct page *page = e->pages;
30845bb912bSLars Ellenberg 	struct page *tmp;
30945bb912bSLars Ellenberg 	unsigned len;
31045bb912bSLars Ellenberg 
31145bb912bSLars Ellenberg 	desc.tfm = tfm;
31245bb912bSLars Ellenberg 	desc.flags = 0;
31345bb912bSLars Ellenberg 
31445bb912bSLars Ellenberg 	sg_init_table(&sg, 1);
31545bb912bSLars Ellenberg 	crypto_hash_init(&desc);
31645bb912bSLars Ellenberg 
31745bb912bSLars Ellenberg 	while ((tmp = page_chain_next(page))) {
31845bb912bSLars Ellenberg 		/* all but the last page will be fully used */
31945bb912bSLars Ellenberg 		sg_set_page(&sg, page, PAGE_SIZE, 0);
32045bb912bSLars Ellenberg 		crypto_hash_update(&desc, &sg, sg.length);
32145bb912bSLars Ellenberg 		page = tmp;
32245bb912bSLars Ellenberg 	}
32345bb912bSLars Ellenberg 	/* and now the last, possibly only partially used page */
32445bb912bSLars Ellenberg 	len = e->size & (PAGE_SIZE - 1);
32545bb912bSLars Ellenberg 	sg_set_page(&sg, page, len ?: PAGE_SIZE, 0);
32645bb912bSLars Ellenberg 	crypto_hash_update(&desc, &sg, sg.length);
32745bb912bSLars Ellenberg 	crypto_hash_final(&desc, digest);
32845bb912bSLars Ellenberg }
32945bb912bSLars Ellenberg 
33045bb912bSLars Ellenberg void drbd_csum_bio(struct drbd_conf *mdev, struct crypto_hash *tfm, struct bio *bio, void *digest)
331b411b363SPhilipp Reisner {
332b411b363SPhilipp Reisner 	struct hash_desc desc;
333b411b363SPhilipp Reisner 	struct scatterlist sg;
334b411b363SPhilipp Reisner 	struct bio_vec *bvec;
335b411b363SPhilipp Reisner 	int i;
336b411b363SPhilipp Reisner 
337b411b363SPhilipp Reisner 	desc.tfm = tfm;
338b411b363SPhilipp Reisner 	desc.flags = 0;
339b411b363SPhilipp Reisner 
340b411b363SPhilipp Reisner 	sg_init_table(&sg, 1);
341b411b363SPhilipp Reisner 	crypto_hash_init(&desc);
342b411b363SPhilipp Reisner 
343b411b363SPhilipp Reisner 	__bio_for_each_segment(bvec, bio, i, 0) {
344b411b363SPhilipp Reisner 		sg_set_page(&sg, bvec->bv_page, bvec->bv_len, bvec->bv_offset);
345b411b363SPhilipp Reisner 		crypto_hash_update(&desc, &sg, sg.length);
346b411b363SPhilipp Reisner 	}
347b411b363SPhilipp Reisner 	crypto_hash_final(&desc, digest);
348b411b363SPhilipp Reisner }
349b411b363SPhilipp Reisner 
350b411b363SPhilipp Reisner static int w_e_send_csum(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
351b411b363SPhilipp Reisner {
352b411b363SPhilipp Reisner 	struct drbd_epoch_entry *e = container_of(w, struct drbd_epoch_entry, w);
353b411b363SPhilipp Reisner 	int digest_size;
354b411b363SPhilipp Reisner 	void *digest;
355b411b363SPhilipp Reisner 	int ok;
356b411b363SPhilipp Reisner 
357b411b363SPhilipp Reisner 	D_ASSERT(e->block_id == DRBD_MAGIC + 0xbeef);
358b411b363SPhilipp Reisner 
359b411b363SPhilipp Reisner 	if (unlikely(cancel)) {
360b411b363SPhilipp Reisner 		drbd_free_ee(mdev, e);
361b411b363SPhilipp Reisner 		return 1;
362b411b363SPhilipp Reisner 	}
363b411b363SPhilipp Reisner 
36445bb912bSLars Ellenberg 	if (likely((e->flags & EE_WAS_ERROR) == 0)) {
365b411b363SPhilipp Reisner 		digest_size = crypto_hash_digestsize(mdev->csums_tfm);
366b411b363SPhilipp Reisner 		digest = kmalloc(digest_size, GFP_NOIO);
367b411b363SPhilipp Reisner 		if (digest) {
36845bb912bSLars Ellenberg 			drbd_csum_ee(mdev, mdev->csums_tfm, e, digest);
369b411b363SPhilipp Reisner 
370b411b363SPhilipp Reisner 			inc_rs_pending(mdev);
371b411b363SPhilipp Reisner 			ok = drbd_send_drequest_csum(mdev,
372b411b363SPhilipp Reisner 						     e->sector,
373b411b363SPhilipp Reisner 						     e->size,
374b411b363SPhilipp Reisner 						     digest,
375b411b363SPhilipp Reisner 						     digest_size,
376b411b363SPhilipp Reisner 						     P_CSUM_RS_REQUEST);
377b411b363SPhilipp Reisner 			kfree(digest);
378b411b363SPhilipp Reisner 		} else {
379b411b363SPhilipp Reisner 			dev_err(DEV, "kmalloc() of digest failed.\n");
380b411b363SPhilipp Reisner 			ok = 0;
381b411b363SPhilipp Reisner 		}
382b411b363SPhilipp Reisner 	} else
383b411b363SPhilipp Reisner 		ok = 1;
384b411b363SPhilipp Reisner 
385b411b363SPhilipp Reisner 	drbd_free_ee(mdev, e);
386b411b363SPhilipp Reisner 
387b411b363SPhilipp Reisner 	if (unlikely(!ok))
388b411b363SPhilipp Reisner 		dev_err(DEV, "drbd_send_drequest(..., csum) failed\n");
389b411b363SPhilipp Reisner 	return ok;
390b411b363SPhilipp Reisner }
391b411b363SPhilipp Reisner 
392b411b363SPhilipp Reisner #define GFP_TRY	(__GFP_HIGHMEM | __GFP_NOWARN)
393b411b363SPhilipp Reisner 
394b411b363SPhilipp Reisner static int read_for_csum(struct drbd_conf *mdev, sector_t sector, int size)
395b411b363SPhilipp Reisner {
396b411b363SPhilipp Reisner 	struct drbd_epoch_entry *e;
397b411b363SPhilipp Reisner 
398b411b363SPhilipp Reisner 	if (!get_ldev(mdev))
399b411b363SPhilipp Reisner 		return 0;
400b411b363SPhilipp Reisner 
401b411b363SPhilipp Reisner 	/* GFP_TRY, because if there is no memory available right now, this may
402b411b363SPhilipp Reisner 	 * be rescheduled for later. It is "only" background resync, after all. */
403b411b363SPhilipp Reisner 	e = drbd_alloc_ee(mdev, DRBD_MAGIC+0xbeef, sector, size, GFP_TRY);
40445bb912bSLars Ellenberg 	if (!e)
40545bb912bSLars Ellenberg 		goto fail;
406b411b363SPhilipp Reisner 
407b411b363SPhilipp Reisner 	spin_lock_irq(&mdev->req_lock);
408b411b363SPhilipp Reisner 	list_add(&e->w.list, &mdev->read_ee);
409b411b363SPhilipp Reisner 	spin_unlock_irq(&mdev->req_lock);
410b411b363SPhilipp Reisner 
411b411b363SPhilipp Reisner 	e->w.cb = w_e_send_csum;
41245bb912bSLars Ellenberg 	if (drbd_submit_ee(mdev, e, READ, DRBD_FAULT_RS_RD) == 0)
413b411b363SPhilipp Reisner 		return 1;
41445bb912bSLars Ellenberg 
41545bb912bSLars Ellenberg 	drbd_free_ee(mdev, e);
41645bb912bSLars Ellenberg fail:
41745bb912bSLars Ellenberg 	put_ldev(mdev);
41845bb912bSLars Ellenberg 	return 2;
419b411b363SPhilipp Reisner }
420b411b363SPhilipp Reisner 
421b411b363SPhilipp Reisner void resync_timer_fn(unsigned long data)
422b411b363SPhilipp Reisner {
423b411b363SPhilipp Reisner 	unsigned long flags;
424b411b363SPhilipp Reisner 	struct drbd_conf *mdev = (struct drbd_conf *) data;
425b411b363SPhilipp Reisner 	int queue;
426b411b363SPhilipp Reisner 
427b411b363SPhilipp Reisner 	spin_lock_irqsave(&mdev->req_lock, flags);
428b411b363SPhilipp Reisner 
429b411b363SPhilipp Reisner 	if (likely(!test_and_clear_bit(STOP_SYNC_TIMER, &mdev->flags))) {
430b411b363SPhilipp Reisner 		queue = 1;
431b411b363SPhilipp Reisner 		if (mdev->state.conn == C_VERIFY_S)
432b411b363SPhilipp Reisner 			mdev->resync_work.cb = w_make_ov_request;
433b411b363SPhilipp Reisner 		else
434b411b363SPhilipp Reisner 			mdev->resync_work.cb = w_make_resync_request;
435b411b363SPhilipp Reisner 	} else {
436b411b363SPhilipp Reisner 		queue = 0;
437b411b363SPhilipp Reisner 		mdev->resync_work.cb = w_resync_inactive;
438b411b363SPhilipp Reisner 	}
439b411b363SPhilipp Reisner 
440b411b363SPhilipp Reisner 	spin_unlock_irqrestore(&mdev->req_lock, flags);
441b411b363SPhilipp Reisner 
442b411b363SPhilipp Reisner 	/* harmless race: list_empty outside data.work.q_lock */
443b411b363SPhilipp Reisner 	if (list_empty(&mdev->resync_work.list) && queue)
444b411b363SPhilipp Reisner 		drbd_queue_work(&mdev->data.work, &mdev->resync_work);
445b411b363SPhilipp Reisner }
446b411b363SPhilipp Reisner 
447cdd67a74SPhilipp Reisner static int calc_resync_rate(struct drbd_conf *mdev)
448cdd67a74SPhilipp Reisner {
449cdd67a74SPhilipp Reisner 	int d = mdev->data_delay / 1000; /* us -> ms */
450cdd67a74SPhilipp Reisner 	int td = mdev->sync_conf.throttle_th * 100;  /* 0.1s -> ms */
451cdd67a74SPhilipp Reisner 	int hd = mdev->sync_conf.hold_off_th * 100;  /* 0.1s -> ms */
452cdd67a74SPhilipp Reisner 	int cr = mdev->sync_conf.rate;
453cdd67a74SPhilipp Reisner 
454cdd67a74SPhilipp Reisner 	return d <= td ? cr :
455cdd67a74SPhilipp Reisner 		d >= hd ? 0 :
456cdd67a74SPhilipp Reisner 		cr + (cr * (td - d) / (hd - td));
457cdd67a74SPhilipp Reisner }
458cdd67a74SPhilipp Reisner 
459b411b363SPhilipp Reisner int w_make_resync_request(struct drbd_conf *mdev,
460b411b363SPhilipp Reisner 		struct drbd_work *w, int cancel)
461b411b363SPhilipp Reisner {
462b411b363SPhilipp Reisner 	unsigned long bit;
463b411b363SPhilipp Reisner 	sector_t sector;
464b411b363SPhilipp Reisner 	const sector_t capacity = drbd_get_capacity(mdev->this_bdev);
465bb3d000cSLars Ellenberg 	int max_segment_size;
466b411b363SPhilipp Reisner 	int number, i, size, pe, mx;
467b411b363SPhilipp Reisner 	int align, queued, sndbuf;
468b411b363SPhilipp Reisner 
469b411b363SPhilipp Reisner 	if (unlikely(cancel))
470b411b363SPhilipp Reisner 		return 1;
471b411b363SPhilipp Reisner 
472b411b363SPhilipp Reisner 	if (unlikely(mdev->state.conn < C_CONNECTED)) {
473b411b363SPhilipp Reisner 		dev_err(DEV, "Confused in w_make_resync_request()! cstate < Connected");
474b411b363SPhilipp Reisner 		return 0;
475b411b363SPhilipp Reisner 	}
476b411b363SPhilipp Reisner 
477b411b363SPhilipp Reisner 	if (mdev->state.conn != C_SYNC_TARGET)
478b411b363SPhilipp Reisner 		dev_err(DEV, "%s in w_make_resync_request\n",
479b411b363SPhilipp Reisner 			drbd_conn_str(mdev->state.conn));
480b411b363SPhilipp Reisner 
481b411b363SPhilipp Reisner 	if (!get_ldev(mdev)) {
482b411b363SPhilipp Reisner 		/* Since we only need to access mdev->rsync a
483b411b363SPhilipp Reisner 		   get_ldev_if_state(mdev,D_FAILED) would be sufficient, but
484b411b363SPhilipp Reisner 		   to continue resync with a broken disk makes no sense at
485b411b363SPhilipp Reisner 		   all */
486b411b363SPhilipp Reisner 		dev_err(DEV, "Disk broke down during resync!\n");
487b411b363SPhilipp Reisner 		mdev->resync_work.cb = w_resync_inactive;
488b411b363SPhilipp Reisner 		return 1;
489b411b363SPhilipp Reisner 	}
490b411b363SPhilipp Reisner 
491bb3d000cSLars Ellenberg 	/* starting with drbd 8.3.8, we can handle multi-bio EEs,
492bb3d000cSLars Ellenberg 	 * if it should be necessary */
493bb3d000cSLars Ellenberg 	max_segment_size = mdev->agreed_pro_version < 94 ?
494bb3d000cSLars Ellenberg 		queue_max_segment_size(mdev->rq_queue) : DRBD_MAX_SEGMENT_SIZE;
495bb3d000cSLars Ellenberg 
496cdd67a74SPhilipp Reisner 	mdev->c_sync_rate = calc_resync_rate(mdev);
497cdd67a74SPhilipp Reisner 	number = SLEEP_TIME * mdev->c_sync_rate  / ((BM_BLOCK_SIZE / 1024) * HZ);
498b411b363SPhilipp Reisner 	pe = atomic_read(&mdev->rs_pending_cnt);
499b411b363SPhilipp Reisner 
500b411b363SPhilipp Reisner 	mutex_lock(&mdev->data.mutex);
501b411b363SPhilipp Reisner 	if (mdev->data.socket)
502b411b363SPhilipp Reisner 		mx = mdev->data.socket->sk->sk_rcvbuf / sizeof(struct p_block_req);
503b411b363SPhilipp Reisner 	else
504b411b363SPhilipp Reisner 		mx = 1;
505b411b363SPhilipp Reisner 	mutex_unlock(&mdev->data.mutex);
506b411b363SPhilipp Reisner 
507b411b363SPhilipp Reisner 	/* For resync rates >160MB/sec, allow more pending RS requests */
508b411b363SPhilipp Reisner 	if (number > mx)
509b411b363SPhilipp Reisner 		mx = number;
510b411b363SPhilipp Reisner 
511b411b363SPhilipp Reisner 	/* Limit the number of pending RS requests to no more than the peer's receive buffer */
512b411b363SPhilipp Reisner 	if ((pe + number) > mx) {
513b411b363SPhilipp Reisner 		number = mx - pe;
514b411b363SPhilipp Reisner 	}
515b411b363SPhilipp Reisner 
516b411b363SPhilipp Reisner 	for (i = 0; i < number; i++) {
517b411b363SPhilipp Reisner 		/* Stop generating RS requests, when half of the send buffer is filled */
518b411b363SPhilipp Reisner 		mutex_lock(&mdev->data.mutex);
519b411b363SPhilipp Reisner 		if (mdev->data.socket) {
520b411b363SPhilipp Reisner 			queued = mdev->data.socket->sk->sk_wmem_queued;
521b411b363SPhilipp Reisner 			sndbuf = mdev->data.socket->sk->sk_sndbuf;
522b411b363SPhilipp Reisner 		} else {
523b411b363SPhilipp Reisner 			queued = 1;
524b411b363SPhilipp Reisner 			sndbuf = 0;
525b411b363SPhilipp Reisner 		}
526b411b363SPhilipp Reisner 		mutex_unlock(&mdev->data.mutex);
527b411b363SPhilipp Reisner 		if (queued > sndbuf / 2)
528b411b363SPhilipp Reisner 			goto requeue;
529b411b363SPhilipp Reisner 
530b411b363SPhilipp Reisner next_sector:
531b411b363SPhilipp Reisner 		size = BM_BLOCK_SIZE;
532b411b363SPhilipp Reisner 		bit  = drbd_bm_find_next(mdev, mdev->bm_resync_fo);
533b411b363SPhilipp Reisner 
534b411b363SPhilipp Reisner 		if (bit == -1UL) {
535b411b363SPhilipp Reisner 			mdev->bm_resync_fo = drbd_bm_bits(mdev);
536b411b363SPhilipp Reisner 			mdev->resync_work.cb = w_resync_inactive;
537b411b363SPhilipp Reisner 			put_ldev(mdev);
538b411b363SPhilipp Reisner 			return 1;
539b411b363SPhilipp Reisner 		}
540b411b363SPhilipp Reisner 
541b411b363SPhilipp Reisner 		sector = BM_BIT_TO_SECT(bit);
542b411b363SPhilipp Reisner 
543b411b363SPhilipp Reisner 		if (drbd_try_rs_begin_io(mdev, sector)) {
544b411b363SPhilipp Reisner 			mdev->bm_resync_fo = bit;
545b411b363SPhilipp Reisner 			goto requeue;
546b411b363SPhilipp Reisner 		}
547b411b363SPhilipp Reisner 		mdev->bm_resync_fo = bit + 1;
548b411b363SPhilipp Reisner 
549b411b363SPhilipp Reisner 		if (unlikely(drbd_bm_test_bit(mdev, bit) == 0)) {
550b411b363SPhilipp Reisner 			drbd_rs_complete_io(mdev, sector);
551b411b363SPhilipp Reisner 			goto next_sector;
552b411b363SPhilipp Reisner 		}
553b411b363SPhilipp Reisner 
554b411b363SPhilipp Reisner #if DRBD_MAX_SEGMENT_SIZE > BM_BLOCK_SIZE
555b411b363SPhilipp Reisner 		/* try to find some adjacent bits.
556b411b363SPhilipp Reisner 		 * we stop if we have already the maximum req size.
557b411b363SPhilipp Reisner 		 *
558b411b363SPhilipp Reisner 		 * Additionally always align bigger requests, in order to
559b411b363SPhilipp Reisner 		 * be prepared for all stripe sizes of software RAIDs.
560b411b363SPhilipp Reisner 		 */
561b411b363SPhilipp Reisner 		align = 1;
562b411b363SPhilipp Reisner 		for (;;) {
563b411b363SPhilipp Reisner 			if (size + BM_BLOCK_SIZE > max_segment_size)
564b411b363SPhilipp Reisner 				break;
565b411b363SPhilipp Reisner 
566b411b363SPhilipp Reisner 			/* Be always aligned */
567b411b363SPhilipp Reisner 			if (sector & ((1<<(align+3))-1))
568b411b363SPhilipp Reisner 				break;
569b411b363SPhilipp Reisner 
570b411b363SPhilipp Reisner 			/* do not cross extent boundaries */
571b411b363SPhilipp Reisner 			if (((bit+1) & BM_BLOCKS_PER_BM_EXT_MASK) == 0)
572b411b363SPhilipp Reisner 				break;
573b411b363SPhilipp Reisner 			/* now, is it actually dirty, after all?
574b411b363SPhilipp Reisner 			 * caution, drbd_bm_test_bit is tri-state for some
575b411b363SPhilipp Reisner 			 * obscure reason; ( b == 0 ) would get the out-of-band
576b411b363SPhilipp Reisner 			 * only accidentally right because of the "oddly sized"
577b411b363SPhilipp Reisner 			 * adjustment below */
578b411b363SPhilipp Reisner 			if (drbd_bm_test_bit(mdev, bit+1) != 1)
579b411b363SPhilipp Reisner 				break;
580b411b363SPhilipp Reisner 			bit++;
581b411b363SPhilipp Reisner 			size += BM_BLOCK_SIZE;
582b411b363SPhilipp Reisner 			if ((BM_BLOCK_SIZE << align) <= size)
583b411b363SPhilipp Reisner 				align++;
584b411b363SPhilipp Reisner 			i++;
585b411b363SPhilipp Reisner 		}
586b411b363SPhilipp Reisner 		/* if we merged some,
587b411b363SPhilipp Reisner 		 * reset the offset to start the next drbd_bm_find_next from */
588b411b363SPhilipp Reisner 		if (size > BM_BLOCK_SIZE)
589b411b363SPhilipp Reisner 			mdev->bm_resync_fo = bit + 1;
590b411b363SPhilipp Reisner #endif
591b411b363SPhilipp Reisner 
592b411b363SPhilipp Reisner 		/* adjust very last sectors, in case we are oddly sized */
593b411b363SPhilipp Reisner 		if (sector + (size>>9) > capacity)
594b411b363SPhilipp Reisner 			size = (capacity-sector)<<9;
595b411b363SPhilipp Reisner 		if (mdev->agreed_pro_version >= 89 && mdev->csums_tfm) {
596b411b363SPhilipp Reisner 			switch (read_for_csum(mdev, sector, size)) {
597b411b363SPhilipp Reisner 			case 0: /* Disk failure*/
598b411b363SPhilipp Reisner 				put_ldev(mdev);
599b411b363SPhilipp Reisner 				return 0;
600b411b363SPhilipp Reisner 			case 2: /* Allocation failed */
601b411b363SPhilipp Reisner 				drbd_rs_complete_io(mdev, sector);
602b411b363SPhilipp Reisner 				mdev->bm_resync_fo = BM_SECT_TO_BIT(sector);
603b411b363SPhilipp Reisner 				goto requeue;
604b411b363SPhilipp Reisner 			/* case 1: everything ok */
605b411b363SPhilipp Reisner 			}
606b411b363SPhilipp Reisner 		} else {
607b411b363SPhilipp Reisner 			inc_rs_pending(mdev);
608b411b363SPhilipp Reisner 			if (!drbd_send_drequest(mdev, P_RS_DATA_REQUEST,
609b411b363SPhilipp Reisner 					       sector, size, ID_SYNCER)) {
610b411b363SPhilipp Reisner 				dev_err(DEV, "drbd_send_drequest() failed, aborting...\n");
611b411b363SPhilipp Reisner 				dec_rs_pending(mdev);
612b411b363SPhilipp Reisner 				put_ldev(mdev);
613b411b363SPhilipp Reisner 				return 0;
614b411b363SPhilipp Reisner 			}
615b411b363SPhilipp Reisner 		}
616b411b363SPhilipp Reisner 	}
617b411b363SPhilipp Reisner 
618b411b363SPhilipp Reisner 	if (mdev->bm_resync_fo >= drbd_bm_bits(mdev)) {
619b411b363SPhilipp Reisner 		/* last syncer _request_ was sent,
620b411b363SPhilipp Reisner 		 * but the P_RS_DATA_REPLY not yet received.  sync will end (and
621b411b363SPhilipp Reisner 		 * next sync group will resume), as soon as we receive the last
622b411b363SPhilipp Reisner 		 * resync data block, and the last bit is cleared.
623b411b363SPhilipp Reisner 		 * until then resync "work" is "inactive" ...
624b411b363SPhilipp Reisner 		 */
625b411b363SPhilipp Reisner 		mdev->resync_work.cb = w_resync_inactive;
626b411b363SPhilipp Reisner 		put_ldev(mdev);
627b411b363SPhilipp Reisner 		return 1;
628b411b363SPhilipp Reisner 	}
629b411b363SPhilipp Reisner 
630b411b363SPhilipp Reisner  requeue:
631b411b363SPhilipp Reisner 	mod_timer(&mdev->resync_timer, jiffies + SLEEP_TIME);
632b411b363SPhilipp Reisner 	put_ldev(mdev);
633b411b363SPhilipp Reisner 	return 1;
634b411b363SPhilipp Reisner }
635b411b363SPhilipp Reisner 
636b411b363SPhilipp Reisner static int w_make_ov_request(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
637b411b363SPhilipp Reisner {
638b411b363SPhilipp Reisner 	int number, i, size;
639b411b363SPhilipp Reisner 	sector_t sector;
640b411b363SPhilipp Reisner 	const sector_t capacity = drbd_get_capacity(mdev->this_bdev);
641b411b363SPhilipp Reisner 
642b411b363SPhilipp Reisner 	if (unlikely(cancel))
643b411b363SPhilipp Reisner 		return 1;
644b411b363SPhilipp Reisner 
645b411b363SPhilipp Reisner 	if (unlikely(mdev->state.conn < C_CONNECTED)) {
646b411b363SPhilipp Reisner 		dev_err(DEV, "Confused in w_make_ov_request()! cstate < Connected");
647b411b363SPhilipp Reisner 		return 0;
648b411b363SPhilipp Reisner 	}
649b411b363SPhilipp Reisner 
650b411b363SPhilipp Reisner 	number = SLEEP_TIME*mdev->sync_conf.rate / ((BM_BLOCK_SIZE/1024)*HZ);
651b411b363SPhilipp Reisner 	if (atomic_read(&mdev->rs_pending_cnt) > number)
652b411b363SPhilipp Reisner 		goto requeue;
653b411b363SPhilipp Reisner 
654b411b363SPhilipp Reisner 	number -= atomic_read(&mdev->rs_pending_cnt);
655b411b363SPhilipp Reisner 
656b411b363SPhilipp Reisner 	sector = mdev->ov_position;
657b411b363SPhilipp Reisner 	for (i = 0; i < number; i++) {
658b411b363SPhilipp Reisner 		if (sector >= capacity) {
659b411b363SPhilipp Reisner 			mdev->resync_work.cb = w_resync_inactive;
660b411b363SPhilipp Reisner 			return 1;
661b411b363SPhilipp Reisner 		}
662b411b363SPhilipp Reisner 
663b411b363SPhilipp Reisner 		size = BM_BLOCK_SIZE;
664b411b363SPhilipp Reisner 
665b411b363SPhilipp Reisner 		if (drbd_try_rs_begin_io(mdev, sector)) {
666b411b363SPhilipp Reisner 			mdev->ov_position = sector;
667b411b363SPhilipp Reisner 			goto requeue;
668b411b363SPhilipp Reisner 		}
669b411b363SPhilipp Reisner 
670b411b363SPhilipp Reisner 		if (sector + (size>>9) > capacity)
671b411b363SPhilipp Reisner 			size = (capacity-sector)<<9;
672b411b363SPhilipp Reisner 
673b411b363SPhilipp Reisner 		inc_rs_pending(mdev);
674b411b363SPhilipp Reisner 		if (!drbd_send_ov_request(mdev, sector, size)) {
675b411b363SPhilipp Reisner 			dec_rs_pending(mdev);
676b411b363SPhilipp Reisner 			return 0;
677b411b363SPhilipp Reisner 		}
678b411b363SPhilipp Reisner 		sector += BM_SECT_PER_BIT;
679b411b363SPhilipp Reisner 	}
680b411b363SPhilipp Reisner 	mdev->ov_position = sector;
681b411b363SPhilipp Reisner 
682b411b363SPhilipp Reisner  requeue:
683b411b363SPhilipp Reisner 	mod_timer(&mdev->resync_timer, jiffies + SLEEP_TIME);
684b411b363SPhilipp Reisner 	return 1;
685b411b363SPhilipp Reisner }
686b411b363SPhilipp Reisner 
687b411b363SPhilipp Reisner 
688b411b363SPhilipp Reisner int w_ov_finished(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
689b411b363SPhilipp Reisner {
690b411b363SPhilipp Reisner 	kfree(w);
691b411b363SPhilipp Reisner 	ov_oos_print(mdev);
692b411b363SPhilipp Reisner 	drbd_resync_finished(mdev);
693b411b363SPhilipp Reisner 
694b411b363SPhilipp Reisner 	return 1;
695b411b363SPhilipp Reisner }
696b411b363SPhilipp Reisner 
697b411b363SPhilipp Reisner static int w_resync_finished(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
698b411b363SPhilipp Reisner {
699b411b363SPhilipp Reisner 	kfree(w);
700b411b363SPhilipp Reisner 
701b411b363SPhilipp Reisner 	drbd_resync_finished(mdev);
702b411b363SPhilipp Reisner 
703b411b363SPhilipp Reisner 	return 1;
704b411b363SPhilipp Reisner }
705b411b363SPhilipp Reisner 
706b411b363SPhilipp Reisner int drbd_resync_finished(struct drbd_conf *mdev)
707b411b363SPhilipp Reisner {
708b411b363SPhilipp Reisner 	unsigned long db, dt, dbdt;
709b411b363SPhilipp Reisner 	unsigned long n_oos;
710b411b363SPhilipp Reisner 	union drbd_state os, ns;
711b411b363SPhilipp Reisner 	struct drbd_work *w;
712b411b363SPhilipp Reisner 	char *khelper_cmd = NULL;
713b411b363SPhilipp Reisner 
714b411b363SPhilipp Reisner 	/* Remove all elements from the resync LRU. Since future actions
715b411b363SPhilipp Reisner 	 * might set bits in the (main) bitmap, then the entries in the
716b411b363SPhilipp Reisner 	 * resync LRU would be wrong. */
717b411b363SPhilipp Reisner 	if (drbd_rs_del_all(mdev)) {
718b411b363SPhilipp Reisner 		/* In case this is not possible now, most probably because
719b411b363SPhilipp Reisner 		 * there are P_RS_DATA_REPLY Packets lingering on the worker's
720b411b363SPhilipp Reisner 		 * queue (or even the read operations for those packets
721b411b363SPhilipp Reisner 		 * is not finished by now).   Retry in 100ms. */
722b411b363SPhilipp Reisner 
723b411b363SPhilipp Reisner 		drbd_kick_lo(mdev);
724b411b363SPhilipp Reisner 		__set_current_state(TASK_INTERRUPTIBLE);
725b411b363SPhilipp Reisner 		schedule_timeout(HZ / 10);
726b411b363SPhilipp Reisner 		w = kmalloc(sizeof(struct drbd_work), GFP_ATOMIC);
727b411b363SPhilipp Reisner 		if (w) {
728b411b363SPhilipp Reisner 			w->cb = w_resync_finished;
729b411b363SPhilipp Reisner 			drbd_queue_work(&mdev->data.work, w);
730b411b363SPhilipp Reisner 			return 1;
731b411b363SPhilipp Reisner 		}
732b411b363SPhilipp Reisner 		dev_err(DEV, "Warn failed to drbd_rs_del_all() and to kmalloc(w).\n");
733b411b363SPhilipp Reisner 	}
734b411b363SPhilipp Reisner 
735b411b363SPhilipp Reisner 	dt = (jiffies - mdev->rs_start - mdev->rs_paused) / HZ;
736b411b363SPhilipp Reisner 	if (dt <= 0)
737b411b363SPhilipp Reisner 		dt = 1;
738b411b363SPhilipp Reisner 	db = mdev->rs_total;
739b411b363SPhilipp Reisner 	dbdt = Bit2KB(db/dt);
740b411b363SPhilipp Reisner 	mdev->rs_paused /= HZ;
741b411b363SPhilipp Reisner 
742b411b363SPhilipp Reisner 	if (!get_ldev(mdev))
743b411b363SPhilipp Reisner 		goto out;
744b411b363SPhilipp Reisner 
745b411b363SPhilipp Reisner 	spin_lock_irq(&mdev->req_lock);
746b411b363SPhilipp Reisner 	os = mdev->state;
747b411b363SPhilipp Reisner 
748b411b363SPhilipp Reisner 	/* This protects us against multiple calls (that can happen in the presence
749b411b363SPhilipp Reisner 	   of application IO), and against connectivity loss just before we arrive here. */
750b411b363SPhilipp Reisner 	if (os.conn <= C_CONNECTED)
751b411b363SPhilipp Reisner 		goto out_unlock;
752b411b363SPhilipp Reisner 
753b411b363SPhilipp Reisner 	ns = os;
754b411b363SPhilipp Reisner 	ns.conn = C_CONNECTED;
755b411b363SPhilipp Reisner 
756b411b363SPhilipp Reisner 	dev_info(DEV, "%s done (total %lu sec; paused %lu sec; %lu K/sec)\n",
757b411b363SPhilipp Reisner 	     (os.conn == C_VERIFY_S || os.conn == C_VERIFY_T) ?
758b411b363SPhilipp Reisner 	     "Online verify " : "Resync",
759b411b363SPhilipp Reisner 	     dt + mdev->rs_paused, mdev->rs_paused, dbdt);
760b411b363SPhilipp Reisner 
761b411b363SPhilipp Reisner 	n_oos = drbd_bm_total_weight(mdev);
762b411b363SPhilipp Reisner 
763b411b363SPhilipp Reisner 	if (os.conn == C_VERIFY_S || os.conn == C_VERIFY_T) {
764b411b363SPhilipp Reisner 		if (n_oos) {
765b411b363SPhilipp Reisner 			dev_alert(DEV, "Online verify found %lu %dk block out of sync!\n",
766b411b363SPhilipp Reisner 			      n_oos, Bit2KB(1));
767b411b363SPhilipp Reisner 			khelper_cmd = "out-of-sync";
768b411b363SPhilipp Reisner 		}
769b411b363SPhilipp Reisner 	} else {
770b411b363SPhilipp Reisner 		D_ASSERT((n_oos - mdev->rs_failed) == 0);
771b411b363SPhilipp Reisner 
772b411b363SPhilipp Reisner 		if (os.conn == C_SYNC_TARGET || os.conn == C_PAUSED_SYNC_T)
773b411b363SPhilipp Reisner 			khelper_cmd = "after-resync-target";
774b411b363SPhilipp Reisner 
775b411b363SPhilipp Reisner 		if (mdev->csums_tfm && mdev->rs_total) {
776b411b363SPhilipp Reisner 			const unsigned long s = mdev->rs_same_csum;
777b411b363SPhilipp Reisner 			const unsigned long t = mdev->rs_total;
778b411b363SPhilipp Reisner 			const int ratio =
779b411b363SPhilipp Reisner 				(t == 0)     ? 0 :
780b411b363SPhilipp Reisner 			(t < 100000) ? ((s*100)/t) : (s/(t/100));
781b411b363SPhilipp Reisner 			dev_info(DEV, "%u %% had equal check sums, eliminated: %luK; "
782b411b363SPhilipp Reisner 			     "transferred %luK total %luK\n",
783b411b363SPhilipp Reisner 			     ratio,
784b411b363SPhilipp Reisner 			     Bit2KB(mdev->rs_same_csum),
785b411b363SPhilipp Reisner 			     Bit2KB(mdev->rs_total - mdev->rs_same_csum),
786b411b363SPhilipp Reisner 			     Bit2KB(mdev->rs_total));
787b411b363SPhilipp Reisner 		}
788b411b363SPhilipp Reisner 	}
789b411b363SPhilipp Reisner 
790b411b363SPhilipp Reisner 	if (mdev->rs_failed) {
791b411b363SPhilipp Reisner 		dev_info(DEV, "            %lu failed blocks\n", mdev->rs_failed);
792b411b363SPhilipp Reisner 
793b411b363SPhilipp Reisner 		if (os.conn == C_SYNC_TARGET || os.conn == C_PAUSED_SYNC_T) {
794b411b363SPhilipp Reisner 			ns.disk = D_INCONSISTENT;
795b411b363SPhilipp Reisner 			ns.pdsk = D_UP_TO_DATE;
796b411b363SPhilipp Reisner 		} else {
797b411b363SPhilipp Reisner 			ns.disk = D_UP_TO_DATE;
798b411b363SPhilipp Reisner 			ns.pdsk = D_INCONSISTENT;
799b411b363SPhilipp Reisner 		}
800b411b363SPhilipp Reisner 	} else {
801b411b363SPhilipp Reisner 		ns.disk = D_UP_TO_DATE;
802b411b363SPhilipp Reisner 		ns.pdsk = D_UP_TO_DATE;
803b411b363SPhilipp Reisner 
804b411b363SPhilipp Reisner 		if (os.conn == C_SYNC_TARGET || os.conn == C_PAUSED_SYNC_T) {
805b411b363SPhilipp Reisner 			if (mdev->p_uuid) {
806b411b363SPhilipp Reisner 				int i;
807b411b363SPhilipp Reisner 				for (i = UI_BITMAP ; i <= UI_HISTORY_END ; i++)
808b411b363SPhilipp Reisner 					_drbd_uuid_set(mdev, i, mdev->p_uuid[i]);
809b411b363SPhilipp Reisner 				drbd_uuid_set(mdev, UI_BITMAP, mdev->ldev->md.uuid[UI_CURRENT]);
810b411b363SPhilipp Reisner 				_drbd_uuid_set(mdev, UI_CURRENT, mdev->p_uuid[UI_CURRENT]);
811b411b363SPhilipp Reisner 			} else {
812b411b363SPhilipp Reisner 				dev_err(DEV, "mdev->p_uuid is NULL! BUG\n");
813b411b363SPhilipp Reisner 			}
814b411b363SPhilipp Reisner 		}
815b411b363SPhilipp Reisner 
816b411b363SPhilipp Reisner 		drbd_uuid_set_bm(mdev, 0UL);
817b411b363SPhilipp Reisner 
818b411b363SPhilipp Reisner 		if (mdev->p_uuid) {
819b411b363SPhilipp Reisner 			/* Now the two UUID sets are equal, update what we
820b411b363SPhilipp Reisner 			 * know of the peer. */
821b411b363SPhilipp Reisner 			int i;
822b411b363SPhilipp Reisner 			for (i = UI_CURRENT ; i <= UI_HISTORY_END ; i++)
823b411b363SPhilipp Reisner 				mdev->p_uuid[i] = mdev->ldev->md.uuid[i];
824b411b363SPhilipp Reisner 		}
825b411b363SPhilipp Reisner 	}
826b411b363SPhilipp Reisner 
827b411b363SPhilipp Reisner 	_drbd_set_state(mdev, ns, CS_VERBOSE, NULL);
828b411b363SPhilipp Reisner out_unlock:
829b411b363SPhilipp Reisner 	spin_unlock_irq(&mdev->req_lock);
830b411b363SPhilipp Reisner 	put_ldev(mdev);
831b411b363SPhilipp Reisner out:
832b411b363SPhilipp Reisner 	mdev->rs_total  = 0;
833b411b363SPhilipp Reisner 	mdev->rs_failed = 0;
834b411b363SPhilipp Reisner 	mdev->rs_paused = 0;
835b411b363SPhilipp Reisner 	mdev->ov_start_sector = 0;
836b411b363SPhilipp Reisner 
837b411b363SPhilipp Reisner 	if (test_and_clear_bit(WRITE_BM_AFTER_RESYNC, &mdev->flags)) {
838b411b363SPhilipp Reisner 		dev_warn(DEV, "Writing the whole bitmap, due to failed kmalloc\n");
839b411b363SPhilipp Reisner 		drbd_queue_bitmap_io(mdev, &drbd_bm_write, NULL, "write from resync_finished");
840b411b363SPhilipp Reisner 	}
841b411b363SPhilipp Reisner 
842b411b363SPhilipp Reisner 	if (khelper_cmd)
843b411b363SPhilipp Reisner 		drbd_khelper(mdev, khelper_cmd);
844b411b363SPhilipp Reisner 
845b411b363SPhilipp Reisner 	return 1;
846b411b363SPhilipp Reisner }
847b411b363SPhilipp Reisner 
848b411b363SPhilipp Reisner /* helper */
849b411b363SPhilipp Reisner static void move_to_net_ee_or_free(struct drbd_conf *mdev, struct drbd_epoch_entry *e)
850b411b363SPhilipp Reisner {
85145bb912bSLars Ellenberg 	if (drbd_ee_has_active_page(e)) {
852b411b363SPhilipp Reisner 		/* This might happen if sendpage() has not finished */
853b411b363SPhilipp Reisner 		spin_lock_irq(&mdev->req_lock);
854b411b363SPhilipp Reisner 		list_add_tail(&e->w.list, &mdev->net_ee);
855b411b363SPhilipp Reisner 		spin_unlock_irq(&mdev->req_lock);
856b411b363SPhilipp Reisner 	} else
857b411b363SPhilipp Reisner 		drbd_free_ee(mdev, e);
858b411b363SPhilipp Reisner }
859b411b363SPhilipp Reisner 
860b411b363SPhilipp Reisner /**
861b411b363SPhilipp Reisner  * w_e_end_data_req() - Worker callback, to send a P_DATA_REPLY packet in response to a P_DATA_REQUEST
862b411b363SPhilipp Reisner  * @mdev:	DRBD device.
863b411b363SPhilipp Reisner  * @w:		work object.
864b411b363SPhilipp Reisner  * @cancel:	The connection will be closed anyways
865b411b363SPhilipp Reisner  */
866b411b363SPhilipp Reisner int w_e_end_data_req(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
867b411b363SPhilipp Reisner {
868b411b363SPhilipp Reisner 	struct drbd_epoch_entry *e = container_of(w, struct drbd_epoch_entry, w);
869b411b363SPhilipp Reisner 	int ok;
870b411b363SPhilipp Reisner 
871b411b363SPhilipp Reisner 	if (unlikely(cancel)) {
872b411b363SPhilipp Reisner 		drbd_free_ee(mdev, e);
873b411b363SPhilipp Reisner 		dec_unacked(mdev);
874b411b363SPhilipp Reisner 		return 1;
875b411b363SPhilipp Reisner 	}
876b411b363SPhilipp Reisner 
87745bb912bSLars Ellenberg 	if (likely((e->flags & EE_WAS_ERROR) == 0)) {
878b411b363SPhilipp Reisner 		ok = drbd_send_block(mdev, P_DATA_REPLY, e);
879b411b363SPhilipp Reisner 	} else {
880b411b363SPhilipp Reisner 		if (__ratelimit(&drbd_ratelimit_state))
881b411b363SPhilipp Reisner 			dev_err(DEV, "Sending NegDReply. sector=%llus.\n",
882b411b363SPhilipp Reisner 			    (unsigned long long)e->sector);
883b411b363SPhilipp Reisner 
884b411b363SPhilipp Reisner 		ok = drbd_send_ack(mdev, P_NEG_DREPLY, e);
885b411b363SPhilipp Reisner 	}
886b411b363SPhilipp Reisner 
887b411b363SPhilipp Reisner 	dec_unacked(mdev);
888b411b363SPhilipp Reisner 
889b411b363SPhilipp Reisner 	move_to_net_ee_or_free(mdev, e);
890b411b363SPhilipp Reisner 
891b411b363SPhilipp Reisner 	if (unlikely(!ok))
892b411b363SPhilipp Reisner 		dev_err(DEV, "drbd_send_block() failed\n");
893b411b363SPhilipp Reisner 	return ok;
894b411b363SPhilipp Reisner }
895b411b363SPhilipp Reisner 
896b411b363SPhilipp Reisner /**
897b411b363SPhilipp Reisner  * w_e_end_rsdata_req() - Worker callback to send a P_RS_DATA_REPLY packet in response to a P_RS_DATA_REQUESTRS
898b411b363SPhilipp Reisner  * @mdev:	DRBD device.
899b411b363SPhilipp Reisner  * @w:		work object.
900b411b363SPhilipp Reisner  * @cancel:	The connection will be closed anyways
901b411b363SPhilipp Reisner  */
902b411b363SPhilipp Reisner int w_e_end_rsdata_req(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
903b411b363SPhilipp Reisner {
904b411b363SPhilipp Reisner 	struct drbd_epoch_entry *e = container_of(w, struct drbd_epoch_entry, w);
905b411b363SPhilipp Reisner 	int ok;
906b411b363SPhilipp Reisner 
907b411b363SPhilipp Reisner 	if (unlikely(cancel)) {
908b411b363SPhilipp Reisner 		drbd_free_ee(mdev, e);
909b411b363SPhilipp Reisner 		dec_unacked(mdev);
910b411b363SPhilipp Reisner 		return 1;
911b411b363SPhilipp Reisner 	}
912b411b363SPhilipp Reisner 
913b411b363SPhilipp Reisner 	if (get_ldev_if_state(mdev, D_FAILED)) {
914b411b363SPhilipp Reisner 		drbd_rs_complete_io(mdev, e->sector);
915b411b363SPhilipp Reisner 		put_ldev(mdev);
916b411b363SPhilipp Reisner 	}
917b411b363SPhilipp Reisner 
91845bb912bSLars Ellenberg 	if (likely((e->flags & EE_WAS_ERROR) == 0)) {
919b411b363SPhilipp Reisner 		if (likely(mdev->state.pdsk >= D_INCONSISTENT)) {
920b411b363SPhilipp Reisner 			inc_rs_pending(mdev);
921b411b363SPhilipp Reisner 			ok = drbd_send_block(mdev, P_RS_DATA_REPLY, e);
922b411b363SPhilipp Reisner 		} else {
923b411b363SPhilipp Reisner 			if (__ratelimit(&drbd_ratelimit_state))
924b411b363SPhilipp Reisner 				dev_err(DEV, "Not sending RSDataReply, "
925b411b363SPhilipp Reisner 				    "partner DISKLESS!\n");
926b411b363SPhilipp Reisner 			ok = 1;
927b411b363SPhilipp Reisner 		}
928b411b363SPhilipp Reisner 	} else {
929b411b363SPhilipp Reisner 		if (__ratelimit(&drbd_ratelimit_state))
930b411b363SPhilipp Reisner 			dev_err(DEV, "Sending NegRSDReply. sector %llus.\n",
931b411b363SPhilipp Reisner 			    (unsigned long long)e->sector);
932b411b363SPhilipp Reisner 
933b411b363SPhilipp Reisner 		ok = drbd_send_ack(mdev, P_NEG_RS_DREPLY, e);
934b411b363SPhilipp Reisner 
935b411b363SPhilipp Reisner 		/* update resync data with failure */
936b411b363SPhilipp Reisner 		drbd_rs_failed_io(mdev, e->sector, e->size);
937b411b363SPhilipp Reisner 	}
938b411b363SPhilipp Reisner 
939b411b363SPhilipp Reisner 	dec_unacked(mdev);
940b411b363SPhilipp Reisner 
941b411b363SPhilipp Reisner 	move_to_net_ee_or_free(mdev, e);
942b411b363SPhilipp Reisner 
943b411b363SPhilipp Reisner 	if (unlikely(!ok))
944b411b363SPhilipp Reisner 		dev_err(DEV, "drbd_send_block() failed\n");
945b411b363SPhilipp Reisner 	return ok;
946b411b363SPhilipp Reisner }
947b411b363SPhilipp Reisner 
948b411b363SPhilipp Reisner int w_e_end_csum_rs_req(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
949b411b363SPhilipp Reisner {
950b411b363SPhilipp Reisner 	struct drbd_epoch_entry *e = container_of(w, struct drbd_epoch_entry, w);
951b411b363SPhilipp Reisner 	struct digest_info *di;
952b411b363SPhilipp Reisner 	int digest_size;
953b411b363SPhilipp Reisner 	void *digest = NULL;
954b411b363SPhilipp Reisner 	int ok, eq = 0;
955b411b363SPhilipp Reisner 
956b411b363SPhilipp Reisner 	if (unlikely(cancel)) {
957b411b363SPhilipp Reisner 		drbd_free_ee(mdev, e);
958b411b363SPhilipp Reisner 		dec_unacked(mdev);
959b411b363SPhilipp Reisner 		return 1;
960b411b363SPhilipp Reisner 	}
961b411b363SPhilipp Reisner 
962b411b363SPhilipp Reisner 	drbd_rs_complete_io(mdev, e->sector);
963b411b363SPhilipp Reisner 
964b411b363SPhilipp Reisner 	di = (struct digest_info *)(unsigned long)e->block_id;
965b411b363SPhilipp Reisner 
96645bb912bSLars Ellenberg 	if (likely((e->flags & EE_WAS_ERROR) == 0)) {
967b411b363SPhilipp Reisner 		/* quick hack to try to avoid a race against reconfiguration.
968b411b363SPhilipp Reisner 		 * a real fix would be much more involved,
969b411b363SPhilipp Reisner 		 * introducing more locking mechanisms */
970b411b363SPhilipp Reisner 		if (mdev->csums_tfm) {
971b411b363SPhilipp Reisner 			digest_size = crypto_hash_digestsize(mdev->csums_tfm);
972b411b363SPhilipp Reisner 			D_ASSERT(digest_size == di->digest_size);
973b411b363SPhilipp Reisner 			digest = kmalloc(digest_size, GFP_NOIO);
974b411b363SPhilipp Reisner 		}
975b411b363SPhilipp Reisner 		if (digest) {
97645bb912bSLars Ellenberg 			drbd_csum_ee(mdev, mdev->csums_tfm, e, digest);
977b411b363SPhilipp Reisner 			eq = !memcmp(digest, di->digest, digest_size);
978b411b363SPhilipp Reisner 			kfree(digest);
979b411b363SPhilipp Reisner 		}
980b411b363SPhilipp Reisner 
981b411b363SPhilipp Reisner 		if (eq) {
982b411b363SPhilipp Reisner 			drbd_set_in_sync(mdev, e->sector, e->size);
983676396d5SLars Ellenberg 			/* rs_same_csums unit is BM_BLOCK_SIZE */
984676396d5SLars Ellenberg 			mdev->rs_same_csum += e->size >> BM_BLOCK_SHIFT;
985b411b363SPhilipp Reisner 			ok = drbd_send_ack(mdev, P_RS_IS_IN_SYNC, e);
986b411b363SPhilipp Reisner 		} else {
987b411b363SPhilipp Reisner 			inc_rs_pending(mdev);
988b411b363SPhilipp Reisner 			e->block_id = ID_SYNCER;
989b411b363SPhilipp Reisner 			ok = drbd_send_block(mdev, P_RS_DATA_REPLY, e);
990b411b363SPhilipp Reisner 		}
991b411b363SPhilipp Reisner 	} else {
992b411b363SPhilipp Reisner 		ok = drbd_send_ack(mdev, P_NEG_RS_DREPLY, e);
993b411b363SPhilipp Reisner 		if (__ratelimit(&drbd_ratelimit_state))
994b411b363SPhilipp Reisner 			dev_err(DEV, "Sending NegDReply. I guess it gets messy.\n");
995b411b363SPhilipp Reisner 	}
996b411b363SPhilipp Reisner 
997b411b363SPhilipp Reisner 	dec_unacked(mdev);
998b411b363SPhilipp Reisner 
999b411b363SPhilipp Reisner 	kfree(di);
1000b411b363SPhilipp Reisner 
1001b411b363SPhilipp Reisner 	move_to_net_ee_or_free(mdev, e);
1002b411b363SPhilipp Reisner 
1003b411b363SPhilipp Reisner 	if (unlikely(!ok))
1004b411b363SPhilipp Reisner 		dev_err(DEV, "drbd_send_block/ack() failed\n");
1005b411b363SPhilipp Reisner 	return ok;
1006b411b363SPhilipp Reisner }
1007b411b363SPhilipp Reisner 
1008b411b363SPhilipp Reisner int w_e_end_ov_req(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
1009b411b363SPhilipp Reisner {
1010b411b363SPhilipp Reisner 	struct drbd_epoch_entry *e = container_of(w, struct drbd_epoch_entry, w);
1011b411b363SPhilipp Reisner 	int digest_size;
1012b411b363SPhilipp Reisner 	void *digest;
1013b411b363SPhilipp Reisner 	int ok = 1;
1014b411b363SPhilipp Reisner 
1015b411b363SPhilipp Reisner 	if (unlikely(cancel))
1016b411b363SPhilipp Reisner 		goto out;
1017b411b363SPhilipp Reisner 
101845bb912bSLars Ellenberg 	if (unlikely((e->flags & EE_WAS_ERROR) != 0))
1019b411b363SPhilipp Reisner 		goto out;
1020b411b363SPhilipp Reisner 
1021b411b363SPhilipp Reisner 	digest_size = crypto_hash_digestsize(mdev->verify_tfm);
1022b411b363SPhilipp Reisner 	/* FIXME if this allocation fails, online verify will not terminate! */
1023b411b363SPhilipp Reisner 	digest = kmalloc(digest_size, GFP_NOIO);
1024b411b363SPhilipp Reisner 	if (digest) {
102545bb912bSLars Ellenberg 		drbd_csum_ee(mdev, mdev->verify_tfm, e, digest);
1026b411b363SPhilipp Reisner 		inc_rs_pending(mdev);
1027b411b363SPhilipp Reisner 		ok = drbd_send_drequest_csum(mdev, e->sector, e->size,
1028b411b363SPhilipp Reisner 					     digest, digest_size, P_OV_REPLY);
1029b411b363SPhilipp Reisner 		if (!ok)
1030b411b363SPhilipp Reisner 			dec_rs_pending(mdev);
1031b411b363SPhilipp Reisner 		kfree(digest);
1032b411b363SPhilipp Reisner 	}
1033b411b363SPhilipp Reisner 
1034b411b363SPhilipp Reisner out:
1035b411b363SPhilipp Reisner 	drbd_free_ee(mdev, e);
1036b411b363SPhilipp Reisner 
1037b411b363SPhilipp Reisner 	dec_unacked(mdev);
1038b411b363SPhilipp Reisner 
1039b411b363SPhilipp Reisner 	return ok;
1040b411b363SPhilipp Reisner }
1041b411b363SPhilipp Reisner 
1042b411b363SPhilipp Reisner void drbd_ov_oos_found(struct drbd_conf *mdev, sector_t sector, int size)
1043b411b363SPhilipp Reisner {
1044b411b363SPhilipp Reisner 	if (mdev->ov_last_oos_start + mdev->ov_last_oos_size == sector) {
1045b411b363SPhilipp Reisner 		mdev->ov_last_oos_size += size>>9;
1046b411b363SPhilipp Reisner 	} else {
1047b411b363SPhilipp Reisner 		mdev->ov_last_oos_start = sector;
1048b411b363SPhilipp Reisner 		mdev->ov_last_oos_size = size>>9;
1049b411b363SPhilipp Reisner 	}
1050b411b363SPhilipp Reisner 	drbd_set_out_of_sync(mdev, sector, size);
1051b411b363SPhilipp Reisner 	set_bit(WRITE_BM_AFTER_RESYNC, &mdev->flags);
1052b411b363SPhilipp Reisner }
1053b411b363SPhilipp Reisner 
1054b411b363SPhilipp Reisner int w_e_end_ov_reply(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
1055b411b363SPhilipp Reisner {
1056b411b363SPhilipp Reisner 	struct drbd_epoch_entry *e = container_of(w, struct drbd_epoch_entry, w);
1057b411b363SPhilipp Reisner 	struct digest_info *di;
1058b411b363SPhilipp Reisner 	int digest_size;
1059b411b363SPhilipp Reisner 	void *digest;
1060b411b363SPhilipp Reisner 	int ok, eq = 0;
1061b411b363SPhilipp Reisner 
1062b411b363SPhilipp Reisner 	if (unlikely(cancel)) {
1063b411b363SPhilipp Reisner 		drbd_free_ee(mdev, e);
1064b411b363SPhilipp Reisner 		dec_unacked(mdev);
1065b411b363SPhilipp Reisner 		return 1;
1066b411b363SPhilipp Reisner 	}
1067b411b363SPhilipp Reisner 
1068b411b363SPhilipp Reisner 	/* after "cancel", because after drbd_disconnect/drbd_rs_cancel_all
1069b411b363SPhilipp Reisner 	 * the resync lru has been cleaned up already */
1070b411b363SPhilipp Reisner 	drbd_rs_complete_io(mdev, e->sector);
1071b411b363SPhilipp Reisner 
1072b411b363SPhilipp Reisner 	di = (struct digest_info *)(unsigned long)e->block_id;
1073b411b363SPhilipp Reisner 
107445bb912bSLars Ellenberg 	if (likely((e->flags & EE_WAS_ERROR) == 0)) {
1075b411b363SPhilipp Reisner 		digest_size = crypto_hash_digestsize(mdev->verify_tfm);
1076b411b363SPhilipp Reisner 		digest = kmalloc(digest_size, GFP_NOIO);
1077b411b363SPhilipp Reisner 		if (digest) {
107845bb912bSLars Ellenberg 			drbd_csum_ee(mdev, mdev->verify_tfm, e, digest);
1079b411b363SPhilipp Reisner 
1080b411b363SPhilipp Reisner 			D_ASSERT(digest_size == di->digest_size);
1081b411b363SPhilipp Reisner 			eq = !memcmp(digest, di->digest, digest_size);
1082b411b363SPhilipp Reisner 			kfree(digest);
1083b411b363SPhilipp Reisner 		}
1084b411b363SPhilipp Reisner 	} else {
1085b411b363SPhilipp Reisner 		ok = drbd_send_ack(mdev, P_NEG_RS_DREPLY, e);
1086b411b363SPhilipp Reisner 		if (__ratelimit(&drbd_ratelimit_state))
1087b411b363SPhilipp Reisner 			dev_err(DEV, "Sending NegDReply. I guess it gets messy.\n");
1088b411b363SPhilipp Reisner 	}
1089b411b363SPhilipp Reisner 
1090b411b363SPhilipp Reisner 	dec_unacked(mdev);
1091b411b363SPhilipp Reisner 
1092b411b363SPhilipp Reisner 	kfree(di);
1093b411b363SPhilipp Reisner 
1094b411b363SPhilipp Reisner 	if (!eq)
1095b411b363SPhilipp Reisner 		drbd_ov_oos_found(mdev, e->sector, e->size);
1096b411b363SPhilipp Reisner 	else
1097b411b363SPhilipp Reisner 		ov_oos_print(mdev);
1098b411b363SPhilipp Reisner 
1099b411b363SPhilipp Reisner 	ok = drbd_send_ack_ex(mdev, P_OV_RESULT, e->sector, e->size,
1100b411b363SPhilipp Reisner 			      eq ? ID_IN_SYNC : ID_OUT_OF_SYNC);
1101b411b363SPhilipp Reisner 
1102b411b363SPhilipp Reisner 	drbd_free_ee(mdev, e);
1103b411b363SPhilipp Reisner 
1104b411b363SPhilipp Reisner 	if (--mdev->ov_left == 0) {
1105b411b363SPhilipp Reisner 		ov_oos_print(mdev);
1106b411b363SPhilipp Reisner 		drbd_resync_finished(mdev);
1107b411b363SPhilipp Reisner 	}
1108b411b363SPhilipp Reisner 
1109b411b363SPhilipp Reisner 	return ok;
1110b411b363SPhilipp Reisner }
1111b411b363SPhilipp Reisner 
1112b411b363SPhilipp Reisner int w_prev_work_done(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
1113b411b363SPhilipp Reisner {
1114b411b363SPhilipp Reisner 	struct drbd_wq_barrier *b = container_of(w, struct drbd_wq_barrier, w);
1115b411b363SPhilipp Reisner 	complete(&b->done);
1116b411b363SPhilipp Reisner 	return 1;
1117b411b363SPhilipp Reisner }
1118b411b363SPhilipp Reisner 
1119b411b363SPhilipp Reisner int w_send_barrier(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
1120b411b363SPhilipp Reisner {
1121b411b363SPhilipp Reisner 	struct drbd_tl_epoch *b = container_of(w, struct drbd_tl_epoch, w);
1122b411b363SPhilipp Reisner 	struct p_barrier *p = &mdev->data.sbuf.barrier;
1123b411b363SPhilipp Reisner 	int ok = 1;
1124b411b363SPhilipp Reisner 
1125b411b363SPhilipp Reisner 	/* really avoid racing with tl_clear.  w.cb may have been referenced
1126b411b363SPhilipp Reisner 	 * just before it was reassigned and re-queued, so double check that.
1127b411b363SPhilipp Reisner 	 * actually, this race was harmless, since we only try to send the
1128b411b363SPhilipp Reisner 	 * barrier packet here, and otherwise do nothing with the object.
1129b411b363SPhilipp Reisner 	 * but compare with the head of w_clear_epoch */
1130b411b363SPhilipp Reisner 	spin_lock_irq(&mdev->req_lock);
1131b411b363SPhilipp Reisner 	if (w->cb != w_send_barrier || mdev->state.conn < C_CONNECTED)
1132b411b363SPhilipp Reisner 		cancel = 1;
1133b411b363SPhilipp Reisner 	spin_unlock_irq(&mdev->req_lock);
1134b411b363SPhilipp Reisner 	if (cancel)
1135b411b363SPhilipp Reisner 		return 1;
1136b411b363SPhilipp Reisner 
1137b411b363SPhilipp Reisner 	if (!drbd_get_data_sock(mdev))
1138b411b363SPhilipp Reisner 		return 0;
1139b411b363SPhilipp Reisner 	p->barrier = b->br_number;
1140b411b363SPhilipp Reisner 	/* inc_ap_pending was done where this was queued.
1141b411b363SPhilipp Reisner 	 * dec_ap_pending will be done in got_BarrierAck
1142b411b363SPhilipp Reisner 	 * or (on connection loss) in w_clear_epoch.  */
1143b411b363SPhilipp Reisner 	ok = _drbd_send_cmd(mdev, mdev->data.socket, P_BARRIER,
1144b411b363SPhilipp Reisner 				(struct p_header *)p, sizeof(*p), 0);
1145b411b363SPhilipp Reisner 	drbd_put_data_sock(mdev);
1146b411b363SPhilipp Reisner 
1147b411b363SPhilipp Reisner 	return ok;
1148b411b363SPhilipp Reisner }
1149b411b363SPhilipp Reisner 
1150b411b363SPhilipp Reisner int w_send_write_hint(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
1151b411b363SPhilipp Reisner {
1152b411b363SPhilipp Reisner 	if (cancel)
1153b411b363SPhilipp Reisner 		return 1;
1154b411b363SPhilipp Reisner 	return drbd_send_short_cmd(mdev, P_UNPLUG_REMOTE);
1155b411b363SPhilipp Reisner }
1156b411b363SPhilipp Reisner 
1157b411b363SPhilipp Reisner /**
1158b411b363SPhilipp Reisner  * w_send_dblock() - Worker callback to send a P_DATA packet in order to mirror a write request
1159b411b363SPhilipp Reisner  * @mdev:	DRBD device.
1160b411b363SPhilipp Reisner  * @w:		work object.
1161b411b363SPhilipp Reisner  * @cancel:	The connection will be closed anyways
1162b411b363SPhilipp Reisner  */
1163b411b363SPhilipp Reisner int w_send_dblock(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
1164b411b363SPhilipp Reisner {
1165b411b363SPhilipp Reisner 	struct drbd_request *req = container_of(w, struct drbd_request, w);
1166b411b363SPhilipp Reisner 	int ok;
1167b411b363SPhilipp Reisner 
1168b411b363SPhilipp Reisner 	if (unlikely(cancel)) {
1169b411b363SPhilipp Reisner 		req_mod(req, send_canceled);
1170b411b363SPhilipp Reisner 		return 1;
1171b411b363SPhilipp Reisner 	}
1172b411b363SPhilipp Reisner 
1173b411b363SPhilipp Reisner 	ok = drbd_send_dblock(mdev, req);
1174b411b363SPhilipp Reisner 	req_mod(req, ok ? handed_over_to_network : send_failed);
1175b411b363SPhilipp Reisner 
1176b411b363SPhilipp Reisner 	return ok;
1177b411b363SPhilipp Reisner }
1178b411b363SPhilipp Reisner 
1179b411b363SPhilipp Reisner /**
1180b411b363SPhilipp Reisner  * w_send_read_req() - Worker callback to send a read request (P_DATA_REQUEST) packet
1181b411b363SPhilipp Reisner  * @mdev:	DRBD device.
1182b411b363SPhilipp Reisner  * @w:		work object.
1183b411b363SPhilipp Reisner  * @cancel:	The connection will be closed anyways
1184b411b363SPhilipp Reisner  */
1185b411b363SPhilipp Reisner int w_send_read_req(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
1186b411b363SPhilipp Reisner {
1187b411b363SPhilipp Reisner 	struct drbd_request *req = container_of(w, struct drbd_request, w);
1188b411b363SPhilipp Reisner 	int ok;
1189b411b363SPhilipp Reisner 
1190b411b363SPhilipp Reisner 	if (unlikely(cancel)) {
1191b411b363SPhilipp Reisner 		req_mod(req, send_canceled);
1192b411b363SPhilipp Reisner 		return 1;
1193b411b363SPhilipp Reisner 	}
1194b411b363SPhilipp Reisner 
1195b411b363SPhilipp Reisner 	ok = drbd_send_drequest(mdev, P_DATA_REQUEST, req->sector, req->size,
1196b411b363SPhilipp Reisner 				(unsigned long)req);
1197b411b363SPhilipp Reisner 
1198b411b363SPhilipp Reisner 	if (!ok) {
1199b411b363SPhilipp Reisner 		/* ?? we set C_TIMEOUT or C_BROKEN_PIPE in drbd_send();
1200b411b363SPhilipp Reisner 		 * so this is probably redundant */
1201b411b363SPhilipp Reisner 		if (mdev->state.conn >= C_CONNECTED)
1202b411b363SPhilipp Reisner 			drbd_force_state(mdev, NS(conn, C_NETWORK_FAILURE));
1203b411b363SPhilipp Reisner 	}
1204b411b363SPhilipp Reisner 	req_mod(req, ok ? handed_over_to_network : send_failed);
1205b411b363SPhilipp Reisner 
1206b411b363SPhilipp Reisner 	return ok;
1207b411b363SPhilipp Reisner }
1208b411b363SPhilipp Reisner 
1209b411b363SPhilipp Reisner static int _drbd_may_sync_now(struct drbd_conf *mdev)
1210b411b363SPhilipp Reisner {
1211b411b363SPhilipp Reisner 	struct drbd_conf *odev = mdev;
1212b411b363SPhilipp Reisner 
1213b411b363SPhilipp Reisner 	while (1) {
1214b411b363SPhilipp Reisner 		if (odev->sync_conf.after == -1)
1215b411b363SPhilipp Reisner 			return 1;
1216b411b363SPhilipp Reisner 		odev = minor_to_mdev(odev->sync_conf.after);
1217b411b363SPhilipp Reisner 		ERR_IF(!odev) return 1;
1218b411b363SPhilipp Reisner 		if ((odev->state.conn >= C_SYNC_SOURCE &&
1219b411b363SPhilipp Reisner 		     odev->state.conn <= C_PAUSED_SYNC_T) ||
1220b411b363SPhilipp Reisner 		    odev->state.aftr_isp || odev->state.peer_isp ||
1221b411b363SPhilipp Reisner 		    odev->state.user_isp)
1222b411b363SPhilipp Reisner 			return 0;
1223b411b363SPhilipp Reisner 	}
1224b411b363SPhilipp Reisner }
1225b411b363SPhilipp Reisner 
1226b411b363SPhilipp Reisner /**
1227b411b363SPhilipp Reisner  * _drbd_pause_after() - Pause resync on all devices that may not resync now
1228b411b363SPhilipp Reisner  * @mdev:	DRBD device.
1229b411b363SPhilipp Reisner  *
1230b411b363SPhilipp Reisner  * Called from process context only (admin command and after_state_ch).
1231b411b363SPhilipp Reisner  */
1232b411b363SPhilipp Reisner static int _drbd_pause_after(struct drbd_conf *mdev)
1233b411b363SPhilipp Reisner {
1234b411b363SPhilipp Reisner 	struct drbd_conf *odev;
1235b411b363SPhilipp Reisner 	int i, rv = 0;
1236b411b363SPhilipp Reisner 
1237b411b363SPhilipp Reisner 	for (i = 0; i < minor_count; i++) {
1238b411b363SPhilipp Reisner 		odev = minor_to_mdev(i);
1239b411b363SPhilipp Reisner 		if (!odev)
1240b411b363SPhilipp Reisner 			continue;
1241b411b363SPhilipp Reisner 		if (odev->state.conn == C_STANDALONE && odev->state.disk == D_DISKLESS)
1242b411b363SPhilipp Reisner 			continue;
1243b411b363SPhilipp Reisner 		if (!_drbd_may_sync_now(odev))
1244b411b363SPhilipp Reisner 			rv |= (__drbd_set_state(_NS(odev, aftr_isp, 1), CS_HARD, NULL)
1245b411b363SPhilipp Reisner 			       != SS_NOTHING_TO_DO);
1246b411b363SPhilipp Reisner 	}
1247b411b363SPhilipp Reisner 
1248b411b363SPhilipp Reisner 	return rv;
1249b411b363SPhilipp Reisner }
1250b411b363SPhilipp Reisner 
1251b411b363SPhilipp Reisner /**
1252b411b363SPhilipp Reisner  * _drbd_resume_next() - Resume resync on all devices that may resync now
1253b411b363SPhilipp Reisner  * @mdev:	DRBD device.
1254b411b363SPhilipp Reisner  *
1255b411b363SPhilipp Reisner  * Called from process context only (admin command and worker).
1256b411b363SPhilipp Reisner  */
1257b411b363SPhilipp Reisner static int _drbd_resume_next(struct drbd_conf *mdev)
1258b411b363SPhilipp Reisner {
1259b411b363SPhilipp Reisner 	struct drbd_conf *odev;
1260b411b363SPhilipp Reisner 	int i, rv = 0;
1261b411b363SPhilipp Reisner 
1262b411b363SPhilipp Reisner 	for (i = 0; i < minor_count; i++) {
1263b411b363SPhilipp Reisner 		odev = minor_to_mdev(i);
1264b411b363SPhilipp Reisner 		if (!odev)
1265b411b363SPhilipp Reisner 			continue;
1266b411b363SPhilipp Reisner 		if (odev->state.conn == C_STANDALONE && odev->state.disk == D_DISKLESS)
1267b411b363SPhilipp Reisner 			continue;
1268b411b363SPhilipp Reisner 		if (odev->state.aftr_isp) {
1269b411b363SPhilipp Reisner 			if (_drbd_may_sync_now(odev))
1270b411b363SPhilipp Reisner 				rv |= (__drbd_set_state(_NS(odev, aftr_isp, 0),
1271b411b363SPhilipp Reisner 							CS_HARD, NULL)
1272b411b363SPhilipp Reisner 				       != SS_NOTHING_TO_DO) ;
1273b411b363SPhilipp Reisner 		}
1274b411b363SPhilipp Reisner 	}
1275b411b363SPhilipp Reisner 	return rv;
1276b411b363SPhilipp Reisner }
1277b411b363SPhilipp Reisner 
1278b411b363SPhilipp Reisner void resume_next_sg(struct drbd_conf *mdev)
1279b411b363SPhilipp Reisner {
1280b411b363SPhilipp Reisner 	write_lock_irq(&global_state_lock);
1281b411b363SPhilipp Reisner 	_drbd_resume_next(mdev);
1282b411b363SPhilipp Reisner 	write_unlock_irq(&global_state_lock);
1283b411b363SPhilipp Reisner }
1284b411b363SPhilipp Reisner 
1285b411b363SPhilipp Reisner void suspend_other_sg(struct drbd_conf *mdev)
1286b411b363SPhilipp Reisner {
1287b411b363SPhilipp Reisner 	write_lock_irq(&global_state_lock);
1288b411b363SPhilipp Reisner 	_drbd_pause_after(mdev);
1289b411b363SPhilipp Reisner 	write_unlock_irq(&global_state_lock);
1290b411b363SPhilipp Reisner }
1291b411b363SPhilipp Reisner 
1292b411b363SPhilipp Reisner static int sync_after_error(struct drbd_conf *mdev, int o_minor)
1293b411b363SPhilipp Reisner {
1294b411b363SPhilipp Reisner 	struct drbd_conf *odev;
1295b411b363SPhilipp Reisner 
1296b411b363SPhilipp Reisner 	if (o_minor == -1)
1297b411b363SPhilipp Reisner 		return NO_ERROR;
1298b411b363SPhilipp Reisner 	if (o_minor < -1 || minor_to_mdev(o_minor) == NULL)
1299b411b363SPhilipp Reisner 		return ERR_SYNC_AFTER;
1300b411b363SPhilipp Reisner 
1301b411b363SPhilipp Reisner 	/* check for loops */
1302b411b363SPhilipp Reisner 	odev = minor_to_mdev(o_minor);
1303b411b363SPhilipp Reisner 	while (1) {
1304b411b363SPhilipp Reisner 		if (odev == mdev)
1305b411b363SPhilipp Reisner 			return ERR_SYNC_AFTER_CYCLE;
1306b411b363SPhilipp Reisner 
1307b411b363SPhilipp Reisner 		/* dependency chain ends here, no cycles. */
1308b411b363SPhilipp Reisner 		if (odev->sync_conf.after == -1)
1309b411b363SPhilipp Reisner 			return NO_ERROR;
1310b411b363SPhilipp Reisner 
1311b411b363SPhilipp Reisner 		/* follow the dependency chain */
1312b411b363SPhilipp Reisner 		odev = minor_to_mdev(odev->sync_conf.after);
1313b411b363SPhilipp Reisner 	}
1314b411b363SPhilipp Reisner }
1315b411b363SPhilipp Reisner 
1316b411b363SPhilipp Reisner int drbd_alter_sa(struct drbd_conf *mdev, int na)
1317b411b363SPhilipp Reisner {
1318b411b363SPhilipp Reisner 	int changes;
1319b411b363SPhilipp Reisner 	int retcode;
1320b411b363SPhilipp Reisner 
1321b411b363SPhilipp Reisner 	write_lock_irq(&global_state_lock);
1322b411b363SPhilipp Reisner 	retcode = sync_after_error(mdev, na);
1323b411b363SPhilipp Reisner 	if (retcode == NO_ERROR) {
1324b411b363SPhilipp Reisner 		mdev->sync_conf.after = na;
1325b411b363SPhilipp Reisner 		do {
1326b411b363SPhilipp Reisner 			changes  = _drbd_pause_after(mdev);
1327b411b363SPhilipp Reisner 			changes |= _drbd_resume_next(mdev);
1328b411b363SPhilipp Reisner 		} while (changes);
1329b411b363SPhilipp Reisner 	}
1330b411b363SPhilipp Reisner 	write_unlock_irq(&global_state_lock);
1331b411b363SPhilipp Reisner 	return retcode;
1332b411b363SPhilipp Reisner }
1333b411b363SPhilipp Reisner 
1334309d1608SPhilipp Reisner static void ping_peer(struct drbd_conf *mdev)
1335309d1608SPhilipp Reisner {
1336309d1608SPhilipp Reisner 	clear_bit(GOT_PING_ACK, &mdev->flags);
1337309d1608SPhilipp Reisner 	request_ping(mdev);
1338309d1608SPhilipp Reisner 	wait_event(mdev->misc_wait,
1339309d1608SPhilipp Reisner 		   test_bit(GOT_PING_ACK, &mdev->flags) || mdev->state.conn < C_CONNECTED);
1340309d1608SPhilipp Reisner }
1341309d1608SPhilipp Reisner 
1342b411b363SPhilipp Reisner /**
1343b411b363SPhilipp Reisner  * drbd_start_resync() - Start the resync process
1344b411b363SPhilipp Reisner  * @mdev:	DRBD device.
1345b411b363SPhilipp Reisner  * @side:	Either C_SYNC_SOURCE or C_SYNC_TARGET
1346b411b363SPhilipp Reisner  *
1347b411b363SPhilipp Reisner  * This function might bring you directly into one of the
1348b411b363SPhilipp Reisner  * C_PAUSED_SYNC_* states.
1349b411b363SPhilipp Reisner  */
1350b411b363SPhilipp Reisner void drbd_start_resync(struct drbd_conf *mdev, enum drbd_conns side)
1351b411b363SPhilipp Reisner {
1352b411b363SPhilipp Reisner 	union drbd_state ns;
1353b411b363SPhilipp Reisner 	int r;
1354b411b363SPhilipp Reisner 
1355b411b363SPhilipp Reisner 	if (mdev->state.conn >= C_SYNC_SOURCE) {
1356b411b363SPhilipp Reisner 		dev_err(DEV, "Resync already running!\n");
1357b411b363SPhilipp Reisner 		return;
1358b411b363SPhilipp Reisner 	}
1359b411b363SPhilipp Reisner 
1360b411b363SPhilipp Reisner 	/* In case a previous resync run was aborted by an IO error/detach on the peer. */
1361b411b363SPhilipp Reisner 	drbd_rs_cancel_all(mdev);
1362b411b363SPhilipp Reisner 
1363b411b363SPhilipp Reisner 	if (side == C_SYNC_TARGET) {
1364b411b363SPhilipp Reisner 		/* Since application IO was locked out during C_WF_BITMAP_T and
1365b411b363SPhilipp Reisner 		   C_WF_SYNC_UUID we are still unmodified. Before going to C_SYNC_TARGET
1366b411b363SPhilipp Reisner 		   we check that we might make the data inconsistent. */
1367b411b363SPhilipp Reisner 		r = drbd_khelper(mdev, "before-resync-target");
1368b411b363SPhilipp Reisner 		r = (r >> 8) & 0xff;
1369b411b363SPhilipp Reisner 		if (r > 0) {
1370b411b363SPhilipp Reisner 			dev_info(DEV, "before-resync-target handler returned %d, "
1371b411b363SPhilipp Reisner 			     "dropping connection.\n", r);
1372b411b363SPhilipp Reisner 			drbd_force_state(mdev, NS(conn, C_DISCONNECTING));
1373b411b363SPhilipp Reisner 			return;
1374b411b363SPhilipp Reisner 		}
1375b411b363SPhilipp Reisner 	}
1376b411b363SPhilipp Reisner 
1377b411b363SPhilipp Reisner 	drbd_state_lock(mdev);
1378b411b363SPhilipp Reisner 
1379b411b363SPhilipp Reisner 	if (!get_ldev_if_state(mdev, D_NEGOTIATING)) {
1380b411b363SPhilipp Reisner 		drbd_state_unlock(mdev);
1381b411b363SPhilipp Reisner 		return;
1382b411b363SPhilipp Reisner 	}
1383b411b363SPhilipp Reisner 
1384b411b363SPhilipp Reisner 	if (side == C_SYNC_TARGET) {
1385b411b363SPhilipp Reisner 		mdev->bm_resync_fo = 0;
1386b411b363SPhilipp Reisner 	} else /* side == C_SYNC_SOURCE */ {
1387b411b363SPhilipp Reisner 		u64 uuid;
1388b411b363SPhilipp Reisner 
1389b411b363SPhilipp Reisner 		get_random_bytes(&uuid, sizeof(u64));
1390b411b363SPhilipp Reisner 		drbd_uuid_set(mdev, UI_BITMAP, uuid);
1391b411b363SPhilipp Reisner 		drbd_send_sync_uuid(mdev, uuid);
1392b411b363SPhilipp Reisner 
1393b411b363SPhilipp Reisner 		D_ASSERT(mdev->state.disk == D_UP_TO_DATE);
1394b411b363SPhilipp Reisner 	}
1395b411b363SPhilipp Reisner 
1396b411b363SPhilipp Reisner 	write_lock_irq(&global_state_lock);
1397b411b363SPhilipp Reisner 	ns = mdev->state;
1398b411b363SPhilipp Reisner 
1399b411b363SPhilipp Reisner 	ns.aftr_isp = !_drbd_may_sync_now(mdev);
1400b411b363SPhilipp Reisner 
1401b411b363SPhilipp Reisner 	ns.conn = side;
1402b411b363SPhilipp Reisner 
1403b411b363SPhilipp Reisner 	if (side == C_SYNC_TARGET)
1404b411b363SPhilipp Reisner 		ns.disk = D_INCONSISTENT;
1405b411b363SPhilipp Reisner 	else /* side == C_SYNC_SOURCE */
1406b411b363SPhilipp Reisner 		ns.pdsk = D_INCONSISTENT;
1407b411b363SPhilipp Reisner 
1408b411b363SPhilipp Reisner 	r = __drbd_set_state(mdev, ns, CS_VERBOSE, NULL);
1409b411b363SPhilipp Reisner 	ns = mdev->state;
1410b411b363SPhilipp Reisner 
1411b411b363SPhilipp Reisner 	if (ns.conn < C_CONNECTED)
1412b411b363SPhilipp Reisner 		r = SS_UNKNOWN_ERROR;
1413b411b363SPhilipp Reisner 
1414b411b363SPhilipp Reisner 	if (r == SS_SUCCESS) {
1415b411b363SPhilipp Reisner 		mdev->rs_total     =
1416b411b363SPhilipp Reisner 		mdev->rs_mark_left = drbd_bm_total_weight(mdev);
1417b411b363SPhilipp Reisner 		mdev->rs_failed    = 0;
1418b411b363SPhilipp Reisner 		mdev->rs_paused    = 0;
1419b411b363SPhilipp Reisner 		mdev->rs_start     =
1420b411b363SPhilipp Reisner 		mdev->rs_mark_time = jiffies;
1421b411b363SPhilipp Reisner 		mdev->rs_same_csum = 0;
1422b411b363SPhilipp Reisner 		_drbd_pause_after(mdev);
1423b411b363SPhilipp Reisner 	}
1424b411b363SPhilipp Reisner 	write_unlock_irq(&global_state_lock);
1425b411b363SPhilipp Reisner 	put_ldev(mdev);
1426b411b363SPhilipp Reisner 
1427b411b363SPhilipp Reisner 	if (r == SS_SUCCESS) {
1428b411b363SPhilipp Reisner 		dev_info(DEV, "Began resync as %s (will sync %lu KB [%lu bits set]).\n",
1429b411b363SPhilipp Reisner 		     drbd_conn_str(ns.conn),
1430b411b363SPhilipp Reisner 		     (unsigned long) mdev->rs_total << (BM_BLOCK_SHIFT-10),
1431b411b363SPhilipp Reisner 		     (unsigned long) mdev->rs_total);
1432b411b363SPhilipp Reisner 
1433b411b363SPhilipp Reisner 		if (mdev->rs_total == 0) {
1434b411b363SPhilipp Reisner 			/* Peer still reachable? Beware of failing before-resync-target handlers! */
1435309d1608SPhilipp Reisner 			ping_peer(mdev);
1436b411b363SPhilipp Reisner 			drbd_resync_finished(mdev);
1437b411b363SPhilipp Reisner 		}
1438b411b363SPhilipp Reisner 
1439b411b363SPhilipp Reisner 		/* ns.conn may already be != mdev->state.conn,
1440b411b363SPhilipp Reisner 		 * we may have been paused in between, or become paused until
1441b411b363SPhilipp Reisner 		 * the timer triggers.
1442b411b363SPhilipp Reisner 		 * No matter, that is handled in resync_timer_fn() */
1443b411b363SPhilipp Reisner 		if (ns.conn == C_SYNC_TARGET)
1444b411b363SPhilipp Reisner 			mod_timer(&mdev->resync_timer, jiffies);
1445b411b363SPhilipp Reisner 
1446b411b363SPhilipp Reisner 		drbd_md_sync(mdev);
1447b411b363SPhilipp Reisner 	}
1448d0c3f60fSPhilipp Reisner 	drbd_state_unlock(mdev);
1449b411b363SPhilipp Reisner }
1450b411b363SPhilipp Reisner 
1451b411b363SPhilipp Reisner int drbd_worker(struct drbd_thread *thi)
1452b411b363SPhilipp Reisner {
1453b411b363SPhilipp Reisner 	struct drbd_conf *mdev = thi->mdev;
1454b411b363SPhilipp Reisner 	struct drbd_work *w = NULL;
1455b411b363SPhilipp Reisner 	LIST_HEAD(work_list);
1456b411b363SPhilipp Reisner 	int intr = 0, i;
1457b411b363SPhilipp Reisner 
1458b411b363SPhilipp Reisner 	sprintf(current->comm, "drbd%d_worker", mdev_to_minor(mdev));
1459b411b363SPhilipp Reisner 
1460b411b363SPhilipp Reisner 	while (get_t_state(thi) == Running) {
1461b411b363SPhilipp Reisner 		drbd_thread_current_set_cpu(mdev);
1462b411b363SPhilipp Reisner 
1463b411b363SPhilipp Reisner 		if (down_trylock(&mdev->data.work.s)) {
1464b411b363SPhilipp Reisner 			mutex_lock(&mdev->data.mutex);
1465b411b363SPhilipp Reisner 			if (mdev->data.socket && !mdev->net_conf->no_cork)
1466b411b363SPhilipp Reisner 				drbd_tcp_uncork(mdev->data.socket);
1467b411b363SPhilipp Reisner 			mutex_unlock(&mdev->data.mutex);
1468b411b363SPhilipp Reisner 
1469b411b363SPhilipp Reisner 			intr = down_interruptible(&mdev->data.work.s);
1470b411b363SPhilipp Reisner 
1471b411b363SPhilipp Reisner 			mutex_lock(&mdev->data.mutex);
1472b411b363SPhilipp Reisner 			if (mdev->data.socket  && !mdev->net_conf->no_cork)
1473b411b363SPhilipp Reisner 				drbd_tcp_cork(mdev->data.socket);
1474b411b363SPhilipp Reisner 			mutex_unlock(&mdev->data.mutex);
1475b411b363SPhilipp Reisner 		}
1476b411b363SPhilipp Reisner 
1477b411b363SPhilipp Reisner 		if (intr) {
1478b411b363SPhilipp Reisner 			D_ASSERT(intr == -EINTR);
1479b411b363SPhilipp Reisner 			flush_signals(current);
1480b411b363SPhilipp Reisner 			ERR_IF (get_t_state(thi) == Running)
1481b411b363SPhilipp Reisner 				continue;
1482b411b363SPhilipp Reisner 			break;
1483b411b363SPhilipp Reisner 		}
1484b411b363SPhilipp Reisner 
1485b411b363SPhilipp Reisner 		if (get_t_state(thi) != Running)
1486b411b363SPhilipp Reisner 			break;
1487b411b363SPhilipp Reisner 		/* With this break, we have done a down() but not consumed
1488b411b363SPhilipp Reisner 		   the entry from the list. The cleanup code takes care of
1489b411b363SPhilipp Reisner 		   this...   */
1490b411b363SPhilipp Reisner 
1491b411b363SPhilipp Reisner 		w = NULL;
1492b411b363SPhilipp Reisner 		spin_lock_irq(&mdev->data.work.q_lock);
1493b411b363SPhilipp Reisner 		ERR_IF(list_empty(&mdev->data.work.q)) {
1494b411b363SPhilipp Reisner 			/* something terribly wrong in our logic.
1495b411b363SPhilipp Reisner 			 * we were able to down() the semaphore,
1496b411b363SPhilipp Reisner 			 * but the list is empty... doh.
1497b411b363SPhilipp Reisner 			 *
1498b411b363SPhilipp Reisner 			 * what is the best thing to do now?
1499b411b363SPhilipp Reisner 			 * try again from scratch, restarting the receiver,
1500b411b363SPhilipp Reisner 			 * asender, whatnot? could break even more ugly,
1501b411b363SPhilipp Reisner 			 * e.g. when we are primary, but no good local data.
1502b411b363SPhilipp Reisner 			 *
1503b411b363SPhilipp Reisner 			 * I'll try to get away just starting over this loop.
1504b411b363SPhilipp Reisner 			 */
1505b411b363SPhilipp Reisner 			spin_unlock_irq(&mdev->data.work.q_lock);
1506b411b363SPhilipp Reisner 			continue;
1507b411b363SPhilipp Reisner 		}
1508b411b363SPhilipp Reisner 		w = list_entry(mdev->data.work.q.next, struct drbd_work, list);
1509b411b363SPhilipp Reisner 		list_del_init(&w->list);
1510b411b363SPhilipp Reisner 		spin_unlock_irq(&mdev->data.work.q_lock);
1511b411b363SPhilipp Reisner 
1512b411b363SPhilipp Reisner 		if (!w->cb(mdev, w, mdev->state.conn < C_CONNECTED)) {
1513b411b363SPhilipp Reisner 			/* dev_warn(DEV, "worker: a callback failed! \n"); */
1514b411b363SPhilipp Reisner 			if (mdev->state.conn >= C_CONNECTED)
1515b411b363SPhilipp Reisner 				drbd_force_state(mdev,
1516b411b363SPhilipp Reisner 						NS(conn, C_NETWORK_FAILURE));
1517b411b363SPhilipp Reisner 		}
1518b411b363SPhilipp Reisner 	}
1519b411b363SPhilipp Reisner 	D_ASSERT(test_bit(DEVICE_DYING, &mdev->flags));
1520b411b363SPhilipp Reisner 	D_ASSERT(test_bit(CONFIG_PENDING, &mdev->flags));
1521b411b363SPhilipp Reisner 
1522b411b363SPhilipp Reisner 	spin_lock_irq(&mdev->data.work.q_lock);
1523b411b363SPhilipp Reisner 	i = 0;
1524b411b363SPhilipp Reisner 	while (!list_empty(&mdev->data.work.q)) {
1525b411b363SPhilipp Reisner 		list_splice_init(&mdev->data.work.q, &work_list);
1526b411b363SPhilipp Reisner 		spin_unlock_irq(&mdev->data.work.q_lock);
1527b411b363SPhilipp Reisner 
1528b411b363SPhilipp Reisner 		while (!list_empty(&work_list)) {
1529b411b363SPhilipp Reisner 			w = list_entry(work_list.next, struct drbd_work, list);
1530b411b363SPhilipp Reisner 			list_del_init(&w->list);
1531b411b363SPhilipp Reisner 			w->cb(mdev, w, 1);
1532b411b363SPhilipp Reisner 			i++; /* dead debugging code */
1533b411b363SPhilipp Reisner 		}
1534b411b363SPhilipp Reisner 
1535b411b363SPhilipp Reisner 		spin_lock_irq(&mdev->data.work.q_lock);
1536b411b363SPhilipp Reisner 	}
1537b411b363SPhilipp Reisner 	sema_init(&mdev->data.work.s, 0);
1538b411b363SPhilipp Reisner 	/* DANGEROUS race: if someone did queue his work within the spinlock,
1539b411b363SPhilipp Reisner 	 * but up() ed outside the spinlock, we could get an up() on the
1540b411b363SPhilipp Reisner 	 * semaphore without corresponding list entry.
1541b411b363SPhilipp Reisner 	 * So don't do that.
1542b411b363SPhilipp Reisner 	 */
1543b411b363SPhilipp Reisner 	spin_unlock_irq(&mdev->data.work.q_lock);
1544b411b363SPhilipp Reisner 
1545b411b363SPhilipp Reisner 	D_ASSERT(mdev->state.disk == D_DISKLESS && mdev->state.conn == C_STANDALONE);
1546b411b363SPhilipp Reisner 	/* _drbd_set_state only uses stop_nowait.
1547b411b363SPhilipp Reisner 	 * wait here for the Exiting receiver. */
1548b411b363SPhilipp Reisner 	drbd_thread_stop(&mdev->receiver);
1549b411b363SPhilipp Reisner 	drbd_mdev_cleanup(mdev);
1550b411b363SPhilipp Reisner 
1551b411b363SPhilipp Reisner 	dev_info(DEV, "worker terminated\n");
1552b411b363SPhilipp Reisner 
1553b411b363SPhilipp Reisner 	clear_bit(DEVICE_DYING, &mdev->flags);
1554b411b363SPhilipp Reisner 	clear_bit(CONFIG_PENDING, &mdev->flags);
1555b411b363SPhilipp Reisner 	wake_up(&mdev->state_wait);
1556b411b363SPhilipp Reisner 
1557b411b363SPhilipp Reisner 	return 0;
1558b411b363SPhilipp Reisner }
1559