xref: /openbmc/linux/drivers/block/drbd/drbd_worker.c (revision c5a91619)
1b411b363SPhilipp Reisner /*
2b411b363SPhilipp Reisner    drbd_worker.c
3b411b363SPhilipp Reisner 
4b411b363SPhilipp Reisner    This file is part of DRBD by Philipp Reisner and Lars Ellenberg.
5b411b363SPhilipp Reisner 
6b411b363SPhilipp Reisner    Copyright (C) 2001-2008, LINBIT Information Technologies GmbH.
7b411b363SPhilipp Reisner    Copyright (C) 1999-2008, Philipp Reisner <philipp.reisner@linbit.com>.
8b411b363SPhilipp Reisner    Copyright (C) 2002-2008, Lars Ellenberg <lars.ellenberg@linbit.com>.
9b411b363SPhilipp Reisner 
10b411b363SPhilipp Reisner    drbd is free software; you can redistribute it and/or modify
11b411b363SPhilipp Reisner    it under the terms of the GNU General Public License as published by
12b411b363SPhilipp Reisner    the Free Software Foundation; either version 2, or (at your option)
13b411b363SPhilipp Reisner    any later version.
14b411b363SPhilipp Reisner 
15b411b363SPhilipp Reisner    drbd is distributed in the hope that it will be useful,
16b411b363SPhilipp Reisner    but WITHOUT ANY WARRANTY; without even the implied warranty of
17b411b363SPhilipp Reisner    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
18b411b363SPhilipp Reisner    GNU General Public License for more details.
19b411b363SPhilipp Reisner 
20b411b363SPhilipp Reisner    You should have received a copy of the GNU General Public License
21b411b363SPhilipp Reisner    along with drbd; see the file COPYING.  If not, write to
22b411b363SPhilipp Reisner    the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139, USA.
23b411b363SPhilipp Reisner 
24b411b363SPhilipp Reisner  */
25b411b363SPhilipp Reisner 
26b411b363SPhilipp Reisner #include <linux/module.h>
27b411b363SPhilipp Reisner #include <linux/drbd.h>
28b411b363SPhilipp Reisner #include <linux/sched.h>
29b411b363SPhilipp Reisner #include <linux/wait.h>
30b411b363SPhilipp Reisner #include <linux/mm.h>
31b411b363SPhilipp Reisner #include <linux/memcontrol.h>
32b411b363SPhilipp Reisner #include <linux/mm_inline.h>
33b411b363SPhilipp Reisner #include <linux/slab.h>
34b411b363SPhilipp Reisner #include <linux/random.h>
35b411b363SPhilipp Reisner #include <linux/string.h>
36b411b363SPhilipp Reisner #include <linux/scatterlist.h>
37b411b363SPhilipp Reisner 
38b411b363SPhilipp Reisner #include "drbd_int.h"
39b411b363SPhilipp Reisner #include "drbd_req.h"
40b411b363SPhilipp Reisner 
41b411b363SPhilipp Reisner static int w_make_ov_request(struct drbd_conf *mdev, struct drbd_work *w, int cancel);
429d77a5feSPhilipp Reisner static int w_make_resync_request(struct drbd_conf *mdev,
439d77a5feSPhilipp Reisner 				 struct drbd_work *w, int cancel);
44b411b363SPhilipp Reisner 
45b411b363SPhilipp Reisner 
46b411b363SPhilipp Reisner 
47c5a91619SAndreas Gruenbacher /* endio handlers:
48c5a91619SAndreas Gruenbacher  *   drbd_md_io_complete (defined here)
49c5a91619SAndreas Gruenbacher  *   drbd_endio_pri (defined here)
50c5a91619SAndreas Gruenbacher  *   drbd_endio_sec (defined here)
51c5a91619SAndreas Gruenbacher  *   bm_async_io_complete (defined in drbd_bitmap.c)
52c5a91619SAndreas Gruenbacher  *
53b411b363SPhilipp Reisner  * For all these callbacks, note the following:
54b411b363SPhilipp Reisner  * The callbacks will be called in irq context by the IDE drivers,
55b411b363SPhilipp Reisner  * and in Softirqs/Tasklets/BH context by the SCSI drivers.
56b411b363SPhilipp Reisner  * Try to get the locking right :)
57b411b363SPhilipp Reisner  *
58b411b363SPhilipp Reisner  */
59b411b363SPhilipp Reisner 
60b411b363SPhilipp Reisner 
61b411b363SPhilipp Reisner /* About the global_state_lock
62b411b363SPhilipp Reisner    Each state transition on an device holds a read lock. In case we have
63b411b363SPhilipp Reisner    to evaluate the sync after dependencies, we grab a write lock, because
64b411b363SPhilipp Reisner    we need stable states on all devices for that.  */
65b411b363SPhilipp Reisner rwlock_t global_state_lock;
66b411b363SPhilipp Reisner 
67b411b363SPhilipp Reisner /* used for synchronous meta data and bitmap IO
68b411b363SPhilipp Reisner  * submitted by drbd_md_sync_page_io()
69b411b363SPhilipp Reisner  */
70b411b363SPhilipp Reisner void drbd_md_io_complete(struct bio *bio, int error)
71b411b363SPhilipp Reisner {
72b411b363SPhilipp Reisner 	struct drbd_md_io *md_io;
73b411b363SPhilipp Reisner 
74b411b363SPhilipp Reisner 	md_io = (struct drbd_md_io *)bio->bi_private;
75b411b363SPhilipp Reisner 	md_io->error = error;
76b411b363SPhilipp Reisner 
77b411b363SPhilipp Reisner 	complete(&md_io->event);
78b411b363SPhilipp Reisner }
79b411b363SPhilipp Reisner 
80b411b363SPhilipp Reisner /* reads on behalf of the partner,
81b411b363SPhilipp Reisner  * "submitted" by the receiver
82b411b363SPhilipp Reisner  */
8345bb912bSLars Ellenberg void drbd_endio_read_sec_final(struct drbd_epoch_entry *e) __releases(local)
84b411b363SPhilipp Reisner {
85b411b363SPhilipp Reisner 	unsigned long flags = 0;
8645bb912bSLars Ellenberg 	struct drbd_conf *mdev = e->mdev;
87b411b363SPhilipp Reisner 
88b411b363SPhilipp Reisner 	D_ASSERT(e->block_id != ID_VACANT);
89b411b363SPhilipp Reisner 
90b411b363SPhilipp Reisner 	spin_lock_irqsave(&mdev->req_lock, flags);
91b411b363SPhilipp Reisner 	mdev->read_cnt += e->size >> 9;
92b411b363SPhilipp Reisner 	list_del(&e->w.list);
93b411b363SPhilipp Reisner 	if (list_empty(&mdev->read_ee))
94b411b363SPhilipp Reisner 		wake_up(&mdev->ee_wait);
9545bb912bSLars Ellenberg 	if (test_bit(__EE_WAS_ERROR, &e->flags))
9681e84650SAndreas Gruenbacher 		__drbd_chk_io_error(mdev, false);
97b411b363SPhilipp Reisner 	spin_unlock_irqrestore(&mdev->req_lock, flags);
98b411b363SPhilipp Reisner 
99b411b363SPhilipp Reisner 	drbd_queue_work(&mdev->data.work, &e->w);
100b411b363SPhilipp Reisner 	put_ldev(mdev);
101b411b363SPhilipp Reisner }
102b411b363SPhilipp Reisner 
103b411b363SPhilipp Reisner /* writes on behalf of the partner, or resync writes,
10445bb912bSLars Ellenberg  * "submitted" by the receiver, final stage.  */
10545bb912bSLars Ellenberg static void drbd_endio_write_sec_final(struct drbd_epoch_entry *e) __releases(local)
106b411b363SPhilipp Reisner {
107b411b363SPhilipp Reisner 	unsigned long flags = 0;
10845bb912bSLars Ellenberg 	struct drbd_conf *mdev = e->mdev;
109b411b363SPhilipp Reisner 	sector_t e_sector;
110b411b363SPhilipp Reisner 	int do_wake;
111b411b363SPhilipp Reisner 	int is_syncer_req;
112b411b363SPhilipp Reisner 	int do_al_complete_io;
113b411b363SPhilipp Reisner 
114b411b363SPhilipp Reisner 	D_ASSERT(e->block_id != ID_VACANT);
115b411b363SPhilipp Reisner 
116b411b363SPhilipp Reisner 	/* after we moved e to done_ee,
117b411b363SPhilipp Reisner 	 * we may no longer access it,
118b411b363SPhilipp Reisner 	 * it may be freed/reused already!
119b411b363SPhilipp Reisner 	 * (as soon as we release the req_lock) */
120b411b363SPhilipp Reisner 	e_sector = e->sector;
121b411b363SPhilipp Reisner 	do_al_complete_io = e->flags & EE_CALL_AL_COMPLETE_IO;
12245bb912bSLars Ellenberg 	is_syncer_req = is_syncer_block_id(e->block_id);
123b411b363SPhilipp Reisner 
12445bb912bSLars Ellenberg 	spin_lock_irqsave(&mdev->req_lock, flags);
12545bb912bSLars Ellenberg 	mdev->writ_cnt += e->size >> 9;
126b411b363SPhilipp Reisner 	list_del(&e->w.list); /* has been on active_ee or sync_ee */
127b411b363SPhilipp Reisner 	list_add_tail(&e->w.list, &mdev->done_ee);
128b411b363SPhilipp Reisner 
129b411b363SPhilipp Reisner 	/* No hlist_del_init(&e->colision) here, we did not send the Ack yet,
130b411b363SPhilipp Reisner 	 * neither did we wake possibly waiting conflicting requests.
131b411b363SPhilipp Reisner 	 * done from "drbd_process_done_ee" within the appropriate w.cb
132b411b363SPhilipp Reisner 	 * (e_end_block/e_end_resync_block) or from _drbd_clear_done_ee */
133b411b363SPhilipp Reisner 
134b411b363SPhilipp Reisner 	do_wake = is_syncer_req
135b411b363SPhilipp Reisner 		? list_empty(&mdev->sync_ee)
136b411b363SPhilipp Reisner 		: list_empty(&mdev->active_ee);
137b411b363SPhilipp Reisner 
13845bb912bSLars Ellenberg 	if (test_bit(__EE_WAS_ERROR, &e->flags))
13981e84650SAndreas Gruenbacher 		__drbd_chk_io_error(mdev, false);
140b411b363SPhilipp Reisner 	spin_unlock_irqrestore(&mdev->req_lock, flags);
141b411b363SPhilipp Reisner 
142b411b363SPhilipp Reisner 	if (is_syncer_req)
143b411b363SPhilipp Reisner 		drbd_rs_complete_io(mdev, e_sector);
144b411b363SPhilipp Reisner 
145b411b363SPhilipp Reisner 	if (do_wake)
146b411b363SPhilipp Reisner 		wake_up(&mdev->ee_wait);
147b411b363SPhilipp Reisner 
148b411b363SPhilipp Reisner 	if (do_al_complete_io)
149b411b363SPhilipp Reisner 		drbd_al_complete_io(mdev, e_sector);
150b411b363SPhilipp Reisner 
151b411b363SPhilipp Reisner 	wake_asender(mdev);
152b411b363SPhilipp Reisner 	put_ldev(mdev);
15345bb912bSLars Ellenberg }
154b411b363SPhilipp Reisner 
15545bb912bSLars Ellenberg /* writes on behalf of the partner, or resync writes,
15645bb912bSLars Ellenberg  * "submitted" by the receiver.
15745bb912bSLars Ellenberg  */
15845bb912bSLars Ellenberg void drbd_endio_sec(struct bio *bio, int error)
15945bb912bSLars Ellenberg {
16045bb912bSLars Ellenberg 	struct drbd_epoch_entry *e = bio->bi_private;
16145bb912bSLars Ellenberg 	struct drbd_conf *mdev = e->mdev;
16245bb912bSLars Ellenberg 	int uptodate = bio_flagged(bio, BIO_UPTODATE);
16345bb912bSLars Ellenberg 	int is_write = bio_data_dir(bio) == WRITE;
16445bb912bSLars Ellenberg 
16507194272SLars Ellenberg 	if (error && __ratelimit(&drbd_ratelimit_state))
16645bb912bSLars Ellenberg 		dev_warn(DEV, "%s: error=%d s=%llus\n",
16745bb912bSLars Ellenberg 				is_write ? "write" : "read", error,
16845bb912bSLars Ellenberg 				(unsigned long long)e->sector);
16945bb912bSLars Ellenberg 	if (!error && !uptodate) {
17007194272SLars Ellenberg 		if (__ratelimit(&drbd_ratelimit_state))
17145bb912bSLars Ellenberg 			dev_warn(DEV, "%s: setting error to -EIO s=%llus\n",
17245bb912bSLars Ellenberg 					is_write ? "write" : "read",
17345bb912bSLars Ellenberg 					(unsigned long long)e->sector);
17445bb912bSLars Ellenberg 		/* strange behavior of some lower level drivers...
17545bb912bSLars Ellenberg 		 * fail the request by clearing the uptodate flag,
17645bb912bSLars Ellenberg 		 * but do not return any error?! */
17745bb912bSLars Ellenberg 		error = -EIO;
17845bb912bSLars Ellenberg 	}
17945bb912bSLars Ellenberg 
18045bb912bSLars Ellenberg 	if (error)
18145bb912bSLars Ellenberg 		set_bit(__EE_WAS_ERROR, &e->flags);
18245bb912bSLars Ellenberg 
18345bb912bSLars Ellenberg 	bio_put(bio); /* no need for the bio anymore */
18445bb912bSLars Ellenberg 	if (atomic_dec_and_test(&e->pending_bios)) {
18545bb912bSLars Ellenberg 		if (is_write)
18645bb912bSLars Ellenberg 			drbd_endio_write_sec_final(e);
18745bb912bSLars Ellenberg 		else
18845bb912bSLars Ellenberg 			drbd_endio_read_sec_final(e);
18945bb912bSLars Ellenberg 	}
190b411b363SPhilipp Reisner }
191b411b363SPhilipp Reisner 
192b411b363SPhilipp Reisner /* read, readA or write requests on R_PRIMARY coming from drbd_make_request
193b411b363SPhilipp Reisner  */
194b411b363SPhilipp Reisner void drbd_endio_pri(struct bio *bio, int error)
195b411b363SPhilipp Reisner {
196a115413dSLars Ellenberg 	unsigned long flags;
197b411b363SPhilipp Reisner 	struct drbd_request *req = bio->bi_private;
198b411b363SPhilipp Reisner 	struct drbd_conf *mdev = req->mdev;
199a115413dSLars Ellenberg 	struct bio_and_error m;
200b411b363SPhilipp Reisner 	enum drbd_req_event what;
201b411b363SPhilipp Reisner 	int uptodate = bio_flagged(bio, BIO_UPTODATE);
202b411b363SPhilipp Reisner 
203b411b363SPhilipp Reisner 	if (!error && !uptodate) {
204b411b363SPhilipp Reisner 		dev_warn(DEV, "p %s: setting error to -EIO\n",
205b411b363SPhilipp Reisner 			 bio_data_dir(bio) == WRITE ? "write" : "read");
206b411b363SPhilipp Reisner 		/* strange behavior of some lower level drivers...
207b411b363SPhilipp Reisner 		 * fail the request by clearing the uptodate flag,
208b411b363SPhilipp Reisner 		 * but do not return any error?! */
209b411b363SPhilipp Reisner 		error = -EIO;
210b411b363SPhilipp Reisner 	}
211b411b363SPhilipp Reisner 
212b411b363SPhilipp Reisner 	/* to avoid recursion in __req_mod */
213b411b363SPhilipp Reisner 	if (unlikely(error)) {
214b411b363SPhilipp Reisner 		what = (bio_data_dir(bio) == WRITE)
215b411b363SPhilipp Reisner 			? write_completed_with_error
2165c3c7e64SLars Ellenberg 			: (bio_rw(bio) == READ)
217b411b363SPhilipp Reisner 			  ? read_completed_with_error
218b411b363SPhilipp Reisner 			  : read_ahead_completed_with_error;
219b411b363SPhilipp Reisner 	} else
220b411b363SPhilipp Reisner 		what = completed_ok;
221b411b363SPhilipp Reisner 
222b411b363SPhilipp Reisner 	bio_put(req->private_bio);
223b411b363SPhilipp Reisner 	req->private_bio = ERR_PTR(error);
224b411b363SPhilipp Reisner 
225a115413dSLars Ellenberg 	/* not req_mod(), we need irqsave here! */
226a115413dSLars Ellenberg 	spin_lock_irqsave(&mdev->req_lock, flags);
227a115413dSLars Ellenberg 	__req_mod(req, what, &m);
228a115413dSLars Ellenberg 	spin_unlock_irqrestore(&mdev->req_lock, flags);
229a115413dSLars Ellenberg 
230a115413dSLars Ellenberg 	if (m.bio)
231a115413dSLars Ellenberg 		complete_master_bio(mdev, &m);
232b411b363SPhilipp Reisner }
233b411b363SPhilipp Reisner 
234b411b363SPhilipp Reisner int w_read_retry_remote(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
235b411b363SPhilipp Reisner {
236b411b363SPhilipp Reisner 	struct drbd_request *req = container_of(w, struct drbd_request, w);
237b411b363SPhilipp Reisner 
238b411b363SPhilipp Reisner 	/* We should not detach for read io-error,
239b411b363SPhilipp Reisner 	 * but try to WRITE the P_DATA_REPLY to the failed location,
240b411b363SPhilipp Reisner 	 * to give the disk the chance to relocate that block */
241b411b363SPhilipp Reisner 
242b411b363SPhilipp Reisner 	spin_lock_irq(&mdev->req_lock);
243d255e5ffSLars Ellenberg 	if (cancel || mdev->state.pdsk != D_UP_TO_DATE) {
244d255e5ffSLars Ellenberg 		_req_mod(req, read_retry_remote_canceled);
245b411b363SPhilipp Reisner 		spin_unlock_irq(&mdev->req_lock);
246b411b363SPhilipp Reisner 		return 1;
247b411b363SPhilipp Reisner 	}
248b411b363SPhilipp Reisner 	spin_unlock_irq(&mdev->req_lock);
249b411b363SPhilipp Reisner 
250b411b363SPhilipp Reisner 	return w_send_read_req(mdev, w, 0);
251b411b363SPhilipp Reisner }
252b411b363SPhilipp Reisner 
25345bb912bSLars Ellenberg void drbd_csum_ee(struct drbd_conf *mdev, struct crypto_hash *tfm, struct drbd_epoch_entry *e, void *digest)
25445bb912bSLars Ellenberg {
25545bb912bSLars Ellenberg 	struct hash_desc desc;
25645bb912bSLars Ellenberg 	struct scatterlist sg;
25745bb912bSLars Ellenberg 	struct page *page = e->pages;
25845bb912bSLars Ellenberg 	struct page *tmp;
25945bb912bSLars Ellenberg 	unsigned len;
26045bb912bSLars Ellenberg 
26145bb912bSLars Ellenberg 	desc.tfm = tfm;
26245bb912bSLars Ellenberg 	desc.flags = 0;
26345bb912bSLars Ellenberg 
26445bb912bSLars Ellenberg 	sg_init_table(&sg, 1);
26545bb912bSLars Ellenberg 	crypto_hash_init(&desc);
26645bb912bSLars Ellenberg 
26745bb912bSLars Ellenberg 	while ((tmp = page_chain_next(page))) {
26845bb912bSLars Ellenberg 		/* all but the last page will be fully used */
26945bb912bSLars Ellenberg 		sg_set_page(&sg, page, PAGE_SIZE, 0);
27045bb912bSLars Ellenberg 		crypto_hash_update(&desc, &sg, sg.length);
27145bb912bSLars Ellenberg 		page = tmp;
27245bb912bSLars Ellenberg 	}
27345bb912bSLars Ellenberg 	/* and now the last, possibly only partially used page */
27445bb912bSLars Ellenberg 	len = e->size & (PAGE_SIZE - 1);
27545bb912bSLars Ellenberg 	sg_set_page(&sg, page, len ?: PAGE_SIZE, 0);
27645bb912bSLars Ellenberg 	crypto_hash_update(&desc, &sg, sg.length);
27745bb912bSLars Ellenberg 	crypto_hash_final(&desc, digest);
27845bb912bSLars Ellenberg }
27945bb912bSLars Ellenberg 
28045bb912bSLars Ellenberg void drbd_csum_bio(struct drbd_conf *mdev, struct crypto_hash *tfm, struct bio *bio, void *digest)
281b411b363SPhilipp Reisner {
282b411b363SPhilipp Reisner 	struct hash_desc desc;
283b411b363SPhilipp Reisner 	struct scatterlist sg;
284b411b363SPhilipp Reisner 	struct bio_vec *bvec;
285b411b363SPhilipp Reisner 	int i;
286b411b363SPhilipp Reisner 
287b411b363SPhilipp Reisner 	desc.tfm = tfm;
288b411b363SPhilipp Reisner 	desc.flags = 0;
289b411b363SPhilipp Reisner 
290b411b363SPhilipp Reisner 	sg_init_table(&sg, 1);
291b411b363SPhilipp Reisner 	crypto_hash_init(&desc);
292b411b363SPhilipp Reisner 
293b411b363SPhilipp Reisner 	__bio_for_each_segment(bvec, bio, i, 0) {
294b411b363SPhilipp Reisner 		sg_set_page(&sg, bvec->bv_page, bvec->bv_len, bvec->bv_offset);
295b411b363SPhilipp Reisner 		crypto_hash_update(&desc, &sg, sg.length);
296b411b363SPhilipp Reisner 	}
297b411b363SPhilipp Reisner 	crypto_hash_final(&desc, digest);
298b411b363SPhilipp Reisner }
299b411b363SPhilipp Reisner 
300b411b363SPhilipp Reisner static int w_e_send_csum(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
301b411b363SPhilipp Reisner {
302b411b363SPhilipp Reisner 	struct drbd_epoch_entry *e = container_of(w, struct drbd_epoch_entry, w);
303b411b363SPhilipp Reisner 	int digest_size;
304b411b363SPhilipp Reisner 	void *digest;
305b411b363SPhilipp Reisner 	int ok;
306b411b363SPhilipp Reisner 
307b411b363SPhilipp Reisner 	D_ASSERT(e->block_id == DRBD_MAGIC + 0xbeef);
308b411b363SPhilipp Reisner 
309b411b363SPhilipp Reisner 	if (unlikely(cancel)) {
310b411b363SPhilipp Reisner 		drbd_free_ee(mdev, e);
311b411b363SPhilipp Reisner 		return 1;
312b411b363SPhilipp Reisner 	}
313b411b363SPhilipp Reisner 
31445bb912bSLars Ellenberg 	if (likely((e->flags & EE_WAS_ERROR) == 0)) {
315b411b363SPhilipp Reisner 		digest_size = crypto_hash_digestsize(mdev->csums_tfm);
316b411b363SPhilipp Reisner 		digest = kmalloc(digest_size, GFP_NOIO);
317b411b363SPhilipp Reisner 		if (digest) {
31845bb912bSLars Ellenberg 			drbd_csum_ee(mdev, mdev->csums_tfm, e, digest);
319b411b363SPhilipp Reisner 
320b411b363SPhilipp Reisner 			inc_rs_pending(mdev);
321b411b363SPhilipp Reisner 			ok = drbd_send_drequest_csum(mdev,
322b411b363SPhilipp Reisner 						     e->sector,
323b411b363SPhilipp Reisner 						     e->size,
324b411b363SPhilipp Reisner 						     digest,
325b411b363SPhilipp Reisner 						     digest_size,
326b411b363SPhilipp Reisner 						     P_CSUM_RS_REQUEST);
327b411b363SPhilipp Reisner 			kfree(digest);
328b411b363SPhilipp Reisner 		} else {
329b411b363SPhilipp Reisner 			dev_err(DEV, "kmalloc() of digest failed.\n");
330b411b363SPhilipp Reisner 			ok = 0;
331b411b363SPhilipp Reisner 		}
332b411b363SPhilipp Reisner 	} else
333b411b363SPhilipp Reisner 		ok = 1;
334b411b363SPhilipp Reisner 
335b411b363SPhilipp Reisner 	drbd_free_ee(mdev, e);
336b411b363SPhilipp Reisner 
337b411b363SPhilipp Reisner 	if (unlikely(!ok))
338b411b363SPhilipp Reisner 		dev_err(DEV, "drbd_send_drequest(..., csum) failed\n");
339b411b363SPhilipp Reisner 	return ok;
340b411b363SPhilipp Reisner }
341b411b363SPhilipp Reisner 
342b411b363SPhilipp Reisner #define GFP_TRY	(__GFP_HIGHMEM | __GFP_NOWARN)
343b411b363SPhilipp Reisner 
344b411b363SPhilipp Reisner static int read_for_csum(struct drbd_conf *mdev, sector_t sector, int size)
345b411b363SPhilipp Reisner {
346b411b363SPhilipp Reisner 	struct drbd_epoch_entry *e;
347b411b363SPhilipp Reisner 
348b411b363SPhilipp Reisner 	if (!get_ldev(mdev))
34980a40e43SLars Ellenberg 		return -EIO;
350b411b363SPhilipp Reisner 
351e3555d85SPhilipp Reisner 	if (drbd_rs_should_slow_down(mdev, sector))
3520f0601f4SLars Ellenberg 		goto defer;
3530f0601f4SLars Ellenberg 
354b411b363SPhilipp Reisner 	/* GFP_TRY, because if there is no memory available right now, this may
355b411b363SPhilipp Reisner 	 * be rescheduled for later. It is "only" background resync, after all. */
356b411b363SPhilipp Reisner 	e = drbd_alloc_ee(mdev, DRBD_MAGIC+0xbeef, sector, size, GFP_TRY);
35745bb912bSLars Ellenberg 	if (!e)
35880a40e43SLars Ellenberg 		goto defer;
359b411b363SPhilipp Reisner 
36080a40e43SLars Ellenberg 	e->w.cb = w_e_send_csum;
361b411b363SPhilipp Reisner 	spin_lock_irq(&mdev->req_lock);
362b411b363SPhilipp Reisner 	list_add(&e->w.list, &mdev->read_ee);
363b411b363SPhilipp Reisner 	spin_unlock_irq(&mdev->req_lock);
364b411b363SPhilipp Reisner 
3650f0601f4SLars Ellenberg 	atomic_add(size >> 9, &mdev->rs_sect_ev);
36645bb912bSLars Ellenberg 	if (drbd_submit_ee(mdev, e, READ, DRBD_FAULT_RS_RD) == 0)
36780a40e43SLars Ellenberg 		return 0;
36845bb912bSLars Ellenberg 
36910f6d992SLars Ellenberg 	/* If it failed because of ENOMEM, retry should help.  If it failed
37010f6d992SLars Ellenberg 	 * because bio_add_page failed (probably broken lower level driver),
37110f6d992SLars Ellenberg 	 * retry may or may not help.
37210f6d992SLars Ellenberg 	 * If it does not, you may need to force disconnect. */
37322cc37a9SLars Ellenberg 	spin_lock_irq(&mdev->req_lock);
37422cc37a9SLars Ellenberg 	list_del(&e->w.list);
37522cc37a9SLars Ellenberg 	spin_unlock_irq(&mdev->req_lock);
37622cc37a9SLars Ellenberg 
37745bb912bSLars Ellenberg 	drbd_free_ee(mdev, e);
37880a40e43SLars Ellenberg defer:
37945bb912bSLars Ellenberg 	put_ldev(mdev);
38080a40e43SLars Ellenberg 	return -EAGAIN;
381b411b363SPhilipp Reisner }
382b411b363SPhilipp Reisner 
383794abb75SPhilipp Reisner int w_resync_timer(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
384794abb75SPhilipp Reisner {
385794abb75SPhilipp Reisner 	switch (mdev->state.conn) {
386794abb75SPhilipp Reisner 	case C_VERIFY_S:
387794abb75SPhilipp Reisner 		w_make_ov_request(mdev, w, cancel);
388794abb75SPhilipp Reisner 		break;
389794abb75SPhilipp Reisner 	case C_SYNC_TARGET:
390794abb75SPhilipp Reisner 		w_make_resync_request(mdev, w, cancel);
391794abb75SPhilipp Reisner 		break;
392794abb75SPhilipp Reisner 	}
393794abb75SPhilipp Reisner 
394794abb75SPhilipp Reisner 	return 1;
395794abb75SPhilipp Reisner }
396794abb75SPhilipp Reisner 
397b411b363SPhilipp Reisner void resync_timer_fn(unsigned long data)
398b411b363SPhilipp Reisner {
399b411b363SPhilipp Reisner 	struct drbd_conf *mdev = (struct drbd_conf *) data;
400b411b363SPhilipp Reisner 
401794abb75SPhilipp Reisner 	if (list_empty(&mdev->resync_work.list))
402b411b363SPhilipp Reisner 		drbd_queue_work(&mdev->data.work, &mdev->resync_work);
403b411b363SPhilipp Reisner }
404b411b363SPhilipp Reisner 
405778f271dSPhilipp Reisner static void fifo_set(struct fifo_buffer *fb, int value)
406778f271dSPhilipp Reisner {
407778f271dSPhilipp Reisner 	int i;
408778f271dSPhilipp Reisner 
409778f271dSPhilipp Reisner 	for (i = 0; i < fb->size; i++)
410f10f2623SPhilipp Reisner 		fb->values[i] = value;
411778f271dSPhilipp Reisner }
412778f271dSPhilipp Reisner 
413778f271dSPhilipp Reisner static int fifo_push(struct fifo_buffer *fb, int value)
414778f271dSPhilipp Reisner {
415778f271dSPhilipp Reisner 	int ov;
416778f271dSPhilipp Reisner 
417778f271dSPhilipp Reisner 	ov = fb->values[fb->head_index];
418778f271dSPhilipp Reisner 	fb->values[fb->head_index++] = value;
419778f271dSPhilipp Reisner 
420778f271dSPhilipp Reisner 	if (fb->head_index >= fb->size)
421778f271dSPhilipp Reisner 		fb->head_index = 0;
422778f271dSPhilipp Reisner 
423778f271dSPhilipp Reisner 	return ov;
424778f271dSPhilipp Reisner }
425778f271dSPhilipp Reisner 
426778f271dSPhilipp Reisner static void fifo_add_val(struct fifo_buffer *fb, int value)
427778f271dSPhilipp Reisner {
428778f271dSPhilipp Reisner 	int i;
429778f271dSPhilipp Reisner 
430778f271dSPhilipp Reisner 	for (i = 0; i < fb->size; i++)
431778f271dSPhilipp Reisner 		fb->values[i] += value;
432778f271dSPhilipp Reisner }
433778f271dSPhilipp Reisner 
4349d77a5feSPhilipp Reisner static int drbd_rs_controller(struct drbd_conf *mdev)
435778f271dSPhilipp Reisner {
436778f271dSPhilipp Reisner 	unsigned int sect_in;  /* Number of sectors that came in since the last turn */
437778f271dSPhilipp Reisner 	unsigned int want;     /* The number of sectors we want in the proxy */
438778f271dSPhilipp Reisner 	int req_sect; /* Number of sectors to request in this turn */
439778f271dSPhilipp Reisner 	int correction; /* Number of sectors more we need in the proxy*/
440778f271dSPhilipp Reisner 	int cps; /* correction per invocation of drbd_rs_controller() */
441778f271dSPhilipp Reisner 	int steps; /* Number of time steps to plan ahead */
442778f271dSPhilipp Reisner 	int curr_corr;
443778f271dSPhilipp Reisner 	int max_sect;
444778f271dSPhilipp Reisner 
445778f271dSPhilipp Reisner 	sect_in = atomic_xchg(&mdev->rs_sect_in, 0); /* Number of sectors that came in */
446778f271dSPhilipp Reisner 	mdev->rs_in_flight -= sect_in;
447778f271dSPhilipp Reisner 
448778f271dSPhilipp Reisner 	spin_lock(&mdev->peer_seq_lock); /* get an atomic view on mdev->rs_plan_s */
449778f271dSPhilipp Reisner 
450778f271dSPhilipp Reisner 	steps = mdev->rs_plan_s.size; /* (mdev->sync_conf.c_plan_ahead * 10 * SLEEP_TIME) / HZ; */
451778f271dSPhilipp Reisner 
452778f271dSPhilipp Reisner 	if (mdev->rs_in_flight + sect_in == 0) { /* At start of resync */
453778f271dSPhilipp Reisner 		want = ((mdev->sync_conf.rate * 2 * SLEEP_TIME) / HZ) * steps;
454778f271dSPhilipp Reisner 	} else { /* normal path */
455778f271dSPhilipp Reisner 		want = mdev->sync_conf.c_fill_target ? mdev->sync_conf.c_fill_target :
456778f271dSPhilipp Reisner 			sect_in * mdev->sync_conf.c_delay_target * HZ / (SLEEP_TIME * 10);
457778f271dSPhilipp Reisner 	}
458778f271dSPhilipp Reisner 
459778f271dSPhilipp Reisner 	correction = want - mdev->rs_in_flight - mdev->rs_planed;
460778f271dSPhilipp Reisner 
461778f271dSPhilipp Reisner 	/* Plan ahead */
462778f271dSPhilipp Reisner 	cps = correction / steps;
463778f271dSPhilipp Reisner 	fifo_add_val(&mdev->rs_plan_s, cps);
464778f271dSPhilipp Reisner 	mdev->rs_planed += cps * steps;
465778f271dSPhilipp Reisner 
466778f271dSPhilipp Reisner 	/* What we do in this step */
467778f271dSPhilipp Reisner 	curr_corr = fifo_push(&mdev->rs_plan_s, 0);
468778f271dSPhilipp Reisner 	spin_unlock(&mdev->peer_seq_lock);
469778f271dSPhilipp Reisner 	mdev->rs_planed -= curr_corr;
470778f271dSPhilipp Reisner 
471778f271dSPhilipp Reisner 	req_sect = sect_in + curr_corr;
472778f271dSPhilipp Reisner 	if (req_sect < 0)
473778f271dSPhilipp Reisner 		req_sect = 0;
474778f271dSPhilipp Reisner 
475778f271dSPhilipp Reisner 	max_sect = (mdev->sync_conf.c_max_rate * 2 * SLEEP_TIME) / HZ;
476778f271dSPhilipp Reisner 	if (req_sect > max_sect)
477778f271dSPhilipp Reisner 		req_sect = max_sect;
478778f271dSPhilipp Reisner 
479778f271dSPhilipp Reisner 	/*
480778f271dSPhilipp Reisner 	dev_warn(DEV, "si=%u if=%d wa=%u co=%d st=%d cps=%d pl=%d cc=%d rs=%d\n",
481778f271dSPhilipp Reisner 		 sect_in, mdev->rs_in_flight, want, correction,
482778f271dSPhilipp Reisner 		 steps, cps, mdev->rs_planed, curr_corr, req_sect);
483778f271dSPhilipp Reisner 	*/
484778f271dSPhilipp Reisner 
485778f271dSPhilipp Reisner 	return req_sect;
486778f271dSPhilipp Reisner }
487778f271dSPhilipp Reisner 
4889d77a5feSPhilipp Reisner static int drbd_rs_number_requests(struct drbd_conf *mdev)
489e65f440dSLars Ellenberg {
490e65f440dSLars Ellenberg 	int number;
491e65f440dSLars Ellenberg 	if (mdev->rs_plan_s.size) { /* mdev->sync_conf.c_plan_ahead */
492e65f440dSLars Ellenberg 		number = drbd_rs_controller(mdev) >> (BM_BLOCK_SHIFT - 9);
493e65f440dSLars Ellenberg 		mdev->c_sync_rate = number * HZ * (BM_BLOCK_SIZE / 1024) / SLEEP_TIME;
494e65f440dSLars Ellenberg 	} else {
495e65f440dSLars Ellenberg 		mdev->c_sync_rate = mdev->sync_conf.rate;
496e65f440dSLars Ellenberg 		number = SLEEP_TIME * mdev->c_sync_rate  / ((BM_BLOCK_SIZE / 1024) * HZ);
497e65f440dSLars Ellenberg 	}
498e65f440dSLars Ellenberg 
499e65f440dSLars Ellenberg 	/* ignore the amount of pending requests, the resync controller should
500e65f440dSLars Ellenberg 	 * throttle down to incoming reply rate soon enough anyways. */
501e65f440dSLars Ellenberg 	return number;
502e65f440dSLars Ellenberg }
503e65f440dSLars Ellenberg 
5049d77a5feSPhilipp Reisner static int w_make_resync_request(struct drbd_conf *mdev,
505b411b363SPhilipp Reisner 				 struct drbd_work *w, int cancel)
506b411b363SPhilipp Reisner {
507b411b363SPhilipp Reisner 	unsigned long bit;
508b411b363SPhilipp Reisner 	sector_t sector;
509b411b363SPhilipp Reisner 	const sector_t capacity = drbd_get_capacity(mdev->this_bdev);
5101816a2b4SLars Ellenberg 	int max_bio_size;
511e65f440dSLars Ellenberg 	int number, rollback_i, size;
512b411b363SPhilipp Reisner 	int align, queued, sndbuf;
5130f0601f4SLars Ellenberg 	int i = 0;
514b411b363SPhilipp Reisner 
515b411b363SPhilipp Reisner 	if (unlikely(cancel))
516b411b363SPhilipp Reisner 		return 1;
517b411b363SPhilipp Reisner 
518af85e8e8SLars Ellenberg 	if (mdev->rs_total == 0) {
519af85e8e8SLars Ellenberg 		/* empty resync? */
520af85e8e8SLars Ellenberg 		drbd_resync_finished(mdev);
521af85e8e8SLars Ellenberg 		return 1;
522af85e8e8SLars Ellenberg 	}
523af85e8e8SLars Ellenberg 
524b411b363SPhilipp Reisner 	if (!get_ldev(mdev)) {
525b411b363SPhilipp Reisner 		/* Since we only need to access mdev->rsync a
526b411b363SPhilipp Reisner 		   get_ldev_if_state(mdev,D_FAILED) would be sufficient, but
527b411b363SPhilipp Reisner 		   to continue resync with a broken disk makes no sense at
528b411b363SPhilipp Reisner 		   all */
529b411b363SPhilipp Reisner 		dev_err(DEV, "Disk broke down during resync!\n");
530b411b363SPhilipp Reisner 		return 1;
531b411b363SPhilipp Reisner 	}
532b411b363SPhilipp Reisner 
533bb3d000cSLars Ellenberg 	/* starting with drbd 8.3.8, we can handle multi-bio EEs,
534bb3d000cSLars Ellenberg 	 * if it should be necessary */
5351816a2b4SLars Ellenberg 	max_bio_size =
5361816a2b4SLars Ellenberg 		mdev->agreed_pro_version < 94 ? queue_max_hw_sectors(mdev->rq_queue) << 9 :
5371816a2b4SLars Ellenberg 		mdev->agreed_pro_version < 95 ?	DRBD_MAX_SIZE_H80_PACKET : DRBD_MAX_BIO_SIZE;
538bb3d000cSLars Ellenberg 
539e65f440dSLars Ellenberg 	number = drbd_rs_number_requests(mdev);
540e65f440dSLars Ellenberg 	if (number == 0)
5410f0601f4SLars Ellenberg 		goto requeue;
542b411b363SPhilipp Reisner 
543b411b363SPhilipp Reisner 	for (i = 0; i < number; i++) {
544b411b363SPhilipp Reisner 		/* Stop generating RS requests, when half of the send buffer is filled */
545b411b363SPhilipp Reisner 		mutex_lock(&mdev->data.mutex);
546b411b363SPhilipp Reisner 		if (mdev->data.socket) {
547b411b363SPhilipp Reisner 			queued = mdev->data.socket->sk->sk_wmem_queued;
548b411b363SPhilipp Reisner 			sndbuf = mdev->data.socket->sk->sk_sndbuf;
549b411b363SPhilipp Reisner 		} else {
550b411b363SPhilipp Reisner 			queued = 1;
551b411b363SPhilipp Reisner 			sndbuf = 0;
552b411b363SPhilipp Reisner 		}
553b411b363SPhilipp Reisner 		mutex_unlock(&mdev->data.mutex);
554b411b363SPhilipp Reisner 		if (queued > sndbuf / 2)
555b411b363SPhilipp Reisner 			goto requeue;
556b411b363SPhilipp Reisner 
557b411b363SPhilipp Reisner next_sector:
558b411b363SPhilipp Reisner 		size = BM_BLOCK_SIZE;
559b411b363SPhilipp Reisner 		bit  = drbd_bm_find_next(mdev, mdev->bm_resync_fo);
560b411b363SPhilipp Reisner 
5614b0715f0SLars Ellenberg 		if (bit == DRBD_END_OF_BITMAP) {
562b411b363SPhilipp Reisner 			mdev->bm_resync_fo = drbd_bm_bits(mdev);
563b411b363SPhilipp Reisner 			put_ldev(mdev);
564b411b363SPhilipp Reisner 			return 1;
565b411b363SPhilipp Reisner 		}
566b411b363SPhilipp Reisner 
567b411b363SPhilipp Reisner 		sector = BM_BIT_TO_SECT(bit);
568b411b363SPhilipp Reisner 
569e3555d85SPhilipp Reisner 		if (drbd_rs_should_slow_down(mdev, sector) ||
570e3555d85SPhilipp Reisner 		    drbd_try_rs_begin_io(mdev, sector)) {
571b411b363SPhilipp Reisner 			mdev->bm_resync_fo = bit;
572b411b363SPhilipp Reisner 			goto requeue;
573b411b363SPhilipp Reisner 		}
574b411b363SPhilipp Reisner 		mdev->bm_resync_fo = bit + 1;
575b411b363SPhilipp Reisner 
576b411b363SPhilipp Reisner 		if (unlikely(drbd_bm_test_bit(mdev, bit) == 0)) {
577b411b363SPhilipp Reisner 			drbd_rs_complete_io(mdev, sector);
578b411b363SPhilipp Reisner 			goto next_sector;
579b411b363SPhilipp Reisner 		}
580b411b363SPhilipp Reisner 
5811816a2b4SLars Ellenberg #if DRBD_MAX_BIO_SIZE > BM_BLOCK_SIZE
582b411b363SPhilipp Reisner 		/* try to find some adjacent bits.
583b411b363SPhilipp Reisner 		 * we stop if we have already the maximum req size.
584b411b363SPhilipp Reisner 		 *
585b411b363SPhilipp Reisner 		 * Additionally always align bigger requests, in order to
586b411b363SPhilipp Reisner 		 * be prepared for all stripe sizes of software RAIDs.
587b411b363SPhilipp Reisner 		 */
588b411b363SPhilipp Reisner 		align = 1;
589d207450cSPhilipp Reisner 		rollback_i = i;
590b411b363SPhilipp Reisner 		for (;;) {
5911816a2b4SLars Ellenberg 			if (size + BM_BLOCK_SIZE > max_bio_size)
592b411b363SPhilipp Reisner 				break;
593b411b363SPhilipp Reisner 
594b411b363SPhilipp Reisner 			/* Be always aligned */
595b411b363SPhilipp Reisner 			if (sector & ((1<<(align+3))-1))
596b411b363SPhilipp Reisner 				break;
597b411b363SPhilipp Reisner 
598b411b363SPhilipp Reisner 			/* do not cross extent boundaries */
599b411b363SPhilipp Reisner 			if (((bit+1) & BM_BLOCKS_PER_BM_EXT_MASK) == 0)
600b411b363SPhilipp Reisner 				break;
601b411b363SPhilipp Reisner 			/* now, is it actually dirty, after all?
602b411b363SPhilipp Reisner 			 * caution, drbd_bm_test_bit is tri-state for some
603b411b363SPhilipp Reisner 			 * obscure reason; ( b == 0 ) would get the out-of-band
604b411b363SPhilipp Reisner 			 * only accidentally right because of the "oddly sized"
605b411b363SPhilipp Reisner 			 * adjustment below */
606b411b363SPhilipp Reisner 			if (drbd_bm_test_bit(mdev, bit+1) != 1)
607b411b363SPhilipp Reisner 				break;
608b411b363SPhilipp Reisner 			bit++;
609b411b363SPhilipp Reisner 			size += BM_BLOCK_SIZE;
610b411b363SPhilipp Reisner 			if ((BM_BLOCK_SIZE << align) <= size)
611b411b363SPhilipp Reisner 				align++;
612b411b363SPhilipp Reisner 			i++;
613b411b363SPhilipp Reisner 		}
614b411b363SPhilipp Reisner 		/* if we merged some,
615b411b363SPhilipp Reisner 		 * reset the offset to start the next drbd_bm_find_next from */
616b411b363SPhilipp Reisner 		if (size > BM_BLOCK_SIZE)
617b411b363SPhilipp Reisner 			mdev->bm_resync_fo = bit + 1;
618b411b363SPhilipp Reisner #endif
619b411b363SPhilipp Reisner 
620b411b363SPhilipp Reisner 		/* adjust very last sectors, in case we are oddly sized */
621b411b363SPhilipp Reisner 		if (sector + (size>>9) > capacity)
622b411b363SPhilipp Reisner 			size = (capacity-sector)<<9;
623b411b363SPhilipp Reisner 		if (mdev->agreed_pro_version >= 89 && mdev->csums_tfm) {
624b411b363SPhilipp Reisner 			switch (read_for_csum(mdev, sector, size)) {
62580a40e43SLars Ellenberg 			case -EIO: /* Disk failure */
626b411b363SPhilipp Reisner 				put_ldev(mdev);
627b411b363SPhilipp Reisner 				return 0;
62880a40e43SLars Ellenberg 			case -EAGAIN: /* allocation failed, or ldev busy */
629b411b363SPhilipp Reisner 				drbd_rs_complete_io(mdev, sector);
630b411b363SPhilipp Reisner 				mdev->bm_resync_fo = BM_SECT_TO_BIT(sector);
631d207450cSPhilipp Reisner 				i = rollback_i;
632b411b363SPhilipp Reisner 				goto requeue;
63380a40e43SLars Ellenberg 			case 0:
63480a40e43SLars Ellenberg 				/* everything ok */
63580a40e43SLars Ellenberg 				break;
63680a40e43SLars Ellenberg 			default:
63780a40e43SLars Ellenberg 				BUG();
638b411b363SPhilipp Reisner 			}
639b411b363SPhilipp Reisner 		} else {
640b411b363SPhilipp Reisner 			inc_rs_pending(mdev);
641b411b363SPhilipp Reisner 			if (!drbd_send_drequest(mdev, P_RS_DATA_REQUEST,
642b411b363SPhilipp Reisner 					       sector, size, ID_SYNCER)) {
643b411b363SPhilipp Reisner 				dev_err(DEV, "drbd_send_drequest() failed, aborting...\n");
644b411b363SPhilipp Reisner 				dec_rs_pending(mdev);
645b411b363SPhilipp Reisner 				put_ldev(mdev);
646b411b363SPhilipp Reisner 				return 0;
647b411b363SPhilipp Reisner 			}
648b411b363SPhilipp Reisner 		}
649b411b363SPhilipp Reisner 	}
650b411b363SPhilipp Reisner 
651b411b363SPhilipp Reisner 	if (mdev->bm_resync_fo >= drbd_bm_bits(mdev)) {
652b411b363SPhilipp Reisner 		/* last syncer _request_ was sent,
653b411b363SPhilipp Reisner 		 * but the P_RS_DATA_REPLY not yet received.  sync will end (and
654b411b363SPhilipp Reisner 		 * next sync group will resume), as soon as we receive the last
655b411b363SPhilipp Reisner 		 * resync data block, and the last bit is cleared.
656b411b363SPhilipp Reisner 		 * until then resync "work" is "inactive" ...
657b411b363SPhilipp Reisner 		 */
658b411b363SPhilipp Reisner 		put_ldev(mdev);
659b411b363SPhilipp Reisner 		return 1;
660b411b363SPhilipp Reisner 	}
661b411b363SPhilipp Reisner 
662b411b363SPhilipp Reisner  requeue:
663778f271dSPhilipp Reisner 	mdev->rs_in_flight += (i << (BM_BLOCK_SHIFT - 9));
664b411b363SPhilipp Reisner 	mod_timer(&mdev->resync_timer, jiffies + SLEEP_TIME);
665b411b363SPhilipp Reisner 	put_ldev(mdev);
666b411b363SPhilipp Reisner 	return 1;
667b411b363SPhilipp Reisner }
668b411b363SPhilipp Reisner 
669b411b363SPhilipp Reisner static int w_make_ov_request(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
670b411b363SPhilipp Reisner {
671b411b363SPhilipp Reisner 	int number, i, size;
672b411b363SPhilipp Reisner 	sector_t sector;
673b411b363SPhilipp Reisner 	const sector_t capacity = drbd_get_capacity(mdev->this_bdev);
674b411b363SPhilipp Reisner 
675b411b363SPhilipp Reisner 	if (unlikely(cancel))
676b411b363SPhilipp Reisner 		return 1;
677b411b363SPhilipp Reisner 
6782649f080SLars Ellenberg 	number = drbd_rs_number_requests(mdev);
679b411b363SPhilipp Reisner 
680b411b363SPhilipp Reisner 	sector = mdev->ov_position;
681b411b363SPhilipp Reisner 	for (i = 0; i < number; i++) {
682b411b363SPhilipp Reisner 		if (sector >= capacity) {
683b411b363SPhilipp Reisner 			return 1;
684b411b363SPhilipp Reisner 		}
685b411b363SPhilipp Reisner 
686b411b363SPhilipp Reisner 		size = BM_BLOCK_SIZE;
687b411b363SPhilipp Reisner 
688e3555d85SPhilipp Reisner 		if (drbd_rs_should_slow_down(mdev, sector) ||
689e3555d85SPhilipp Reisner 		    drbd_try_rs_begin_io(mdev, sector)) {
690b411b363SPhilipp Reisner 			mdev->ov_position = sector;
691b411b363SPhilipp Reisner 			goto requeue;
692b411b363SPhilipp Reisner 		}
693b411b363SPhilipp Reisner 
694b411b363SPhilipp Reisner 		if (sector + (size>>9) > capacity)
695b411b363SPhilipp Reisner 			size = (capacity-sector)<<9;
696b411b363SPhilipp Reisner 
697b411b363SPhilipp Reisner 		inc_rs_pending(mdev);
698b411b363SPhilipp Reisner 		if (!drbd_send_ov_request(mdev, sector, size)) {
699b411b363SPhilipp Reisner 			dec_rs_pending(mdev);
700b411b363SPhilipp Reisner 			return 0;
701b411b363SPhilipp Reisner 		}
702b411b363SPhilipp Reisner 		sector += BM_SECT_PER_BIT;
703b411b363SPhilipp Reisner 	}
704b411b363SPhilipp Reisner 	mdev->ov_position = sector;
705b411b363SPhilipp Reisner 
706b411b363SPhilipp Reisner  requeue:
7072649f080SLars Ellenberg 	mdev->rs_in_flight += (i << (BM_BLOCK_SHIFT - 9));
708b411b363SPhilipp Reisner 	mod_timer(&mdev->resync_timer, jiffies + SLEEP_TIME);
709b411b363SPhilipp Reisner 	return 1;
710b411b363SPhilipp Reisner }
711b411b363SPhilipp Reisner 
712c4752ef1SPhilipp Reisner 
713370a43e7SPhilipp Reisner void start_resync_timer_fn(unsigned long data)
714370a43e7SPhilipp Reisner {
715370a43e7SPhilipp Reisner 	struct drbd_conf *mdev = (struct drbd_conf *) data;
716370a43e7SPhilipp Reisner 
717370a43e7SPhilipp Reisner 	drbd_queue_work(&mdev->data.work, &mdev->start_resync_work);
718370a43e7SPhilipp Reisner }
719370a43e7SPhilipp Reisner 
720c4752ef1SPhilipp Reisner int w_start_resync(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
721c4752ef1SPhilipp Reisner {
722370a43e7SPhilipp Reisner 	if (atomic_read(&mdev->unacked_cnt) || atomic_read(&mdev->rs_pending_cnt)) {
723370a43e7SPhilipp Reisner 		dev_warn(DEV, "w_start_resync later...\n");
724370a43e7SPhilipp Reisner 		mdev->start_resync_timer.expires = jiffies + HZ/10;
725370a43e7SPhilipp Reisner 		add_timer(&mdev->start_resync_timer);
726370a43e7SPhilipp Reisner 		return 1;
727370a43e7SPhilipp Reisner 	}
728c4752ef1SPhilipp Reisner 
729370a43e7SPhilipp Reisner 	drbd_start_resync(mdev, C_SYNC_SOURCE);
730370a43e7SPhilipp Reisner 	clear_bit(AHEAD_TO_SYNC_SOURCE, &mdev->current_epoch->flags);
731c4752ef1SPhilipp Reisner 	return 1;
732c4752ef1SPhilipp Reisner }
733c4752ef1SPhilipp Reisner 
734b411b363SPhilipp Reisner int w_ov_finished(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
735b411b363SPhilipp Reisner {
736b411b363SPhilipp Reisner 	kfree(w);
737b411b363SPhilipp Reisner 	ov_oos_print(mdev);
738b411b363SPhilipp Reisner 	drbd_resync_finished(mdev);
739b411b363SPhilipp Reisner 
740b411b363SPhilipp Reisner 	return 1;
741b411b363SPhilipp Reisner }
742b411b363SPhilipp Reisner 
743b411b363SPhilipp Reisner static int w_resync_finished(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
744b411b363SPhilipp Reisner {
745b411b363SPhilipp Reisner 	kfree(w);
746b411b363SPhilipp Reisner 
747b411b363SPhilipp Reisner 	drbd_resync_finished(mdev);
748b411b363SPhilipp Reisner 
749b411b363SPhilipp Reisner 	return 1;
750b411b363SPhilipp Reisner }
751b411b363SPhilipp Reisner 
752af85e8e8SLars Ellenberg static void ping_peer(struct drbd_conf *mdev)
753af85e8e8SLars Ellenberg {
754af85e8e8SLars Ellenberg 	clear_bit(GOT_PING_ACK, &mdev->flags);
755af85e8e8SLars Ellenberg 	request_ping(mdev);
756af85e8e8SLars Ellenberg 	wait_event(mdev->misc_wait,
757af85e8e8SLars Ellenberg 		   test_bit(GOT_PING_ACK, &mdev->flags) || mdev->state.conn < C_CONNECTED);
758af85e8e8SLars Ellenberg }
759af85e8e8SLars Ellenberg 
760b411b363SPhilipp Reisner int drbd_resync_finished(struct drbd_conf *mdev)
761b411b363SPhilipp Reisner {
762b411b363SPhilipp Reisner 	unsigned long db, dt, dbdt;
763b411b363SPhilipp Reisner 	unsigned long n_oos;
764b411b363SPhilipp Reisner 	union drbd_state os, ns;
765b411b363SPhilipp Reisner 	struct drbd_work *w;
766b411b363SPhilipp Reisner 	char *khelper_cmd = NULL;
76726525618SLars Ellenberg 	int verify_done = 0;
768b411b363SPhilipp Reisner 
769b411b363SPhilipp Reisner 	/* Remove all elements from the resync LRU. Since future actions
770b411b363SPhilipp Reisner 	 * might set bits in the (main) bitmap, then the entries in the
771b411b363SPhilipp Reisner 	 * resync LRU would be wrong. */
772b411b363SPhilipp Reisner 	if (drbd_rs_del_all(mdev)) {
773b411b363SPhilipp Reisner 		/* In case this is not possible now, most probably because
774b411b363SPhilipp Reisner 		 * there are P_RS_DATA_REPLY Packets lingering on the worker's
775b411b363SPhilipp Reisner 		 * queue (or even the read operations for those packets
776b411b363SPhilipp Reisner 		 * is not finished by now).   Retry in 100ms. */
777b411b363SPhilipp Reisner 
77820ee6390SPhilipp Reisner 		schedule_timeout_interruptible(HZ / 10);
779b411b363SPhilipp Reisner 		w = kmalloc(sizeof(struct drbd_work), GFP_ATOMIC);
780b411b363SPhilipp Reisner 		if (w) {
781b411b363SPhilipp Reisner 			w->cb = w_resync_finished;
782b411b363SPhilipp Reisner 			drbd_queue_work(&mdev->data.work, w);
783b411b363SPhilipp Reisner 			return 1;
784b411b363SPhilipp Reisner 		}
785b411b363SPhilipp Reisner 		dev_err(DEV, "Warn failed to drbd_rs_del_all() and to kmalloc(w).\n");
786b411b363SPhilipp Reisner 	}
787b411b363SPhilipp Reisner 
788b411b363SPhilipp Reisner 	dt = (jiffies - mdev->rs_start - mdev->rs_paused) / HZ;
789b411b363SPhilipp Reisner 	if (dt <= 0)
790b411b363SPhilipp Reisner 		dt = 1;
791b411b363SPhilipp Reisner 	db = mdev->rs_total;
792b411b363SPhilipp Reisner 	dbdt = Bit2KB(db/dt);
793b411b363SPhilipp Reisner 	mdev->rs_paused /= HZ;
794b411b363SPhilipp Reisner 
795b411b363SPhilipp Reisner 	if (!get_ldev(mdev))
796b411b363SPhilipp Reisner 		goto out;
797b411b363SPhilipp Reisner 
798af85e8e8SLars Ellenberg 	ping_peer(mdev);
799af85e8e8SLars Ellenberg 
800b411b363SPhilipp Reisner 	spin_lock_irq(&mdev->req_lock);
801b411b363SPhilipp Reisner 	os = mdev->state;
802b411b363SPhilipp Reisner 
80326525618SLars Ellenberg 	verify_done = (os.conn == C_VERIFY_S || os.conn == C_VERIFY_T);
80426525618SLars Ellenberg 
805b411b363SPhilipp Reisner 	/* This protects us against multiple calls (that can happen in the presence
806b411b363SPhilipp Reisner 	   of application IO), and against connectivity loss just before we arrive here. */
807b411b363SPhilipp Reisner 	if (os.conn <= C_CONNECTED)
808b411b363SPhilipp Reisner 		goto out_unlock;
809b411b363SPhilipp Reisner 
810b411b363SPhilipp Reisner 	ns = os;
811b411b363SPhilipp Reisner 	ns.conn = C_CONNECTED;
812b411b363SPhilipp Reisner 
813b411b363SPhilipp Reisner 	dev_info(DEV, "%s done (total %lu sec; paused %lu sec; %lu K/sec)\n",
81426525618SLars Ellenberg 	     verify_done ? "Online verify " : "Resync",
815b411b363SPhilipp Reisner 	     dt + mdev->rs_paused, mdev->rs_paused, dbdt);
816b411b363SPhilipp Reisner 
817b411b363SPhilipp Reisner 	n_oos = drbd_bm_total_weight(mdev);
818b411b363SPhilipp Reisner 
819b411b363SPhilipp Reisner 	if (os.conn == C_VERIFY_S || os.conn == C_VERIFY_T) {
820b411b363SPhilipp Reisner 		if (n_oos) {
821b411b363SPhilipp Reisner 			dev_alert(DEV, "Online verify found %lu %dk block out of sync!\n",
822b411b363SPhilipp Reisner 			      n_oos, Bit2KB(1));
823b411b363SPhilipp Reisner 			khelper_cmd = "out-of-sync";
824b411b363SPhilipp Reisner 		}
825b411b363SPhilipp Reisner 	} else {
826b411b363SPhilipp Reisner 		D_ASSERT((n_oos - mdev->rs_failed) == 0);
827b411b363SPhilipp Reisner 
828b411b363SPhilipp Reisner 		if (os.conn == C_SYNC_TARGET || os.conn == C_PAUSED_SYNC_T)
829b411b363SPhilipp Reisner 			khelper_cmd = "after-resync-target";
830b411b363SPhilipp Reisner 
831b411b363SPhilipp Reisner 		if (mdev->csums_tfm && mdev->rs_total) {
832b411b363SPhilipp Reisner 			const unsigned long s = mdev->rs_same_csum;
833b411b363SPhilipp Reisner 			const unsigned long t = mdev->rs_total;
834b411b363SPhilipp Reisner 			const int ratio =
835b411b363SPhilipp Reisner 				(t == 0)     ? 0 :
836b411b363SPhilipp Reisner 			(t < 100000) ? ((s*100)/t) : (s/(t/100));
837b411b363SPhilipp Reisner 			dev_info(DEV, "%u %% had equal check sums, eliminated: %luK; "
838b411b363SPhilipp Reisner 			     "transferred %luK total %luK\n",
839b411b363SPhilipp Reisner 			     ratio,
840b411b363SPhilipp Reisner 			     Bit2KB(mdev->rs_same_csum),
841b411b363SPhilipp Reisner 			     Bit2KB(mdev->rs_total - mdev->rs_same_csum),
842b411b363SPhilipp Reisner 			     Bit2KB(mdev->rs_total));
843b411b363SPhilipp Reisner 		}
844b411b363SPhilipp Reisner 	}
845b411b363SPhilipp Reisner 
846b411b363SPhilipp Reisner 	if (mdev->rs_failed) {
847b411b363SPhilipp Reisner 		dev_info(DEV, "            %lu failed blocks\n", mdev->rs_failed);
848b411b363SPhilipp Reisner 
849b411b363SPhilipp Reisner 		if (os.conn == C_SYNC_TARGET || os.conn == C_PAUSED_SYNC_T) {
850b411b363SPhilipp Reisner 			ns.disk = D_INCONSISTENT;
851b411b363SPhilipp Reisner 			ns.pdsk = D_UP_TO_DATE;
852b411b363SPhilipp Reisner 		} else {
853b411b363SPhilipp Reisner 			ns.disk = D_UP_TO_DATE;
854b411b363SPhilipp Reisner 			ns.pdsk = D_INCONSISTENT;
855b411b363SPhilipp Reisner 		}
856b411b363SPhilipp Reisner 	} else {
857b411b363SPhilipp Reisner 		ns.disk = D_UP_TO_DATE;
858b411b363SPhilipp Reisner 		ns.pdsk = D_UP_TO_DATE;
859b411b363SPhilipp Reisner 
860b411b363SPhilipp Reisner 		if (os.conn == C_SYNC_TARGET || os.conn == C_PAUSED_SYNC_T) {
861b411b363SPhilipp Reisner 			if (mdev->p_uuid) {
862b411b363SPhilipp Reisner 				int i;
863b411b363SPhilipp Reisner 				for (i = UI_BITMAP ; i <= UI_HISTORY_END ; i++)
864b411b363SPhilipp Reisner 					_drbd_uuid_set(mdev, i, mdev->p_uuid[i]);
865b411b363SPhilipp Reisner 				drbd_uuid_set(mdev, UI_BITMAP, mdev->ldev->md.uuid[UI_CURRENT]);
866b411b363SPhilipp Reisner 				_drbd_uuid_set(mdev, UI_CURRENT, mdev->p_uuid[UI_CURRENT]);
867b411b363SPhilipp Reisner 			} else {
868b411b363SPhilipp Reisner 				dev_err(DEV, "mdev->p_uuid is NULL! BUG\n");
869b411b363SPhilipp Reisner 			}
870b411b363SPhilipp Reisner 		}
871b411b363SPhilipp Reisner 
87262b0da3aSLars Ellenberg 		if (!(os.conn == C_VERIFY_S || os.conn == C_VERIFY_T)) {
87362b0da3aSLars Ellenberg 			/* for verify runs, we don't update uuids here,
87462b0da3aSLars Ellenberg 			 * so there would be nothing to report. */
875b411b363SPhilipp Reisner 			drbd_uuid_set_bm(mdev, 0UL);
87662b0da3aSLars Ellenberg 			drbd_print_uuids(mdev, "updated UUIDs");
877b411b363SPhilipp Reisner 			if (mdev->p_uuid) {
878b411b363SPhilipp Reisner 				/* Now the two UUID sets are equal, update what we
879b411b363SPhilipp Reisner 				 * know of the peer. */
880b411b363SPhilipp Reisner 				int i;
881b411b363SPhilipp Reisner 				for (i = UI_CURRENT ; i <= UI_HISTORY_END ; i++)
882b411b363SPhilipp Reisner 					mdev->p_uuid[i] = mdev->ldev->md.uuid[i];
883b411b363SPhilipp Reisner 			}
884b411b363SPhilipp Reisner 		}
88562b0da3aSLars Ellenberg 	}
886b411b363SPhilipp Reisner 
887b411b363SPhilipp Reisner 	_drbd_set_state(mdev, ns, CS_VERBOSE, NULL);
888b411b363SPhilipp Reisner out_unlock:
889b411b363SPhilipp Reisner 	spin_unlock_irq(&mdev->req_lock);
890b411b363SPhilipp Reisner 	put_ldev(mdev);
891b411b363SPhilipp Reisner out:
892b411b363SPhilipp Reisner 	mdev->rs_total  = 0;
893b411b363SPhilipp Reisner 	mdev->rs_failed = 0;
894b411b363SPhilipp Reisner 	mdev->rs_paused = 0;
89526525618SLars Ellenberg 	if (verify_done)
896b411b363SPhilipp Reisner 		mdev->ov_start_sector = 0;
897b411b363SPhilipp Reisner 
89813d42685SLars Ellenberg 	drbd_md_sync(mdev);
89913d42685SLars Ellenberg 
900b411b363SPhilipp Reisner 	if (khelper_cmd)
901b411b363SPhilipp Reisner 		drbd_khelper(mdev, khelper_cmd);
902b411b363SPhilipp Reisner 
903b411b363SPhilipp Reisner 	return 1;
904b411b363SPhilipp Reisner }
905b411b363SPhilipp Reisner 
906b411b363SPhilipp Reisner /* helper */
907b411b363SPhilipp Reisner static void move_to_net_ee_or_free(struct drbd_conf *mdev, struct drbd_epoch_entry *e)
908b411b363SPhilipp Reisner {
90945bb912bSLars Ellenberg 	if (drbd_ee_has_active_page(e)) {
910b411b363SPhilipp Reisner 		/* This might happen if sendpage() has not finished */
91178db8928SLars Ellenberg 		int i = (e->size + PAGE_SIZE -1) >> PAGE_SHIFT;
912435f0740SLars Ellenberg 		atomic_add(i, &mdev->pp_in_use_by_net);
913435f0740SLars Ellenberg 		atomic_sub(i, &mdev->pp_in_use);
914b411b363SPhilipp Reisner 		spin_lock_irq(&mdev->req_lock);
915b411b363SPhilipp Reisner 		list_add_tail(&e->w.list, &mdev->net_ee);
916b411b363SPhilipp Reisner 		spin_unlock_irq(&mdev->req_lock);
917435f0740SLars Ellenberg 		wake_up(&drbd_pp_wait);
918b411b363SPhilipp Reisner 	} else
919b411b363SPhilipp Reisner 		drbd_free_ee(mdev, e);
920b411b363SPhilipp Reisner }
921b411b363SPhilipp Reisner 
922b411b363SPhilipp Reisner /**
923b411b363SPhilipp Reisner  * w_e_end_data_req() - Worker callback, to send a P_DATA_REPLY packet in response to a P_DATA_REQUEST
924b411b363SPhilipp Reisner  * @mdev:	DRBD device.
925b411b363SPhilipp Reisner  * @w:		work object.
926b411b363SPhilipp Reisner  * @cancel:	The connection will be closed anyways
927b411b363SPhilipp Reisner  */
928b411b363SPhilipp Reisner int w_e_end_data_req(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
929b411b363SPhilipp Reisner {
930b411b363SPhilipp Reisner 	struct drbd_epoch_entry *e = container_of(w, struct drbd_epoch_entry, w);
931b411b363SPhilipp Reisner 	int ok;
932b411b363SPhilipp Reisner 
933b411b363SPhilipp Reisner 	if (unlikely(cancel)) {
934b411b363SPhilipp Reisner 		drbd_free_ee(mdev, e);
935b411b363SPhilipp Reisner 		dec_unacked(mdev);
936b411b363SPhilipp Reisner 		return 1;
937b411b363SPhilipp Reisner 	}
938b411b363SPhilipp Reisner 
93945bb912bSLars Ellenberg 	if (likely((e->flags & EE_WAS_ERROR) == 0)) {
940b411b363SPhilipp Reisner 		ok = drbd_send_block(mdev, P_DATA_REPLY, e);
941b411b363SPhilipp Reisner 	} else {
942b411b363SPhilipp Reisner 		if (__ratelimit(&drbd_ratelimit_state))
943b411b363SPhilipp Reisner 			dev_err(DEV, "Sending NegDReply. sector=%llus.\n",
944b411b363SPhilipp Reisner 			    (unsigned long long)e->sector);
945b411b363SPhilipp Reisner 
946b411b363SPhilipp Reisner 		ok = drbd_send_ack(mdev, P_NEG_DREPLY, e);
947b411b363SPhilipp Reisner 	}
948b411b363SPhilipp Reisner 
949b411b363SPhilipp Reisner 	dec_unacked(mdev);
950b411b363SPhilipp Reisner 
951b411b363SPhilipp Reisner 	move_to_net_ee_or_free(mdev, e);
952b411b363SPhilipp Reisner 
953b411b363SPhilipp Reisner 	if (unlikely(!ok))
954b411b363SPhilipp Reisner 		dev_err(DEV, "drbd_send_block() failed\n");
955b411b363SPhilipp Reisner 	return ok;
956b411b363SPhilipp Reisner }
957b411b363SPhilipp Reisner 
958b411b363SPhilipp Reisner /**
959b411b363SPhilipp Reisner  * w_e_end_rsdata_req() - Worker callback to send a P_RS_DATA_REPLY packet in response to a P_RS_DATA_REQUESTRS
960b411b363SPhilipp Reisner  * @mdev:	DRBD device.
961b411b363SPhilipp Reisner  * @w:		work object.
962b411b363SPhilipp Reisner  * @cancel:	The connection will be closed anyways
963b411b363SPhilipp Reisner  */
964b411b363SPhilipp Reisner int w_e_end_rsdata_req(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
965b411b363SPhilipp Reisner {
966b411b363SPhilipp Reisner 	struct drbd_epoch_entry *e = container_of(w, struct drbd_epoch_entry, w);
967b411b363SPhilipp Reisner 	int ok;
968b411b363SPhilipp Reisner 
969b411b363SPhilipp Reisner 	if (unlikely(cancel)) {
970b411b363SPhilipp Reisner 		drbd_free_ee(mdev, e);
971b411b363SPhilipp Reisner 		dec_unacked(mdev);
972b411b363SPhilipp Reisner 		return 1;
973b411b363SPhilipp Reisner 	}
974b411b363SPhilipp Reisner 
975b411b363SPhilipp Reisner 	if (get_ldev_if_state(mdev, D_FAILED)) {
976b411b363SPhilipp Reisner 		drbd_rs_complete_io(mdev, e->sector);
977b411b363SPhilipp Reisner 		put_ldev(mdev);
978b411b363SPhilipp Reisner 	}
979b411b363SPhilipp Reisner 
980d612d309SPhilipp Reisner 	if (mdev->state.conn == C_AHEAD) {
981d612d309SPhilipp Reisner 		ok = drbd_send_ack(mdev, P_RS_CANCEL, e);
982d612d309SPhilipp Reisner 	} else if (likely((e->flags & EE_WAS_ERROR) == 0)) {
983b411b363SPhilipp Reisner 		if (likely(mdev->state.pdsk >= D_INCONSISTENT)) {
984b411b363SPhilipp Reisner 			inc_rs_pending(mdev);
985b411b363SPhilipp Reisner 			ok = drbd_send_block(mdev, P_RS_DATA_REPLY, e);
986b411b363SPhilipp Reisner 		} else {
987b411b363SPhilipp Reisner 			if (__ratelimit(&drbd_ratelimit_state))
988b411b363SPhilipp Reisner 				dev_err(DEV, "Not sending RSDataReply, "
989b411b363SPhilipp Reisner 				    "partner DISKLESS!\n");
990b411b363SPhilipp Reisner 			ok = 1;
991b411b363SPhilipp Reisner 		}
992b411b363SPhilipp Reisner 	} else {
993b411b363SPhilipp Reisner 		if (__ratelimit(&drbd_ratelimit_state))
994b411b363SPhilipp Reisner 			dev_err(DEV, "Sending NegRSDReply. sector %llus.\n",
995b411b363SPhilipp Reisner 			    (unsigned long long)e->sector);
996b411b363SPhilipp Reisner 
997b411b363SPhilipp Reisner 		ok = drbd_send_ack(mdev, P_NEG_RS_DREPLY, e);
998b411b363SPhilipp Reisner 
999b411b363SPhilipp Reisner 		/* update resync data with failure */
1000b411b363SPhilipp Reisner 		drbd_rs_failed_io(mdev, e->sector, e->size);
1001b411b363SPhilipp Reisner 	}
1002b411b363SPhilipp Reisner 
1003b411b363SPhilipp Reisner 	dec_unacked(mdev);
1004b411b363SPhilipp Reisner 
1005b411b363SPhilipp Reisner 	move_to_net_ee_or_free(mdev, e);
1006b411b363SPhilipp Reisner 
1007b411b363SPhilipp Reisner 	if (unlikely(!ok))
1008b411b363SPhilipp Reisner 		dev_err(DEV, "drbd_send_block() failed\n");
1009b411b363SPhilipp Reisner 	return ok;
1010b411b363SPhilipp Reisner }
1011b411b363SPhilipp Reisner 
1012b411b363SPhilipp Reisner int w_e_end_csum_rs_req(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
1013b411b363SPhilipp Reisner {
1014b411b363SPhilipp Reisner 	struct drbd_epoch_entry *e = container_of(w, struct drbd_epoch_entry, w);
1015b411b363SPhilipp Reisner 	struct digest_info *di;
1016b411b363SPhilipp Reisner 	int digest_size;
1017b411b363SPhilipp Reisner 	void *digest = NULL;
1018b411b363SPhilipp Reisner 	int ok, eq = 0;
1019b411b363SPhilipp Reisner 
1020b411b363SPhilipp Reisner 	if (unlikely(cancel)) {
1021b411b363SPhilipp Reisner 		drbd_free_ee(mdev, e);
1022b411b363SPhilipp Reisner 		dec_unacked(mdev);
1023b411b363SPhilipp Reisner 		return 1;
1024b411b363SPhilipp Reisner 	}
1025b411b363SPhilipp Reisner 
10261d53f09eSLars Ellenberg 	if (get_ldev(mdev)) {
1027b411b363SPhilipp Reisner 		drbd_rs_complete_io(mdev, e->sector);
10281d53f09eSLars Ellenberg 		put_ldev(mdev);
10291d53f09eSLars Ellenberg 	}
1030b411b363SPhilipp Reisner 
103185719573SPhilipp Reisner 	di = e->digest;
1032b411b363SPhilipp Reisner 
103345bb912bSLars Ellenberg 	if (likely((e->flags & EE_WAS_ERROR) == 0)) {
1034b411b363SPhilipp Reisner 		/* quick hack to try to avoid a race against reconfiguration.
1035b411b363SPhilipp Reisner 		 * a real fix would be much more involved,
1036b411b363SPhilipp Reisner 		 * introducing more locking mechanisms */
1037b411b363SPhilipp Reisner 		if (mdev->csums_tfm) {
1038b411b363SPhilipp Reisner 			digest_size = crypto_hash_digestsize(mdev->csums_tfm);
1039b411b363SPhilipp Reisner 			D_ASSERT(digest_size == di->digest_size);
1040b411b363SPhilipp Reisner 			digest = kmalloc(digest_size, GFP_NOIO);
1041b411b363SPhilipp Reisner 		}
1042b411b363SPhilipp Reisner 		if (digest) {
104345bb912bSLars Ellenberg 			drbd_csum_ee(mdev, mdev->csums_tfm, e, digest);
1044b411b363SPhilipp Reisner 			eq = !memcmp(digest, di->digest, digest_size);
1045b411b363SPhilipp Reisner 			kfree(digest);
1046b411b363SPhilipp Reisner 		}
1047b411b363SPhilipp Reisner 
1048b411b363SPhilipp Reisner 		if (eq) {
1049b411b363SPhilipp Reisner 			drbd_set_in_sync(mdev, e->sector, e->size);
1050676396d5SLars Ellenberg 			/* rs_same_csums unit is BM_BLOCK_SIZE */
1051676396d5SLars Ellenberg 			mdev->rs_same_csum += e->size >> BM_BLOCK_SHIFT;
1052b411b363SPhilipp Reisner 			ok = drbd_send_ack(mdev, P_RS_IS_IN_SYNC, e);
1053b411b363SPhilipp Reisner 		} else {
1054b411b363SPhilipp Reisner 			inc_rs_pending(mdev);
1055204bba99SPhilipp Reisner 			e->block_id = ID_SYNCER; /* By setting block_id, digest pointer becomes invalid! */
1056204bba99SPhilipp Reisner 			e->flags &= ~EE_HAS_DIGEST; /* This e no longer has a digest pointer */
1057204bba99SPhilipp Reisner 			kfree(di);
1058b411b363SPhilipp Reisner 			ok = drbd_send_block(mdev, P_RS_DATA_REPLY, e);
1059b411b363SPhilipp Reisner 		}
1060b411b363SPhilipp Reisner 	} else {
1061b411b363SPhilipp Reisner 		ok = drbd_send_ack(mdev, P_NEG_RS_DREPLY, e);
1062b411b363SPhilipp Reisner 		if (__ratelimit(&drbd_ratelimit_state))
1063b411b363SPhilipp Reisner 			dev_err(DEV, "Sending NegDReply. I guess it gets messy.\n");
1064b411b363SPhilipp Reisner 	}
1065b411b363SPhilipp Reisner 
1066b411b363SPhilipp Reisner 	dec_unacked(mdev);
1067b411b363SPhilipp Reisner 	move_to_net_ee_or_free(mdev, e);
1068b411b363SPhilipp Reisner 
1069b411b363SPhilipp Reisner 	if (unlikely(!ok))
1070b411b363SPhilipp Reisner 		dev_err(DEV, "drbd_send_block/ack() failed\n");
1071b411b363SPhilipp Reisner 	return ok;
1072b411b363SPhilipp Reisner }
1073b411b363SPhilipp Reisner 
1074b411b363SPhilipp Reisner int w_e_end_ov_req(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
1075b411b363SPhilipp Reisner {
1076b411b363SPhilipp Reisner 	struct drbd_epoch_entry *e = container_of(w, struct drbd_epoch_entry, w);
1077b411b363SPhilipp Reisner 	int digest_size;
1078b411b363SPhilipp Reisner 	void *digest;
1079b411b363SPhilipp Reisner 	int ok = 1;
1080b411b363SPhilipp Reisner 
1081b411b363SPhilipp Reisner 	if (unlikely(cancel))
1082b411b363SPhilipp Reisner 		goto out;
1083b411b363SPhilipp Reisner 
108445bb912bSLars Ellenberg 	if (unlikely((e->flags & EE_WAS_ERROR) != 0))
1085b411b363SPhilipp Reisner 		goto out;
1086b411b363SPhilipp Reisner 
1087b411b363SPhilipp Reisner 	digest_size = crypto_hash_digestsize(mdev->verify_tfm);
1088b411b363SPhilipp Reisner 	/* FIXME if this allocation fails, online verify will not terminate! */
1089b411b363SPhilipp Reisner 	digest = kmalloc(digest_size, GFP_NOIO);
1090b411b363SPhilipp Reisner 	if (digest) {
109145bb912bSLars Ellenberg 		drbd_csum_ee(mdev, mdev->verify_tfm, e, digest);
1092b411b363SPhilipp Reisner 		inc_rs_pending(mdev);
1093b411b363SPhilipp Reisner 		ok = drbd_send_drequest_csum(mdev, e->sector, e->size,
1094b411b363SPhilipp Reisner 					     digest, digest_size, P_OV_REPLY);
1095b411b363SPhilipp Reisner 		if (!ok)
1096b411b363SPhilipp Reisner 			dec_rs_pending(mdev);
1097b411b363SPhilipp Reisner 		kfree(digest);
1098b411b363SPhilipp Reisner 	}
1099b411b363SPhilipp Reisner 
1100b411b363SPhilipp Reisner out:
1101b411b363SPhilipp Reisner 	drbd_free_ee(mdev, e);
1102b411b363SPhilipp Reisner 
1103b411b363SPhilipp Reisner 	dec_unacked(mdev);
1104b411b363SPhilipp Reisner 
1105b411b363SPhilipp Reisner 	return ok;
1106b411b363SPhilipp Reisner }
1107b411b363SPhilipp Reisner 
1108b411b363SPhilipp Reisner void drbd_ov_oos_found(struct drbd_conf *mdev, sector_t sector, int size)
1109b411b363SPhilipp Reisner {
1110b411b363SPhilipp Reisner 	if (mdev->ov_last_oos_start + mdev->ov_last_oos_size == sector) {
1111b411b363SPhilipp Reisner 		mdev->ov_last_oos_size += size>>9;
1112b411b363SPhilipp Reisner 	} else {
1113b411b363SPhilipp Reisner 		mdev->ov_last_oos_start = sector;
1114b411b363SPhilipp Reisner 		mdev->ov_last_oos_size = size>>9;
1115b411b363SPhilipp Reisner 	}
1116b411b363SPhilipp Reisner 	drbd_set_out_of_sync(mdev, sector, size);
1117b411b363SPhilipp Reisner }
1118b411b363SPhilipp Reisner 
1119b411b363SPhilipp Reisner int w_e_end_ov_reply(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
1120b411b363SPhilipp Reisner {
1121b411b363SPhilipp Reisner 	struct drbd_epoch_entry *e = container_of(w, struct drbd_epoch_entry, w);
1122b411b363SPhilipp Reisner 	struct digest_info *di;
1123b411b363SPhilipp Reisner 	int digest_size;
1124b411b363SPhilipp Reisner 	void *digest;
1125b411b363SPhilipp Reisner 	int ok, eq = 0;
1126b411b363SPhilipp Reisner 
1127b411b363SPhilipp Reisner 	if (unlikely(cancel)) {
1128b411b363SPhilipp Reisner 		drbd_free_ee(mdev, e);
1129b411b363SPhilipp Reisner 		dec_unacked(mdev);
1130b411b363SPhilipp Reisner 		return 1;
1131b411b363SPhilipp Reisner 	}
1132b411b363SPhilipp Reisner 
1133b411b363SPhilipp Reisner 	/* after "cancel", because after drbd_disconnect/drbd_rs_cancel_all
1134b411b363SPhilipp Reisner 	 * the resync lru has been cleaned up already */
11351d53f09eSLars Ellenberg 	if (get_ldev(mdev)) {
1136b411b363SPhilipp Reisner 		drbd_rs_complete_io(mdev, e->sector);
11371d53f09eSLars Ellenberg 		put_ldev(mdev);
11381d53f09eSLars Ellenberg 	}
1139b411b363SPhilipp Reisner 
114085719573SPhilipp Reisner 	di = e->digest;
1141b411b363SPhilipp Reisner 
114245bb912bSLars Ellenberg 	if (likely((e->flags & EE_WAS_ERROR) == 0)) {
1143b411b363SPhilipp Reisner 		digest_size = crypto_hash_digestsize(mdev->verify_tfm);
1144b411b363SPhilipp Reisner 		digest = kmalloc(digest_size, GFP_NOIO);
1145b411b363SPhilipp Reisner 		if (digest) {
114645bb912bSLars Ellenberg 			drbd_csum_ee(mdev, mdev->verify_tfm, e, digest);
1147b411b363SPhilipp Reisner 
1148b411b363SPhilipp Reisner 			D_ASSERT(digest_size == di->digest_size);
1149b411b363SPhilipp Reisner 			eq = !memcmp(digest, di->digest, digest_size);
1150b411b363SPhilipp Reisner 			kfree(digest);
1151b411b363SPhilipp Reisner 		}
1152b411b363SPhilipp Reisner 	} else {
1153b411b363SPhilipp Reisner 		ok = drbd_send_ack(mdev, P_NEG_RS_DREPLY, e);
1154b411b363SPhilipp Reisner 		if (__ratelimit(&drbd_ratelimit_state))
1155b411b363SPhilipp Reisner 			dev_err(DEV, "Sending NegDReply. I guess it gets messy.\n");
1156b411b363SPhilipp Reisner 	}
1157b411b363SPhilipp Reisner 
1158b411b363SPhilipp Reisner 	dec_unacked(mdev);
1159b411b363SPhilipp Reisner 	if (!eq)
1160b411b363SPhilipp Reisner 		drbd_ov_oos_found(mdev, e->sector, e->size);
1161b411b363SPhilipp Reisner 	else
1162b411b363SPhilipp Reisner 		ov_oos_print(mdev);
1163b411b363SPhilipp Reisner 
1164b411b363SPhilipp Reisner 	ok = drbd_send_ack_ex(mdev, P_OV_RESULT, e->sector, e->size,
1165b411b363SPhilipp Reisner 			      eq ? ID_IN_SYNC : ID_OUT_OF_SYNC);
1166b411b363SPhilipp Reisner 
1167b411b363SPhilipp Reisner 	drbd_free_ee(mdev, e);
1168b411b363SPhilipp Reisner 
1169ea5442afSLars Ellenberg 	--mdev->ov_left;
1170ea5442afSLars Ellenberg 
1171ea5442afSLars Ellenberg 	/* let's advance progress step marks only for every other megabyte */
1172ea5442afSLars Ellenberg 	if ((mdev->ov_left & 0x200) == 0x200)
1173ea5442afSLars Ellenberg 		drbd_advance_rs_marks(mdev, mdev->ov_left);
1174ea5442afSLars Ellenberg 
1175ea5442afSLars Ellenberg 	if (mdev->ov_left == 0) {
1176b411b363SPhilipp Reisner 		ov_oos_print(mdev);
1177b411b363SPhilipp Reisner 		drbd_resync_finished(mdev);
1178b411b363SPhilipp Reisner 	}
1179b411b363SPhilipp Reisner 
1180b411b363SPhilipp Reisner 	return ok;
1181b411b363SPhilipp Reisner }
1182b411b363SPhilipp Reisner 
1183b411b363SPhilipp Reisner int w_prev_work_done(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
1184b411b363SPhilipp Reisner {
1185b411b363SPhilipp Reisner 	struct drbd_wq_barrier *b = container_of(w, struct drbd_wq_barrier, w);
1186b411b363SPhilipp Reisner 	complete(&b->done);
1187b411b363SPhilipp Reisner 	return 1;
1188b411b363SPhilipp Reisner }
1189b411b363SPhilipp Reisner 
1190b411b363SPhilipp Reisner int w_send_barrier(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
1191b411b363SPhilipp Reisner {
1192b411b363SPhilipp Reisner 	struct drbd_tl_epoch *b = container_of(w, struct drbd_tl_epoch, w);
1193b411b363SPhilipp Reisner 	struct p_barrier *p = &mdev->data.sbuf.barrier;
1194b411b363SPhilipp Reisner 	int ok = 1;
1195b411b363SPhilipp Reisner 
1196b411b363SPhilipp Reisner 	/* really avoid racing with tl_clear.  w.cb may have been referenced
1197b411b363SPhilipp Reisner 	 * just before it was reassigned and re-queued, so double check that.
1198b411b363SPhilipp Reisner 	 * actually, this race was harmless, since we only try to send the
1199b411b363SPhilipp Reisner 	 * barrier packet here, and otherwise do nothing with the object.
1200b411b363SPhilipp Reisner 	 * but compare with the head of w_clear_epoch */
1201b411b363SPhilipp Reisner 	spin_lock_irq(&mdev->req_lock);
1202b411b363SPhilipp Reisner 	if (w->cb != w_send_barrier || mdev->state.conn < C_CONNECTED)
1203b411b363SPhilipp Reisner 		cancel = 1;
1204b411b363SPhilipp Reisner 	spin_unlock_irq(&mdev->req_lock);
1205b411b363SPhilipp Reisner 	if (cancel)
1206b411b363SPhilipp Reisner 		return 1;
1207b411b363SPhilipp Reisner 
1208b411b363SPhilipp Reisner 	if (!drbd_get_data_sock(mdev))
1209b411b363SPhilipp Reisner 		return 0;
1210b411b363SPhilipp Reisner 	p->barrier = b->br_number;
1211b411b363SPhilipp Reisner 	/* inc_ap_pending was done where this was queued.
1212b411b363SPhilipp Reisner 	 * dec_ap_pending will be done in got_BarrierAck
1213b411b363SPhilipp Reisner 	 * or (on connection loss) in w_clear_epoch.  */
1214b411b363SPhilipp Reisner 	ok = _drbd_send_cmd(mdev, mdev->data.socket, P_BARRIER,
12150b70a13dSPhilipp Reisner 				(struct p_header80 *)p, sizeof(*p), 0);
1216b411b363SPhilipp Reisner 	drbd_put_data_sock(mdev);
1217b411b363SPhilipp Reisner 
1218b411b363SPhilipp Reisner 	return ok;
1219b411b363SPhilipp Reisner }
1220b411b363SPhilipp Reisner 
1221b411b363SPhilipp Reisner int w_send_write_hint(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
1222b411b363SPhilipp Reisner {
1223b411b363SPhilipp Reisner 	if (cancel)
1224b411b363SPhilipp Reisner 		return 1;
1225b411b363SPhilipp Reisner 	return drbd_send_short_cmd(mdev, P_UNPLUG_REMOTE);
1226b411b363SPhilipp Reisner }
1227b411b363SPhilipp Reisner 
122873a01a18SPhilipp Reisner int w_send_oos(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
122973a01a18SPhilipp Reisner {
123073a01a18SPhilipp Reisner 	struct drbd_request *req = container_of(w, struct drbd_request, w);
123173a01a18SPhilipp Reisner 	int ok;
123273a01a18SPhilipp Reisner 
123373a01a18SPhilipp Reisner 	if (unlikely(cancel)) {
123473a01a18SPhilipp Reisner 		req_mod(req, send_canceled);
123573a01a18SPhilipp Reisner 		return 1;
123673a01a18SPhilipp Reisner 	}
123773a01a18SPhilipp Reisner 
123873a01a18SPhilipp Reisner 	ok = drbd_send_oos(mdev, req);
123973a01a18SPhilipp Reisner 	req_mod(req, oos_handed_to_network);
124073a01a18SPhilipp Reisner 
124173a01a18SPhilipp Reisner 	return ok;
124273a01a18SPhilipp Reisner }
124373a01a18SPhilipp Reisner 
1244b411b363SPhilipp Reisner /**
1245b411b363SPhilipp Reisner  * w_send_dblock() - Worker callback to send a P_DATA packet in order to mirror a write request
1246b411b363SPhilipp Reisner  * @mdev:	DRBD device.
1247b411b363SPhilipp Reisner  * @w:		work object.
1248b411b363SPhilipp Reisner  * @cancel:	The connection will be closed anyways
1249b411b363SPhilipp Reisner  */
1250b411b363SPhilipp Reisner int w_send_dblock(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
1251b411b363SPhilipp Reisner {
1252b411b363SPhilipp Reisner 	struct drbd_request *req = container_of(w, struct drbd_request, w);
1253b411b363SPhilipp Reisner 	int ok;
1254b411b363SPhilipp Reisner 
1255b411b363SPhilipp Reisner 	if (unlikely(cancel)) {
1256b411b363SPhilipp Reisner 		req_mod(req, send_canceled);
1257b411b363SPhilipp Reisner 		return 1;
1258b411b363SPhilipp Reisner 	}
1259b411b363SPhilipp Reisner 
1260b411b363SPhilipp Reisner 	ok = drbd_send_dblock(mdev, req);
1261b411b363SPhilipp Reisner 	req_mod(req, ok ? handed_over_to_network : send_failed);
1262b411b363SPhilipp Reisner 
1263b411b363SPhilipp Reisner 	return ok;
1264b411b363SPhilipp Reisner }
1265b411b363SPhilipp Reisner 
1266b411b363SPhilipp Reisner /**
1267b411b363SPhilipp Reisner  * w_send_read_req() - Worker callback to send a read request (P_DATA_REQUEST) packet
1268b411b363SPhilipp Reisner  * @mdev:	DRBD device.
1269b411b363SPhilipp Reisner  * @w:		work object.
1270b411b363SPhilipp Reisner  * @cancel:	The connection will be closed anyways
1271b411b363SPhilipp Reisner  */
1272b411b363SPhilipp Reisner int w_send_read_req(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
1273b411b363SPhilipp Reisner {
1274b411b363SPhilipp Reisner 	struct drbd_request *req = container_of(w, struct drbd_request, w);
1275b411b363SPhilipp Reisner 	int ok;
1276b411b363SPhilipp Reisner 
1277b411b363SPhilipp Reisner 	if (unlikely(cancel)) {
1278b411b363SPhilipp Reisner 		req_mod(req, send_canceled);
1279b411b363SPhilipp Reisner 		return 1;
1280b411b363SPhilipp Reisner 	}
1281b411b363SPhilipp Reisner 
1282b411b363SPhilipp Reisner 	ok = drbd_send_drequest(mdev, P_DATA_REQUEST, req->sector, req->size,
1283b411b363SPhilipp Reisner 				(unsigned long)req);
1284b411b363SPhilipp Reisner 
1285b411b363SPhilipp Reisner 	if (!ok) {
1286b411b363SPhilipp Reisner 		/* ?? we set C_TIMEOUT or C_BROKEN_PIPE in drbd_send();
1287b411b363SPhilipp Reisner 		 * so this is probably redundant */
1288b411b363SPhilipp Reisner 		if (mdev->state.conn >= C_CONNECTED)
1289b411b363SPhilipp Reisner 			drbd_force_state(mdev, NS(conn, C_NETWORK_FAILURE));
1290b411b363SPhilipp Reisner 	}
1291b411b363SPhilipp Reisner 	req_mod(req, ok ? handed_over_to_network : send_failed);
1292b411b363SPhilipp Reisner 
1293b411b363SPhilipp Reisner 	return ok;
1294b411b363SPhilipp Reisner }
1295b411b363SPhilipp Reisner 
1296265be2d0SPhilipp Reisner int w_restart_disk_io(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
1297265be2d0SPhilipp Reisner {
1298265be2d0SPhilipp Reisner 	struct drbd_request *req = container_of(w, struct drbd_request, w);
1299265be2d0SPhilipp Reisner 
13000778286aSPhilipp Reisner 	if (bio_data_dir(req->master_bio) == WRITE && req->rq_state & RQ_IN_ACT_LOG)
1301265be2d0SPhilipp Reisner 		drbd_al_begin_io(mdev, req->sector);
1302265be2d0SPhilipp Reisner 	/* Calling drbd_al_begin_io() out of the worker might deadlocks
1303265be2d0SPhilipp Reisner 	   theoretically. Practically it can not deadlock, since this is
1304265be2d0SPhilipp Reisner 	   only used when unfreezing IOs. All the extents of the requests
1305265be2d0SPhilipp Reisner 	   that made it into the TL are already active */
1306265be2d0SPhilipp Reisner 
1307265be2d0SPhilipp Reisner 	drbd_req_make_private_bio(req, req->master_bio);
1308265be2d0SPhilipp Reisner 	req->private_bio->bi_bdev = mdev->ldev->backing_bdev;
1309265be2d0SPhilipp Reisner 	generic_make_request(req->private_bio);
1310265be2d0SPhilipp Reisner 
1311265be2d0SPhilipp Reisner 	return 1;
1312265be2d0SPhilipp Reisner }
1313265be2d0SPhilipp Reisner 
1314b411b363SPhilipp Reisner static int _drbd_may_sync_now(struct drbd_conf *mdev)
1315b411b363SPhilipp Reisner {
1316b411b363SPhilipp Reisner 	struct drbd_conf *odev = mdev;
1317b411b363SPhilipp Reisner 
1318b411b363SPhilipp Reisner 	while (1) {
1319b411b363SPhilipp Reisner 		if (odev->sync_conf.after == -1)
1320b411b363SPhilipp Reisner 			return 1;
1321b411b363SPhilipp Reisner 		odev = minor_to_mdev(odev->sync_conf.after);
1322b411b363SPhilipp Reisner 		ERR_IF(!odev) return 1;
1323b411b363SPhilipp Reisner 		if ((odev->state.conn >= C_SYNC_SOURCE &&
1324b411b363SPhilipp Reisner 		     odev->state.conn <= C_PAUSED_SYNC_T) ||
1325b411b363SPhilipp Reisner 		    odev->state.aftr_isp || odev->state.peer_isp ||
1326b411b363SPhilipp Reisner 		    odev->state.user_isp)
1327b411b363SPhilipp Reisner 			return 0;
1328b411b363SPhilipp Reisner 	}
1329b411b363SPhilipp Reisner }
1330b411b363SPhilipp Reisner 
1331b411b363SPhilipp Reisner /**
1332b411b363SPhilipp Reisner  * _drbd_pause_after() - Pause resync on all devices that may not resync now
1333b411b363SPhilipp Reisner  * @mdev:	DRBD device.
1334b411b363SPhilipp Reisner  *
1335b411b363SPhilipp Reisner  * Called from process context only (admin command and after_state_ch).
1336b411b363SPhilipp Reisner  */
1337b411b363SPhilipp Reisner static int _drbd_pause_after(struct drbd_conf *mdev)
1338b411b363SPhilipp Reisner {
1339b411b363SPhilipp Reisner 	struct drbd_conf *odev;
1340b411b363SPhilipp Reisner 	int i, rv = 0;
1341b411b363SPhilipp Reisner 
1342b411b363SPhilipp Reisner 	for (i = 0; i < minor_count; i++) {
1343b411b363SPhilipp Reisner 		odev = minor_to_mdev(i);
1344b411b363SPhilipp Reisner 		if (!odev)
1345b411b363SPhilipp Reisner 			continue;
1346b411b363SPhilipp Reisner 		if (odev->state.conn == C_STANDALONE && odev->state.disk == D_DISKLESS)
1347b411b363SPhilipp Reisner 			continue;
1348b411b363SPhilipp Reisner 		if (!_drbd_may_sync_now(odev))
1349b411b363SPhilipp Reisner 			rv |= (__drbd_set_state(_NS(odev, aftr_isp, 1), CS_HARD, NULL)
1350b411b363SPhilipp Reisner 			       != SS_NOTHING_TO_DO);
1351b411b363SPhilipp Reisner 	}
1352b411b363SPhilipp Reisner 
1353b411b363SPhilipp Reisner 	return rv;
1354b411b363SPhilipp Reisner }
1355b411b363SPhilipp Reisner 
1356b411b363SPhilipp Reisner /**
1357b411b363SPhilipp Reisner  * _drbd_resume_next() - Resume resync on all devices that may resync now
1358b411b363SPhilipp Reisner  * @mdev:	DRBD device.
1359b411b363SPhilipp Reisner  *
1360b411b363SPhilipp Reisner  * Called from process context only (admin command and worker).
1361b411b363SPhilipp Reisner  */
1362b411b363SPhilipp Reisner static int _drbd_resume_next(struct drbd_conf *mdev)
1363b411b363SPhilipp Reisner {
1364b411b363SPhilipp Reisner 	struct drbd_conf *odev;
1365b411b363SPhilipp Reisner 	int i, rv = 0;
1366b411b363SPhilipp Reisner 
1367b411b363SPhilipp Reisner 	for (i = 0; i < minor_count; i++) {
1368b411b363SPhilipp Reisner 		odev = minor_to_mdev(i);
1369b411b363SPhilipp Reisner 		if (!odev)
1370b411b363SPhilipp Reisner 			continue;
1371b411b363SPhilipp Reisner 		if (odev->state.conn == C_STANDALONE && odev->state.disk == D_DISKLESS)
1372b411b363SPhilipp Reisner 			continue;
1373b411b363SPhilipp Reisner 		if (odev->state.aftr_isp) {
1374b411b363SPhilipp Reisner 			if (_drbd_may_sync_now(odev))
1375b411b363SPhilipp Reisner 				rv |= (__drbd_set_state(_NS(odev, aftr_isp, 0),
1376b411b363SPhilipp Reisner 							CS_HARD, NULL)
1377b411b363SPhilipp Reisner 				       != SS_NOTHING_TO_DO) ;
1378b411b363SPhilipp Reisner 		}
1379b411b363SPhilipp Reisner 	}
1380b411b363SPhilipp Reisner 	return rv;
1381b411b363SPhilipp Reisner }
1382b411b363SPhilipp Reisner 
1383b411b363SPhilipp Reisner void resume_next_sg(struct drbd_conf *mdev)
1384b411b363SPhilipp Reisner {
1385b411b363SPhilipp Reisner 	write_lock_irq(&global_state_lock);
1386b411b363SPhilipp Reisner 	_drbd_resume_next(mdev);
1387b411b363SPhilipp Reisner 	write_unlock_irq(&global_state_lock);
1388b411b363SPhilipp Reisner }
1389b411b363SPhilipp Reisner 
1390b411b363SPhilipp Reisner void suspend_other_sg(struct drbd_conf *mdev)
1391b411b363SPhilipp Reisner {
1392b411b363SPhilipp Reisner 	write_lock_irq(&global_state_lock);
1393b411b363SPhilipp Reisner 	_drbd_pause_after(mdev);
1394b411b363SPhilipp Reisner 	write_unlock_irq(&global_state_lock);
1395b411b363SPhilipp Reisner }
1396b411b363SPhilipp Reisner 
1397b411b363SPhilipp Reisner static int sync_after_error(struct drbd_conf *mdev, int o_minor)
1398b411b363SPhilipp Reisner {
1399b411b363SPhilipp Reisner 	struct drbd_conf *odev;
1400b411b363SPhilipp Reisner 
1401b411b363SPhilipp Reisner 	if (o_minor == -1)
1402b411b363SPhilipp Reisner 		return NO_ERROR;
1403b411b363SPhilipp Reisner 	if (o_minor < -1 || minor_to_mdev(o_minor) == NULL)
1404b411b363SPhilipp Reisner 		return ERR_SYNC_AFTER;
1405b411b363SPhilipp Reisner 
1406b411b363SPhilipp Reisner 	/* check for loops */
1407b411b363SPhilipp Reisner 	odev = minor_to_mdev(o_minor);
1408b411b363SPhilipp Reisner 	while (1) {
1409b411b363SPhilipp Reisner 		if (odev == mdev)
1410b411b363SPhilipp Reisner 			return ERR_SYNC_AFTER_CYCLE;
1411b411b363SPhilipp Reisner 
1412b411b363SPhilipp Reisner 		/* dependency chain ends here, no cycles. */
1413b411b363SPhilipp Reisner 		if (odev->sync_conf.after == -1)
1414b411b363SPhilipp Reisner 			return NO_ERROR;
1415b411b363SPhilipp Reisner 
1416b411b363SPhilipp Reisner 		/* follow the dependency chain */
1417b411b363SPhilipp Reisner 		odev = minor_to_mdev(odev->sync_conf.after);
1418b411b363SPhilipp Reisner 	}
1419b411b363SPhilipp Reisner }
1420b411b363SPhilipp Reisner 
1421b411b363SPhilipp Reisner int drbd_alter_sa(struct drbd_conf *mdev, int na)
1422b411b363SPhilipp Reisner {
1423b411b363SPhilipp Reisner 	int changes;
1424b411b363SPhilipp Reisner 	int retcode;
1425b411b363SPhilipp Reisner 
1426b411b363SPhilipp Reisner 	write_lock_irq(&global_state_lock);
1427b411b363SPhilipp Reisner 	retcode = sync_after_error(mdev, na);
1428b411b363SPhilipp Reisner 	if (retcode == NO_ERROR) {
1429b411b363SPhilipp Reisner 		mdev->sync_conf.after = na;
1430b411b363SPhilipp Reisner 		do {
1431b411b363SPhilipp Reisner 			changes  = _drbd_pause_after(mdev);
1432b411b363SPhilipp Reisner 			changes |= _drbd_resume_next(mdev);
1433b411b363SPhilipp Reisner 		} while (changes);
1434b411b363SPhilipp Reisner 	}
1435b411b363SPhilipp Reisner 	write_unlock_irq(&global_state_lock);
1436b411b363SPhilipp Reisner 	return retcode;
1437b411b363SPhilipp Reisner }
1438b411b363SPhilipp Reisner 
14399bd28d3cSLars Ellenberg void drbd_rs_controller_reset(struct drbd_conf *mdev)
14409bd28d3cSLars Ellenberg {
14419bd28d3cSLars Ellenberg 	atomic_set(&mdev->rs_sect_in, 0);
14429bd28d3cSLars Ellenberg 	atomic_set(&mdev->rs_sect_ev, 0);
14439bd28d3cSLars Ellenberg 	mdev->rs_in_flight = 0;
14449bd28d3cSLars Ellenberg 	mdev->rs_planed = 0;
14459bd28d3cSLars Ellenberg 	spin_lock(&mdev->peer_seq_lock);
14469bd28d3cSLars Ellenberg 	fifo_set(&mdev->rs_plan_s, 0);
14479bd28d3cSLars Ellenberg 	spin_unlock(&mdev->peer_seq_lock);
14489bd28d3cSLars Ellenberg }
14499bd28d3cSLars Ellenberg 
1450b411b363SPhilipp Reisner /**
1451b411b363SPhilipp Reisner  * drbd_start_resync() - Start the resync process
1452b411b363SPhilipp Reisner  * @mdev:	DRBD device.
1453b411b363SPhilipp Reisner  * @side:	Either C_SYNC_SOURCE or C_SYNC_TARGET
1454b411b363SPhilipp Reisner  *
1455b411b363SPhilipp Reisner  * This function might bring you directly into one of the
1456b411b363SPhilipp Reisner  * C_PAUSED_SYNC_* states.
1457b411b363SPhilipp Reisner  */
1458b411b363SPhilipp Reisner void drbd_start_resync(struct drbd_conf *mdev, enum drbd_conns side)
1459b411b363SPhilipp Reisner {
1460b411b363SPhilipp Reisner 	union drbd_state ns;
1461b411b363SPhilipp Reisner 	int r;
1462b411b363SPhilipp Reisner 
1463c4752ef1SPhilipp Reisner 	if (mdev->state.conn >= C_SYNC_SOURCE && mdev->state.conn < C_AHEAD) {
1464b411b363SPhilipp Reisner 		dev_err(DEV, "Resync already running!\n");
1465b411b363SPhilipp Reisner 		return;
1466b411b363SPhilipp Reisner 	}
1467b411b363SPhilipp Reisner 
146859817f4fSPhilipp Reisner 	if (mdev->state.conn < C_AHEAD) {
1469b411b363SPhilipp Reisner 		/* In case a previous resync run was aborted by an IO error/detach on the peer. */
1470b411b363SPhilipp Reisner 		drbd_rs_cancel_all(mdev);
147159817f4fSPhilipp Reisner 		/* This should be done when we abort the resync. We definitely do not
147259817f4fSPhilipp Reisner 		   want to have this for connections going back and forth between
147359817f4fSPhilipp Reisner 		   Ahead/Behind and SyncSource/SyncTarget */
147459817f4fSPhilipp Reisner 	}
1475b411b363SPhilipp Reisner 
1476b411b363SPhilipp Reisner 	if (side == C_SYNC_TARGET) {
1477b411b363SPhilipp Reisner 		/* Since application IO was locked out during C_WF_BITMAP_T and
1478b411b363SPhilipp Reisner 		   C_WF_SYNC_UUID we are still unmodified. Before going to C_SYNC_TARGET
1479b411b363SPhilipp Reisner 		   we check that we might make the data inconsistent. */
1480b411b363SPhilipp Reisner 		r = drbd_khelper(mdev, "before-resync-target");
1481b411b363SPhilipp Reisner 		r = (r >> 8) & 0xff;
1482b411b363SPhilipp Reisner 		if (r > 0) {
1483b411b363SPhilipp Reisner 			dev_info(DEV, "before-resync-target handler returned %d, "
1484b411b363SPhilipp Reisner 			     "dropping connection.\n", r);
1485b411b363SPhilipp Reisner 			drbd_force_state(mdev, NS(conn, C_DISCONNECTING));
1486b411b363SPhilipp Reisner 			return;
1487b411b363SPhilipp Reisner 		}
148809b9e797SPhilipp Reisner 	} else /* C_SYNC_SOURCE */ {
148909b9e797SPhilipp Reisner 		r = drbd_khelper(mdev, "before-resync-source");
149009b9e797SPhilipp Reisner 		r = (r >> 8) & 0xff;
149109b9e797SPhilipp Reisner 		if (r > 0) {
149209b9e797SPhilipp Reisner 			if (r == 3) {
149309b9e797SPhilipp Reisner 				dev_info(DEV, "before-resync-source handler returned %d, "
149409b9e797SPhilipp Reisner 					 "ignoring. Old userland tools?", r);
149509b9e797SPhilipp Reisner 			} else {
149609b9e797SPhilipp Reisner 				dev_info(DEV, "before-resync-source handler returned %d, "
149709b9e797SPhilipp Reisner 					 "dropping connection.\n", r);
149809b9e797SPhilipp Reisner 				drbd_force_state(mdev, NS(conn, C_DISCONNECTING));
149909b9e797SPhilipp Reisner 				return;
150009b9e797SPhilipp Reisner 			}
150109b9e797SPhilipp Reisner 		}
1502b411b363SPhilipp Reisner 	}
1503b411b363SPhilipp Reisner 
1504b411b363SPhilipp Reisner 	drbd_state_lock(mdev);
1505b411b363SPhilipp Reisner 
1506b411b363SPhilipp Reisner 	if (!get_ldev_if_state(mdev, D_NEGOTIATING)) {
1507b411b363SPhilipp Reisner 		drbd_state_unlock(mdev);
1508b411b363SPhilipp Reisner 		return;
1509b411b363SPhilipp Reisner 	}
1510b411b363SPhilipp Reisner 
1511b411b363SPhilipp Reisner 	write_lock_irq(&global_state_lock);
1512b411b363SPhilipp Reisner 	ns = mdev->state;
1513b411b363SPhilipp Reisner 
1514b411b363SPhilipp Reisner 	ns.aftr_isp = !_drbd_may_sync_now(mdev);
1515b411b363SPhilipp Reisner 
1516b411b363SPhilipp Reisner 	ns.conn = side;
1517b411b363SPhilipp Reisner 
1518b411b363SPhilipp Reisner 	if (side == C_SYNC_TARGET)
1519b411b363SPhilipp Reisner 		ns.disk = D_INCONSISTENT;
1520b411b363SPhilipp Reisner 	else /* side == C_SYNC_SOURCE */
1521b411b363SPhilipp Reisner 		ns.pdsk = D_INCONSISTENT;
1522b411b363SPhilipp Reisner 
1523b411b363SPhilipp Reisner 	r = __drbd_set_state(mdev, ns, CS_VERBOSE, NULL);
1524b411b363SPhilipp Reisner 	ns = mdev->state;
1525b411b363SPhilipp Reisner 
1526b411b363SPhilipp Reisner 	if (ns.conn < C_CONNECTED)
1527b411b363SPhilipp Reisner 		r = SS_UNKNOWN_ERROR;
1528b411b363SPhilipp Reisner 
1529b411b363SPhilipp Reisner 	if (r == SS_SUCCESS) {
15301d7734a0SLars Ellenberg 		unsigned long tw = drbd_bm_total_weight(mdev);
15311d7734a0SLars Ellenberg 		unsigned long now = jiffies;
15321d7734a0SLars Ellenberg 		int i;
15331d7734a0SLars Ellenberg 
1534b411b363SPhilipp Reisner 		mdev->rs_failed    = 0;
1535b411b363SPhilipp Reisner 		mdev->rs_paused    = 0;
1536b411b363SPhilipp Reisner 		mdev->rs_same_csum = 0;
15370f0601f4SLars Ellenberg 		mdev->rs_last_events = 0;
15380f0601f4SLars Ellenberg 		mdev->rs_last_sect_ev = 0;
15391d7734a0SLars Ellenberg 		mdev->rs_total     = tw;
15401d7734a0SLars Ellenberg 		mdev->rs_start     = now;
15411d7734a0SLars Ellenberg 		for (i = 0; i < DRBD_SYNC_MARKS; i++) {
15421d7734a0SLars Ellenberg 			mdev->rs_mark_left[i] = tw;
15431d7734a0SLars Ellenberg 			mdev->rs_mark_time[i] = now;
15441d7734a0SLars Ellenberg 		}
1545b411b363SPhilipp Reisner 		_drbd_pause_after(mdev);
1546b411b363SPhilipp Reisner 	}
1547b411b363SPhilipp Reisner 	write_unlock_irq(&global_state_lock);
15485a22db89SLars Ellenberg 
15496c922ed5SLars Ellenberg 	if (r == SS_SUCCESS) {
15506c922ed5SLars Ellenberg 		dev_info(DEV, "Began resync as %s (will sync %lu KB [%lu bits set]).\n",
15516c922ed5SLars Ellenberg 		     drbd_conn_str(ns.conn),
15526c922ed5SLars Ellenberg 		     (unsigned long) mdev->rs_total << (BM_BLOCK_SHIFT-10),
15536c922ed5SLars Ellenberg 		     (unsigned long) mdev->rs_total);
15545a22db89SLars Ellenberg 		if (side == C_SYNC_TARGET)
15555a22db89SLars Ellenberg 			mdev->bm_resync_fo = 0;
15565a22db89SLars Ellenberg 
15575a22db89SLars Ellenberg 		/* Since protocol 96, we must serialize drbd_gen_and_send_sync_uuid
15585a22db89SLars Ellenberg 		 * with w_send_oos, or the sync target will get confused as to
15595a22db89SLars Ellenberg 		 * how much bits to resync.  We cannot do that always, because for an
15605a22db89SLars Ellenberg 		 * empty resync and protocol < 95, we need to do it here, as we call
15615a22db89SLars Ellenberg 		 * drbd_resync_finished from here in that case.
15625a22db89SLars Ellenberg 		 * We drbd_gen_and_send_sync_uuid here for protocol < 96,
15635a22db89SLars Ellenberg 		 * and from after_state_ch otherwise. */
15645a22db89SLars Ellenberg 		if (side == C_SYNC_SOURCE && mdev->agreed_pro_version < 96)
15655a22db89SLars Ellenberg 			drbd_gen_and_send_sync_uuid(mdev);
1566b411b363SPhilipp Reisner 
1567af85e8e8SLars Ellenberg 		if (mdev->agreed_pro_version < 95 && mdev->rs_total == 0) {
1568af85e8e8SLars Ellenberg 			/* This still has a race (about when exactly the peers
1569af85e8e8SLars Ellenberg 			 * detect connection loss) that can lead to a full sync
1570af85e8e8SLars Ellenberg 			 * on next handshake. In 8.3.9 we fixed this with explicit
1571af85e8e8SLars Ellenberg 			 * resync-finished notifications, but the fix
1572af85e8e8SLars Ellenberg 			 * introduces a protocol change.  Sleeping for some
1573af85e8e8SLars Ellenberg 			 * time longer than the ping interval + timeout on the
1574af85e8e8SLars Ellenberg 			 * SyncSource, to give the SyncTarget the chance to
1575af85e8e8SLars Ellenberg 			 * detect connection loss, then waiting for a ping
1576af85e8e8SLars Ellenberg 			 * response (implicit in drbd_resync_finished) reduces
1577af85e8e8SLars Ellenberg 			 * the race considerably, but does not solve it. */
1578af85e8e8SLars Ellenberg 			if (side == C_SYNC_SOURCE)
1579af85e8e8SLars Ellenberg 				schedule_timeout_interruptible(
1580af85e8e8SLars Ellenberg 					mdev->net_conf->ping_int * HZ +
1581af85e8e8SLars Ellenberg 					mdev->net_conf->ping_timeo*HZ/9);
1582b411b363SPhilipp Reisner 			drbd_resync_finished(mdev);
1583b411b363SPhilipp Reisner 		}
1584b411b363SPhilipp Reisner 
15859bd28d3cSLars Ellenberg 		drbd_rs_controller_reset(mdev);
1586b411b363SPhilipp Reisner 		/* ns.conn may already be != mdev->state.conn,
1587b411b363SPhilipp Reisner 		 * we may have been paused in between, or become paused until
1588b411b363SPhilipp Reisner 		 * the timer triggers.
1589b411b363SPhilipp Reisner 		 * No matter, that is handled in resync_timer_fn() */
1590b411b363SPhilipp Reisner 		if (ns.conn == C_SYNC_TARGET)
1591b411b363SPhilipp Reisner 			mod_timer(&mdev->resync_timer, jiffies);
1592b411b363SPhilipp Reisner 
1593b411b363SPhilipp Reisner 		drbd_md_sync(mdev);
1594b411b363SPhilipp Reisner 	}
15955a22db89SLars Ellenberg 	put_ldev(mdev);
1596d0c3f60fSPhilipp Reisner 	drbd_state_unlock(mdev);
1597b411b363SPhilipp Reisner }
1598b411b363SPhilipp Reisner 
1599b411b363SPhilipp Reisner int drbd_worker(struct drbd_thread *thi)
1600b411b363SPhilipp Reisner {
1601b411b363SPhilipp Reisner 	struct drbd_conf *mdev = thi->mdev;
1602b411b363SPhilipp Reisner 	struct drbd_work *w = NULL;
1603b411b363SPhilipp Reisner 	LIST_HEAD(work_list);
1604b411b363SPhilipp Reisner 	int intr = 0, i;
1605b411b363SPhilipp Reisner 
1606b411b363SPhilipp Reisner 	sprintf(current->comm, "drbd%d_worker", mdev_to_minor(mdev));
1607b411b363SPhilipp Reisner 
1608b411b363SPhilipp Reisner 	while (get_t_state(thi) == Running) {
1609b411b363SPhilipp Reisner 		drbd_thread_current_set_cpu(mdev);
1610b411b363SPhilipp Reisner 
1611b411b363SPhilipp Reisner 		if (down_trylock(&mdev->data.work.s)) {
1612b411b363SPhilipp Reisner 			mutex_lock(&mdev->data.mutex);
1613b411b363SPhilipp Reisner 			if (mdev->data.socket && !mdev->net_conf->no_cork)
1614b411b363SPhilipp Reisner 				drbd_tcp_uncork(mdev->data.socket);
1615b411b363SPhilipp Reisner 			mutex_unlock(&mdev->data.mutex);
1616b411b363SPhilipp Reisner 
1617b411b363SPhilipp Reisner 			intr = down_interruptible(&mdev->data.work.s);
1618b411b363SPhilipp Reisner 
1619b411b363SPhilipp Reisner 			mutex_lock(&mdev->data.mutex);
1620b411b363SPhilipp Reisner 			if (mdev->data.socket  && !mdev->net_conf->no_cork)
1621b411b363SPhilipp Reisner 				drbd_tcp_cork(mdev->data.socket);
1622b411b363SPhilipp Reisner 			mutex_unlock(&mdev->data.mutex);
1623b411b363SPhilipp Reisner 		}
1624b411b363SPhilipp Reisner 
1625b411b363SPhilipp Reisner 		if (intr) {
1626b411b363SPhilipp Reisner 			D_ASSERT(intr == -EINTR);
1627b411b363SPhilipp Reisner 			flush_signals(current);
1628b411b363SPhilipp Reisner 			ERR_IF (get_t_state(thi) == Running)
1629b411b363SPhilipp Reisner 				continue;
1630b411b363SPhilipp Reisner 			break;
1631b411b363SPhilipp Reisner 		}
1632b411b363SPhilipp Reisner 
1633b411b363SPhilipp Reisner 		if (get_t_state(thi) != Running)
1634b411b363SPhilipp Reisner 			break;
1635b411b363SPhilipp Reisner 		/* With this break, we have done a down() but not consumed
1636b411b363SPhilipp Reisner 		   the entry from the list. The cleanup code takes care of
1637b411b363SPhilipp Reisner 		   this...   */
1638b411b363SPhilipp Reisner 
1639b411b363SPhilipp Reisner 		w = NULL;
1640b411b363SPhilipp Reisner 		spin_lock_irq(&mdev->data.work.q_lock);
1641b411b363SPhilipp Reisner 		ERR_IF(list_empty(&mdev->data.work.q)) {
1642b411b363SPhilipp Reisner 			/* something terribly wrong in our logic.
1643b411b363SPhilipp Reisner 			 * we were able to down() the semaphore,
1644b411b363SPhilipp Reisner 			 * but the list is empty... doh.
1645b411b363SPhilipp Reisner 			 *
1646b411b363SPhilipp Reisner 			 * what is the best thing to do now?
1647b411b363SPhilipp Reisner 			 * try again from scratch, restarting the receiver,
1648b411b363SPhilipp Reisner 			 * asender, whatnot? could break even more ugly,
1649b411b363SPhilipp Reisner 			 * e.g. when we are primary, but no good local data.
1650b411b363SPhilipp Reisner 			 *
1651b411b363SPhilipp Reisner 			 * I'll try to get away just starting over this loop.
1652b411b363SPhilipp Reisner 			 */
1653b411b363SPhilipp Reisner 			spin_unlock_irq(&mdev->data.work.q_lock);
1654b411b363SPhilipp Reisner 			continue;
1655b411b363SPhilipp Reisner 		}
1656b411b363SPhilipp Reisner 		w = list_entry(mdev->data.work.q.next, struct drbd_work, list);
1657b411b363SPhilipp Reisner 		list_del_init(&w->list);
1658b411b363SPhilipp Reisner 		spin_unlock_irq(&mdev->data.work.q_lock);
1659b411b363SPhilipp Reisner 
1660b411b363SPhilipp Reisner 		if (!w->cb(mdev, w, mdev->state.conn < C_CONNECTED)) {
1661b411b363SPhilipp Reisner 			/* dev_warn(DEV, "worker: a callback failed! \n"); */
1662b411b363SPhilipp Reisner 			if (mdev->state.conn >= C_CONNECTED)
1663b411b363SPhilipp Reisner 				drbd_force_state(mdev,
1664b411b363SPhilipp Reisner 						NS(conn, C_NETWORK_FAILURE));
1665b411b363SPhilipp Reisner 		}
1666b411b363SPhilipp Reisner 	}
1667b411b363SPhilipp Reisner 	D_ASSERT(test_bit(DEVICE_DYING, &mdev->flags));
1668b411b363SPhilipp Reisner 	D_ASSERT(test_bit(CONFIG_PENDING, &mdev->flags));
1669b411b363SPhilipp Reisner 
1670b411b363SPhilipp Reisner 	spin_lock_irq(&mdev->data.work.q_lock);
1671b411b363SPhilipp Reisner 	i = 0;
1672b411b363SPhilipp Reisner 	while (!list_empty(&mdev->data.work.q)) {
1673b411b363SPhilipp Reisner 		list_splice_init(&mdev->data.work.q, &work_list);
1674b411b363SPhilipp Reisner 		spin_unlock_irq(&mdev->data.work.q_lock);
1675b411b363SPhilipp Reisner 
1676b411b363SPhilipp Reisner 		while (!list_empty(&work_list)) {
1677b411b363SPhilipp Reisner 			w = list_entry(work_list.next, struct drbd_work, list);
1678b411b363SPhilipp Reisner 			list_del_init(&w->list);
1679b411b363SPhilipp Reisner 			w->cb(mdev, w, 1);
1680b411b363SPhilipp Reisner 			i++; /* dead debugging code */
1681b411b363SPhilipp Reisner 		}
1682b411b363SPhilipp Reisner 
1683b411b363SPhilipp Reisner 		spin_lock_irq(&mdev->data.work.q_lock);
1684b411b363SPhilipp Reisner 	}
1685b411b363SPhilipp Reisner 	sema_init(&mdev->data.work.s, 0);
1686b411b363SPhilipp Reisner 	/* DANGEROUS race: if someone did queue his work within the spinlock,
1687b411b363SPhilipp Reisner 	 * but up() ed outside the spinlock, we could get an up() on the
1688b411b363SPhilipp Reisner 	 * semaphore without corresponding list entry.
1689b411b363SPhilipp Reisner 	 * So don't do that.
1690b411b363SPhilipp Reisner 	 */
1691b411b363SPhilipp Reisner 	spin_unlock_irq(&mdev->data.work.q_lock);
1692b411b363SPhilipp Reisner 
1693b411b363SPhilipp Reisner 	D_ASSERT(mdev->state.disk == D_DISKLESS && mdev->state.conn == C_STANDALONE);
1694b411b363SPhilipp Reisner 	/* _drbd_set_state only uses stop_nowait.
1695b411b363SPhilipp Reisner 	 * wait here for the Exiting receiver. */
1696b411b363SPhilipp Reisner 	drbd_thread_stop(&mdev->receiver);
1697b411b363SPhilipp Reisner 	drbd_mdev_cleanup(mdev);
1698b411b363SPhilipp Reisner 
1699b411b363SPhilipp Reisner 	dev_info(DEV, "worker terminated\n");
1700b411b363SPhilipp Reisner 
1701b411b363SPhilipp Reisner 	clear_bit(DEVICE_DYING, &mdev->flags);
1702b411b363SPhilipp Reisner 	clear_bit(CONFIG_PENDING, &mdev->flags);
1703b411b363SPhilipp Reisner 	wake_up(&mdev->state_wait);
1704b411b363SPhilipp Reisner 
1705b411b363SPhilipp Reisner 	return 0;
1706b411b363SPhilipp Reisner }
1707