xref: /openbmc/linux/drivers/block/drbd/drbd_worker.c (revision 010f6e67)
1b411b363SPhilipp Reisner /*
2b411b363SPhilipp Reisner    drbd_worker.c
3b411b363SPhilipp Reisner 
4b411b363SPhilipp Reisner    This file is part of DRBD by Philipp Reisner and Lars Ellenberg.
5b411b363SPhilipp Reisner 
6b411b363SPhilipp Reisner    Copyright (C) 2001-2008, LINBIT Information Technologies GmbH.
7b411b363SPhilipp Reisner    Copyright (C) 1999-2008, Philipp Reisner <philipp.reisner@linbit.com>.
8b411b363SPhilipp Reisner    Copyright (C) 2002-2008, Lars Ellenberg <lars.ellenberg@linbit.com>.
9b411b363SPhilipp Reisner 
10b411b363SPhilipp Reisner    drbd is free software; you can redistribute it and/or modify
11b411b363SPhilipp Reisner    it under the terms of the GNU General Public License as published by
12b411b363SPhilipp Reisner    the Free Software Foundation; either version 2, or (at your option)
13b411b363SPhilipp Reisner    any later version.
14b411b363SPhilipp Reisner 
15b411b363SPhilipp Reisner    drbd is distributed in the hope that it will be useful,
16b411b363SPhilipp Reisner    but WITHOUT ANY WARRANTY; without even the implied warranty of
17b411b363SPhilipp Reisner    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
18b411b363SPhilipp Reisner    GNU General Public License for more details.
19b411b363SPhilipp Reisner 
20b411b363SPhilipp Reisner    You should have received a copy of the GNU General Public License
21b411b363SPhilipp Reisner    along with drbd; see the file COPYING.  If not, write to
22b411b363SPhilipp Reisner    the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139, USA.
23b411b363SPhilipp Reisner 
24b411b363SPhilipp Reisner  */
25b411b363SPhilipp Reisner 
26b411b363SPhilipp Reisner #include <linux/module.h>
27b411b363SPhilipp Reisner #include <linux/drbd.h>
28b411b363SPhilipp Reisner #include <linux/sched.h>
29b411b363SPhilipp Reisner #include <linux/wait.h>
30b411b363SPhilipp Reisner #include <linux/mm.h>
31b411b363SPhilipp Reisner #include <linux/memcontrol.h>
32b411b363SPhilipp Reisner #include <linux/mm_inline.h>
33b411b363SPhilipp Reisner #include <linux/slab.h>
34b411b363SPhilipp Reisner #include <linux/random.h>
35b411b363SPhilipp Reisner #include <linux/string.h>
36b411b363SPhilipp Reisner #include <linux/scatterlist.h>
37b411b363SPhilipp Reisner 
38b411b363SPhilipp Reisner #include "drbd_int.h"
39b411b363SPhilipp Reisner #include "drbd_req.h"
40b411b363SPhilipp Reisner 
41b411b363SPhilipp Reisner static int w_make_ov_request(struct drbd_conf *mdev, struct drbd_work *w, int cancel);
429d77a5feSPhilipp Reisner static int w_make_resync_request(struct drbd_conf *mdev,
439d77a5feSPhilipp Reisner 				 struct drbd_work *w, int cancel);
44b411b363SPhilipp Reisner 
45b411b363SPhilipp Reisner 
46b411b363SPhilipp Reisner 
47c5a91619SAndreas Gruenbacher /* endio handlers:
48c5a91619SAndreas Gruenbacher  *   drbd_md_io_complete (defined here)
49c5a91619SAndreas Gruenbacher  *   drbd_endio_pri (defined here)
50c5a91619SAndreas Gruenbacher  *   drbd_endio_sec (defined here)
51c5a91619SAndreas Gruenbacher  *   bm_async_io_complete (defined in drbd_bitmap.c)
52c5a91619SAndreas Gruenbacher  *
53b411b363SPhilipp Reisner  * For all these callbacks, note the following:
54b411b363SPhilipp Reisner  * The callbacks will be called in irq context by the IDE drivers,
55b411b363SPhilipp Reisner  * and in Softirqs/Tasklets/BH context by the SCSI drivers.
56b411b363SPhilipp Reisner  * Try to get the locking right :)
57b411b363SPhilipp Reisner  *
58b411b363SPhilipp Reisner  */
59b411b363SPhilipp Reisner 
60b411b363SPhilipp Reisner 
61b411b363SPhilipp Reisner /* About the global_state_lock
62b411b363SPhilipp Reisner    Each state transition on an device holds a read lock. In case we have
63b411b363SPhilipp Reisner    to evaluate the sync after dependencies, we grab a write lock, because
64b411b363SPhilipp Reisner    we need stable states on all devices for that.  */
65b411b363SPhilipp Reisner rwlock_t global_state_lock;
66b411b363SPhilipp Reisner 
67b411b363SPhilipp Reisner /* used for synchronous meta data and bitmap IO
68b411b363SPhilipp Reisner  * submitted by drbd_md_sync_page_io()
69b411b363SPhilipp Reisner  */
70b411b363SPhilipp Reisner void drbd_md_io_complete(struct bio *bio, int error)
71b411b363SPhilipp Reisner {
72b411b363SPhilipp Reisner 	struct drbd_md_io *md_io;
73b411b363SPhilipp Reisner 
74b411b363SPhilipp Reisner 	md_io = (struct drbd_md_io *)bio->bi_private;
75b411b363SPhilipp Reisner 	md_io->error = error;
76b411b363SPhilipp Reisner 
77b411b363SPhilipp Reisner 	complete(&md_io->event);
78b411b363SPhilipp Reisner }
79b411b363SPhilipp Reisner 
80b411b363SPhilipp Reisner /* reads on behalf of the partner,
81b411b363SPhilipp Reisner  * "submitted" by the receiver
82b411b363SPhilipp Reisner  */
8345bb912bSLars Ellenberg void drbd_endio_read_sec_final(struct drbd_epoch_entry *e) __releases(local)
84b411b363SPhilipp Reisner {
85b411b363SPhilipp Reisner 	unsigned long flags = 0;
8645bb912bSLars Ellenberg 	struct drbd_conf *mdev = e->mdev;
87b411b363SPhilipp Reisner 
88b411b363SPhilipp Reisner 	spin_lock_irqsave(&mdev->req_lock, flags);
89010f6e67SAndreas Gruenbacher 	mdev->read_cnt += e->i.size >> 9;
90b411b363SPhilipp Reisner 	list_del(&e->w.list);
91b411b363SPhilipp Reisner 	if (list_empty(&mdev->read_ee))
92b411b363SPhilipp Reisner 		wake_up(&mdev->ee_wait);
9345bb912bSLars Ellenberg 	if (test_bit(__EE_WAS_ERROR, &e->flags))
9481e84650SAndreas Gruenbacher 		__drbd_chk_io_error(mdev, false);
95b411b363SPhilipp Reisner 	spin_unlock_irqrestore(&mdev->req_lock, flags);
96b411b363SPhilipp Reisner 
97b411b363SPhilipp Reisner 	drbd_queue_work(&mdev->data.work, &e->w);
98b411b363SPhilipp Reisner 	put_ldev(mdev);
99b411b363SPhilipp Reisner }
100b411b363SPhilipp Reisner 
101b411b363SPhilipp Reisner /* writes on behalf of the partner, or resync writes,
10245bb912bSLars Ellenberg  * "submitted" by the receiver, final stage.  */
10345bb912bSLars Ellenberg static void drbd_endio_write_sec_final(struct drbd_epoch_entry *e) __releases(local)
104b411b363SPhilipp Reisner {
105b411b363SPhilipp Reisner 	unsigned long flags = 0;
10645bb912bSLars Ellenberg 	struct drbd_conf *mdev = e->mdev;
107b411b363SPhilipp Reisner 	sector_t e_sector;
108b411b363SPhilipp Reisner 	int do_wake;
109579b57edSAndreas Gruenbacher 	u64 block_id;
110b411b363SPhilipp Reisner 	int do_al_complete_io;
111b411b363SPhilipp Reisner 
112b411b363SPhilipp Reisner 	/* after we moved e to done_ee,
113b411b363SPhilipp Reisner 	 * we may no longer access it,
114b411b363SPhilipp Reisner 	 * it may be freed/reused already!
115b411b363SPhilipp Reisner 	 * (as soon as we release the req_lock) */
116010f6e67SAndreas Gruenbacher 	e_sector = e->i.sector;
117b411b363SPhilipp Reisner 	do_al_complete_io = e->flags & EE_CALL_AL_COMPLETE_IO;
118579b57edSAndreas Gruenbacher 	block_id = e->block_id;
119b411b363SPhilipp Reisner 
12045bb912bSLars Ellenberg 	spin_lock_irqsave(&mdev->req_lock, flags);
121010f6e67SAndreas Gruenbacher 	mdev->writ_cnt += e->i.size >> 9;
122b411b363SPhilipp Reisner 	list_del(&e->w.list); /* has been on active_ee or sync_ee */
123b411b363SPhilipp Reisner 	list_add_tail(&e->w.list, &mdev->done_ee);
124b411b363SPhilipp Reisner 
12524c4830cSBart Van Assche 	/* No hlist_del_init(&e->collision) here, we did not send the Ack yet,
126b411b363SPhilipp Reisner 	 * neither did we wake possibly waiting conflicting requests.
127b411b363SPhilipp Reisner 	 * done from "drbd_process_done_ee" within the appropriate w.cb
128b411b363SPhilipp Reisner 	 * (e_end_block/e_end_resync_block) or from _drbd_clear_done_ee */
129b411b363SPhilipp Reisner 
130579b57edSAndreas Gruenbacher 	do_wake = list_empty(block_id == ID_SYNCER ? &mdev->sync_ee : &mdev->active_ee);
131b411b363SPhilipp Reisner 
13245bb912bSLars Ellenberg 	if (test_bit(__EE_WAS_ERROR, &e->flags))
13381e84650SAndreas Gruenbacher 		__drbd_chk_io_error(mdev, false);
134b411b363SPhilipp Reisner 	spin_unlock_irqrestore(&mdev->req_lock, flags);
135b411b363SPhilipp Reisner 
136579b57edSAndreas Gruenbacher 	if (block_id == ID_SYNCER)
137b411b363SPhilipp Reisner 		drbd_rs_complete_io(mdev, e_sector);
138b411b363SPhilipp Reisner 
139b411b363SPhilipp Reisner 	if (do_wake)
140b411b363SPhilipp Reisner 		wake_up(&mdev->ee_wait);
141b411b363SPhilipp Reisner 
142b411b363SPhilipp Reisner 	if (do_al_complete_io)
143b411b363SPhilipp Reisner 		drbd_al_complete_io(mdev, e_sector);
144b411b363SPhilipp Reisner 
145b411b363SPhilipp Reisner 	wake_asender(mdev);
146b411b363SPhilipp Reisner 	put_ldev(mdev);
14745bb912bSLars Ellenberg }
148b411b363SPhilipp Reisner 
14945bb912bSLars Ellenberg /* writes on behalf of the partner, or resync writes,
15045bb912bSLars Ellenberg  * "submitted" by the receiver.
15145bb912bSLars Ellenberg  */
15245bb912bSLars Ellenberg void drbd_endio_sec(struct bio *bio, int error)
15345bb912bSLars Ellenberg {
15445bb912bSLars Ellenberg 	struct drbd_epoch_entry *e = bio->bi_private;
15545bb912bSLars Ellenberg 	struct drbd_conf *mdev = e->mdev;
15645bb912bSLars Ellenberg 	int uptodate = bio_flagged(bio, BIO_UPTODATE);
15745bb912bSLars Ellenberg 	int is_write = bio_data_dir(bio) == WRITE;
15845bb912bSLars Ellenberg 
15907194272SLars Ellenberg 	if (error && __ratelimit(&drbd_ratelimit_state))
16045bb912bSLars Ellenberg 		dev_warn(DEV, "%s: error=%d s=%llus\n",
16145bb912bSLars Ellenberg 				is_write ? "write" : "read", error,
162010f6e67SAndreas Gruenbacher 				(unsigned long long)e->i.sector);
16345bb912bSLars Ellenberg 	if (!error && !uptodate) {
16407194272SLars Ellenberg 		if (__ratelimit(&drbd_ratelimit_state))
16545bb912bSLars Ellenberg 			dev_warn(DEV, "%s: setting error to -EIO s=%llus\n",
16645bb912bSLars Ellenberg 					is_write ? "write" : "read",
167010f6e67SAndreas Gruenbacher 					(unsigned long long)e->i.sector);
16845bb912bSLars Ellenberg 		/* strange behavior of some lower level drivers...
16945bb912bSLars Ellenberg 		 * fail the request by clearing the uptodate flag,
17045bb912bSLars Ellenberg 		 * but do not return any error?! */
17145bb912bSLars Ellenberg 		error = -EIO;
17245bb912bSLars Ellenberg 	}
17345bb912bSLars Ellenberg 
17445bb912bSLars Ellenberg 	if (error)
17545bb912bSLars Ellenberg 		set_bit(__EE_WAS_ERROR, &e->flags);
17645bb912bSLars Ellenberg 
17745bb912bSLars Ellenberg 	bio_put(bio); /* no need for the bio anymore */
17845bb912bSLars Ellenberg 	if (atomic_dec_and_test(&e->pending_bios)) {
17945bb912bSLars Ellenberg 		if (is_write)
18045bb912bSLars Ellenberg 			drbd_endio_write_sec_final(e);
18145bb912bSLars Ellenberg 		else
18245bb912bSLars Ellenberg 			drbd_endio_read_sec_final(e);
18345bb912bSLars Ellenberg 	}
184b411b363SPhilipp Reisner }
185b411b363SPhilipp Reisner 
186b411b363SPhilipp Reisner /* read, readA or write requests on R_PRIMARY coming from drbd_make_request
187b411b363SPhilipp Reisner  */
188b411b363SPhilipp Reisner void drbd_endio_pri(struct bio *bio, int error)
189b411b363SPhilipp Reisner {
190a115413dSLars Ellenberg 	unsigned long flags;
191b411b363SPhilipp Reisner 	struct drbd_request *req = bio->bi_private;
192b411b363SPhilipp Reisner 	struct drbd_conf *mdev = req->mdev;
193a115413dSLars Ellenberg 	struct bio_and_error m;
194b411b363SPhilipp Reisner 	enum drbd_req_event what;
195b411b363SPhilipp Reisner 	int uptodate = bio_flagged(bio, BIO_UPTODATE);
196b411b363SPhilipp Reisner 
197b411b363SPhilipp Reisner 	if (!error && !uptodate) {
198b411b363SPhilipp Reisner 		dev_warn(DEV, "p %s: setting error to -EIO\n",
199b411b363SPhilipp Reisner 			 bio_data_dir(bio) == WRITE ? "write" : "read");
200b411b363SPhilipp Reisner 		/* strange behavior of some lower level drivers...
201b411b363SPhilipp Reisner 		 * fail the request by clearing the uptodate flag,
202b411b363SPhilipp Reisner 		 * but do not return any error?! */
203b411b363SPhilipp Reisner 		error = -EIO;
204b411b363SPhilipp Reisner 	}
205b411b363SPhilipp Reisner 
206b411b363SPhilipp Reisner 	/* to avoid recursion in __req_mod */
207b411b363SPhilipp Reisner 	if (unlikely(error)) {
208b411b363SPhilipp Reisner 		what = (bio_data_dir(bio) == WRITE)
209b411b363SPhilipp Reisner 			? write_completed_with_error
2105c3c7e64SLars Ellenberg 			: (bio_rw(bio) == READ)
211b411b363SPhilipp Reisner 			  ? read_completed_with_error
212b411b363SPhilipp Reisner 			  : read_ahead_completed_with_error;
213b411b363SPhilipp Reisner 	} else
214b411b363SPhilipp Reisner 		what = completed_ok;
215b411b363SPhilipp Reisner 
216b411b363SPhilipp Reisner 	bio_put(req->private_bio);
217b411b363SPhilipp Reisner 	req->private_bio = ERR_PTR(error);
218b411b363SPhilipp Reisner 
219a115413dSLars Ellenberg 	/* not req_mod(), we need irqsave here! */
220a115413dSLars Ellenberg 	spin_lock_irqsave(&mdev->req_lock, flags);
221a115413dSLars Ellenberg 	__req_mod(req, what, &m);
222a115413dSLars Ellenberg 	spin_unlock_irqrestore(&mdev->req_lock, flags);
223a115413dSLars Ellenberg 
224a115413dSLars Ellenberg 	if (m.bio)
225a115413dSLars Ellenberg 		complete_master_bio(mdev, &m);
226b411b363SPhilipp Reisner }
227b411b363SPhilipp Reisner 
228b411b363SPhilipp Reisner int w_read_retry_remote(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
229b411b363SPhilipp Reisner {
230b411b363SPhilipp Reisner 	struct drbd_request *req = container_of(w, struct drbd_request, w);
231b411b363SPhilipp Reisner 
232b411b363SPhilipp Reisner 	/* We should not detach for read io-error,
233b411b363SPhilipp Reisner 	 * but try to WRITE the P_DATA_REPLY to the failed location,
234b411b363SPhilipp Reisner 	 * to give the disk the chance to relocate that block */
235b411b363SPhilipp Reisner 
236b411b363SPhilipp Reisner 	spin_lock_irq(&mdev->req_lock);
237d255e5ffSLars Ellenberg 	if (cancel || mdev->state.pdsk != D_UP_TO_DATE) {
238d255e5ffSLars Ellenberg 		_req_mod(req, read_retry_remote_canceled);
239b411b363SPhilipp Reisner 		spin_unlock_irq(&mdev->req_lock);
240b411b363SPhilipp Reisner 		return 1;
241b411b363SPhilipp Reisner 	}
242b411b363SPhilipp Reisner 	spin_unlock_irq(&mdev->req_lock);
243b411b363SPhilipp Reisner 
244b411b363SPhilipp Reisner 	return w_send_read_req(mdev, w, 0);
245b411b363SPhilipp Reisner }
246b411b363SPhilipp Reisner 
24745bb912bSLars Ellenberg void drbd_csum_ee(struct drbd_conf *mdev, struct crypto_hash *tfm, struct drbd_epoch_entry *e, void *digest)
24845bb912bSLars Ellenberg {
24945bb912bSLars Ellenberg 	struct hash_desc desc;
25045bb912bSLars Ellenberg 	struct scatterlist sg;
25145bb912bSLars Ellenberg 	struct page *page = e->pages;
25245bb912bSLars Ellenberg 	struct page *tmp;
25345bb912bSLars Ellenberg 	unsigned len;
25445bb912bSLars Ellenberg 
25545bb912bSLars Ellenberg 	desc.tfm = tfm;
25645bb912bSLars Ellenberg 	desc.flags = 0;
25745bb912bSLars Ellenberg 
25845bb912bSLars Ellenberg 	sg_init_table(&sg, 1);
25945bb912bSLars Ellenberg 	crypto_hash_init(&desc);
26045bb912bSLars Ellenberg 
26145bb912bSLars Ellenberg 	while ((tmp = page_chain_next(page))) {
26245bb912bSLars Ellenberg 		/* all but the last page will be fully used */
26345bb912bSLars Ellenberg 		sg_set_page(&sg, page, PAGE_SIZE, 0);
26445bb912bSLars Ellenberg 		crypto_hash_update(&desc, &sg, sg.length);
26545bb912bSLars Ellenberg 		page = tmp;
26645bb912bSLars Ellenberg 	}
26745bb912bSLars Ellenberg 	/* and now the last, possibly only partially used page */
268010f6e67SAndreas Gruenbacher 	len = e->i.size & (PAGE_SIZE - 1);
26945bb912bSLars Ellenberg 	sg_set_page(&sg, page, len ?: PAGE_SIZE, 0);
27045bb912bSLars Ellenberg 	crypto_hash_update(&desc, &sg, sg.length);
27145bb912bSLars Ellenberg 	crypto_hash_final(&desc, digest);
27245bb912bSLars Ellenberg }
27345bb912bSLars Ellenberg 
27445bb912bSLars Ellenberg void drbd_csum_bio(struct drbd_conf *mdev, struct crypto_hash *tfm, struct bio *bio, void *digest)
275b411b363SPhilipp Reisner {
276b411b363SPhilipp Reisner 	struct hash_desc desc;
277b411b363SPhilipp Reisner 	struct scatterlist sg;
278b411b363SPhilipp Reisner 	struct bio_vec *bvec;
279b411b363SPhilipp Reisner 	int i;
280b411b363SPhilipp Reisner 
281b411b363SPhilipp Reisner 	desc.tfm = tfm;
282b411b363SPhilipp Reisner 	desc.flags = 0;
283b411b363SPhilipp Reisner 
284b411b363SPhilipp Reisner 	sg_init_table(&sg, 1);
285b411b363SPhilipp Reisner 	crypto_hash_init(&desc);
286b411b363SPhilipp Reisner 
287b411b363SPhilipp Reisner 	__bio_for_each_segment(bvec, bio, i, 0) {
288b411b363SPhilipp Reisner 		sg_set_page(&sg, bvec->bv_page, bvec->bv_len, bvec->bv_offset);
289b411b363SPhilipp Reisner 		crypto_hash_update(&desc, &sg, sg.length);
290b411b363SPhilipp Reisner 	}
291b411b363SPhilipp Reisner 	crypto_hash_final(&desc, digest);
292b411b363SPhilipp Reisner }
293b411b363SPhilipp Reisner 
29453ea4331SLars Ellenberg /* TODO merge common code with w_e_end_ov_req */
29553ea4331SLars Ellenberg int w_e_send_csum(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
296b411b363SPhilipp Reisner {
297b411b363SPhilipp Reisner 	struct drbd_epoch_entry *e = container_of(w, struct drbd_epoch_entry, w);
298b411b363SPhilipp Reisner 	int digest_size;
299b411b363SPhilipp Reisner 	void *digest;
30053ea4331SLars Ellenberg 	int ok = 1;
301b411b363SPhilipp Reisner 
30253ea4331SLars Ellenberg 	if (unlikely(cancel))
30353ea4331SLars Ellenberg 		goto out;
304b411b363SPhilipp Reisner 
30553ea4331SLars Ellenberg 	if (likely((e->flags & EE_WAS_ERROR) != 0))
30653ea4331SLars Ellenberg 		goto out;
30753ea4331SLars Ellenberg 
308b411b363SPhilipp Reisner 	digest_size = crypto_hash_digestsize(mdev->csums_tfm);
309b411b363SPhilipp Reisner 	digest = kmalloc(digest_size, GFP_NOIO);
310b411b363SPhilipp Reisner 	if (digest) {
311010f6e67SAndreas Gruenbacher 		sector_t sector = e->i.sector;
312010f6e67SAndreas Gruenbacher 		unsigned int size = e->i.size;
31345bb912bSLars Ellenberg 		drbd_csum_ee(mdev, mdev->csums_tfm, e, digest);
31453ea4331SLars Ellenberg 		/* Free e and pages before send.
31553ea4331SLars Ellenberg 		 * In case we block on congestion, we could otherwise run into
31653ea4331SLars Ellenberg 		 * some distributed deadlock, if the other side blocks on
31753ea4331SLars Ellenberg 		 * congestion as well, because our receiver blocks in
31853ea4331SLars Ellenberg 		 * drbd_pp_alloc due to pp_in_use > max_buffers. */
31953ea4331SLars Ellenberg 		drbd_free_ee(mdev, e);
32053ea4331SLars Ellenberg 		e = NULL;
321b411b363SPhilipp Reisner 		inc_rs_pending(mdev);
32253ea4331SLars Ellenberg 		ok = drbd_send_drequest_csum(mdev, sector, size,
32353ea4331SLars Ellenberg 					     digest, digest_size,
324b411b363SPhilipp Reisner 					     P_CSUM_RS_REQUEST);
325b411b363SPhilipp Reisner 		kfree(digest);
326b411b363SPhilipp Reisner 	} else {
327b411b363SPhilipp Reisner 		dev_err(DEV, "kmalloc() of digest failed.\n");
328b411b363SPhilipp Reisner 		ok = 0;
329b411b363SPhilipp Reisner 	}
330b411b363SPhilipp Reisner 
33153ea4331SLars Ellenberg out:
33253ea4331SLars Ellenberg 	if (e)
333b411b363SPhilipp Reisner 		drbd_free_ee(mdev, e);
334b411b363SPhilipp Reisner 
335b411b363SPhilipp Reisner 	if (unlikely(!ok))
336b411b363SPhilipp Reisner 		dev_err(DEV, "drbd_send_drequest(..., csum) failed\n");
337b411b363SPhilipp Reisner 	return ok;
338b411b363SPhilipp Reisner }
339b411b363SPhilipp Reisner 
340b411b363SPhilipp Reisner #define GFP_TRY	(__GFP_HIGHMEM | __GFP_NOWARN)
341b411b363SPhilipp Reisner 
342b411b363SPhilipp Reisner static int read_for_csum(struct drbd_conf *mdev, sector_t sector, int size)
343b411b363SPhilipp Reisner {
344b411b363SPhilipp Reisner 	struct drbd_epoch_entry *e;
345b411b363SPhilipp Reisner 
346b411b363SPhilipp Reisner 	if (!get_ldev(mdev))
34780a40e43SLars Ellenberg 		return -EIO;
348b411b363SPhilipp Reisner 
349e3555d85SPhilipp Reisner 	if (drbd_rs_should_slow_down(mdev, sector))
3500f0601f4SLars Ellenberg 		goto defer;
3510f0601f4SLars Ellenberg 
352b411b363SPhilipp Reisner 	/* GFP_TRY, because if there is no memory available right now, this may
353b411b363SPhilipp Reisner 	 * be rescheduled for later. It is "only" background resync, after all. */
3549a8e7753SAndreas Gruenbacher 	e = drbd_alloc_ee(mdev, ID_SYNCER /* unused */, sector, size, GFP_TRY);
35545bb912bSLars Ellenberg 	if (!e)
35680a40e43SLars Ellenberg 		goto defer;
357b411b363SPhilipp Reisner 
35880a40e43SLars Ellenberg 	e->w.cb = w_e_send_csum;
359b411b363SPhilipp Reisner 	spin_lock_irq(&mdev->req_lock);
360b411b363SPhilipp Reisner 	list_add(&e->w.list, &mdev->read_ee);
361b411b363SPhilipp Reisner 	spin_unlock_irq(&mdev->req_lock);
362b411b363SPhilipp Reisner 
3630f0601f4SLars Ellenberg 	atomic_add(size >> 9, &mdev->rs_sect_ev);
36445bb912bSLars Ellenberg 	if (drbd_submit_ee(mdev, e, READ, DRBD_FAULT_RS_RD) == 0)
36580a40e43SLars Ellenberg 		return 0;
36645bb912bSLars Ellenberg 
36710f6d992SLars Ellenberg 	/* If it failed because of ENOMEM, retry should help.  If it failed
36810f6d992SLars Ellenberg 	 * because bio_add_page failed (probably broken lower level driver),
36910f6d992SLars Ellenberg 	 * retry may or may not help.
37010f6d992SLars Ellenberg 	 * If it does not, you may need to force disconnect. */
37122cc37a9SLars Ellenberg 	spin_lock_irq(&mdev->req_lock);
37222cc37a9SLars Ellenberg 	list_del(&e->w.list);
37322cc37a9SLars Ellenberg 	spin_unlock_irq(&mdev->req_lock);
37422cc37a9SLars Ellenberg 
37545bb912bSLars Ellenberg 	drbd_free_ee(mdev, e);
37680a40e43SLars Ellenberg defer:
37745bb912bSLars Ellenberg 	put_ldev(mdev);
37880a40e43SLars Ellenberg 	return -EAGAIN;
379b411b363SPhilipp Reisner }
380b411b363SPhilipp Reisner 
381794abb75SPhilipp Reisner int w_resync_timer(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
382794abb75SPhilipp Reisner {
383794abb75SPhilipp Reisner 	switch (mdev->state.conn) {
384794abb75SPhilipp Reisner 	case C_VERIFY_S:
385794abb75SPhilipp Reisner 		w_make_ov_request(mdev, w, cancel);
386794abb75SPhilipp Reisner 		break;
387794abb75SPhilipp Reisner 	case C_SYNC_TARGET:
388794abb75SPhilipp Reisner 		w_make_resync_request(mdev, w, cancel);
389794abb75SPhilipp Reisner 		break;
390794abb75SPhilipp Reisner 	}
391794abb75SPhilipp Reisner 
392794abb75SPhilipp Reisner 	return 1;
393794abb75SPhilipp Reisner }
394794abb75SPhilipp Reisner 
395b411b363SPhilipp Reisner void resync_timer_fn(unsigned long data)
396b411b363SPhilipp Reisner {
397b411b363SPhilipp Reisner 	struct drbd_conf *mdev = (struct drbd_conf *) data;
398b411b363SPhilipp Reisner 
399794abb75SPhilipp Reisner 	if (list_empty(&mdev->resync_work.list))
400b411b363SPhilipp Reisner 		drbd_queue_work(&mdev->data.work, &mdev->resync_work);
401b411b363SPhilipp Reisner }
402b411b363SPhilipp Reisner 
403778f271dSPhilipp Reisner static void fifo_set(struct fifo_buffer *fb, int value)
404778f271dSPhilipp Reisner {
405778f271dSPhilipp Reisner 	int i;
406778f271dSPhilipp Reisner 
407778f271dSPhilipp Reisner 	for (i = 0; i < fb->size; i++)
408f10f2623SPhilipp Reisner 		fb->values[i] = value;
409778f271dSPhilipp Reisner }
410778f271dSPhilipp Reisner 
411778f271dSPhilipp Reisner static int fifo_push(struct fifo_buffer *fb, int value)
412778f271dSPhilipp Reisner {
413778f271dSPhilipp Reisner 	int ov;
414778f271dSPhilipp Reisner 
415778f271dSPhilipp Reisner 	ov = fb->values[fb->head_index];
416778f271dSPhilipp Reisner 	fb->values[fb->head_index++] = value;
417778f271dSPhilipp Reisner 
418778f271dSPhilipp Reisner 	if (fb->head_index >= fb->size)
419778f271dSPhilipp Reisner 		fb->head_index = 0;
420778f271dSPhilipp Reisner 
421778f271dSPhilipp Reisner 	return ov;
422778f271dSPhilipp Reisner }
423778f271dSPhilipp Reisner 
424778f271dSPhilipp Reisner static void fifo_add_val(struct fifo_buffer *fb, int value)
425778f271dSPhilipp Reisner {
426778f271dSPhilipp Reisner 	int i;
427778f271dSPhilipp Reisner 
428778f271dSPhilipp Reisner 	for (i = 0; i < fb->size; i++)
429778f271dSPhilipp Reisner 		fb->values[i] += value;
430778f271dSPhilipp Reisner }
431778f271dSPhilipp Reisner 
4329d77a5feSPhilipp Reisner static int drbd_rs_controller(struct drbd_conf *mdev)
433778f271dSPhilipp Reisner {
434778f271dSPhilipp Reisner 	unsigned int sect_in;  /* Number of sectors that came in since the last turn */
435778f271dSPhilipp Reisner 	unsigned int want;     /* The number of sectors we want in the proxy */
436778f271dSPhilipp Reisner 	int req_sect; /* Number of sectors to request in this turn */
437778f271dSPhilipp Reisner 	int correction; /* Number of sectors more we need in the proxy*/
438778f271dSPhilipp Reisner 	int cps; /* correction per invocation of drbd_rs_controller() */
439778f271dSPhilipp Reisner 	int steps; /* Number of time steps to plan ahead */
440778f271dSPhilipp Reisner 	int curr_corr;
441778f271dSPhilipp Reisner 	int max_sect;
442778f271dSPhilipp Reisner 
443778f271dSPhilipp Reisner 	sect_in = atomic_xchg(&mdev->rs_sect_in, 0); /* Number of sectors that came in */
444778f271dSPhilipp Reisner 	mdev->rs_in_flight -= sect_in;
445778f271dSPhilipp Reisner 
446778f271dSPhilipp Reisner 	spin_lock(&mdev->peer_seq_lock); /* get an atomic view on mdev->rs_plan_s */
447778f271dSPhilipp Reisner 
448778f271dSPhilipp Reisner 	steps = mdev->rs_plan_s.size; /* (mdev->sync_conf.c_plan_ahead * 10 * SLEEP_TIME) / HZ; */
449778f271dSPhilipp Reisner 
450778f271dSPhilipp Reisner 	if (mdev->rs_in_flight + sect_in == 0) { /* At start of resync */
451778f271dSPhilipp Reisner 		want = ((mdev->sync_conf.rate * 2 * SLEEP_TIME) / HZ) * steps;
452778f271dSPhilipp Reisner 	} else { /* normal path */
453778f271dSPhilipp Reisner 		want = mdev->sync_conf.c_fill_target ? mdev->sync_conf.c_fill_target :
454778f271dSPhilipp Reisner 			sect_in * mdev->sync_conf.c_delay_target * HZ / (SLEEP_TIME * 10);
455778f271dSPhilipp Reisner 	}
456778f271dSPhilipp Reisner 
457778f271dSPhilipp Reisner 	correction = want - mdev->rs_in_flight - mdev->rs_planed;
458778f271dSPhilipp Reisner 
459778f271dSPhilipp Reisner 	/* Plan ahead */
460778f271dSPhilipp Reisner 	cps = correction / steps;
461778f271dSPhilipp Reisner 	fifo_add_val(&mdev->rs_plan_s, cps);
462778f271dSPhilipp Reisner 	mdev->rs_planed += cps * steps;
463778f271dSPhilipp Reisner 
464778f271dSPhilipp Reisner 	/* What we do in this step */
465778f271dSPhilipp Reisner 	curr_corr = fifo_push(&mdev->rs_plan_s, 0);
466778f271dSPhilipp Reisner 	spin_unlock(&mdev->peer_seq_lock);
467778f271dSPhilipp Reisner 	mdev->rs_planed -= curr_corr;
468778f271dSPhilipp Reisner 
469778f271dSPhilipp Reisner 	req_sect = sect_in + curr_corr;
470778f271dSPhilipp Reisner 	if (req_sect < 0)
471778f271dSPhilipp Reisner 		req_sect = 0;
472778f271dSPhilipp Reisner 
473778f271dSPhilipp Reisner 	max_sect = (mdev->sync_conf.c_max_rate * 2 * SLEEP_TIME) / HZ;
474778f271dSPhilipp Reisner 	if (req_sect > max_sect)
475778f271dSPhilipp Reisner 		req_sect = max_sect;
476778f271dSPhilipp Reisner 
477778f271dSPhilipp Reisner 	/*
478778f271dSPhilipp Reisner 	dev_warn(DEV, "si=%u if=%d wa=%u co=%d st=%d cps=%d pl=%d cc=%d rs=%d\n",
479778f271dSPhilipp Reisner 		 sect_in, mdev->rs_in_flight, want, correction,
480778f271dSPhilipp Reisner 		 steps, cps, mdev->rs_planed, curr_corr, req_sect);
481778f271dSPhilipp Reisner 	*/
482778f271dSPhilipp Reisner 
483778f271dSPhilipp Reisner 	return req_sect;
484778f271dSPhilipp Reisner }
485778f271dSPhilipp Reisner 
4869d77a5feSPhilipp Reisner static int drbd_rs_number_requests(struct drbd_conf *mdev)
487e65f440dSLars Ellenberg {
488e65f440dSLars Ellenberg 	int number;
489e65f440dSLars Ellenberg 	if (mdev->rs_plan_s.size) { /* mdev->sync_conf.c_plan_ahead */
490e65f440dSLars Ellenberg 		number = drbd_rs_controller(mdev) >> (BM_BLOCK_SHIFT - 9);
491e65f440dSLars Ellenberg 		mdev->c_sync_rate = number * HZ * (BM_BLOCK_SIZE / 1024) / SLEEP_TIME;
492e65f440dSLars Ellenberg 	} else {
493e65f440dSLars Ellenberg 		mdev->c_sync_rate = mdev->sync_conf.rate;
494e65f440dSLars Ellenberg 		number = SLEEP_TIME * mdev->c_sync_rate  / ((BM_BLOCK_SIZE / 1024) * HZ);
495e65f440dSLars Ellenberg 	}
496e65f440dSLars Ellenberg 
497e65f440dSLars Ellenberg 	/* ignore the amount of pending requests, the resync controller should
498e65f440dSLars Ellenberg 	 * throttle down to incoming reply rate soon enough anyways. */
499e65f440dSLars Ellenberg 	return number;
500e65f440dSLars Ellenberg }
501e65f440dSLars Ellenberg 
5029d77a5feSPhilipp Reisner static int w_make_resync_request(struct drbd_conf *mdev,
503b411b363SPhilipp Reisner 				 struct drbd_work *w, int cancel)
504b411b363SPhilipp Reisner {
505b411b363SPhilipp Reisner 	unsigned long bit;
506b411b363SPhilipp Reisner 	sector_t sector;
507b411b363SPhilipp Reisner 	const sector_t capacity = drbd_get_capacity(mdev->this_bdev);
5081816a2b4SLars Ellenberg 	int max_bio_size;
509e65f440dSLars Ellenberg 	int number, rollback_i, size;
510b411b363SPhilipp Reisner 	int align, queued, sndbuf;
5110f0601f4SLars Ellenberg 	int i = 0;
512b411b363SPhilipp Reisner 
513b411b363SPhilipp Reisner 	if (unlikely(cancel))
514b411b363SPhilipp Reisner 		return 1;
515b411b363SPhilipp Reisner 
516af85e8e8SLars Ellenberg 	if (mdev->rs_total == 0) {
517af85e8e8SLars Ellenberg 		/* empty resync? */
518af85e8e8SLars Ellenberg 		drbd_resync_finished(mdev);
519af85e8e8SLars Ellenberg 		return 1;
520af85e8e8SLars Ellenberg 	}
521af85e8e8SLars Ellenberg 
522b411b363SPhilipp Reisner 	if (!get_ldev(mdev)) {
523b411b363SPhilipp Reisner 		/* Since we only need to access mdev->rsync a
524b411b363SPhilipp Reisner 		   get_ldev_if_state(mdev,D_FAILED) would be sufficient, but
525b411b363SPhilipp Reisner 		   to continue resync with a broken disk makes no sense at
526b411b363SPhilipp Reisner 		   all */
527b411b363SPhilipp Reisner 		dev_err(DEV, "Disk broke down during resync!\n");
528b411b363SPhilipp Reisner 		return 1;
529b411b363SPhilipp Reisner 	}
530b411b363SPhilipp Reisner 
5310cfdd247SPhilipp Reisner 	max_bio_size = queue_max_hw_sectors(mdev->rq_queue) << 9;
532e65f440dSLars Ellenberg 	number = drbd_rs_number_requests(mdev);
533e65f440dSLars Ellenberg 	if (number == 0)
5340f0601f4SLars Ellenberg 		goto requeue;
535b411b363SPhilipp Reisner 
536b411b363SPhilipp Reisner 	for (i = 0; i < number; i++) {
537b411b363SPhilipp Reisner 		/* Stop generating RS requests, when half of the send buffer is filled */
538b411b363SPhilipp Reisner 		mutex_lock(&mdev->data.mutex);
539b411b363SPhilipp Reisner 		if (mdev->data.socket) {
540b411b363SPhilipp Reisner 			queued = mdev->data.socket->sk->sk_wmem_queued;
541b411b363SPhilipp Reisner 			sndbuf = mdev->data.socket->sk->sk_sndbuf;
542b411b363SPhilipp Reisner 		} else {
543b411b363SPhilipp Reisner 			queued = 1;
544b411b363SPhilipp Reisner 			sndbuf = 0;
545b411b363SPhilipp Reisner 		}
546b411b363SPhilipp Reisner 		mutex_unlock(&mdev->data.mutex);
547b411b363SPhilipp Reisner 		if (queued > sndbuf / 2)
548b411b363SPhilipp Reisner 			goto requeue;
549b411b363SPhilipp Reisner 
550b411b363SPhilipp Reisner next_sector:
551b411b363SPhilipp Reisner 		size = BM_BLOCK_SIZE;
552b411b363SPhilipp Reisner 		bit  = drbd_bm_find_next(mdev, mdev->bm_resync_fo);
553b411b363SPhilipp Reisner 
5544b0715f0SLars Ellenberg 		if (bit == DRBD_END_OF_BITMAP) {
555b411b363SPhilipp Reisner 			mdev->bm_resync_fo = drbd_bm_bits(mdev);
556b411b363SPhilipp Reisner 			put_ldev(mdev);
557b411b363SPhilipp Reisner 			return 1;
558b411b363SPhilipp Reisner 		}
559b411b363SPhilipp Reisner 
560b411b363SPhilipp Reisner 		sector = BM_BIT_TO_SECT(bit);
561b411b363SPhilipp Reisner 
562e3555d85SPhilipp Reisner 		if (drbd_rs_should_slow_down(mdev, sector) ||
563e3555d85SPhilipp Reisner 		    drbd_try_rs_begin_io(mdev, sector)) {
564b411b363SPhilipp Reisner 			mdev->bm_resync_fo = bit;
565b411b363SPhilipp Reisner 			goto requeue;
566b411b363SPhilipp Reisner 		}
567b411b363SPhilipp Reisner 		mdev->bm_resync_fo = bit + 1;
568b411b363SPhilipp Reisner 
569b411b363SPhilipp Reisner 		if (unlikely(drbd_bm_test_bit(mdev, bit) == 0)) {
570b411b363SPhilipp Reisner 			drbd_rs_complete_io(mdev, sector);
571b411b363SPhilipp Reisner 			goto next_sector;
572b411b363SPhilipp Reisner 		}
573b411b363SPhilipp Reisner 
5741816a2b4SLars Ellenberg #if DRBD_MAX_BIO_SIZE > BM_BLOCK_SIZE
575b411b363SPhilipp Reisner 		/* try to find some adjacent bits.
576b411b363SPhilipp Reisner 		 * we stop if we have already the maximum req size.
577b411b363SPhilipp Reisner 		 *
578b411b363SPhilipp Reisner 		 * Additionally always align bigger requests, in order to
579b411b363SPhilipp Reisner 		 * be prepared for all stripe sizes of software RAIDs.
580b411b363SPhilipp Reisner 		 */
581b411b363SPhilipp Reisner 		align = 1;
582d207450cSPhilipp Reisner 		rollback_i = i;
583b411b363SPhilipp Reisner 		for (;;) {
5841816a2b4SLars Ellenberg 			if (size + BM_BLOCK_SIZE > max_bio_size)
585b411b363SPhilipp Reisner 				break;
586b411b363SPhilipp Reisner 
587b411b363SPhilipp Reisner 			/* Be always aligned */
588b411b363SPhilipp Reisner 			if (sector & ((1<<(align+3))-1))
589b411b363SPhilipp Reisner 				break;
590b411b363SPhilipp Reisner 
591b411b363SPhilipp Reisner 			/* do not cross extent boundaries */
592b411b363SPhilipp Reisner 			if (((bit+1) & BM_BLOCKS_PER_BM_EXT_MASK) == 0)
593b411b363SPhilipp Reisner 				break;
594b411b363SPhilipp Reisner 			/* now, is it actually dirty, after all?
595b411b363SPhilipp Reisner 			 * caution, drbd_bm_test_bit is tri-state for some
596b411b363SPhilipp Reisner 			 * obscure reason; ( b == 0 ) would get the out-of-band
597b411b363SPhilipp Reisner 			 * only accidentally right because of the "oddly sized"
598b411b363SPhilipp Reisner 			 * adjustment below */
599b411b363SPhilipp Reisner 			if (drbd_bm_test_bit(mdev, bit+1) != 1)
600b411b363SPhilipp Reisner 				break;
601b411b363SPhilipp Reisner 			bit++;
602b411b363SPhilipp Reisner 			size += BM_BLOCK_SIZE;
603b411b363SPhilipp Reisner 			if ((BM_BLOCK_SIZE << align) <= size)
604b411b363SPhilipp Reisner 				align++;
605b411b363SPhilipp Reisner 			i++;
606b411b363SPhilipp Reisner 		}
607b411b363SPhilipp Reisner 		/* if we merged some,
608b411b363SPhilipp Reisner 		 * reset the offset to start the next drbd_bm_find_next from */
609b411b363SPhilipp Reisner 		if (size > BM_BLOCK_SIZE)
610b411b363SPhilipp Reisner 			mdev->bm_resync_fo = bit + 1;
611b411b363SPhilipp Reisner #endif
612b411b363SPhilipp Reisner 
613b411b363SPhilipp Reisner 		/* adjust very last sectors, in case we are oddly sized */
614b411b363SPhilipp Reisner 		if (sector + (size>>9) > capacity)
615b411b363SPhilipp Reisner 			size = (capacity-sector)<<9;
616b411b363SPhilipp Reisner 		if (mdev->agreed_pro_version >= 89 && mdev->csums_tfm) {
617b411b363SPhilipp Reisner 			switch (read_for_csum(mdev, sector, size)) {
61880a40e43SLars Ellenberg 			case -EIO: /* Disk failure */
619b411b363SPhilipp Reisner 				put_ldev(mdev);
620b411b363SPhilipp Reisner 				return 0;
62180a40e43SLars Ellenberg 			case -EAGAIN: /* allocation failed, or ldev busy */
622b411b363SPhilipp Reisner 				drbd_rs_complete_io(mdev, sector);
623b411b363SPhilipp Reisner 				mdev->bm_resync_fo = BM_SECT_TO_BIT(sector);
624d207450cSPhilipp Reisner 				i = rollback_i;
625b411b363SPhilipp Reisner 				goto requeue;
62680a40e43SLars Ellenberg 			case 0:
62780a40e43SLars Ellenberg 				/* everything ok */
62880a40e43SLars Ellenberg 				break;
62980a40e43SLars Ellenberg 			default:
63080a40e43SLars Ellenberg 				BUG();
631b411b363SPhilipp Reisner 			}
632b411b363SPhilipp Reisner 		} else {
633b411b363SPhilipp Reisner 			inc_rs_pending(mdev);
634b411b363SPhilipp Reisner 			if (!drbd_send_drequest(mdev, P_RS_DATA_REQUEST,
635b411b363SPhilipp Reisner 					       sector, size, ID_SYNCER)) {
636b411b363SPhilipp Reisner 				dev_err(DEV, "drbd_send_drequest() failed, aborting...\n");
637b411b363SPhilipp Reisner 				dec_rs_pending(mdev);
638b411b363SPhilipp Reisner 				put_ldev(mdev);
639b411b363SPhilipp Reisner 				return 0;
640b411b363SPhilipp Reisner 			}
641b411b363SPhilipp Reisner 		}
642b411b363SPhilipp Reisner 	}
643b411b363SPhilipp Reisner 
644b411b363SPhilipp Reisner 	if (mdev->bm_resync_fo >= drbd_bm_bits(mdev)) {
645b411b363SPhilipp Reisner 		/* last syncer _request_ was sent,
646b411b363SPhilipp Reisner 		 * but the P_RS_DATA_REPLY not yet received.  sync will end (and
647b411b363SPhilipp Reisner 		 * next sync group will resume), as soon as we receive the last
648b411b363SPhilipp Reisner 		 * resync data block, and the last bit is cleared.
649b411b363SPhilipp Reisner 		 * until then resync "work" is "inactive" ...
650b411b363SPhilipp Reisner 		 */
651b411b363SPhilipp Reisner 		put_ldev(mdev);
652b411b363SPhilipp Reisner 		return 1;
653b411b363SPhilipp Reisner 	}
654b411b363SPhilipp Reisner 
655b411b363SPhilipp Reisner  requeue:
656778f271dSPhilipp Reisner 	mdev->rs_in_flight += (i << (BM_BLOCK_SHIFT - 9));
657b411b363SPhilipp Reisner 	mod_timer(&mdev->resync_timer, jiffies + SLEEP_TIME);
658b411b363SPhilipp Reisner 	put_ldev(mdev);
659b411b363SPhilipp Reisner 	return 1;
660b411b363SPhilipp Reisner }
661b411b363SPhilipp Reisner 
662b411b363SPhilipp Reisner static int w_make_ov_request(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
663b411b363SPhilipp Reisner {
664b411b363SPhilipp Reisner 	int number, i, size;
665b411b363SPhilipp Reisner 	sector_t sector;
666b411b363SPhilipp Reisner 	const sector_t capacity = drbd_get_capacity(mdev->this_bdev);
667b411b363SPhilipp Reisner 
668b411b363SPhilipp Reisner 	if (unlikely(cancel))
669b411b363SPhilipp Reisner 		return 1;
670b411b363SPhilipp Reisner 
6712649f080SLars Ellenberg 	number = drbd_rs_number_requests(mdev);
672b411b363SPhilipp Reisner 
673b411b363SPhilipp Reisner 	sector = mdev->ov_position;
674b411b363SPhilipp Reisner 	for (i = 0; i < number; i++) {
675b411b363SPhilipp Reisner 		if (sector >= capacity) {
676b411b363SPhilipp Reisner 			return 1;
677b411b363SPhilipp Reisner 		}
678b411b363SPhilipp Reisner 
679b411b363SPhilipp Reisner 		size = BM_BLOCK_SIZE;
680b411b363SPhilipp Reisner 
681e3555d85SPhilipp Reisner 		if (drbd_rs_should_slow_down(mdev, sector) ||
682e3555d85SPhilipp Reisner 		    drbd_try_rs_begin_io(mdev, sector)) {
683b411b363SPhilipp Reisner 			mdev->ov_position = sector;
684b411b363SPhilipp Reisner 			goto requeue;
685b411b363SPhilipp Reisner 		}
686b411b363SPhilipp Reisner 
687b411b363SPhilipp Reisner 		if (sector + (size>>9) > capacity)
688b411b363SPhilipp Reisner 			size = (capacity-sector)<<9;
689b411b363SPhilipp Reisner 
690b411b363SPhilipp Reisner 		inc_rs_pending(mdev);
691b411b363SPhilipp Reisner 		if (!drbd_send_ov_request(mdev, sector, size)) {
692b411b363SPhilipp Reisner 			dec_rs_pending(mdev);
693b411b363SPhilipp Reisner 			return 0;
694b411b363SPhilipp Reisner 		}
695b411b363SPhilipp Reisner 		sector += BM_SECT_PER_BIT;
696b411b363SPhilipp Reisner 	}
697b411b363SPhilipp Reisner 	mdev->ov_position = sector;
698b411b363SPhilipp Reisner 
699b411b363SPhilipp Reisner  requeue:
7002649f080SLars Ellenberg 	mdev->rs_in_flight += (i << (BM_BLOCK_SHIFT - 9));
701b411b363SPhilipp Reisner 	mod_timer(&mdev->resync_timer, jiffies + SLEEP_TIME);
702b411b363SPhilipp Reisner 	return 1;
703b411b363SPhilipp Reisner }
704b411b363SPhilipp Reisner 
705c4752ef1SPhilipp Reisner 
706370a43e7SPhilipp Reisner void start_resync_timer_fn(unsigned long data)
707370a43e7SPhilipp Reisner {
708370a43e7SPhilipp Reisner 	struct drbd_conf *mdev = (struct drbd_conf *) data;
709370a43e7SPhilipp Reisner 
710370a43e7SPhilipp Reisner 	drbd_queue_work(&mdev->data.work, &mdev->start_resync_work);
711370a43e7SPhilipp Reisner }
712370a43e7SPhilipp Reisner 
713c4752ef1SPhilipp Reisner int w_start_resync(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
714c4752ef1SPhilipp Reisner {
715370a43e7SPhilipp Reisner 	if (atomic_read(&mdev->unacked_cnt) || atomic_read(&mdev->rs_pending_cnt)) {
716370a43e7SPhilipp Reisner 		dev_warn(DEV, "w_start_resync later...\n");
717370a43e7SPhilipp Reisner 		mdev->start_resync_timer.expires = jiffies + HZ/10;
718370a43e7SPhilipp Reisner 		add_timer(&mdev->start_resync_timer);
719370a43e7SPhilipp Reisner 		return 1;
720370a43e7SPhilipp Reisner 	}
721c4752ef1SPhilipp Reisner 
722370a43e7SPhilipp Reisner 	drbd_start_resync(mdev, C_SYNC_SOURCE);
723370a43e7SPhilipp Reisner 	clear_bit(AHEAD_TO_SYNC_SOURCE, &mdev->current_epoch->flags);
724c4752ef1SPhilipp Reisner 	return 1;
725c4752ef1SPhilipp Reisner }
726c4752ef1SPhilipp Reisner 
727b411b363SPhilipp Reisner int w_ov_finished(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
728b411b363SPhilipp Reisner {
729b411b363SPhilipp Reisner 	kfree(w);
730b411b363SPhilipp Reisner 	ov_oos_print(mdev);
731b411b363SPhilipp Reisner 	drbd_resync_finished(mdev);
732b411b363SPhilipp Reisner 
733b411b363SPhilipp Reisner 	return 1;
734b411b363SPhilipp Reisner }
735b411b363SPhilipp Reisner 
736b411b363SPhilipp Reisner static int w_resync_finished(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
737b411b363SPhilipp Reisner {
738b411b363SPhilipp Reisner 	kfree(w);
739b411b363SPhilipp Reisner 
740b411b363SPhilipp Reisner 	drbd_resync_finished(mdev);
741b411b363SPhilipp Reisner 
742b411b363SPhilipp Reisner 	return 1;
743b411b363SPhilipp Reisner }
744b411b363SPhilipp Reisner 
745af85e8e8SLars Ellenberg static void ping_peer(struct drbd_conf *mdev)
746af85e8e8SLars Ellenberg {
747af85e8e8SLars Ellenberg 	clear_bit(GOT_PING_ACK, &mdev->flags);
748af85e8e8SLars Ellenberg 	request_ping(mdev);
749af85e8e8SLars Ellenberg 	wait_event(mdev->misc_wait,
750af85e8e8SLars Ellenberg 		   test_bit(GOT_PING_ACK, &mdev->flags) || mdev->state.conn < C_CONNECTED);
751af85e8e8SLars Ellenberg }
752af85e8e8SLars Ellenberg 
753b411b363SPhilipp Reisner int drbd_resync_finished(struct drbd_conf *mdev)
754b411b363SPhilipp Reisner {
755b411b363SPhilipp Reisner 	unsigned long db, dt, dbdt;
756b411b363SPhilipp Reisner 	unsigned long n_oos;
757b411b363SPhilipp Reisner 	union drbd_state os, ns;
758b411b363SPhilipp Reisner 	struct drbd_work *w;
759b411b363SPhilipp Reisner 	char *khelper_cmd = NULL;
76026525618SLars Ellenberg 	int verify_done = 0;
761b411b363SPhilipp Reisner 
762b411b363SPhilipp Reisner 	/* Remove all elements from the resync LRU. Since future actions
763b411b363SPhilipp Reisner 	 * might set bits in the (main) bitmap, then the entries in the
764b411b363SPhilipp Reisner 	 * resync LRU would be wrong. */
765b411b363SPhilipp Reisner 	if (drbd_rs_del_all(mdev)) {
766b411b363SPhilipp Reisner 		/* In case this is not possible now, most probably because
767b411b363SPhilipp Reisner 		 * there are P_RS_DATA_REPLY Packets lingering on the worker's
768b411b363SPhilipp Reisner 		 * queue (or even the read operations for those packets
769b411b363SPhilipp Reisner 		 * is not finished by now).   Retry in 100ms. */
770b411b363SPhilipp Reisner 
77120ee6390SPhilipp Reisner 		schedule_timeout_interruptible(HZ / 10);
772b411b363SPhilipp Reisner 		w = kmalloc(sizeof(struct drbd_work), GFP_ATOMIC);
773b411b363SPhilipp Reisner 		if (w) {
774b411b363SPhilipp Reisner 			w->cb = w_resync_finished;
775b411b363SPhilipp Reisner 			drbd_queue_work(&mdev->data.work, w);
776b411b363SPhilipp Reisner 			return 1;
777b411b363SPhilipp Reisner 		}
778b411b363SPhilipp Reisner 		dev_err(DEV, "Warn failed to drbd_rs_del_all() and to kmalloc(w).\n");
779b411b363SPhilipp Reisner 	}
780b411b363SPhilipp Reisner 
781b411b363SPhilipp Reisner 	dt = (jiffies - mdev->rs_start - mdev->rs_paused) / HZ;
782b411b363SPhilipp Reisner 	if (dt <= 0)
783b411b363SPhilipp Reisner 		dt = 1;
784b411b363SPhilipp Reisner 	db = mdev->rs_total;
785b411b363SPhilipp Reisner 	dbdt = Bit2KB(db/dt);
786b411b363SPhilipp Reisner 	mdev->rs_paused /= HZ;
787b411b363SPhilipp Reisner 
788b411b363SPhilipp Reisner 	if (!get_ldev(mdev))
789b411b363SPhilipp Reisner 		goto out;
790b411b363SPhilipp Reisner 
791af85e8e8SLars Ellenberg 	ping_peer(mdev);
792af85e8e8SLars Ellenberg 
793b411b363SPhilipp Reisner 	spin_lock_irq(&mdev->req_lock);
794b411b363SPhilipp Reisner 	os = mdev->state;
795b411b363SPhilipp Reisner 
79626525618SLars Ellenberg 	verify_done = (os.conn == C_VERIFY_S || os.conn == C_VERIFY_T);
79726525618SLars Ellenberg 
798b411b363SPhilipp Reisner 	/* This protects us against multiple calls (that can happen in the presence
799b411b363SPhilipp Reisner 	   of application IO), and against connectivity loss just before we arrive here. */
800b411b363SPhilipp Reisner 	if (os.conn <= C_CONNECTED)
801b411b363SPhilipp Reisner 		goto out_unlock;
802b411b363SPhilipp Reisner 
803b411b363SPhilipp Reisner 	ns = os;
804b411b363SPhilipp Reisner 	ns.conn = C_CONNECTED;
805b411b363SPhilipp Reisner 
806b411b363SPhilipp Reisner 	dev_info(DEV, "%s done (total %lu sec; paused %lu sec; %lu K/sec)\n",
80726525618SLars Ellenberg 	     verify_done ? "Online verify " : "Resync",
808b411b363SPhilipp Reisner 	     dt + mdev->rs_paused, mdev->rs_paused, dbdt);
809b411b363SPhilipp Reisner 
810b411b363SPhilipp Reisner 	n_oos = drbd_bm_total_weight(mdev);
811b411b363SPhilipp Reisner 
812b411b363SPhilipp Reisner 	if (os.conn == C_VERIFY_S || os.conn == C_VERIFY_T) {
813b411b363SPhilipp Reisner 		if (n_oos) {
814b411b363SPhilipp Reisner 			dev_alert(DEV, "Online verify found %lu %dk block out of sync!\n",
815b411b363SPhilipp Reisner 			      n_oos, Bit2KB(1));
816b411b363SPhilipp Reisner 			khelper_cmd = "out-of-sync";
817b411b363SPhilipp Reisner 		}
818b411b363SPhilipp Reisner 	} else {
819b411b363SPhilipp Reisner 		D_ASSERT((n_oos - mdev->rs_failed) == 0);
820b411b363SPhilipp Reisner 
821b411b363SPhilipp Reisner 		if (os.conn == C_SYNC_TARGET || os.conn == C_PAUSED_SYNC_T)
822b411b363SPhilipp Reisner 			khelper_cmd = "after-resync-target";
823b411b363SPhilipp Reisner 
824b411b363SPhilipp Reisner 		if (mdev->csums_tfm && mdev->rs_total) {
825b411b363SPhilipp Reisner 			const unsigned long s = mdev->rs_same_csum;
826b411b363SPhilipp Reisner 			const unsigned long t = mdev->rs_total;
827b411b363SPhilipp Reisner 			const int ratio =
828b411b363SPhilipp Reisner 				(t == 0)     ? 0 :
829b411b363SPhilipp Reisner 			(t < 100000) ? ((s*100)/t) : (s/(t/100));
830b411b363SPhilipp Reisner 			dev_info(DEV, "%u %% had equal checksums, eliminated: %luK; "
831b411b363SPhilipp Reisner 			     "transferred %luK total %luK\n",
832b411b363SPhilipp Reisner 			     ratio,
833b411b363SPhilipp Reisner 			     Bit2KB(mdev->rs_same_csum),
834b411b363SPhilipp Reisner 			     Bit2KB(mdev->rs_total - mdev->rs_same_csum),
835b411b363SPhilipp Reisner 			     Bit2KB(mdev->rs_total));
836b411b363SPhilipp Reisner 		}
837b411b363SPhilipp Reisner 	}
838b411b363SPhilipp Reisner 
839b411b363SPhilipp Reisner 	if (mdev->rs_failed) {
840b411b363SPhilipp Reisner 		dev_info(DEV, "            %lu failed blocks\n", mdev->rs_failed);
841b411b363SPhilipp Reisner 
842b411b363SPhilipp Reisner 		if (os.conn == C_SYNC_TARGET || os.conn == C_PAUSED_SYNC_T) {
843b411b363SPhilipp Reisner 			ns.disk = D_INCONSISTENT;
844b411b363SPhilipp Reisner 			ns.pdsk = D_UP_TO_DATE;
845b411b363SPhilipp Reisner 		} else {
846b411b363SPhilipp Reisner 			ns.disk = D_UP_TO_DATE;
847b411b363SPhilipp Reisner 			ns.pdsk = D_INCONSISTENT;
848b411b363SPhilipp Reisner 		}
849b411b363SPhilipp Reisner 	} else {
850b411b363SPhilipp Reisner 		ns.disk = D_UP_TO_DATE;
851b411b363SPhilipp Reisner 		ns.pdsk = D_UP_TO_DATE;
852b411b363SPhilipp Reisner 
853b411b363SPhilipp Reisner 		if (os.conn == C_SYNC_TARGET || os.conn == C_PAUSED_SYNC_T) {
854b411b363SPhilipp Reisner 			if (mdev->p_uuid) {
855b411b363SPhilipp Reisner 				int i;
856b411b363SPhilipp Reisner 				for (i = UI_BITMAP ; i <= UI_HISTORY_END ; i++)
857b411b363SPhilipp Reisner 					_drbd_uuid_set(mdev, i, mdev->p_uuid[i]);
858b411b363SPhilipp Reisner 				drbd_uuid_set(mdev, UI_BITMAP, mdev->ldev->md.uuid[UI_CURRENT]);
859b411b363SPhilipp Reisner 				_drbd_uuid_set(mdev, UI_CURRENT, mdev->p_uuid[UI_CURRENT]);
860b411b363SPhilipp Reisner 			} else {
861b411b363SPhilipp Reisner 				dev_err(DEV, "mdev->p_uuid is NULL! BUG\n");
862b411b363SPhilipp Reisner 			}
863b411b363SPhilipp Reisner 		}
864b411b363SPhilipp Reisner 
86562b0da3aSLars Ellenberg 		if (!(os.conn == C_VERIFY_S || os.conn == C_VERIFY_T)) {
86662b0da3aSLars Ellenberg 			/* for verify runs, we don't update uuids here,
86762b0da3aSLars Ellenberg 			 * so there would be nothing to report. */
868b411b363SPhilipp Reisner 			drbd_uuid_set_bm(mdev, 0UL);
86962b0da3aSLars Ellenberg 			drbd_print_uuids(mdev, "updated UUIDs");
870b411b363SPhilipp Reisner 			if (mdev->p_uuid) {
871b411b363SPhilipp Reisner 				/* Now the two UUID sets are equal, update what we
872b411b363SPhilipp Reisner 				 * know of the peer. */
873b411b363SPhilipp Reisner 				int i;
874b411b363SPhilipp Reisner 				for (i = UI_CURRENT ; i <= UI_HISTORY_END ; i++)
875b411b363SPhilipp Reisner 					mdev->p_uuid[i] = mdev->ldev->md.uuid[i];
876b411b363SPhilipp Reisner 			}
877b411b363SPhilipp Reisner 		}
87862b0da3aSLars Ellenberg 	}
879b411b363SPhilipp Reisner 
880b411b363SPhilipp Reisner 	_drbd_set_state(mdev, ns, CS_VERBOSE, NULL);
881b411b363SPhilipp Reisner out_unlock:
882b411b363SPhilipp Reisner 	spin_unlock_irq(&mdev->req_lock);
883b411b363SPhilipp Reisner 	put_ldev(mdev);
884b411b363SPhilipp Reisner out:
885b411b363SPhilipp Reisner 	mdev->rs_total  = 0;
886b411b363SPhilipp Reisner 	mdev->rs_failed = 0;
887b411b363SPhilipp Reisner 	mdev->rs_paused = 0;
88826525618SLars Ellenberg 	if (verify_done)
889b411b363SPhilipp Reisner 		mdev->ov_start_sector = 0;
890b411b363SPhilipp Reisner 
89113d42685SLars Ellenberg 	drbd_md_sync(mdev);
89213d42685SLars Ellenberg 
893b411b363SPhilipp Reisner 	if (khelper_cmd)
894b411b363SPhilipp Reisner 		drbd_khelper(mdev, khelper_cmd);
895b411b363SPhilipp Reisner 
896b411b363SPhilipp Reisner 	return 1;
897b411b363SPhilipp Reisner }
898b411b363SPhilipp Reisner 
899b411b363SPhilipp Reisner /* helper */
900b411b363SPhilipp Reisner static void move_to_net_ee_or_free(struct drbd_conf *mdev, struct drbd_epoch_entry *e)
901b411b363SPhilipp Reisner {
90245bb912bSLars Ellenberg 	if (drbd_ee_has_active_page(e)) {
903b411b363SPhilipp Reisner 		/* This might happen if sendpage() has not finished */
904010f6e67SAndreas Gruenbacher 		int i = (e->i.size + PAGE_SIZE -1) >> PAGE_SHIFT;
905435f0740SLars Ellenberg 		atomic_add(i, &mdev->pp_in_use_by_net);
906435f0740SLars Ellenberg 		atomic_sub(i, &mdev->pp_in_use);
907b411b363SPhilipp Reisner 		spin_lock_irq(&mdev->req_lock);
908b411b363SPhilipp Reisner 		list_add_tail(&e->w.list, &mdev->net_ee);
909b411b363SPhilipp Reisner 		spin_unlock_irq(&mdev->req_lock);
910435f0740SLars Ellenberg 		wake_up(&drbd_pp_wait);
911b411b363SPhilipp Reisner 	} else
912b411b363SPhilipp Reisner 		drbd_free_ee(mdev, e);
913b411b363SPhilipp Reisner }
914b411b363SPhilipp Reisner 
915b411b363SPhilipp Reisner /**
916b411b363SPhilipp Reisner  * w_e_end_data_req() - Worker callback, to send a P_DATA_REPLY packet in response to a P_DATA_REQUEST
917b411b363SPhilipp Reisner  * @mdev:	DRBD device.
918b411b363SPhilipp Reisner  * @w:		work object.
919b411b363SPhilipp Reisner  * @cancel:	The connection will be closed anyways
920b411b363SPhilipp Reisner  */
921b411b363SPhilipp Reisner int w_e_end_data_req(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
922b411b363SPhilipp Reisner {
923b411b363SPhilipp Reisner 	struct drbd_epoch_entry *e = container_of(w, struct drbd_epoch_entry, w);
924b411b363SPhilipp Reisner 	int ok;
925b411b363SPhilipp Reisner 
926b411b363SPhilipp Reisner 	if (unlikely(cancel)) {
927b411b363SPhilipp Reisner 		drbd_free_ee(mdev, e);
928b411b363SPhilipp Reisner 		dec_unacked(mdev);
929b411b363SPhilipp Reisner 		return 1;
930b411b363SPhilipp Reisner 	}
931b411b363SPhilipp Reisner 
93245bb912bSLars Ellenberg 	if (likely((e->flags & EE_WAS_ERROR) == 0)) {
933b411b363SPhilipp Reisner 		ok = drbd_send_block(mdev, P_DATA_REPLY, e);
934b411b363SPhilipp Reisner 	} else {
935b411b363SPhilipp Reisner 		if (__ratelimit(&drbd_ratelimit_state))
936b411b363SPhilipp Reisner 			dev_err(DEV, "Sending NegDReply. sector=%llus.\n",
937010f6e67SAndreas Gruenbacher 			    (unsigned long long)e->i.sector);
938b411b363SPhilipp Reisner 
939b411b363SPhilipp Reisner 		ok = drbd_send_ack(mdev, P_NEG_DREPLY, e);
940b411b363SPhilipp Reisner 	}
941b411b363SPhilipp Reisner 
942b411b363SPhilipp Reisner 	dec_unacked(mdev);
943b411b363SPhilipp Reisner 
944b411b363SPhilipp Reisner 	move_to_net_ee_or_free(mdev, e);
945b411b363SPhilipp Reisner 
946b411b363SPhilipp Reisner 	if (unlikely(!ok))
947b411b363SPhilipp Reisner 		dev_err(DEV, "drbd_send_block() failed\n");
948b411b363SPhilipp Reisner 	return ok;
949b411b363SPhilipp Reisner }
950b411b363SPhilipp Reisner 
951b411b363SPhilipp Reisner /**
952b411b363SPhilipp Reisner  * w_e_end_rsdata_req() - Worker callback to send a P_RS_DATA_REPLY packet in response to a P_RS_DATA_REQUESTRS
953b411b363SPhilipp Reisner  * @mdev:	DRBD device.
954b411b363SPhilipp Reisner  * @w:		work object.
955b411b363SPhilipp Reisner  * @cancel:	The connection will be closed anyways
956b411b363SPhilipp Reisner  */
957b411b363SPhilipp Reisner int w_e_end_rsdata_req(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
958b411b363SPhilipp Reisner {
959b411b363SPhilipp Reisner 	struct drbd_epoch_entry *e = container_of(w, struct drbd_epoch_entry, w);
960b411b363SPhilipp Reisner 	int ok;
961b411b363SPhilipp Reisner 
962b411b363SPhilipp Reisner 	if (unlikely(cancel)) {
963b411b363SPhilipp Reisner 		drbd_free_ee(mdev, e);
964b411b363SPhilipp Reisner 		dec_unacked(mdev);
965b411b363SPhilipp Reisner 		return 1;
966b411b363SPhilipp Reisner 	}
967b411b363SPhilipp Reisner 
968b411b363SPhilipp Reisner 	if (get_ldev_if_state(mdev, D_FAILED)) {
969010f6e67SAndreas Gruenbacher 		drbd_rs_complete_io(mdev, e->i.sector);
970b411b363SPhilipp Reisner 		put_ldev(mdev);
971b411b363SPhilipp Reisner 	}
972b411b363SPhilipp Reisner 
973d612d309SPhilipp Reisner 	if (mdev->state.conn == C_AHEAD) {
974d612d309SPhilipp Reisner 		ok = drbd_send_ack(mdev, P_RS_CANCEL, e);
975d612d309SPhilipp Reisner 	} else if (likely((e->flags & EE_WAS_ERROR) == 0)) {
976b411b363SPhilipp Reisner 		if (likely(mdev->state.pdsk >= D_INCONSISTENT)) {
977b411b363SPhilipp Reisner 			inc_rs_pending(mdev);
978b411b363SPhilipp Reisner 			ok = drbd_send_block(mdev, P_RS_DATA_REPLY, e);
979b411b363SPhilipp Reisner 		} else {
980b411b363SPhilipp Reisner 			if (__ratelimit(&drbd_ratelimit_state))
981b411b363SPhilipp Reisner 				dev_err(DEV, "Not sending RSDataReply, "
982b411b363SPhilipp Reisner 				    "partner DISKLESS!\n");
983b411b363SPhilipp Reisner 			ok = 1;
984b411b363SPhilipp Reisner 		}
985b411b363SPhilipp Reisner 	} else {
986b411b363SPhilipp Reisner 		if (__ratelimit(&drbd_ratelimit_state))
987b411b363SPhilipp Reisner 			dev_err(DEV, "Sending NegRSDReply. sector %llus.\n",
988010f6e67SAndreas Gruenbacher 			    (unsigned long long)e->i.sector);
989b411b363SPhilipp Reisner 
990b411b363SPhilipp Reisner 		ok = drbd_send_ack(mdev, P_NEG_RS_DREPLY, e);
991b411b363SPhilipp Reisner 
992b411b363SPhilipp Reisner 		/* update resync data with failure */
993010f6e67SAndreas Gruenbacher 		drbd_rs_failed_io(mdev, e->i.sector, e->i.size);
994b411b363SPhilipp Reisner 	}
995b411b363SPhilipp Reisner 
996b411b363SPhilipp Reisner 	dec_unacked(mdev);
997b411b363SPhilipp Reisner 
998b411b363SPhilipp Reisner 	move_to_net_ee_or_free(mdev, e);
999b411b363SPhilipp Reisner 
1000b411b363SPhilipp Reisner 	if (unlikely(!ok))
1001b411b363SPhilipp Reisner 		dev_err(DEV, "drbd_send_block() failed\n");
1002b411b363SPhilipp Reisner 	return ok;
1003b411b363SPhilipp Reisner }
1004b411b363SPhilipp Reisner 
1005b411b363SPhilipp Reisner int w_e_end_csum_rs_req(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
1006b411b363SPhilipp Reisner {
1007b411b363SPhilipp Reisner 	struct drbd_epoch_entry *e = container_of(w, struct drbd_epoch_entry, w);
1008b411b363SPhilipp Reisner 	struct digest_info *di;
1009b411b363SPhilipp Reisner 	int digest_size;
1010b411b363SPhilipp Reisner 	void *digest = NULL;
1011b411b363SPhilipp Reisner 	int ok, eq = 0;
1012b411b363SPhilipp Reisner 
1013b411b363SPhilipp Reisner 	if (unlikely(cancel)) {
1014b411b363SPhilipp Reisner 		drbd_free_ee(mdev, e);
1015b411b363SPhilipp Reisner 		dec_unacked(mdev);
1016b411b363SPhilipp Reisner 		return 1;
1017b411b363SPhilipp Reisner 	}
1018b411b363SPhilipp Reisner 
10191d53f09eSLars Ellenberg 	if (get_ldev(mdev)) {
1020010f6e67SAndreas Gruenbacher 		drbd_rs_complete_io(mdev, e->i.sector);
10211d53f09eSLars Ellenberg 		put_ldev(mdev);
10221d53f09eSLars Ellenberg 	}
1023b411b363SPhilipp Reisner 
102485719573SPhilipp Reisner 	di = e->digest;
1025b411b363SPhilipp Reisner 
102645bb912bSLars Ellenberg 	if (likely((e->flags & EE_WAS_ERROR) == 0)) {
1027b411b363SPhilipp Reisner 		/* quick hack to try to avoid a race against reconfiguration.
1028b411b363SPhilipp Reisner 		 * a real fix would be much more involved,
1029b411b363SPhilipp Reisner 		 * introducing more locking mechanisms */
1030b411b363SPhilipp Reisner 		if (mdev->csums_tfm) {
1031b411b363SPhilipp Reisner 			digest_size = crypto_hash_digestsize(mdev->csums_tfm);
1032b411b363SPhilipp Reisner 			D_ASSERT(digest_size == di->digest_size);
1033b411b363SPhilipp Reisner 			digest = kmalloc(digest_size, GFP_NOIO);
1034b411b363SPhilipp Reisner 		}
1035b411b363SPhilipp Reisner 		if (digest) {
103645bb912bSLars Ellenberg 			drbd_csum_ee(mdev, mdev->csums_tfm, e, digest);
1037b411b363SPhilipp Reisner 			eq = !memcmp(digest, di->digest, digest_size);
1038b411b363SPhilipp Reisner 			kfree(digest);
1039b411b363SPhilipp Reisner 		}
1040b411b363SPhilipp Reisner 
1041b411b363SPhilipp Reisner 		if (eq) {
1042010f6e67SAndreas Gruenbacher 			drbd_set_in_sync(mdev, e->i.sector, e->i.size);
1043676396d5SLars Ellenberg 			/* rs_same_csums unit is BM_BLOCK_SIZE */
1044010f6e67SAndreas Gruenbacher 			mdev->rs_same_csum += e->i.size >> BM_BLOCK_SHIFT;
1045b411b363SPhilipp Reisner 			ok = drbd_send_ack(mdev, P_RS_IS_IN_SYNC, e);
1046b411b363SPhilipp Reisner 		} else {
1047b411b363SPhilipp Reisner 			inc_rs_pending(mdev);
1048204bba99SPhilipp Reisner 			e->block_id = ID_SYNCER; /* By setting block_id, digest pointer becomes invalid! */
1049204bba99SPhilipp Reisner 			e->flags &= ~EE_HAS_DIGEST; /* This e no longer has a digest pointer */
1050204bba99SPhilipp Reisner 			kfree(di);
1051b411b363SPhilipp Reisner 			ok = drbd_send_block(mdev, P_RS_DATA_REPLY, e);
1052b411b363SPhilipp Reisner 		}
1053b411b363SPhilipp Reisner 	} else {
1054b411b363SPhilipp Reisner 		ok = drbd_send_ack(mdev, P_NEG_RS_DREPLY, e);
1055b411b363SPhilipp Reisner 		if (__ratelimit(&drbd_ratelimit_state))
1056b411b363SPhilipp Reisner 			dev_err(DEV, "Sending NegDReply. I guess it gets messy.\n");
1057b411b363SPhilipp Reisner 	}
1058b411b363SPhilipp Reisner 
1059b411b363SPhilipp Reisner 	dec_unacked(mdev);
1060b411b363SPhilipp Reisner 	move_to_net_ee_or_free(mdev, e);
1061b411b363SPhilipp Reisner 
1062b411b363SPhilipp Reisner 	if (unlikely(!ok))
1063b411b363SPhilipp Reisner 		dev_err(DEV, "drbd_send_block/ack() failed\n");
1064b411b363SPhilipp Reisner 	return ok;
1065b411b363SPhilipp Reisner }
1066b411b363SPhilipp Reisner 
106753ea4331SLars Ellenberg /* TODO merge common code with w_e_send_csum */
1068b411b363SPhilipp Reisner int w_e_end_ov_req(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
1069b411b363SPhilipp Reisner {
1070b411b363SPhilipp Reisner 	struct drbd_epoch_entry *e = container_of(w, struct drbd_epoch_entry, w);
1071010f6e67SAndreas Gruenbacher 	sector_t sector = e->i.sector;
1072010f6e67SAndreas Gruenbacher 	unsigned int size = e->i.size;
1073b411b363SPhilipp Reisner 	int digest_size;
1074b411b363SPhilipp Reisner 	void *digest;
1075b411b363SPhilipp Reisner 	int ok = 1;
1076b411b363SPhilipp Reisner 
1077b411b363SPhilipp Reisner 	if (unlikely(cancel))
1078b411b363SPhilipp Reisner 		goto out;
1079b411b363SPhilipp Reisner 
1080b411b363SPhilipp Reisner 	digest_size = crypto_hash_digestsize(mdev->verify_tfm);
1081b411b363SPhilipp Reisner 	digest = kmalloc(digest_size, GFP_NOIO);
10828f21420eSPhilipp Reisner 	if (!digest) {
10838f21420eSPhilipp Reisner 		ok = 0;	/* terminate the connection in case the allocation failed */
10848f21420eSPhilipp Reisner 		goto out;
10858f21420eSPhilipp Reisner 	}
10868f21420eSPhilipp Reisner 
10878f21420eSPhilipp Reisner 	if (likely(!(e->flags & EE_WAS_ERROR)))
108845bb912bSLars Ellenberg 		drbd_csum_ee(mdev, mdev->verify_tfm, e, digest);
10898f21420eSPhilipp Reisner 	else
10908f21420eSPhilipp Reisner 		memset(digest, 0, digest_size);
10918f21420eSPhilipp Reisner 
109253ea4331SLars Ellenberg 	/* Free e and pages before send.
109353ea4331SLars Ellenberg 	 * In case we block on congestion, we could otherwise run into
109453ea4331SLars Ellenberg 	 * some distributed deadlock, if the other side blocks on
109553ea4331SLars Ellenberg 	 * congestion as well, because our receiver blocks in
109653ea4331SLars Ellenberg 	 * drbd_pp_alloc due to pp_in_use > max_buffers. */
109753ea4331SLars Ellenberg 	drbd_free_ee(mdev, e);
109853ea4331SLars Ellenberg 	e = NULL;
1099b411b363SPhilipp Reisner 	inc_rs_pending(mdev);
110053ea4331SLars Ellenberg 	ok = drbd_send_drequest_csum(mdev, sector, size,
110153ea4331SLars Ellenberg 				     digest, digest_size,
110253ea4331SLars Ellenberg 				     P_OV_REPLY);
1103b411b363SPhilipp Reisner 	if (!ok)
1104b411b363SPhilipp Reisner 		dec_rs_pending(mdev);
1105b411b363SPhilipp Reisner 	kfree(digest);
1106b411b363SPhilipp Reisner 
1107b411b363SPhilipp Reisner out:
110853ea4331SLars Ellenberg 	if (e)
1109b411b363SPhilipp Reisner 		drbd_free_ee(mdev, e);
1110b411b363SPhilipp Reisner 	dec_unacked(mdev);
1111b411b363SPhilipp Reisner 	return ok;
1112b411b363SPhilipp Reisner }
1113b411b363SPhilipp Reisner 
1114b411b363SPhilipp Reisner void drbd_ov_oos_found(struct drbd_conf *mdev, sector_t sector, int size)
1115b411b363SPhilipp Reisner {
1116b411b363SPhilipp Reisner 	if (mdev->ov_last_oos_start + mdev->ov_last_oos_size == sector) {
1117b411b363SPhilipp Reisner 		mdev->ov_last_oos_size += size>>9;
1118b411b363SPhilipp Reisner 	} else {
1119b411b363SPhilipp Reisner 		mdev->ov_last_oos_start = sector;
1120b411b363SPhilipp Reisner 		mdev->ov_last_oos_size = size>>9;
1121b411b363SPhilipp Reisner 	}
1122b411b363SPhilipp Reisner 	drbd_set_out_of_sync(mdev, sector, size);
1123b411b363SPhilipp Reisner }
1124b411b363SPhilipp Reisner 
1125b411b363SPhilipp Reisner int w_e_end_ov_reply(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
1126b411b363SPhilipp Reisner {
1127b411b363SPhilipp Reisner 	struct drbd_epoch_entry *e = container_of(w, struct drbd_epoch_entry, w);
1128b411b363SPhilipp Reisner 	struct digest_info *di;
1129b411b363SPhilipp Reisner 	void *digest;
1130010f6e67SAndreas Gruenbacher 	sector_t sector = e->i.sector;
1131010f6e67SAndreas Gruenbacher 	unsigned int size = e->i.size;
113253ea4331SLars Ellenberg 	int digest_size;
1133b411b363SPhilipp Reisner 	int ok, eq = 0;
1134b411b363SPhilipp Reisner 
1135b411b363SPhilipp Reisner 	if (unlikely(cancel)) {
1136b411b363SPhilipp Reisner 		drbd_free_ee(mdev, e);
1137b411b363SPhilipp Reisner 		dec_unacked(mdev);
1138b411b363SPhilipp Reisner 		return 1;
1139b411b363SPhilipp Reisner 	}
1140b411b363SPhilipp Reisner 
1141b411b363SPhilipp Reisner 	/* after "cancel", because after drbd_disconnect/drbd_rs_cancel_all
1142b411b363SPhilipp Reisner 	 * the resync lru has been cleaned up already */
11431d53f09eSLars Ellenberg 	if (get_ldev(mdev)) {
1144010f6e67SAndreas Gruenbacher 		drbd_rs_complete_io(mdev, e->i.sector);
11451d53f09eSLars Ellenberg 		put_ldev(mdev);
11461d53f09eSLars Ellenberg 	}
1147b411b363SPhilipp Reisner 
114885719573SPhilipp Reisner 	di = e->digest;
1149b411b363SPhilipp Reisner 
115045bb912bSLars Ellenberg 	if (likely((e->flags & EE_WAS_ERROR) == 0)) {
1151b411b363SPhilipp Reisner 		digest_size = crypto_hash_digestsize(mdev->verify_tfm);
1152b411b363SPhilipp Reisner 		digest = kmalloc(digest_size, GFP_NOIO);
1153b411b363SPhilipp Reisner 		if (digest) {
115445bb912bSLars Ellenberg 			drbd_csum_ee(mdev, mdev->verify_tfm, e, digest);
1155b411b363SPhilipp Reisner 
1156b411b363SPhilipp Reisner 			D_ASSERT(digest_size == di->digest_size);
1157b411b363SPhilipp Reisner 			eq = !memcmp(digest, di->digest, digest_size);
1158b411b363SPhilipp Reisner 			kfree(digest);
1159b411b363SPhilipp Reisner 		}
1160b411b363SPhilipp Reisner 	}
1161b411b363SPhilipp Reisner 
116253ea4331SLars Ellenberg 		/* Free e and pages before send.
116353ea4331SLars Ellenberg 		 * In case we block on congestion, we could otherwise run into
116453ea4331SLars Ellenberg 		 * some distributed deadlock, if the other side blocks on
116553ea4331SLars Ellenberg 		 * congestion as well, because our receiver blocks in
116653ea4331SLars Ellenberg 		 * drbd_pp_alloc due to pp_in_use > max_buffers. */
116753ea4331SLars Ellenberg 	drbd_free_ee(mdev, e);
1168b411b363SPhilipp Reisner 	if (!eq)
116953ea4331SLars Ellenberg 		drbd_ov_oos_found(mdev, sector, size);
1170b411b363SPhilipp Reisner 	else
1171b411b363SPhilipp Reisner 		ov_oos_print(mdev);
1172b411b363SPhilipp Reisner 
117353ea4331SLars Ellenberg 	ok = drbd_send_ack_ex(mdev, P_OV_RESULT, sector, size,
1174b411b363SPhilipp Reisner 			      eq ? ID_IN_SYNC : ID_OUT_OF_SYNC);
1175b411b363SPhilipp Reisner 
117653ea4331SLars Ellenberg 	dec_unacked(mdev);
1177b411b363SPhilipp Reisner 
1178ea5442afSLars Ellenberg 	--mdev->ov_left;
1179ea5442afSLars Ellenberg 
1180ea5442afSLars Ellenberg 	/* let's advance progress step marks only for every other megabyte */
1181ea5442afSLars Ellenberg 	if ((mdev->ov_left & 0x200) == 0x200)
1182ea5442afSLars Ellenberg 		drbd_advance_rs_marks(mdev, mdev->ov_left);
1183ea5442afSLars Ellenberg 
1184ea5442afSLars Ellenberg 	if (mdev->ov_left == 0) {
1185b411b363SPhilipp Reisner 		ov_oos_print(mdev);
1186b411b363SPhilipp Reisner 		drbd_resync_finished(mdev);
1187b411b363SPhilipp Reisner 	}
1188b411b363SPhilipp Reisner 
1189b411b363SPhilipp Reisner 	return ok;
1190b411b363SPhilipp Reisner }
1191b411b363SPhilipp Reisner 
1192b411b363SPhilipp Reisner int w_prev_work_done(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
1193b411b363SPhilipp Reisner {
1194b411b363SPhilipp Reisner 	struct drbd_wq_barrier *b = container_of(w, struct drbd_wq_barrier, w);
1195b411b363SPhilipp Reisner 	complete(&b->done);
1196b411b363SPhilipp Reisner 	return 1;
1197b411b363SPhilipp Reisner }
1198b411b363SPhilipp Reisner 
1199b411b363SPhilipp Reisner int w_send_barrier(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
1200b411b363SPhilipp Reisner {
1201b411b363SPhilipp Reisner 	struct drbd_tl_epoch *b = container_of(w, struct drbd_tl_epoch, w);
1202b411b363SPhilipp Reisner 	struct p_barrier *p = &mdev->data.sbuf.barrier;
1203b411b363SPhilipp Reisner 	int ok = 1;
1204b411b363SPhilipp Reisner 
1205b411b363SPhilipp Reisner 	/* really avoid racing with tl_clear.  w.cb may have been referenced
1206b411b363SPhilipp Reisner 	 * just before it was reassigned and re-queued, so double check that.
1207b411b363SPhilipp Reisner 	 * actually, this race was harmless, since we only try to send the
1208b411b363SPhilipp Reisner 	 * barrier packet here, and otherwise do nothing with the object.
1209b411b363SPhilipp Reisner 	 * but compare with the head of w_clear_epoch */
1210b411b363SPhilipp Reisner 	spin_lock_irq(&mdev->req_lock);
1211b411b363SPhilipp Reisner 	if (w->cb != w_send_barrier || mdev->state.conn < C_CONNECTED)
1212b411b363SPhilipp Reisner 		cancel = 1;
1213b411b363SPhilipp Reisner 	spin_unlock_irq(&mdev->req_lock);
1214b411b363SPhilipp Reisner 	if (cancel)
1215b411b363SPhilipp Reisner 		return 1;
1216b411b363SPhilipp Reisner 
1217b411b363SPhilipp Reisner 	if (!drbd_get_data_sock(mdev))
1218b411b363SPhilipp Reisner 		return 0;
1219b411b363SPhilipp Reisner 	p->barrier = b->br_number;
1220b411b363SPhilipp Reisner 	/* inc_ap_pending was done where this was queued.
1221b411b363SPhilipp Reisner 	 * dec_ap_pending will be done in got_BarrierAck
1222b411b363SPhilipp Reisner 	 * or (on connection loss) in w_clear_epoch.  */
1223b411b363SPhilipp Reisner 	ok = _drbd_send_cmd(mdev, mdev->data.socket, P_BARRIER,
12240b70a13dSPhilipp Reisner 				(struct p_header80 *)p, sizeof(*p), 0);
1225b411b363SPhilipp Reisner 	drbd_put_data_sock(mdev);
1226b411b363SPhilipp Reisner 
1227b411b363SPhilipp Reisner 	return ok;
1228b411b363SPhilipp Reisner }
1229b411b363SPhilipp Reisner 
1230b411b363SPhilipp Reisner int w_send_write_hint(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
1231b411b363SPhilipp Reisner {
1232b411b363SPhilipp Reisner 	if (cancel)
1233b411b363SPhilipp Reisner 		return 1;
1234b411b363SPhilipp Reisner 	return drbd_send_short_cmd(mdev, P_UNPLUG_REMOTE);
1235b411b363SPhilipp Reisner }
1236b411b363SPhilipp Reisner 
123773a01a18SPhilipp Reisner int w_send_oos(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
123873a01a18SPhilipp Reisner {
123973a01a18SPhilipp Reisner 	struct drbd_request *req = container_of(w, struct drbd_request, w);
124073a01a18SPhilipp Reisner 	int ok;
124173a01a18SPhilipp Reisner 
124273a01a18SPhilipp Reisner 	if (unlikely(cancel)) {
124373a01a18SPhilipp Reisner 		req_mod(req, send_canceled);
124473a01a18SPhilipp Reisner 		return 1;
124573a01a18SPhilipp Reisner 	}
124673a01a18SPhilipp Reisner 
124773a01a18SPhilipp Reisner 	ok = drbd_send_oos(mdev, req);
124873a01a18SPhilipp Reisner 	req_mod(req, oos_handed_to_network);
124973a01a18SPhilipp Reisner 
125073a01a18SPhilipp Reisner 	return ok;
125173a01a18SPhilipp Reisner }
125273a01a18SPhilipp Reisner 
1253b411b363SPhilipp Reisner /**
1254b411b363SPhilipp Reisner  * w_send_dblock() - Worker callback to send a P_DATA packet in order to mirror a write request
1255b411b363SPhilipp Reisner  * @mdev:	DRBD device.
1256b411b363SPhilipp Reisner  * @w:		work object.
1257b411b363SPhilipp Reisner  * @cancel:	The connection will be closed anyways
1258b411b363SPhilipp Reisner  */
1259b411b363SPhilipp Reisner int w_send_dblock(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
1260b411b363SPhilipp Reisner {
1261b411b363SPhilipp Reisner 	struct drbd_request *req = container_of(w, struct drbd_request, w);
1262b411b363SPhilipp Reisner 	int ok;
1263b411b363SPhilipp Reisner 
1264b411b363SPhilipp Reisner 	if (unlikely(cancel)) {
1265b411b363SPhilipp Reisner 		req_mod(req, send_canceled);
1266b411b363SPhilipp Reisner 		return 1;
1267b411b363SPhilipp Reisner 	}
1268b411b363SPhilipp Reisner 
1269b411b363SPhilipp Reisner 	ok = drbd_send_dblock(mdev, req);
1270b411b363SPhilipp Reisner 	req_mod(req, ok ? handed_over_to_network : send_failed);
1271b411b363SPhilipp Reisner 
1272b411b363SPhilipp Reisner 	return ok;
1273b411b363SPhilipp Reisner }
1274b411b363SPhilipp Reisner 
1275b411b363SPhilipp Reisner /**
1276b411b363SPhilipp Reisner  * w_send_read_req() - Worker callback to send a read request (P_DATA_REQUEST) packet
1277b411b363SPhilipp Reisner  * @mdev:	DRBD device.
1278b411b363SPhilipp Reisner  * @w:		work object.
1279b411b363SPhilipp Reisner  * @cancel:	The connection will be closed anyways
1280b411b363SPhilipp Reisner  */
1281b411b363SPhilipp Reisner int w_send_read_req(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
1282b411b363SPhilipp Reisner {
1283b411b363SPhilipp Reisner 	struct drbd_request *req = container_of(w, struct drbd_request, w);
1284b411b363SPhilipp Reisner 	int ok;
1285b411b363SPhilipp Reisner 
1286b411b363SPhilipp Reisner 	if (unlikely(cancel)) {
1287b411b363SPhilipp Reisner 		req_mod(req, send_canceled);
1288b411b363SPhilipp Reisner 		return 1;
1289b411b363SPhilipp Reisner 	}
1290b411b363SPhilipp Reisner 
1291ace652acSAndreas Gruenbacher 	ok = drbd_send_drequest(mdev, P_DATA_REQUEST, req->i.sector, req->i.size,
1292b411b363SPhilipp Reisner 				(unsigned long)req);
1293b411b363SPhilipp Reisner 
1294b411b363SPhilipp Reisner 	if (!ok) {
1295b411b363SPhilipp Reisner 		/* ?? we set C_TIMEOUT or C_BROKEN_PIPE in drbd_send();
1296b411b363SPhilipp Reisner 		 * so this is probably redundant */
1297b411b363SPhilipp Reisner 		if (mdev->state.conn >= C_CONNECTED)
1298b411b363SPhilipp Reisner 			drbd_force_state(mdev, NS(conn, C_NETWORK_FAILURE));
1299b411b363SPhilipp Reisner 	}
1300b411b363SPhilipp Reisner 	req_mod(req, ok ? handed_over_to_network : send_failed);
1301b411b363SPhilipp Reisner 
1302b411b363SPhilipp Reisner 	return ok;
1303b411b363SPhilipp Reisner }
1304b411b363SPhilipp Reisner 
1305265be2d0SPhilipp Reisner int w_restart_disk_io(struct drbd_conf *mdev, struct drbd_work *w, int cancel)
1306265be2d0SPhilipp Reisner {
1307265be2d0SPhilipp Reisner 	struct drbd_request *req = container_of(w, struct drbd_request, w);
1308265be2d0SPhilipp Reisner 
13090778286aSPhilipp Reisner 	if (bio_data_dir(req->master_bio) == WRITE && req->rq_state & RQ_IN_ACT_LOG)
1310ace652acSAndreas Gruenbacher 		drbd_al_begin_io(mdev, req->i.sector);
1311265be2d0SPhilipp Reisner 	/* Calling drbd_al_begin_io() out of the worker might deadlocks
1312265be2d0SPhilipp Reisner 	   theoretically. Practically it can not deadlock, since this is
1313265be2d0SPhilipp Reisner 	   only used when unfreezing IOs. All the extents of the requests
1314265be2d0SPhilipp Reisner 	   that made it into the TL are already active */
1315265be2d0SPhilipp Reisner 
1316265be2d0SPhilipp Reisner 	drbd_req_make_private_bio(req, req->master_bio);
1317265be2d0SPhilipp Reisner 	req->private_bio->bi_bdev = mdev->ldev->backing_bdev;
1318265be2d0SPhilipp Reisner 	generic_make_request(req->private_bio);
1319265be2d0SPhilipp Reisner 
1320265be2d0SPhilipp Reisner 	return 1;
1321265be2d0SPhilipp Reisner }
1322265be2d0SPhilipp Reisner 
1323b411b363SPhilipp Reisner static int _drbd_may_sync_now(struct drbd_conf *mdev)
1324b411b363SPhilipp Reisner {
1325b411b363SPhilipp Reisner 	struct drbd_conf *odev = mdev;
1326b411b363SPhilipp Reisner 
1327b411b363SPhilipp Reisner 	while (1) {
1328b411b363SPhilipp Reisner 		if (odev->sync_conf.after == -1)
1329b411b363SPhilipp Reisner 			return 1;
1330b411b363SPhilipp Reisner 		odev = minor_to_mdev(odev->sync_conf.after);
1331b411b363SPhilipp Reisner 		ERR_IF(!odev) return 1;
1332b411b363SPhilipp Reisner 		if ((odev->state.conn >= C_SYNC_SOURCE &&
1333b411b363SPhilipp Reisner 		     odev->state.conn <= C_PAUSED_SYNC_T) ||
1334b411b363SPhilipp Reisner 		    odev->state.aftr_isp || odev->state.peer_isp ||
1335b411b363SPhilipp Reisner 		    odev->state.user_isp)
1336b411b363SPhilipp Reisner 			return 0;
1337b411b363SPhilipp Reisner 	}
1338b411b363SPhilipp Reisner }
1339b411b363SPhilipp Reisner 
1340b411b363SPhilipp Reisner /**
1341b411b363SPhilipp Reisner  * _drbd_pause_after() - Pause resync on all devices that may not resync now
1342b411b363SPhilipp Reisner  * @mdev:	DRBD device.
1343b411b363SPhilipp Reisner  *
1344b411b363SPhilipp Reisner  * Called from process context only (admin command and after_state_ch).
1345b411b363SPhilipp Reisner  */
1346b411b363SPhilipp Reisner static int _drbd_pause_after(struct drbd_conf *mdev)
1347b411b363SPhilipp Reisner {
1348b411b363SPhilipp Reisner 	struct drbd_conf *odev;
1349b411b363SPhilipp Reisner 	int i, rv = 0;
1350b411b363SPhilipp Reisner 
1351b411b363SPhilipp Reisner 	for (i = 0; i < minor_count; i++) {
1352b411b363SPhilipp Reisner 		odev = minor_to_mdev(i);
1353b411b363SPhilipp Reisner 		if (!odev)
1354b411b363SPhilipp Reisner 			continue;
1355b411b363SPhilipp Reisner 		if (odev->state.conn == C_STANDALONE && odev->state.disk == D_DISKLESS)
1356b411b363SPhilipp Reisner 			continue;
1357b411b363SPhilipp Reisner 		if (!_drbd_may_sync_now(odev))
1358b411b363SPhilipp Reisner 			rv |= (__drbd_set_state(_NS(odev, aftr_isp, 1), CS_HARD, NULL)
1359b411b363SPhilipp Reisner 			       != SS_NOTHING_TO_DO);
1360b411b363SPhilipp Reisner 	}
1361b411b363SPhilipp Reisner 
1362b411b363SPhilipp Reisner 	return rv;
1363b411b363SPhilipp Reisner }
1364b411b363SPhilipp Reisner 
1365b411b363SPhilipp Reisner /**
1366b411b363SPhilipp Reisner  * _drbd_resume_next() - Resume resync on all devices that may resync now
1367b411b363SPhilipp Reisner  * @mdev:	DRBD device.
1368b411b363SPhilipp Reisner  *
1369b411b363SPhilipp Reisner  * Called from process context only (admin command and worker).
1370b411b363SPhilipp Reisner  */
1371b411b363SPhilipp Reisner static int _drbd_resume_next(struct drbd_conf *mdev)
1372b411b363SPhilipp Reisner {
1373b411b363SPhilipp Reisner 	struct drbd_conf *odev;
1374b411b363SPhilipp Reisner 	int i, rv = 0;
1375b411b363SPhilipp Reisner 
1376b411b363SPhilipp Reisner 	for (i = 0; i < minor_count; i++) {
1377b411b363SPhilipp Reisner 		odev = minor_to_mdev(i);
1378b411b363SPhilipp Reisner 		if (!odev)
1379b411b363SPhilipp Reisner 			continue;
1380b411b363SPhilipp Reisner 		if (odev->state.conn == C_STANDALONE && odev->state.disk == D_DISKLESS)
1381b411b363SPhilipp Reisner 			continue;
1382b411b363SPhilipp Reisner 		if (odev->state.aftr_isp) {
1383b411b363SPhilipp Reisner 			if (_drbd_may_sync_now(odev))
1384b411b363SPhilipp Reisner 				rv |= (__drbd_set_state(_NS(odev, aftr_isp, 0),
1385b411b363SPhilipp Reisner 							CS_HARD, NULL)
1386b411b363SPhilipp Reisner 				       != SS_NOTHING_TO_DO) ;
1387b411b363SPhilipp Reisner 		}
1388b411b363SPhilipp Reisner 	}
1389b411b363SPhilipp Reisner 	return rv;
1390b411b363SPhilipp Reisner }
1391b411b363SPhilipp Reisner 
1392b411b363SPhilipp Reisner void resume_next_sg(struct drbd_conf *mdev)
1393b411b363SPhilipp Reisner {
1394b411b363SPhilipp Reisner 	write_lock_irq(&global_state_lock);
1395b411b363SPhilipp Reisner 	_drbd_resume_next(mdev);
1396b411b363SPhilipp Reisner 	write_unlock_irq(&global_state_lock);
1397b411b363SPhilipp Reisner }
1398b411b363SPhilipp Reisner 
1399b411b363SPhilipp Reisner void suspend_other_sg(struct drbd_conf *mdev)
1400b411b363SPhilipp Reisner {
1401b411b363SPhilipp Reisner 	write_lock_irq(&global_state_lock);
1402b411b363SPhilipp Reisner 	_drbd_pause_after(mdev);
1403b411b363SPhilipp Reisner 	write_unlock_irq(&global_state_lock);
1404b411b363SPhilipp Reisner }
1405b411b363SPhilipp Reisner 
1406b411b363SPhilipp Reisner static int sync_after_error(struct drbd_conf *mdev, int o_minor)
1407b411b363SPhilipp Reisner {
1408b411b363SPhilipp Reisner 	struct drbd_conf *odev;
1409b411b363SPhilipp Reisner 
1410b411b363SPhilipp Reisner 	if (o_minor == -1)
1411b411b363SPhilipp Reisner 		return NO_ERROR;
1412b411b363SPhilipp Reisner 	if (o_minor < -1 || minor_to_mdev(o_minor) == NULL)
1413b411b363SPhilipp Reisner 		return ERR_SYNC_AFTER;
1414b411b363SPhilipp Reisner 
1415b411b363SPhilipp Reisner 	/* check for loops */
1416b411b363SPhilipp Reisner 	odev = minor_to_mdev(o_minor);
1417b411b363SPhilipp Reisner 	while (1) {
1418b411b363SPhilipp Reisner 		if (odev == mdev)
1419b411b363SPhilipp Reisner 			return ERR_SYNC_AFTER_CYCLE;
1420b411b363SPhilipp Reisner 
1421b411b363SPhilipp Reisner 		/* dependency chain ends here, no cycles. */
1422b411b363SPhilipp Reisner 		if (odev->sync_conf.after == -1)
1423b411b363SPhilipp Reisner 			return NO_ERROR;
1424b411b363SPhilipp Reisner 
1425b411b363SPhilipp Reisner 		/* follow the dependency chain */
1426b411b363SPhilipp Reisner 		odev = minor_to_mdev(odev->sync_conf.after);
1427b411b363SPhilipp Reisner 	}
1428b411b363SPhilipp Reisner }
1429b411b363SPhilipp Reisner 
1430b411b363SPhilipp Reisner int drbd_alter_sa(struct drbd_conf *mdev, int na)
1431b411b363SPhilipp Reisner {
1432b411b363SPhilipp Reisner 	int changes;
1433b411b363SPhilipp Reisner 	int retcode;
1434b411b363SPhilipp Reisner 
1435b411b363SPhilipp Reisner 	write_lock_irq(&global_state_lock);
1436b411b363SPhilipp Reisner 	retcode = sync_after_error(mdev, na);
1437b411b363SPhilipp Reisner 	if (retcode == NO_ERROR) {
1438b411b363SPhilipp Reisner 		mdev->sync_conf.after = na;
1439b411b363SPhilipp Reisner 		do {
1440b411b363SPhilipp Reisner 			changes  = _drbd_pause_after(mdev);
1441b411b363SPhilipp Reisner 			changes |= _drbd_resume_next(mdev);
1442b411b363SPhilipp Reisner 		} while (changes);
1443b411b363SPhilipp Reisner 	}
1444b411b363SPhilipp Reisner 	write_unlock_irq(&global_state_lock);
1445b411b363SPhilipp Reisner 	return retcode;
1446b411b363SPhilipp Reisner }
1447b411b363SPhilipp Reisner 
14489bd28d3cSLars Ellenberg void drbd_rs_controller_reset(struct drbd_conf *mdev)
14499bd28d3cSLars Ellenberg {
14509bd28d3cSLars Ellenberg 	atomic_set(&mdev->rs_sect_in, 0);
14519bd28d3cSLars Ellenberg 	atomic_set(&mdev->rs_sect_ev, 0);
14529bd28d3cSLars Ellenberg 	mdev->rs_in_flight = 0;
14539bd28d3cSLars Ellenberg 	mdev->rs_planed = 0;
14549bd28d3cSLars Ellenberg 	spin_lock(&mdev->peer_seq_lock);
14559bd28d3cSLars Ellenberg 	fifo_set(&mdev->rs_plan_s, 0);
14569bd28d3cSLars Ellenberg 	spin_unlock(&mdev->peer_seq_lock);
14579bd28d3cSLars Ellenberg }
14589bd28d3cSLars Ellenberg 
1459b411b363SPhilipp Reisner /**
1460b411b363SPhilipp Reisner  * drbd_start_resync() - Start the resync process
1461b411b363SPhilipp Reisner  * @mdev:	DRBD device.
1462b411b363SPhilipp Reisner  * @side:	Either C_SYNC_SOURCE or C_SYNC_TARGET
1463b411b363SPhilipp Reisner  *
1464b411b363SPhilipp Reisner  * This function might bring you directly into one of the
1465b411b363SPhilipp Reisner  * C_PAUSED_SYNC_* states.
1466b411b363SPhilipp Reisner  */
1467b411b363SPhilipp Reisner void drbd_start_resync(struct drbd_conf *mdev, enum drbd_conns side)
1468b411b363SPhilipp Reisner {
1469b411b363SPhilipp Reisner 	union drbd_state ns;
1470b411b363SPhilipp Reisner 	int r;
1471b411b363SPhilipp Reisner 
1472c4752ef1SPhilipp Reisner 	if (mdev->state.conn >= C_SYNC_SOURCE && mdev->state.conn < C_AHEAD) {
1473b411b363SPhilipp Reisner 		dev_err(DEV, "Resync already running!\n");
1474b411b363SPhilipp Reisner 		return;
1475b411b363SPhilipp Reisner 	}
1476b411b363SPhilipp Reisner 
147759817f4fSPhilipp Reisner 	if (mdev->state.conn < C_AHEAD) {
1478b411b363SPhilipp Reisner 		/* In case a previous resync run was aborted by an IO error/detach on the peer. */
1479b411b363SPhilipp Reisner 		drbd_rs_cancel_all(mdev);
148059817f4fSPhilipp Reisner 		/* This should be done when we abort the resync. We definitely do not
148159817f4fSPhilipp Reisner 		   want to have this for connections going back and forth between
148259817f4fSPhilipp Reisner 		   Ahead/Behind and SyncSource/SyncTarget */
148359817f4fSPhilipp Reisner 	}
1484b411b363SPhilipp Reisner 
1485b411b363SPhilipp Reisner 	if (side == C_SYNC_TARGET) {
1486b411b363SPhilipp Reisner 		/* Since application IO was locked out during C_WF_BITMAP_T and
1487b411b363SPhilipp Reisner 		   C_WF_SYNC_UUID we are still unmodified. Before going to C_SYNC_TARGET
1488b411b363SPhilipp Reisner 		   we check that we might make the data inconsistent. */
1489b411b363SPhilipp Reisner 		r = drbd_khelper(mdev, "before-resync-target");
1490b411b363SPhilipp Reisner 		r = (r >> 8) & 0xff;
1491b411b363SPhilipp Reisner 		if (r > 0) {
1492b411b363SPhilipp Reisner 			dev_info(DEV, "before-resync-target handler returned %d, "
1493b411b363SPhilipp Reisner 			     "dropping connection.\n", r);
1494b411b363SPhilipp Reisner 			drbd_force_state(mdev, NS(conn, C_DISCONNECTING));
1495b411b363SPhilipp Reisner 			return;
1496b411b363SPhilipp Reisner 		}
149709b9e797SPhilipp Reisner 	} else /* C_SYNC_SOURCE */ {
149809b9e797SPhilipp Reisner 		r = drbd_khelper(mdev, "before-resync-source");
149909b9e797SPhilipp Reisner 		r = (r >> 8) & 0xff;
150009b9e797SPhilipp Reisner 		if (r > 0) {
150109b9e797SPhilipp Reisner 			if (r == 3) {
150209b9e797SPhilipp Reisner 				dev_info(DEV, "before-resync-source handler returned %d, "
150309b9e797SPhilipp Reisner 					 "ignoring. Old userland tools?", r);
150409b9e797SPhilipp Reisner 			} else {
150509b9e797SPhilipp Reisner 				dev_info(DEV, "before-resync-source handler returned %d, "
150609b9e797SPhilipp Reisner 					 "dropping connection.\n", r);
150709b9e797SPhilipp Reisner 				drbd_force_state(mdev, NS(conn, C_DISCONNECTING));
150809b9e797SPhilipp Reisner 				return;
150909b9e797SPhilipp Reisner 			}
151009b9e797SPhilipp Reisner 		}
1511b411b363SPhilipp Reisner 	}
1512b411b363SPhilipp Reisner 
1513b411b363SPhilipp Reisner 	drbd_state_lock(mdev);
1514b411b363SPhilipp Reisner 
1515b411b363SPhilipp Reisner 	if (!get_ldev_if_state(mdev, D_NEGOTIATING)) {
1516b411b363SPhilipp Reisner 		drbd_state_unlock(mdev);
1517b411b363SPhilipp Reisner 		return;
1518b411b363SPhilipp Reisner 	}
1519b411b363SPhilipp Reisner 
1520b411b363SPhilipp Reisner 	write_lock_irq(&global_state_lock);
1521b411b363SPhilipp Reisner 	ns = mdev->state;
1522b411b363SPhilipp Reisner 
1523b411b363SPhilipp Reisner 	ns.aftr_isp = !_drbd_may_sync_now(mdev);
1524b411b363SPhilipp Reisner 
1525b411b363SPhilipp Reisner 	ns.conn = side;
1526b411b363SPhilipp Reisner 
1527b411b363SPhilipp Reisner 	if (side == C_SYNC_TARGET)
1528b411b363SPhilipp Reisner 		ns.disk = D_INCONSISTENT;
1529b411b363SPhilipp Reisner 	else /* side == C_SYNC_SOURCE */
1530b411b363SPhilipp Reisner 		ns.pdsk = D_INCONSISTENT;
1531b411b363SPhilipp Reisner 
1532b411b363SPhilipp Reisner 	r = __drbd_set_state(mdev, ns, CS_VERBOSE, NULL);
1533b411b363SPhilipp Reisner 	ns = mdev->state;
1534b411b363SPhilipp Reisner 
1535b411b363SPhilipp Reisner 	if (ns.conn < C_CONNECTED)
1536b411b363SPhilipp Reisner 		r = SS_UNKNOWN_ERROR;
1537b411b363SPhilipp Reisner 
1538b411b363SPhilipp Reisner 	if (r == SS_SUCCESS) {
15391d7734a0SLars Ellenberg 		unsigned long tw = drbd_bm_total_weight(mdev);
15401d7734a0SLars Ellenberg 		unsigned long now = jiffies;
15411d7734a0SLars Ellenberg 		int i;
15421d7734a0SLars Ellenberg 
1543b411b363SPhilipp Reisner 		mdev->rs_failed    = 0;
1544b411b363SPhilipp Reisner 		mdev->rs_paused    = 0;
1545b411b363SPhilipp Reisner 		mdev->rs_same_csum = 0;
15460f0601f4SLars Ellenberg 		mdev->rs_last_events = 0;
15470f0601f4SLars Ellenberg 		mdev->rs_last_sect_ev = 0;
15481d7734a0SLars Ellenberg 		mdev->rs_total     = tw;
15491d7734a0SLars Ellenberg 		mdev->rs_start     = now;
15501d7734a0SLars Ellenberg 		for (i = 0; i < DRBD_SYNC_MARKS; i++) {
15511d7734a0SLars Ellenberg 			mdev->rs_mark_left[i] = tw;
15521d7734a0SLars Ellenberg 			mdev->rs_mark_time[i] = now;
15531d7734a0SLars Ellenberg 		}
1554b411b363SPhilipp Reisner 		_drbd_pause_after(mdev);
1555b411b363SPhilipp Reisner 	}
1556b411b363SPhilipp Reisner 	write_unlock_irq(&global_state_lock);
15575a22db89SLars Ellenberg 
15586c922ed5SLars Ellenberg 	if (r == SS_SUCCESS) {
15596c922ed5SLars Ellenberg 		dev_info(DEV, "Began resync as %s (will sync %lu KB [%lu bits set]).\n",
15606c922ed5SLars Ellenberg 		     drbd_conn_str(ns.conn),
15616c922ed5SLars Ellenberg 		     (unsigned long) mdev->rs_total << (BM_BLOCK_SHIFT-10),
15626c922ed5SLars Ellenberg 		     (unsigned long) mdev->rs_total);
15635a22db89SLars Ellenberg 		if (side == C_SYNC_TARGET)
15645a22db89SLars Ellenberg 			mdev->bm_resync_fo = 0;
15655a22db89SLars Ellenberg 
15665a22db89SLars Ellenberg 		/* Since protocol 96, we must serialize drbd_gen_and_send_sync_uuid
15675a22db89SLars Ellenberg 		 * with w_send_oos, or the sync target will get confused as to
15685a22db89SLars Ellenberg 		 * how much bits to resync.  We cannot do that always, because for an
15695a22db89SLars Ellenberg 		 * empty resync and protocol < 95, we need to do it here, as we call
15705a22db89SLars Ellenberg 		 * drbd_resync_finished from here in that case.
15715a22db89SLars Ellenberg 		 * We drbd_gen_and_send_sync_uuid here for protocol < 96,
15725a22db89SLars Ellenberg 		 * and from after_state_ch otherwise. */
15735a22db89SLars Ellenberg 		if (side == C_SYNC_SOURCE && mdev->agreed_pro_version < 96)
15745a22db89SLars Ellenberg 			drbd_gen_and_send_sync_uuid(mdev);
1575b411b363SPhilipp Reisner 
1576af85e8e8SLars Ellenberg 		if (mdev->agreed_pro_version < 95 && mdev->rs_total == 0) {
1577af85e8e8SLars Ellenberg 			/* This still has a race (about when exactly the peers
1578af85e8e8SLars Ellenberg 			 * detect connection loss) that can lead to a full sync
1579af85e8e8SLars Ellenberg 			 * on next handshake. In 8.3.9 we fixed this with explicit
1580af85e8e8SLars Ellenberg 			 * resync-finished notifications, but the fix
1581af85e8e8SLars Ellenberg 			 * introduces a protocol change.  Sleeping for some
1582af85e8e8SLars Ellenberg 			 * time longer than the ping interval + timeout on the
1583af85e8e8SLars Ellenberg 			 * SyncSource, to give the SyncTarget the chance to
1584af85e8e8SLars Ellenberg 			 * detect connection loss, then waiting for a ping
1585af85e8e8SLars Ellenberg 			 * response (implicit in drbd_resync_finished) reduces
1586af85e8e8SLars Ellenberg 			 * the race considerably, but does not solve it. */
1587af85e8e8SLars Ellenberg 			if (side == C_SYNC_SOURCE)
1588af85e8e8SLars Ellenberg 				schedule_timeout_interruptible(
1589af85e8e8SLars Ellenberg 					mdev->net_conf->ping_int * HZ +
1590af85e8e8SLars Ellenberg 					mdev->net_conf->ping_timeo*HZ/9);
1591b411b363SPhilipp Reisner 			drbd_resync_finished(mdev);
1592b411b363SPhilipp Reisner 		}
1593b411b363SPhilipp Reisner 
15949bd28d3cSLars Ellenberg 		drbd_rs_controller_reset(mdev);
1595b411b363SPhilipp Reisner 		/* ns.conn may already be != mdev->state.conn,
1596b411b363SPhilipp Reisner 		 * we may have been paused in between, or become paused until
1597b411b363SPhilipp Reisner 		 * the timer triggers.
1598b411b363SPhilipp Reisner 		 * No matter, that is handled in resync_timer_fn() */
1599b411b363SPhilipp Reisner 		if (ns.conn == C_SYNC_TARGET)
1600b411b363SPhilipp Reisner 			mod_timer(&mdev->resync_timer, jiffies);
1601b411b363SPhilipp Reisner 
1602b411b363SPhilipp Reisner 		drbd_md_sync(mdev);
1603b411b363SPhilipp Reisner 	}
16045a22db89SLars Ellenberg 	put_ldev(mdev);
1605d0c3f60fSPhilipp Reisner 	drbd_state_unlock(mdev);
1606b411b363SPhilipp Reisner }
1607b411b363SPhilipp Reisner 
1608b411b363SPhilipp Reisner int drbd_worker(struct drbd_thread *thi)
1609b411b363SPhilipp Reisner {
1610b411b363SPhilipp Reisner 	struct drbd_conf *mdev = thi->mdev;
1611b411b363SPhilipp Reisner 	struct drbd_work *w = NULL;
1612b411b363SPhilipp Reisner 	LIST_HEAD(work_list);
1613b411b363SPhilipp Reisner 	int intr = 0, i;
1614b411b363SPhilipp Reisner 
1615b411b363SPhilipp Reisner 	sprintf(current->comm, "drbd%d_worker", mdev_to_minor(mdev));
1616b411b363SPhilipp Reisner 
1617b411b363SPhilipp Reisner 	while (get_t_state(thi) == Running) {
1618b411b363SPhilipp Reisner 		drbd_thread_current_set_cpu(mdev);
1619b411b363SPhilipp Reisner 
1620b411b363SPhilipp Reisner 		if (down_trylock(&mdev->data.work.s)) {
1621b411b363SPhilipp Reisner 			mutex_lock(&mdev->data.mutex);
1622b411b363SPhilipp Reisner 			if (mdev->data.socket && !mdev->net_conf->no_cork)
1623b411b363SPhilipp Reisner 				drbd_tcp_uncork(mdev->data.socket);
1624b411b363SPhilipp Reisner 			mutex_unlock(&mdev->data.mutex);
1625b411b363SPhilipp Reisner 
1626b411b363SPhilipp Reisner 			intr = down_interruptible(&mdev->data.work.s);
1627b411b363SPhilipp Reisner 
1628b411b363SPhilipp Reisner 			mutex_lock(&mdev->data.mutex);
1629b411b363SPhilipp Reisner 			if (mdev->data.socket  && !mdev->net_conf->no_cork)
1630b411b363SPhilipp Reisner 				drbd_tcp_cork(mdev->data.socket);
1631b411b363SPhilipp Reisner 			mutex_unlock(&mdev->data.mutex);
1632b411b363SPhilipp Reisner 		}
1633b411b363SPhilipp Reisner 
1634b411b363SPhilipp Reisner 		if (intr) {
1635b411b363SPhilipp Reisner 			D_ASSERT(intr == -EINTR);
1636b411b363SPhilipp Reisner 			flush_signals(current);
1637b411b363SPhilipp Reisner 			ERR_IF (get_t_state(thi) == Running)
1638b411b363SPhilipp Reisner 				continue;
1639b411b363SPhilipp Reisner 			break;
1640b411b363SPhilipp Reisner 		}
1641b411b363SPhilipp Reisner 
1642b411b363SPhilipp Reisner 		if (get_t_state(thi) != Running)
1643b411b363SPhilipp Reisner 			break;
1644b411b363SPhilipp Reisner 		/* With this break, we have done a down() but not consumed
1645b411b363SPhilipp Reisner 		   the entry from the list. The cleanup code takes care of
1646b411b363SPhilipp Reisner 		   this...   */
1647b411b363SPhilipp Reisner 
1648b411b363SPhilipp Reisner 		w = NULL;
1649b411b363SPhilipp Reisner 		spin_lock_irq(&mdev->data.work.q_lock);
1650b411b363SPhilipp Reisner 		ERR_IF(list_empty(&mdev->data.work.q)) {
1651b411b363SPhilipp Reisner 			/* something terribly wrong in our logic.
1652b411b363SPhilipp Reisner 			 * we were able to down() the semaphore,
1653b411b363SPhilipp Reisner 			 * but the list is empty... doh.
1654b411b363SPhilipp Reisner 			 *
1655b411b363SPhilipp Reisner 			 * what is the best thing to do now?
1656b411b363SPhilipp Reisner 			 * try again from scratch, restarting the receiver,
1657b411b363SPhilipp Reisner 			 * asender, whatnot? could break even more ugly,
1658b411b363SPhilipp Reisner 			 * e.g. when we are primary, but no good local data.
1659b411b363SPhilipp Reisner 			 *
1660b411b363SPhilipp Reisner 			 * I'll try to get away just starting over this loop.
1661b411b363SPhilipp Reisner 			 */
1662b411b363SPhilipp Reisner 			spin_unlock_irq(&mdev->data.work.q_lock);
1663b411b363SPhilipp Reisner 			continue;
1664b411b363SPhilipp Reisner 		}
1665b411b363SPhilipp Reisner 		w = list_entry(mdev->data.work.q.next, struct drbd_work, list);
1666b411b363SPhilipp Reisner 		list_del_init(&w->list);
1667b411b363SPhilipp Reisner 		spin_unlock_irq(&mdev->data.work.q_lock);
1668b411b363SPhilipp Reisner 
1669b411b363SPhilipp Reisner 		if (!w->cb(mdev, w, mdev->state.conn < C_CONNECTED)) {
1670b411b363SPhilipp Reisner 			/* dev_warn(DEV, "worker: a callback failed! \n"); */
1671b411b363SPhilipp Reisner 			if (mdev->state.conn >= C_CONNECTED)
1672b411b363SPhilipp Reisner 				drbd_force_state(mdev,
1673b411b363SPhilipp Reisner 						NS(conn, C_NETWORK_FAILURE));
1674b411b363SPhilipp Reisner 		}
1675b411b363SPhilipp Reisner 	}
1676b411b363SPhilipp Reisner 	D_ASSERT(test_bit(DEVICE_DYING, &mdev->flags));
1677b411b363SPhilipp Reisner 	D_ASSERT(test_bit(CONFIG_PENDING, &mdev->flags));
1678b411b363SPhilipp Reisner 
1679b411b363SPhilipp Reisner 	spin_lock_irq(&mdev->data.work.q_lock);
1680b411b363SPhilipp Reisner 	i = 0;
1681b411b363SPhilipp Reisner 	while (!list_empty(&mdev->data.work.q)) {
1682b411b363SPhilipp Reisner 		list_splice_init(&mdev->data.work.q, &work_list);
1683b411b363SPhilipp Reisner 		spin_unlock_irq(&mdev->data.work.q_lock);
1684b411b363SPhilipp Reisner 
1685b411b363SPhilipp Reisner 		while (!list_empty(&work_list)) {
1686b411b363SPhilipp Reisner 			w = list_entry(work_list.next, struct drbd_work, list);
1687b411b363SPhilipp Reisner 			list_del_init(&w->list);
1688b411b363SPhilipp Reisner 			w->cb(mdev, w, 1);
1689b411b363SPhilipp Reisner 			i++; /* dead debugging code */
1690b411b363SPhilipp Reisner 		}
1691b411b363SPhilipp Reisner 
1692b411b363SPhilipp Reisner 		spin_lock_irq(&mdev->data.work.q_lock);
1693b411b363SPhilipp Reisner 	}
1694b411b363SPhilipp Reisner 	sema_init(&mdev->data.work.s, 0);
1695b411b363SPhilipp Reisner 	/* DANGEROUS race: if someone did queue his work within the spinlock,
1696b411b363SPhilipp Reisner 	 * but up() ed outside the spinlock, we could get an up() on the
1697b411b363SPhilipp Reisner 	 * semaphore without corresponding list entry.
1698b411b363SPhilipp Reisner 	 * So don't do that.
1699b411b363SPhilipp Reisner 	 */
1700b411b363SPhilipp Reisner 	spin_unlock_irq(&mdev->data.work.q_lock);
1701b411b363SPhilipp Reisner 
1702b411b363SPhilipp Reisner 	D_ASSERT(mdev->state.disk == D_DISKLESS && mdev->state.conn == C_STANDALONE);
1703b411b363SPhilipp Reisner 	/* _drbd_set_state only uses stop_nowait.
1704b411b363SPhilipp Reisner 	 * wait here for the Exiting receiver. */
1705b411b363SPhilipp Reisner 	drbd_thread_stop(&mdev->receiver);
1706b411b363SPhilipp Reisner 	drbd_mdev_cleanup(mdev);
1707b411b363SPhilipp Reisner 
1708b411b363SPhilipp Reisner 	dev_info(DEV, "worker terminated\n");
1709b411b363SPhilipp Reisner 
1710b411b363SPhilipp Reisner 	clear_bit(DEVICE_DYING, &mdev->flags);
1711b411b363SPhilipp Reisner 	clear_bit(CONFIG_PENDING, &mdev->flags);
1712b411b363SPhilipp Reisner 	wake_up(&mdev->state_wait);
1713b411b363SPhilipp Reisner 
1714b411b363SPhilipp Reisner 	return 0;
1715b411b363SPhilipp Reisner }
1716