1b411b363SPhilipp Reisner /* 2b411b363SPhilipp Reisner drbd_worker.c 3b411b363SPhilipp Reisner 4b411b363SPhilipp Reisner This file is part of DRBD by Philipp Reisner and Lars Ellenberg. 5b411b363SPhilipp Reisner 6b411b363SPhilipp Reisner Copyright (C) 2001-2008, LINBIT Information Technologies GmbH. 7b411b363SPhilipp Reisner Copyright (C) 1999-2008, Philipp Reisner <philipp.reisner@linbit.com>. 8b411b363SPhilipp Reisner Copyright (C) 2002-2008, Lars Ellenberg <lars.ellenberg@linbit.com>. 9b411b363SPhilipp Reisner 10b411b363SPhilipp Reisner drbd is free software; you can redistribute it and/or modify 11b411b363SPhilipp Reisner it under the terms of the GNU General Public License as published by 12b411b363SPhilipp Reisner the Free Software Foundation; either version 2, or (at your option) 13b411b363SPhilipp Reisner any later version. 14b411b363SPhilipp Reisner 15b411b363SPhilipp Reisner drbd is distributed in the hope that it will be useful, 16b411b363SPhilipp Reisner but WITHOUT ANY WARRANTY; without even the implied warranty of 17b411b363SPhilipp Reisner MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 18b411b363SPhilipp Reisner GNU General Public License for more details. 19b411b363SPhilipp Reisner 20b411b363SPhilipp Reisner You should have received a copy of the GNU General Public License 21b411b363SPhilipp Reisner along with drbd; see the file COPYING. If not, write to 22b411b363SPhilipp Reisner the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139, USA. 23b411b363SPhilipp Reisner 24b411b363SPhilipp Reisner */ 25b411b363SPhilipp Reisner 26b411b363SPhilipp Reisner #include <linux/module.h> 27b411b363SPhilipp Reisner #include <linux/drbd.h> 28b411b363SPhilipp Reisner #include <linux/sched.h> 29b411b363SPhilipp Reisner #include <linux/wait.h> 30b411b363SPhilipp Reisner #include <linux/mm.h> 31b411b363SPhilipp Reisner #include <linux/memcontrol.h> 32b411b363SPhilipp Reisner #include <linux/mm_inline.h> 33b411b363SPhilipp Reisner #include <linux/slab.h> 34b411b363SPhilipp Reisner #include <linux/random.h> 35b411b363SPhilipp Reisner #include <linux/string.h> 36b411b363SPhilipp Reisner #include <linux/scatterlist.h> 37b411b363SPhilipp Reisner 38b411b363SPhilipp Reisner #include "drbd_int.h" 39b411b363SPhilipp Reisner #include "drbd_req.h" 40b411b363SPhilipp Reisner 4100d56944SPhilipp Reisner static int w_make_ov_request(struct drbd_work *w, int cancel); 42b411b363SPhilipp Reisner 43b411b363SPhilipp Reisner 44c5a91619SAndreas Gruenbacher /* endio handlers: 45c5a91619SAndreas Gruenbacher * drbd_md_io_complete (defined here) 46fcefa62eSAndreas Gruenbacher * drbd_request_endio (defined here) 47fcefa62eSAndreas Gruenbacher * drbd_peer_request_endio (defined here) 48c5a91619SAndreas Gruenbacher * bm_async_io_complete (defined in drbd_bitmap.c) 49c5a91619SAndreas Gruenbacher * 50b411b363SPhilipp Reisner * For all these callbacks, note the following: 51b411b363SPhilipp Reisner * The callbacks will be called in irq context by the IDE drivers, 52b411b363SPhilipp Reisner * and in Softirqs/Tasklets/BH context by the SCSI drivers. 53b411b363SPhilipp Reisner * Try to get the locking right :) 54b411b363SPhilipp Reisner * 55b411b363SPhilipp Reisner */ 56b411b363SPhilipp Reisner 57b411b363SPhilipp Reisner 58b411b363SPhilipp Reisner /* About the global_state_lock 59b411b363SPhilipp Reisner Each state transition on an device holds a read lock. In case we have 6095f8efd0SAndreas Gruenbacher to evaluate the resync after dependencies, we grab a write lock, because 61b411b363SPhilipp Reisner we need stable states on all devices for that. */ 62b411b363SPhilipp Reisner rwlock_t global_state_lock; 63b411b363SPhilipp Reisner 64b411b363SPhilipp Reisner /* used for synchronous meta data and bitmap IO 65b411b363SPhilipp Reisner * submitted by drbd_md_sync_page_io() 66b411b363SPhilipp Reisner */ 67b411b363SPhilipp Reisner void drbd_md_io_complete(struct bio *bio, int error) 68b411b363SPhilipp Reisner { 69b411b363SPhilipp Reisner struct drbd_md_io *md_io; 70cdfda633SPhilipp Reisner struct drbd_conf *mdev; 71b411b363SPhilipp Reisner 72b411b363SPhilipp Reisner md_io = (struct drbd_md_io *)bio->bi_private; 73cdfda633SPhilipp Reisner mdev = container_of(md_io, struct drbd_conf, md_io); 74cdfda633SPhilipp Reisner 75b411b363SPhilipp Reisner md_io->error = error; 76b411b363SPhilipp Reisner 770cfac5ddSPhilipp Reisner /* We grabbed an extra reference in _drbd_md_sync_page_io() to be able 780cfac5ddSPhilipp Reisner * to timeout on the lower level device, and eventually detach from it. 790cfac5ddSPhilipp Reisner * If this io completion runs after that timeout expired, this 800cfac5ddSPhilipp Reisner * drbd_md_put_buffer() may allow us to finally try and re-attach. 810cfac5ddSPhilipp Reisner * During normal operation, this only puts that extra reference 820cfac5ddSPhilipp Reisner * down to 1 again. 830cfac5ddSPhilipp Reisner * Make sure we first drop the reference, and only then signal 840cfac5ddSPhilipp Reisner * completion, or we may (in drbd_al_read_log()) cycle so fast into the 850cfac5ddSPhilipp Reisner * next drbd_md_sync_page_io(), that we trigger the 860cfac5ddSPhilipp Reisner * ASSERT(atomic_read(&mdev->md_io_in_use) == 1) there. 870cfac5ddSPhilipp Reisner */ 880cfac5ddSPhilipp Reisner drbd_md_put_buffer(mdev); 89cdfda633SPhilipp Reisner md_io->done = 1; 90cdfda633SPhilipp Reisner wake_up(&mdev->misc_wait); 91cdfda633SPhilipp Reisner bio_put(bio); 92cdfda633SPhilipp Reisner put_ldev(mdev); 93b411b363SPhilipp Reisner } 94b411b363SPhilipp Reisner 95b411b363SPhilipp Reisner /* reads on behalf of the partner, 96b411b363SPhilipp Reisner * "submitted" by the receiver 97b411b363SPhilipp Reisner */ 98db830c46SAndreas Gruenbacher void drbd_endio_read_sec_final(struct drbd_peer_request *peer_req) __releases(local) 99b411b363SPhilipp Reisner { 100b411b363SPhilipp Reisner unsigned long flags = 0; 101a21e9298SPhilipp Reisner struct drbd_conf *mdev = peer_req->w.mdev; 102b411b363SPhilipp Reisner 10387eeee41SPhilipp Reisner spin_lock_irqsave(&mdev->tconn->req_lock, flags); 104db830c46SAndreas Gruenbacher mdev->read_cnt += peer_req->i.size >> 9; 105db830c46SAndreas Gruenbacher list_del(&peer_req->w.list); 106b411b363SPhilipp Reisner if (list_empty(&mdev->read_ee)) 107b411b363SPhilipp Reisner wake_up(&mdev->ee_wait); 108db830c46SAndreas Gruenbacher if (test_bit(__EE_WAS_ERROR, &peer_req->flags)) 10981e84650SAndreas Gruenbacher __drbd_chk_io_error(mdev, false); 11087eeee41SPhilipp Reisner spin_unlock_irqrestore(&mdev->tconn->req_lock, flags); 111b411b363SPhilipp Reisner 112db830c46SAndreas Gruenbacher drbd_queue_work(&mdev->tconn->data.work, &peer_req->w); 113b411b363SPhilipp Reisner put_ldev(mdev); 114b411b363SPhilipp Reisner } 115b411b363SPhilipp Reisner 116b411b363SPhilipp Reisner /* writes on behalf of the partner, or resync writes, 11745bb912bSLars Ellenberg * "submitted" by the receiver, final stage. */ 118db830c46SAndreas Gruenbacher static void drbd_endio_write_sec_final(struct drbd_peer_request *peer_req) __releases(local) 119b411b363SPhilipp Reisner { 120b411b363SPhilipp Reisner unsigned long flags = 0; 121a21e9298SPhilipp Reisner struct drbd_conf *mdev = peer_req->w.mdev; 122181286adSLars Ellenberg struct drbd_interval i; 123b411b363SPhilipp Reisner int do_wake; 124579b57edSAndreas Gruenbacher u64 block_id; 125b411b363SPhilipp Reisner int do_al_complete_io; 126b411b363SPhilipp Reisner 127db830c46SAndreas Gruenbacher /* after we moved peer_req to done_ee, 128b411b363SPhilipp Reisner * we may no longer access it, 129b411b363SPhilipp Reisner * it may be freed/reused already! 130b411b363SPhilipp Reisner * (as soon as we release the req_lock) */ 131181286adSLars Ellenberg i = peer_req->i; 132db830c46SAndreas Gruenbacher do_al_complete_io = peer_req->flags & EE_CALL_AL_COMPLETE_IO; 133db830c46SAndreas Gruenbacher block_id = peer_req->block_id; 134b411b363SPhilipp Reisner 13587eeee41SPhilipp Reisner spin_lock_irqsave(&mdev->tconn->req_lock, flags); 136db830c46SAndreas Gruenbacher mdev->writ_cnt += peer_req->i.size >> 9; 137db830c46SAndreas Gruenbacher list_del(&peer_req->w.list); /* has been on active_ee or sync_ee */ 138db830c46SAndreas Gruenbacher list_add_tail(&peer_req->w.list, &mdev->done_ee); 139b411b363SPhilipp Reisner 140bb3bfe96SAndreas Gruenbacher /* 1415e472264SAndreas Gruenbacher * Do not remove from the write_requests tree here: we did not send the 142bb3bfe96SAndreas Gruenbacher * Ack yet and did not wake possibly waiting conflicting requests. 143bb3bfe96SAndreas Gruenbacher * Removed from the tree from "drbd_process_done_ee" within the 144bb3bfe96SAndreas Gruenbacher * appropriate w.cb (e_end_block/e_end_resync_block) or from 145bb3bfe96SAndreas Gruenbacher * _drbd_clear_done_ee. 146bb3bfe96SAndreas Gruenbacher */ 147b411b363SPhilipp Reisner 148579b57edSAndreas Gruenbacher do_wake = list_empty(block_id == ID_SYNCER ? &mdev->sync_ee : &mdev->active_ee); 149b411b363SPhilipp Reisner 150db830c46SAndreas Gruenbacher if (test_bit(__EE_WAS_ERROR, &peer_req->flags)) 15181e84650SAndreas Gruenbacher __drbd_chk_io_error(mdev, false); 15287eeee41SPhilipp Reisner spin_unlock_irqrestore(&mdev->tconn->req_lock, flags); 153b411b363SPhilipp Reisner 154579b57edSAndreas Gruenbacher if (block_id == ID_SYNCER) 155181286adSLars Ellenberg drbd_rs_complete_io(mdev, i.sector); 156b411b363SPhilipp Reisner 157b411b363SPhilipp Reisner if (do_wake) 158b411b363SPhilipp Reisner wake_up(&mdev->ee_wait); 159b411b363SPhilipp Reisner 160b411b363SPhilipp Reisner if (do_al_complete_io) 161181286adSLars Ellenberg drbd_al_complete_io(mdev, &i); 162b411b363SPhilipp Reisner 1630625ac19SPhilipp Reisner wake_asender(mdev->tconn); 164b411b363SPhilipp Reisner put_ldev(mdev); 16545bb912bSLars Ellenberg } 166b411b363SPhilipp Reisner 16745bb912bSLars Ellenberg /* writes on behalf of the partner, or resync writes, 16845bb912bSLars Ellenberg * "submitted" by the receiver. 16945bb912bSLars Ellenberg */ 170fcefa62eSAndreas Gruenbacher void drbd_peer_request_endio(struct bio *bio, int error) 17145bb912bSLars Ellenberg { 172db830c46SAndreas Gruenbacher struct drbd_peer_request *peer_req = bio->bi_private; 173a21e9298SPhilipp Reisner struct drbd_conf *mdev = peer_req->w.mdev; 17445bb912bSLars Ellenberg int uptodate = bio_flagged(bio, BIO_UPTODATE); 17545bb912bSLars Ellenberg int is_write = bio_data_dir(bio) == WRITE; 17645bb912bSLars Ellenberg 17707194272SLars Ellenberg if (error && __ratelimit(&drbd_ratelimit_state)) 17845bb912bSLars Ellenberg dev_warn(DEV, "%s: error=%d s=%llus\n", 17945bb912bSLars Ellenberg is_write ? "write" : "read", error, 180db830c46SAndreas Gruenbacher (unsigned long long)peer_req->i.sector); 18145bb912bSLars Ellenberg if (!error && !uptodate) { 18207194272SLars Ellenberg if (__ratelimit(&drbd_ratelimit_state)) 18345bb912bSLars Ellenberg dev_warn(DEV, "%s: setting error to -EIO s=%llus\n", 18445bb912bSLars Ellenberg is_write ? "write" : "read", 185db830c46SAndreas Gruenbacher (unsigned long long)peer_req->i.sector); 18645bb912bSLars Ellenberg /* strange behavior of some lower level drivers... 18745bb912bSLars Ellenberg * fail the request by clearing the uptodate flag, 18845bb912bSLars Ellenberg * but do not return any error?! */ 18945bb912bSLars Ellenberg error = -EIO; 19045bb912bSLars Ellenberg } 19145bb912bSLars Ellenberg 19245bb912bSLars Ellenberg if (error) 193db830c46SAndreas Gruenbacher set_bit(__EE_WAS_ERROR, &peer_req->flags); 19445bb912bSLars Ellenberg 19545bb912bSLars Ellenberg bio_put(bio); /* no need for the bio anymore */ 196db830c46SAndreas Gruenbacher if (atomic_dec_and_test(&peer_req->pending_bios)) { 19745bb912bSLars Ellenberg if (is_write) 198db830c46SAndreas Gruenbacher drbd_endio_write_sec_final(peer_req); 19945bb912bSLars Ellenberg else 200db830c46SAndreas Gruenbacher drbd_endio_read_sec_final(peer_req); 20145bb912bSLars Ellenberg } 202b411b363SPhilipp Reisner } 203b411b363SPhilipp Reisner 204b411b363SPhilipp Reisner /* read, readA or write requests on R_PRIMARY coming from drbd_make_request 205b411b363SPhilipp Reisner */ 206fcefa62eSAndreas Gruenbacher void drbd_request_endio(struct bio *bio, int error) 207b411b363SPhilipp Reisner { 208a115413dSLars Ellenberg unsigned long flags; 209b411b363SPhilipp Reisner struct drbd_request *req = bio->bi_private; 210a21e9298SPhilipp Reisner struct drbd_conf *mdev = req->w.mdev; 211a115413dSLars Ellenberg struct bio_and_error m; 212b411b363SPhilipp Reisner enum drbd_req_event what; 213b411b363SPhilipp Reisner int uptodate = bio_flagged(bio, BIO_UPTODATE); 214b411b363SPhilipp Reisner 215b411b363SPhilipp Reisner if (!error && !uptodate) { 216b411b363SPhilipp Reisner dev_warn(DEV, "p %s: setting error to -EIO\n", 217b411b363SPhilipp Reisner bio_data_dir(bio) == WRITE ? "write" : "read"); 218b411b363SPhilipp Reisner /* strange behavior of some lower level drivers... 219b411b363SPhilipp Reisner * fail the request by clearing the uptodate flag, 220b411b363SPhilipp Reisner * but do not return any error?! */ 221b411b363SPhilipp Reisner error = -EIO; 222b411b363SPhilipp Reisner } 223b411b363SPhilipp Reisner 224b411b363SPhilipp Reisner /* to avoid recursion in __req_mod */ 225b411b363SPhilipp Reisner if (unlikely(error)) { 226b411b363SPhilipp Reisner what = (bio_data_dir(bio) == WRITE) 2278554df1cSAndreas Gruenbacher ? WRITE_COMPLETED_WITH_ERROR 2285c3c7e64SLars Ellenberg : (bio_rw(bio) == READ) 2298554df1cSAndreas Gruenbacher ? READ_COMPLETED_WITH_ERROR 2308554df1cSAndreas Gruenbacher : READ_AHEAD_COMPLETED_WITH_ERROR; 231b411b363SPhilipp Reisner } else 2328554df1cSAndreas Gruenbacher what = COMPLETED_OK; 233b411b363SPhilipp Reisner 234b411b363SPhilipp Reisner bio_put(req->private_bio); 235b411b363SPhilipp Reisner req->private_bio = ERR_PTR(error); 236b411b363SPhilipp Reisner 237a115413dSLars Ellenberg /* not req_mod(), we need irqsave here! */ 23887eeee41SPhilipp Reisner spin_lock_irqsave(&mdev->tconn->req_lock, flags); 239a115413dSLars Ellenberg __req_mod(req, what, &m); 24087eeee41SPhilipp Reisner spin_unlock_irqrestore(&mdev->tconn->req_lock, flags); 241a115413dSLars Ellenberg 242a115413dSLars Ellenberg if (m.bio) 243a115413dSLars Ellenberg complete_master_bio(mdev, &m); 244b411b363SPhilipp Reisner } 245b411b363SPhilipp Reisner 24699920dc5SAndreas Gruenbacher int w_read_retry_remote(struct drbd_work *w, int cancel) 247b411b363SPhilipp Reisner { 248b411b363SPhilipp Reisner struct drbd_request *req = container_of(w, struct drbd_request, w); 24900d56944SPhilipp Reisner struct drbd_conf *mdev = w->mdev; 250b411b363SPhilipp Reisner 251b411b363SPhilipp Reisner /* We should not detach for read io-error, 252b411b363SPhilipp Reisner * but try to WRITE the P_DATA_REPLY to the failed location, 253b411b363SPhilipp Reisner * to give the disk the chance to relocate that block */ 254b411b363SPhilipp Reisner 25587eeee41SPhilipp Reisner spin_lock_irq(&mdev->tconn->req_lock); 256d255e5ffSLars Ellenberg if (cancel || mdev->state.pdsk != D_UP_TO_DATE) { 2578554df1cSAndreas Gruenbacher _req_mod(req, READ_RETRY_REMOTE_CANCELED); 25887eeee41SPhilipp Reisner spin_unlock_irq(&mdev->tconn->req_lock); 25999920dc5SAndreas Gruenbacher return 0; 260b411b363SPhilipp Reisner } 26187eeee41SPhilipp Reisner spin_unlock_irq(&mdev->tconn->req_lock); 262b411b363SPhilipp Reisner 26300d56944SPhilipp Reisner return w_send_read_req(w, 0); 264b411b363SPhilipp Reisner } 265b411b363SPhilipp Reisner 266f6ffca9fSAndreas Gruenbacher void drbd_csum_ee(struct drbd_conf *mdev, struct crypto_hash *tfm, 267db830c46SAndreas Gruenbacher struct drbd_peer_request *peer_req, void *digest) 26845bb912bSLars Ellenberg { 26945bb912bSLars Ellenberg struct hash_desc desc; 27045bb912bSLars Ellenberg struct scatterlist sg; 271db830c46SAndreas Gruenbacher struct page *page = peer_req->pages; 27245bb912bSLars Ellenberg struct page *tmp; 27345bb912bSLars Ellenberg unsigned len; 27445bb912bSLars Ellenberg 27545bb912bSLars Ellenberg desc.tfm = tfm; 27645bb912bSLars Ellenberg desc.flags = 0; 27745bb912bSLars Ellenberg 27845bb912bSLars Ellenberg sg_init_table(&sg, 1); 27945bb912bSLars Ellenberg crypto_hash_init(&desc); 28045bb912bSLars Ellenberg 28145bb912bSLars Ellenberg while ((tmp = page_chain_next(page))) { 28245bb912bSLars Ellenberg /* all but the last page will be fully used */ 28345bb912bSLars Ellenberg sg_set_page(&sg, page, PAGE_SIZE, 0); 28445bb912bSLars Ellenberg crypto_hash_update(&desc, &sg, sg.length); 28545bb912bSLars Ellenberg page = tmp; 28645bb912bSLars Ellenberg } 28745bb912bSLars Ellenberg /* and now the last, possibly only partially used page */ 288db830c46SAndreas Gruenbacher len = peer_req->i.size & (PAGE_SIZE - 1); 28945bb912bSLars Ellenberg sg_set_page(&sg, page, len ?: PAGE_SIZE, 0); 29045bb912bSLars Ellenberg crypto_hash_update(&desc, &sg, sg.length); 29145bb912bSLars Ellenberg crypto_hash_final(&desc, digest); 29245bb912bSLars Ellenberg } 29345bb912bSLars Ellenberg 29445bb912bSLars Ellenberg void drbd_csum_bio(struct drbd_conf *mdev, struct crypto_hash *tfm, struct bio *bio, void *digest) 295b411b363SPhilipp Reisner { 296b411b363SPhilipp Reisner struct hash_desc desc; 297b411b363SPhilipp Reisner struct scatterlist sg; 298b411b363SPhilipp Reisner struct bio_vec *bvec; 299b411b363SPhilipp Reisner int i; 300b411b363SPhilipp Reisner 301b411b363SPhilipp Reisner desc.tfm = tfm; 302b411b363SPhilipp Reisner desc.flags = 0; 303b411b363SPhilipp Reisner 304b411b363SPhilipp Reisner sg_init_table(&sg, 1); 305b411b363SPhilipp Reisner crypto_hash_init(&desc); 306b411b363SPhilipp Reisner 307b411b363SPhilipp Reisner __bio_for_each_segment(bvec, bio, i, 0) { 308b411b363SPhilipp Reisner sg_set_page(&sg, bvec->bv_page, bvec->bv_len, bvec->bv_offset); 309b411b363SPhilipp Reisner crypto_hash_update(&desc, &sg, sg.length); 310b411b363SPhilipp Reisner } 311b411b363SPhilipp Reisner crypto_hash_final(&desc, digest); 312b411b363SPhilipp Reisner } 313b411b363SPhilipp Reisner 3149676c760SLars Ellenberg /* MAYBE merge common code with w_e_end_ov_req */ 31599920dc5SAndreas Gruenbacher static int w_e_send_csum(struct drbd_work *w, int cancel) 316b411b363SPhilipp Reisner { 31700d56944SPhilipp Reisner struct drbd_peer_request *peer_req = container_of(w, struct drbd_peer_request, w); 31800d56944SPhilipp Reisner struct drbd_conf *mdev = w->mdev; 319b411b363SPhilipp Reisner int digest_size; 320b411b363SPhilipp Reisner void *digest; 32199920dc5SAndreas Gruenbacher int err = 0; 322b411b363SPhilipp Reisner 32353ea4331SLars Ellenberg if (unlikely(cancel)) 32453ea4331SLars Ellenberg goto out; 325b411b363SPhilipp Reisner 3269676c760SLars Ellenberg if (unlikely((peer_req->flags & EE_WAS_ERROR) != 0)) 32753ea4331SLars Ellenberg goto out; 32853ea4331SLars Ellenberg 329f399002eSLars Ellenberg digest_size = crypto_hash_digestsize(mdev->tconn->csums_tfm); 330b411b363SPhilipp Reisner digest = kmalloc(digest_size, GFP_NOIO); 331b411b363SPhilipp Reisner if (digest) { 332db830c46SAndreas Gruenbacher sector_t sector = peer_req->i.sector; 333db830c46SAndreas Gruenbacher unsigned int size = peer_req->i.size; 334f399002eSLars Ellenberg drbd_csum_ee(mdev, mdev->tconn->csums_tfm, peer_req, digest); 3359676c760SLars Ellenberg /* Free peer_req and pages before send. 33653ea4331SLars Ellenberg * In case we block on congestion, we could otherwise run into 33753ea4331SLars Ellenberg * some distributed deadlock, if the other side blocks on 33853ea4331SLars Ellenberg * congestion as well, because our receiver blocks in 339c37c8ecfSAndreas Gruenbacher * drbd_alloc_pages due to pp_in_use > max_buffers. */ 3403967deb1SAndreas Gruenbacher drbd_free_peer_req(mdev, peer_req); 341db830c46SAndreas Gruenbacher peer_req = NULL; 342b411b363SPhilipp Reisner inc_rs_pending(mdev); 34399920dc5SAndreas Gruenbacher err = drbd_send_drequest_csum(mdev, sector, size, 34453ea4331SLars Ellenberg digest, digest_size, 345b411b363SPhilipp Reisner P_CSUM_RS_REQUEST); 346b411b363SPhilipp Reisner kfree(digest); 347b411b363SPhilipp Reisner } else { 348b411b363SPhilipp Reisner dev_err(DEV, "kmalloc() of digest failed.\n"); 34999920dc5SAndreas Gruenbacher err = -ENOMEM; 350b411b363SPhilipp Reisner } 351b411b363SPhilipp Reisner 35253ea4331SLars Ellenberg out: 353db830c46SAndreas Gruenbacher if (peer_req) 3543967deb1SAndreas Gruenbacher drbd_free_peer_req(mdev, peer_req); 355b411b363SPhilipp Reisner 35699920dc5SAndreas Gruenbacher if (unlikely(err)) 357b411b363SPhilipp Reisner dev_err(DEV, "drbd_send_drequest(..., csum) failed\n"); 35899920dc5SAndreas Gruenbacher return err; 359b411b363SPhilipp Reisner } 360b411b363SPhilipp Reisner 361b411b363SPhilipp Reisner #define GFP_TRY (__GFP_HIGHMEM | __GFP_NOWARN) 362b411b363SPhilipp Reisner 363b411b363SPhilipp Reisner static int read_for_csum(struct drbd_conf *mdev, sector_t sector, int size) 364b411b363SPhilipp Reisner { 365db830c46SAndreas Gruenbacher struct drbd_peer_request *peer_req; 366b411b363SPhilipp Reisner 367b411b363SPhilipp Reisner if (!get_ldev(mdev)) 36880a40e43SLars Ellenberg return -EIO; 369b411b363SPhilipp Reisner 370e3555d85SPhilipp Reisner if (drbd_rs_should_slow_down(mdev, sector)) 3710f0601f4SLars Ellenberg goto defer; 3720f0601f4SLars Ellenberg 373b411b363SPhilipp Reisner /* GFP_TRY, because if there is no memory available right now, this may 374b411b363SPhilipp Reisner * be rescheduled for later. It is "only" background resync, after all. */ 3750db55363SAndreas Gruenbacher peer_req = drbd_alloc_peer_req(mdev, ID_SYNCER /* unused */, sector, 3760db55363SAndreas Gruenbacher size, GFP_TRY); 377db830c46SAndreas Gruenbacher if (!peer_req) 37880a40e43SLars Ellenberg goto defer; 379b411b363SPhilipp Reisner 380db830c46SAndreas Gruenbacher peer_req->w.cb = w_e_send_csum; 38187eeee41SPhilipp Reisner spin_lock_irq(&mdev->tconn->req_lock); 382db830c46SAndreas Gruenbacher list_add(&peer_req->w.list, &mdev->read_ee); 38387eeee41SPhilipp Reisner spin_unlock_irq(&mdev->tconn->req_lock); 384b411b363SPhilipp Reisner 3850f0601f4SLars Ellenberg atomic_add(size >> 9, &mdev->rs_sect_ev); 386fbe29decSAndreas Gruenbacher if (drbd_submit_peer_request(mdev, peer_req, READ, DRBD_FAULT_RS_RD) == 0) 38780a40e43SLars Ellenberg return 0; 38845bb912bSLars Ellenberg 38910f6d992SLars Ellenberg /* If it failed because of ENOMEM, retry should help. If it failed 39010f6d992SLars Ellenberg * because bio_add_page failed (probably broken lower level driver), 39110f6d992SLars Ellenberg * retry may or may not help. 39210f6d992SLars Ellenberg * If it does not, you may need to force disconnect. */ 39387eeee41SPhilipp Reisner spin_lock_irq(&mdev->tconn->req_lock); 394db830c46SAndreas Gruenbacher list_del(&peer_req->w.list); 39587eeee41SPhilipp Reisner spin_unlock_irq(&mdev->tconn->req_lock); 39622cc37a9SLars Ellenberg 3973967deb1SAndreas Gruenbacher drbd_free_peer_req(mdev, peer_req); 39880a40e43SLars Ellenberg defer: 39945bb912bSLars Ellenberg put_ldev(mdev); 40080a40e43SLars Ellenberg return -EAGAIN; 401b411b363SPhilipp Reisner } 402b411b363SPhilipp Reisner 40399920dc5SAndreas Gruenbacher int w_resync_timer(struct drbd_work *w, int cancel) 404794abb75SPhilipp Reisner { 40500d56944SPhilipp Reisner struct drbd_conf *mdev = w->mdev; 406794abb75SPhilipp Reisner switch (mdev->state.conn) { 407794abb75SPhilipp Reisner case C_VERIFY_S: 40800d56944SPhilipp Reisner w_make_ov_request(w, cancel); 409794abb75SPhilipp Reisner break; 410794abb75SPhilipp Reisner case C_SYNC_TARGET: 41100d56944SPhilipp Reisner w_make_resync_request(w, cancel); 412794abb75SPhilipp Reisner break; 413794abb75SPhilipp Reisner } 414794abb75SPhilipp Reisner 41599920dc5SAndreas Gruenbacher return 0; 416794abb75SPhilipp Reisner } 417794abb75SPhilipp Reisner 418b411b363SPhilipp Reisner void resync_timer_fn(unsigned long data) 419b411b363SPhilipp Reisner { 420b411b363SPhilipp Reisner struct drbd_conf *mdev = (struct drbd_conf *) data; 421b411b363SPhilipp Reisner 422794abb75SPhilipp Reisner if (list_empty(&mdev->resync_work.list)) 423e42325a5SPhilipp Reisner drbd_queue_work(&mdev->tconn->data.work, &mdev->resync_work); 424b411b363SPhilipp Reisner } 425b411b363SPhilipp Reisner 426778f271dSPhilipp Reisner static void fifo_set(struct fifo_buffer *fb, int value) 427778f271dSPhilipp Reisner { 428778f271dSPhilipp Reisner int i; 429778f271dSPhilipp Reisner 430778f271dSPhilipp Reisner for (i = 0; i < fb->size; i++) 431f10f2623SPhilipp Reisner fb->values[i] = value; 432778f271dSPhilipp Reisner } 433778f271dSPhilipp Reisner 434778f271dSPhilipp Reisner static int fifo_push(struct fifo_buffer *fb, int value) 435778f271dSPhilipp Reisner { 436778f271dSPhilipp Reisner int ov; 437778f271dSPhilipp Reisner 438778f271dSPhilipp Reisner ov = fb->values[fb->head_index]; 439778f271dSPhilipp Reisner fb->values[fb->head_index++] = value; 440778f271dSPhilipp Reisner 441778f271dSPhilipp Reisner if (fb->head_index >= fb->size) 442778f271dSPhilipp Reisner fb->head_index = 0; 443778f271dSPhilipp Reisner 444778f271dSPhilipp Reisner return ov; 445778f271dSPhilipp Reisner } 446778f271dSPhilipp Reisner 447778f271dSPhilipp Reisner static void fifo_add_val(struct fifo_buffer *fb, int value) 448778f271dSPhilipp Reisner { 449778f271dSPhilipp Reisner int i; 450778f271dSPhilipp Reisner 451778f271dSPhilipp Reisner for (i = 0; i < fb->size; i++) 452778f271dSPhilipp Reisner fb->values[i] += value; 453778f271dSPhilipp Reisner } 454778f271dSPhilipp Reisner 4559958c857SPhilipp Reisner struct fifo_buffer *fifo_alloc(int fifo_size) 4569958c857SPhilipp Reisner { 4579958c857SPhilipp Reisner struct fifo_buffer *fb; 4589958c857SPhilipp Reisner 4599958c857SPhilipp Reisner fb = kzalloc(sizeof(struct fifo_buffer) + sizeof(int) * fifo_size, GFP_KERNEL); 4609958c857SPhilipp Reisner if (!fb) 4619958c857SPhilipp Reisner return NULL; 4629958c857SPhilipp Reisner 4639958c857SPhilipp Reisner fb->head_index = 0; 4649958c857SPhilipp Reisner fb->size = fifo_size; 4659958c857SPhilipp Reisner fb->total = 0; 4669958c857SPhilipp Reisner 4679958c857SPhilipp Reisner return fb; 4689958c857SPhilipp Reisner } 4699958c857SPhilipp Reisner 4709d77a5feSPhilipp Reisner static int drbd_rs_controller(struct drbd_conf *mdev) 471778f271dSPhilipp Reisner { 472daeda1ccSPhilipp Reisner struct disk_conf *dc; 473778f271dSPhilipp Reisner unsigned int sect_in; /* Number of sectors that came in since the last turn */ 474778f271dSPhilipp Reisner unsigned int want; /* The number of sectors we want in the proxy */ 475778f271dSPhilipp Reisner int req_sect; /* Number of sectors to request in this turn */ 476778f271dSPhilipp Reisner int correction; /* Number of sectors more we need in the proxy*/ 477778f271dSPhilipp Reisner int cps; /* correction per invocation of drbd_rs_controller() */ 478778f271dSPhilipp Reisner int steps; /* Number of time steps to plan ahead */ 479778f271dSPhilipp Reisner int curr_corr; 480778f271dSPhilipp Reisner int max_sect; 481813472ceSPhilipp Reisner struct fifo_buffer *plan; 482778f271dSPhilipp Reisner 483778f271dSPhilipp Reisner sect_in = atomic_xchg(&mdev->rs_sect_in, 0); /* Number of sectors that came in */ 484778f271dSPhilipp Reisner mdev->rs_in_flight -= sect_in; 485778f271dSPhilipp Reisner 486daeda1ccSPhilipp Reisner dc = rcu_dereference(mdev->ldev->disk_conf); 487813472ceSPhilipp Reisner plan = rcu_dereference(mdev->rs_plan_s); 488778f271dSPhilipp Reisner 489813472ceSPhilipp Reisner steps = plan->size; /* (dc->c_plan_ahead * 10 * SLEEP_TIME) / HZ; */ 490778f271dSPhilipp Reisner 491778f271dSPhilipp Reisner if (mdev->rs_in_flight + sect_in == 0) { /* At start of resync */ 492daeda1ccSPhilipp Reisner want = ((dc->resync_rate * 2 * SLEEP_TIME) / HZ) * steps; 493778f271dSPhilipp Reisner } else { /* normal path */ 494daeda1ccSPhilipp Reisner want = dc->c_fill_target ? dc->c_fill_target : 495daeda1ccSPhilipp Reisner sect_in * dc->c_delay_target * HZ / (SLEEP_TIME * 10); 496778f271dSPhilipp Reisner } 497778f271dSPhilipp Reisner 498813472ceSPhilipp Reisner correction = want - mdev->rs_in_flight - plan->total; 499778f271dSPhilipp Reisner 500778f271dSPhilipp Reisner /* Plan ahead */ 501778f271dSPhilipp Reisner cps = correction / steps; 502813472ceSPhilipp Reisner fifo_add_val(plan, cps); 503813472ceSPhilipp Reisner plan->total += cps * steps; 504778f271dSPhilipp Reisner 505778f271dSPhilipp Reisner /* What we do in this step */ 506813472ceSPhilipp Reisner curr_corr = fifo_push(plan, 0); 507813472ceSPhilipp Reisner plan->total -= curr_corr; 508778f271dSPhilipp Reisner 509778f271dSPhilipp Reisner req_sect = sect_in + curr_corr; 510778f271dSPhilipp Reisner if (req_sect < 0) 511778f271dSPhilipp Reisner req_sect = 0; 512778f271dSPhilipp Reisner 513daeda1ccSPhilipp Reisner max_sect = (dc->c_max_rate * 2 * SLEEP_TIME) / HZ; 514778f271dSPhilipp Reisner if (req_sect > max_sect) 515778f271dSPhilipp Reisner req_sect = max_sect; 516778f271dSPhilipp Reisner 517778f271dSPhilipp Reisner /* 518778f271dSPhilipp Reisner dev_warn(DEV, "si=%u if=%d wa=%u co=%d st=%d cps=%d pl=%d cc=%d rs=%d\n", 519778f271dSPhilipp Reisner sect_in, mdev->rs_in_flight, want, correction, 520778f271dSPhilipp Reisner steps, cps, mdev->rs_planed, curr_corr, req_sect); 521778f271dSPhilipp Reisner */ 522778f271dSPhilipp Reisner 523778f271dSPhilipp Reisner return req_sect; 524778f271dSPhilipp Reisner } 525778f271dSPhilipp Reisner 5269d77a5feSPhilipp Reisner static int drbd_rs_number_requests(struct drbd_conf *mdev) 527e65f440dSLars Ellenberg { 528e65f440dSLars Ellenberg int number; 529813472ceSPhilipp Reisner 530813472ceSPhilipp Reisner rcu_read_lock(); 531813472ceSPhilipp Reisner if (rcu_dereference(mdev->rs_plan_s)->size) { 532e65f440dSLars Ellenberg number = drbd_rs_controller(mdev) >> (BM_BLOCK_SHIFT - 9); 533e65f440dSLars Ellenberg mdev->c_sync_rate = number * HZ * (BM_BLOCK_SIZE / 1024) / SLEEP_TIME; 534e65f440dSLars Ellenberg } else { 535daeda1ccSPhilipp Reisner mdev->c_sync_rate = rcu_dereference(mdev->ldev->disk_conf)->resync_rate; 536e65f440dSLars Ellenberg number = SLEEP_TIME * mdev->c_sync_rate / ((BM_BLOCK_SIZE / 1024) * HZ); 537e65f440dSLars Ellenberg } 538813472ceSPhilipp Reisner rcu_read_unlock(); 539e65f440dSLars Ellenberg 540e65f440dSLars Ellenberg /* ignore the amount of pending requests, the resync controller should 541e65f440dSLars Ellenberg * throttle down to incoming reply rate soon enough anyways. */ 542e65f440dSLars Ellenberg return number; 543e65f440dSLars Ellenberg } 544e65f440dSLars Ellenberg 54599920dc5SAndreas Gruenbacher int w_make_resync_request(struct drbd_work *w, int cancel) 546b411b363SPhilipp Reisner { 54700d56944SPhilipp Reisner struct drbd_conf *mdev = w->mdev; 548b411b363SPhilipp Reisner unsigned long bit; 549b411b363SPhilipp Reisner sector_t sector; 550b411b363SPhilipp Reisner const sector_t capacity = drbd_get_capacity(mdev->this_bdev); 5511816a2b4SLars Ellenberg int max_bio_size; 552e65f440dSLars Ellenberg int number, rollback_i, size; 553b411b363SPhilipp Reisner int align, queued, sndbuf; 5540f0601f4SLars Ellenberg int i = 0; 555b411b363SPhilipp Reisner 556b411b363SPhilipp Reisner if (unlikely(cancel)) 55799920dc5SAndreas Gruenbacher return 0; 558b411b363SPhilipp Reisner 559af85e8e8SLars Ellenberg if (mdev->rs_total == 0) { 560af85e8e8SLars Ellenberg /* empty resync? */ 561af85e8e8SLars Ellenberg drbd_resync_finished(mdev); 56299920dc5SAndreas Gruenbacher return 0; 563af85e8e8SLars Ellenberg } 564af85e8e8SLars Ellenberg 565b411b363SPhilipp Reisner if (!get_ldev(mdev)) { 566b411b363SPhilipp Reisner /* Since we only need to access mdev->rsync a 567b411b363SPhilipp Reisner get_ldev_if_state(mdev,D_FAILED) would be sufficient, but 568b411b363SPhilipp Reisner to continue resync with a broken disk makes no sense at 569b411b363SPhilipp Reisner all */ 570b411b363SPhilipp Reisner dev_err(DEV, "Disk broke down during resync!\n"); 57199920dc5SAndreas Gruenbacher return 0; 572b411b363SPhilipp Reisner } 573b411b363SPhilipp Reisner 5740cfdd247SPhilipp Reisner max_bio_size = queue_max_hw_sectors(mdev->rq_queue) << 9; 575e65f440dSLars Ellenberg number = drbd_rs_number_requests(mdev); 576e65f440dSLars Ellenberg if (number == 0) 5770f0601f4SLars Ellenberg goto requeue; 578b411b363SPhilipp Reisner 579b411b363SPhilipp Reisner for (i = 0; i < number; i++) { 580b411b363SPhilipp Reisner /* Stop generating RS requests, when half of the send buffer is filled */ 581e42325a5SPhilipp Reisner mutex_lock(&mdev->tconn->data.mutex); 582e42325a5SPhilipp Reisner if (mdev->tconn->data.socket) { 583e42325a5SPhilipp Reisner queued = mdev->tconn->data.socket->sk->sk_wmem_queued; 584e42325a5SPhilipp Reisner sndbuf = mdev->tconn->data.socket->sk->sk_sndbuf; 585b411b363SPhilipp Reisner } else { 586b411b363SPhilipp Reisner queued = 1; 587b411b363SPhilipp Reisner sndbuf = 0; 588b411b363SPhilipp Reisner } 589e42325a5SPhilipp Reisner mutex_unlock(&mdev->tconn->data.mutex); 590b411b363SPhilipp Reisner if (queued > sndbuf / 2) 591b411b363SPhilipp Reisner goto requeue; 592b411b363SPhilipp Reisner 593b411b363SPhilipp Reisner next_sector: 594b411b363SPhilipp Reisner size = BM_BLOCK_SIZE; 595b411b363SPhilipp Reisner bit = drbd_bm_find_next(mdev, mdev->bm_resync_fo); 596b411b363SPhilipp Reisner 5974b0715f0SLars Ellenberg if (bit == DRBD_END_OF_BITMAP) { 598b411b363SPhilipp Reisner mdev->bm_resync_fo = drbd_bm_bits(mdev); 599b411b363SPhilipp Reisner put_ldev(mdev); 60099920dc5SAndreas Gruenbacher return 0; 601b411b363SPhilipp Reisner } 602b411b363SPhilipp Reisner 603b411b363SPhilipp Reisner sector = BM_BIT_TO_SECT(bit); 604b411b363SPhilipp Reisner 605e3555d85SPhilipp Reisner if (drbd_rs_should_slow_down(mdev, sector) || 606e3555d85SPhilipp Reisner drbd_try_rs_begin_io(mdev, sector)) { 607b411b363SPhilipp Reisner mdev->bm_resync_fo = bit; 608b411b363SPhilipp Reisner goto requeue; 609b411b363SPhilipp Reisner } 610b411b363SPhilipp Reisner mdev->bm_resync_fo = bit + 1; 611b411b363SPhilipp Reisner 612b411b363SPhilipp Reisner if (unlikely(drbd_bm_test_bit(mdev, bit) == 0)) { 613b411b363SPhilipp Reisner drbd_rs_complete_io(mdev, sector); 614b411b363SPhilipp Reisner goto next_sector; 615b411b363SPhilipp Reisner } 616b411b363SPhilipp Reisner 6171816a2b4SLars Ellenberg #if DRBD_MAX_BIO_SIZE > BM_BLOCK_SIZE 618b411b363SPhilipp Reisner /* try to find some adjacent bits. 619b411b363SPhilipp Reisner * we stop if we have already the maximum req size. 620b411b363SPhilipp Reisner * 621b411b363SPhilipp Reisner * Additionally always align bigger requests, in order to 622b411b363SPhilipp Reisner * be prepared for all stripe sizes of software RAIDs. 623b411b363SPhilipp Reisner */ 624b411b363SPhilipp Reisner align = 1; 625d207450cSPhilipp Reisner rollback_i = i; 626b411b363SPhilipp Reisner for (;;) { 6271816a2b4SLars Ellenberg if (size + BM_BLOCK_SIZE > max_bio_size) 628b411b363SPhilipp Reisner break; 629b411b363SPhilipp Reisner 630b411b363SPhilipp Reisner /* Be always aligned */ 631b411b363SPhilipp Reisner if (sector & ((1<<(align+3))-1)) 632b411b363SPhilipp Reisner break; 633b411b363SPhilipp Reisner 634b411b363SPhilipp Reisner /* do not cross extent boundaries */ 635b411b363SPhilipp Reisner if (((bit+1) & BM_BLOCKS_PER_BM_EXT_MASK) == 0) 636b411b363SPhilipp Reisner break; 637b411b363SPhilipp Reisner /* now, is it actually dirty, after all? 638b411b363SPhilipp Reisner * caution, drbd_bm_test_bit is tri-state for some 639b411b363SPhilipp Reisner * obscure reason; ( b == 0 ) would get the out-of-band 640b411b363SPhilipp Reisner * only accidentally right because of the "oddly sized" 641b411b363SPhilipp Reisner * adjustment below */ 642b411b363SPhilipp Reisner if (drbd_bm_test_bit(mdev, bit+1) != 1) 643b411b363SPhilipp Reisner break; 644b411b363SPhilipp Reisner bit++; 645b411b363SPhilipp Reisner size += BM_BLOCK_SIZE; 646b411b363SPhilipp Reisner if ((BM_BLOCK_SIZE << align) <= size) 647b411b363SPhilipp Reisner align++; 648b411b363SPhilipp Reisner i++; 649b411b363SPhilipp Reisner } 650b411b363SPhilipp Reisner /* if we merged some, 651b411b363SPhilipp Reisner * reset the offset to start the next drbd_bm_find_next from */ 652b411b363SPhilipp Reisner if (size > BM_BLOCK_SIZE) 653b411b363SPhilipp Reisner mdev->bm_resync_fo = bit + 1; 654b411b363SPhilipp Reisner #endif 655b411b363SPhilipp Reisner 656b411b363SPhilipp Reisner /* adjust very last sectors, in case we are oddly sized */ 657b411b363SPhilipp Reisner if (sector + (size>>9) > capacity) 658b411b363SPhilipp Reisner size = (capacity-sector)<<9; 659f399002eSLars Ellenberg if (mdev->tconn->agreed_pro_version >= 89 && mdev->tconn->csums_tfm) { 660b411b363SPhilipp Reisner switch (read_for_csum(mdev, sector, size)) { 66180a40e43SLars Ellenberg case -EIO: /* Disk failure */ 662b411b363SPhilipp Reisner put_ldev(mdev); 66399920dc5SAndreas Gruenbacher return -EIO; 66480a40e43SLars Ellenberg case -EAGAIN: /* allocation failed, or ldev busy */ 665b411b363SPhilipp Reisner drbd_rs_complete_io(mdev, sector); 666b411b363SPhilipp Reisner mdev->bm_resync_fo = BM_SECT_TO_BIT(sector); 667d207450cSPhilipp Reisner i = rollback_i; 668b411b363SPhilipp Reisner goto requeue; 66980a40e43SLars Ellenberg case 0: 67080a40e43SLars Ellenberg /* everything ok */ 67180a40e43SLars Ellenberg break; 67280a40e43SLars Ellenberg default: 67380a40e43SLars Ellenberg BUG(); 674b411b363SPhilipp Reisner } 675b411b363SPhilipp Reisner } else { 67699920dc5SAndreas Gruenbacher int err; 67799920dc5SAndreas Gruenbacher 678b411b363SPhilipp Reisner inc_rs_pending(mdev); 67999920dc5SAndreas Gruenbacher err = drbd_send_drequest(mdev, P_RS_DATA_REQUEST, 68099920dc5SAndreas Gruenbacher sector, size, ID_SYNCER); 68199920dc5SAndreas Gruenbacher if (err) { 682b411b363SPhilipp Reisner dev_err(DEV, "drbd_send_drequest() failed, aborting...\n"); 683b411b363SPhilipp Reisner dec_rs_pending(mdev); 684b411b363SPhilipp Reisner put_ldev(mdev); 68599920dc5SAndreas Gruenbacher return err; 686b411b363SPhilipp Reisner } 687b411b363SPhilipp Reisner } 688b411b363SPhilipp Reisner } 689b411b363SPhilipp Reisner 690b411b363SPhilipp Reisner if (mdev->bm_resync_fo >= drbd_bm_bits(mdev)) { 691b411b363SPhilipp Reisner /* last syncer _request_ was sent, 692b411b363SPhilipp Reisner * but the P_RS_DATA_REPLY not yet received. sync will end (and 693b411b363SPhilipp Reisner * next sync group will resume), as soon as we receive the last 694b411b363SPhilipp Reisner * resync data block, and the last bit is cleared. 695b411b363SPhilipp Reisner * until then resync "work" is "inactive" ... 696b411b363SPhilipp Reisner */ 697b411b363SPhilipp Reisner put_ldev(mdev); 69899920dc5SAndreas Gruenbacher return 0; 699b411b363SPhilipp Reisner } 700b411b363SPhilipp Reisner 701b411b363SPhilipp Reisner requeue: 702778f271dSPhilipp Reisner mdev->rs_in_flight += (i << (BM_BLOCK_SHIFT - 9)); 703b411b363SPhilipp Reisner mod_timer(&mdev->resync_timer, jiffies + SLEEP_TIME); 704b411b363SPhilipp Reisner put_ldev(mdev); 70599920dc5SAndreas Gruenbacher return 0; 706b411b363SPhilipp Reisner } 707b411b363SPhilipp Reisner 70800d56944SPhilipp Reisner static int w_make_ov_request(struct drbd_work *w, int cancel) 709b411b363SPhilipp Reisner { 71000d56944SPhilipp Reisner struct drbd_conf *mdev = w->mdev; 711b411b363SPhilipp Reisner int number, i, size; 712b411b363SPhilipp Reisner sector_t sector; 713b411b363SPhilipp Reisner const sector_t capacity = drbd_get_capacity(mdev->this_bdev); 714b411b363SPhilipp Reisner 715b411b363SPhilipp Reisner if (unlikely(cancel)) 716b411b363SPhilipp Reisner return 1; 717b411b363SPhilipp Reisner 7182649f080SLars Ellenberg number = drbd_rs_number_requests(mdev); 719b411b363SPhilipp Reisner 720b411b363SPhilipp Reisner sector = mdev->ov_position; 721b411b363SPhilipp Reisner for (i = 0; i < number; i++) { 722b411b363SPhilipp Reisner if (sector >= capacity) { 723b411b363SPhilipp Reisner return 1; 724b411b363SPhilipp Reisner } 725b411b363SPhilipp Reisner 726b411b363SPhilipp Reisner size = BM_BLOCK_SIZE; 727b411b363SPhilipp Reisner 728e3555d85SPhilipp Reisner if (drbd_rs_should_slow_down(mdev, sector) || 729e3555d85SPhilipp Reisner drbd_try_rs_begin_io(mdev, sector)) { 730b411b363SPhilipp Reisner mdev->ov_position = sector; 731b411b363SPhilipp Reisner goto requeue; 732b411b363SPhilipp Reisner } 733b411b363SPhilipp Reisner 734b411b363SPhilipp Reisner if (sector + (size>>9) > capacity) 735b411b363SPhilipp Reisner size = (capacity-sector)<<9; 736b411b363SPhilipp Reisner 737b411b363SPhilipp Reisner inc_rs_pending(mdev); 7385b9f499cSAndreas Gruenbacher if (drbd_send_ov_request(mdev, sector, size)) { 739b411b363SPhilipp Reisner dec_rs_pending(mdev); 740b411b363SPhilipp Reisner return 0; 741b411b363SPhilipp Reisner } 742b411b363SPhilipp Reisner sector += BM_SECT_PER_BIT; 743b411b363SPhilipp Reisner } 744b411b363SPhilipp Reisner mdev->ov_position = sector; 745b411b363SPhilipp Reisner 746b411b363SPhilipp Reisner requeue: 7472649f080SLars Ellenberg mdev->rs_in_flight += (i << (BM_BLOCK_SHIFT - 9)); 748b411b363SPhilipp Reisner mod_timer(&mdev->resync_timer, jiffies + SLEEP_TIME); 749b411b363SPhilipp Reisner return 1; 750b411b363SPhilipp Reisner } 751b411b363SPhilipp Reisner 75299920dc5SAndreas Gruenbacher int w_ov_finished(struct drbd_work *w, int cancel) 753b411b363SPhilipp Reisner { 75400d56944SPhilipp Reisner struct drbd_conf *mdev = w->mdev; 755b411b363SPhilipp Reisner kfree(w); 7568f7bed77SAndreas Gruenbacher ov_out_of_sync_print(mdev); 757b411b363SPhilipp Reisner drbd_resync_finished(mdev); 758b411b363SPhilipp Reisner 75999920dc5SAndreas Gruenbacher return 0; 760b411b363SPhilipp Reisner } 761b411b363SPhilipp Reisner 76299920dc5SAndreas Gruenbacher static int w_resync_finished(struct drbd_work *w, int cancel) 763b411b363SPhilipp Reisner { 76400d56944SPhilipp Reisner struct drbd_conf *mdev = w->mdev; 765b411b363SPhilipp Reisner kfree(w); 766b411b363SPhilipp Reisner 767b411b363SPhilipp Reisner drbd_resync_finished(mdev); 768b411b363SPhilipp Reisner 76999920dc5SAndreas Gruenbacher return 0; 770b411b363SPhilipp Reisner } 771b411b363SPhilipp Reisner 772af85e8e8SLars Ellenberg static void ping_peer(struct drbd_conf *mdev) 773af85e8e8SLars Ellenberg { 7742a67d8b9SPhilipp Reisner struct drbd_tconn *tconn = mdev->tconn; 7752a67d8b9SPhilipp Reisner 7762a67d8b9SPhilipp Reisner clear_bit(GOT_PING_ACK, &tconn->flags); 7772a67d8b9SPhilipp Reisner request_ping(tconn); 7782a67d8b9SPhilipp Reisner wait_event(tconn->ping_wait, 7792a67d8b9SPhilipp Reisner test_bit(GOT_PING_ACK, &tconn->flags) || mdev->state.conn < C_CONNECTED); 780af85e8e8SLars Ellenberg } 781af85e8e8SLars Ellenberg 782b411b363SPhilipp Reisner int drbd_resync_finished(struct drbd_conf *mdev) 783b411b363SPhilipp Reisner { 784b411b363SPhilipp Reisner unsigned long db, dt, dbdt; 785b411b363SPhilipp Reisner unsigned long n_oos; 786b411b363SPhilipp Reisner union drbd_state os, ns; 787b411b363SPhilipp Reisner struct drbd_work *w; 788b411b363SPhilipp Reisner char *khelper_cmd = NULL; 78926525618SLars Ellenberg int verify_done = 0; 790b411b363SPhilipp Reisner 791b411b363SPhilipp Reisner /* Remove all elements from the resync LRU. Since future actions 792b411b363SPhilipp Reisner * might set bits in the (main) bitmap, then the entries in the 793b411b363SPhilipp Reisner * resync LRU would be wrong. */ 794b411b363SPhilipp Reisner if (drbd_rs_del_all(mdev)) { 795b411b363SPhilipp Reisner /* In case this is not possible now, most probably because 796b411b363SPhilipp Reisner * there are P_RS_DATA_REPLY Packets lingering on the worker's 797b411b363SPhilipp Reisner * queue (or even the read operations for those packets 798b411b363SPhilipp Reisner * is not finished by now). Retry in 100ms. */ 799b411b363SPhilipp Reisner 80020ee6390SPhilipp Reisner schedule_timeout_interruptible(HZ / 10); 801b411b363SPhilipp Reisner w = kmalloc(sizeof(struct drbd_work), GFP_ATOMIC); 802b411b363SPhilipp Reisner if (w) { 803b411b363SPhilipp Reisner w->cb = w_resync_finished; 8049b743da9SPhilipp Reisner w->mdev = mdev; 805e42325a5SPhilipp Reisner drbd_queue_work(&mdev->tconn->data.work, w); 806b411b363SPhilipp Reisner return 1; 807b411b363SPhilipp Reisner } 808b411b363SPhilipp Reisner dev_err(DEV, "Warn failed to drbd_rs_del_all() and to kmalloc(w).\n"); 809b411b363SPhilipp Reisner } 810b411b363SPhilipp Reisner 811b411b363SPhilipp Reisner dt = (jiffies - mdev->rs_start - mdev->rs_paused) / HZ; 812b411b363SPhilipp Reisner if (dt <= 0) 813b411b363SPhilipp Reisner dt = 1; 814b411b363SPhilipp Reisner db = mdev->rs_total; 815b411b363SPhilipp Reisner dbdt = Bit2KB(db/dt); 816b411b363SPhilipp Reisner mdev->rs_paused /= HZ; 817b411b363SPhilipp Reisner 818b411b363SPhilipp Reisner if (!get_ldev(mdev)) 819b411b363SPhilipp Reisner goto out; 820b411b363SPhilipp Reisner 821af85e8e8SLars Ellenberg ping_peer(mdev); 822af85e8e8SLars Ellenberg 82387eeee41SPhilipp Reisner spin_lock_irq(&mdev->tconn->req_lock); 82478bae59bSPhilipp Reisner os = drbd_read_state(mdev); 825b411b363SPhilipp Reisner 82626525618SLars Ellenberg verify_done = (os.conn == C_VERIFY_S || os.conn == C_VERIFY_T); 82726525618SLars Ellenberg 828b411b363SPhilipp Reisner /* This protects us against multiple calls (that can happen in the presence 829b411b363SPhilipp Reisner of application IO), and against connectivity loss just before we arrive here. */ 830b411b363SPhilipp Reisner if (os.conn <= C_CONNECTED) 831b411b363SPhilipp Reisner goto out_unlock; 832b411b363SPhilipp Reisner 833b411b363SPhilipp Reisner ns = os; 834b411b363SPhilipp Reisner ns.conn = C_CONNECTED; 835b411b363SPhilipp Reisner 836b411b363SPhilipp Reisner dev_info(DEV, "%s done (total %lu sec; paused %lu sec; %lu K/sec)\n", 83726525618SLars Ellenberg verify_done ? "Online verify " : "Resync", 838b411b363SPhilipp Reisner dt + mdev->rs_paused, mdev->rs_paused, dbdt); 839b411b363SPhilipp Reisner 840b411b363SPhilipp Reisner n_oos = drbd_bm_total_weight(mdev); 841b411b363SPhilipp Reisner 842b411b363SPhilipp Reisner if (os.conn == C_VERIFY_S || os.conn == C_VERIFY_T) { 843b411b363SPhilipp Reisner if (n_oos) { 844b411b363SPhilipp Reisner dev_alert(DEV, "Online verify found %lu %dk block out of sync!\n", 845b411b363SPhilipp Reisner n_oos, Bit2KB(1)); 846b411b363SPhilipp Reisner khelper_cmd = "out-of-sync"; 847b411b363SPhilipp Reisner } 848b411b363SPhilipp Reisner } else { 849b411b363SPhilipp Reisner D_ASSERT((n_oos - mdev->rs_failed) == 0); 850b411b363SPhilipp Reisner 851b411b363SPhilipp Reisner if (os.conn == C_SYNC_TARGET || os.conn == C_PAUSED_SYNC_T) 852b411b363SPhilipp Reisner khelper_cmd = "after-resync-target"; 853b411b363SPhilipp Reisner 854f399002eSLars Ellenberg if (mdev->tconn->csums_tfm && mdev->rs_total) { 855b411b363SPhilipp Reisner const unsigned long s = mdev->rs_same_csum; 856b411b363SPhilipp Reisner const unsigned long t = mdev->rs_total; 857b411b363SPhilipp Reisner const int ratio = 858b411b363SPhilipp Reisner (t == 0) ? 0 : 859b411b363SPhilipp Reisner (t < 100000) ? ((s*100)/t) : (s/(t/100)); 860b411b363SPhilipp Reisner dev_info(DEV, "%u %% had equal checksums, eliminated: %luK; " 861b411b363SPhilipp Reisner "transferred %luK total %luK\n", 862b411b363SPhilipp Reisner ratio, 863b411b363SPhilipp Reisner Bit2KB(mdev->rs_same_csum), 864b411b363SPhilipp Reisner Bit2KB(mdev->rs_total - mdev->rs_same_csum), 865b411b363SPhilipp Reisner Bit2KB(mdev->rs_total)); 866b411b363SPhilipp Reisner } 867b411b363SPhilipp Reisner } 868b411b363SPhilipp Reisner 869b411b363SPhilipp Reisner if (mdev->rs_failed) { 870b411b363SPhilipp Reisner dev_info(DEV, " %lu failed blocks\n", mdev->rs_failed); 871b411b363SPhilipp Reisner 872b411b363SPhilipp Reisner if (os.conn == C_SYNC_TARGET || os.conn == C_PAUSED_SYNC_T) { 873b411b363SPhilipp Reisner ns.disk = D_INCONSISTENT; 874b411b363SPhilipp Reisner ns.pdsk = D_UP_TO_DATE; 875b411b363SPhilipp Reisner } else { 876b411b363SPhilipp Reisner ns.disk = D_UP_TO_DATE; 877b411b363SPhilipp Reisner ns.pdsk = D_INCONSISTENT; 878b411b363SPhilipp Reisner } 879b411b363SPhilipp Reisner } else { 880b411b363SPhilipp Reisner ns.disk = D_UP_TO_DATE; 881b411b363SPhilipp Reisner ns.pdsk = D_UP_TO_DATE; 882b411b363SPhilipp Reisner 883b411b363SPhilipp Reisner if (os.conn == C_SYNC_TARGET || os.conn == C_PAUSED_SYNC_T) { 884b411b363SPhilipp Reisner if (mdev->p_uuid) { 885b411b363SPhilipp Reisner int i; 886b411b363SPhilipp Reisner for (i = UI_BITMAP ; i <= UI_HISTORY_END ; i++) 887b411b363SPhilipp Reisner _drbd_uuid_set(mdev, i, mdev->p_uuid[i]); 888b411b363SPhilipp Reisner drbd_uuid_set(mdev, UI_BITMAP, mdev->ldev->md.uuid[UI_CURRENT]); 889b411b363SPhilipp Reisner _drbd_uuid_set(mdev, UI_CURRENT, mdev->p_uuid[UI_CURRENT]); 890b411b363SPhilipp Reisner } else { 891b411b363SPhilipp Reisner dev_err(DEV, "mdev->p_uuid is NULL! BUG\n"); 892b411b363SPhilipp Reisner } 893b411b363SPhilipp Reisner } 894b411b363SPhilipp Reisner 89562b0da3aSLars Ellenberg if (!(os.conn == C_VERIFY_S || os.conn == C_VERIFY_T)) { 89662b0da3aSLars Ellenberg /* for verify runs, we don't update uuids here, 89762b0da3aSLars Ellenberg * so there would be nothing to report. */ 898b411b363SPhilipp Reisner drbd_uuid_set_bm(mdev, 0UL); 89962b0da3aSLars Ellenberg drbd_print_uuids(mdev, "updated UUIDs"); 900b411b363SPhilipp Reisner if (mdev->p_uuid) { 901b411b363SPhilipp Reisner /* Now the two UUID sets are equal, update what we 902b411b363SPhilipp Reisner * know of the peer. */ 903b411b363SPhilipp Reisner int i; 904b411b363SPhilipp Reisner for (i = UI_CURRENT ; i <= UI_HISTORY_END ; i++) 905b411b363SPhilipp Reisner mdev->p_uuid[i] = mdev->ldev->md.uuid[i]; 906b411b363SPhilipp Reisner } 907b411b363SPhilipp Reisner } 90862b0da3aSLars Ellenberg } 909b411b363SPhilipp Reisner 910b411b363SPhilipp Reisner _drbd_set_state(mdev, ns, CS_VERBOSE, NULL); 911b411b363SPhilipp Reisner out_unlock: 91287eeee41SPhilipp Reisner spin_unlock_irq(&mdev->tconn->req_lock); 913b411b363SPhilipp Reisner put_ldev(mdev); 914b411b363SPhilipp Reisner out: 915b411b363SPhilipp Reisner mdev->rs_total = 0; 916b411b363SPhilipp Reisner mdev->rs_failed = 0; 917b411b363SPhilipp Reisner mdev->rs_paused = 0; 91826525618SLars Ellenberg if (verify_done) 919b411b363SPhilipp Reisner mdev->ov_start_sector = 0; 920b411b363SPhilipp Reisner 92113d42685SLars Ellenberg drbd_md_sync(mdev); 92213d42685SLars Ellenberg 923b411b363SPhilipp Reisner if (khelper_cmd) 924b411b363SPhilipp Reisner drbd_khelper(mdev, khelper_cmd); 925b411b363SPhilipp Reisner 926b411b363SPhilipp Reisner return 1; 927b411b363SPhilipp Reisner } 928b411b363SPhilipp Reisner 929b411b363SPhilipp Reisner /* helper */ 930db830c46SAndreas Gruenbacher static void move_to_net_ee_or_free(struct drbd_conf *mdev, struct drbd_peer_request *peer_req) 931b411b363SPhilipp Reisner { 932045417f7SAndreas Gruenbacher if (drbd_peer_req_has_active_page(peer_req)) { 933b411b363SPhilipp Reisner /* This might happen if sendpage() has not finished */ 934db830c46SAndreas Gruenbacher int i = (peer_req->i.size + PAGE_SIZE -1) >> PAGE_SHIFT; 935435f0740SLars Ellenberg atomic_add(i, &mdev->pp_in_use_by_net); 936435f0740SLars Ellenberg atomic_sub(i, &mdev->pp_in_use); 93787eeee41SPhilipp Reisner spin_lock_irq(&mdev->tconn->req_lock); 938db830c46SAndreas Gruenbacher list_add_tail(&peer_req->w.list, &mdev->net_ee); 93987eeee41SPhilipp Reisner spin_unlock_irq(&mdev->tconn->req_lock); 940435f0740SLars Ellenberg wake_up(&drbd_pp_wait); 941b411b363SPhilipp Reisner } else 9423967deb1SAndreas Gruenbacher drbd_free_peer_req(mdev, peer_req); 943b411b363SPhilipp Reisner } 944b411b363SPhilipp Reisner 945b411b363SPhilipp Reisner /** 946b411b363SPhilipp Reisner * w_e_end_data_req() - Worker callback, to send a P_DATA_REPLY packet in response to a P_DATA_REQUEST 947b411b363SPhilipp Reisner * @mdev: DRBD device. 948b411b363SPhilipp Reisner * @w: work object. 949b411b363SPhilipp Reisner * @cancel: The connection will be closed anyways 950b411b363SPhilipp Reisner */ 95199920dc5SAndreas Gruenbacher int w_e_end_data_req(struct drbd_work *w, int cancel) 952b411b363SPhilipp Reisner { 953db830c46SAndreas Gruenbacher struct drbd_peer_request *peer_req = container_of(w, struct drbd_peer_request, w); 95400d56944SPhilipp Reisner struct drbd_conf *mdev = w->mdev; 95599920dc5SAndreas Gruenbacher int err; 956b411b363SPhilipp Reisner 957b411b363SPhilipp Reisner if (unlikely(cancel)) { 9583967deb1SAndreas Gruenbacher drbd_free_peer_req(mdev, peer_req); 959b411b363SPhilipp Reisner dec_unacked(mdev); 96099920dc5SAndreas Gruenbacher return 0; 961b411b363SPhilipp Reisner } 962b411b363SPhilipp Reisner 963db830c46SAndreas Gruenbacher if (likely((peer_req->flags & EE_WAS_ERROR) == 0)) { 96499920dc5SAndreas Gruenbacher err = drbd_send_block(mdev, P_DATA_REPLY, peer_req); 965b411b363SPhilipp Reisner } else { 966b411b363SPhilipp Reisner if (__ratelimit(&drbd_ratelimit_state)) 967b411b363SPhilipp Reisner dev_err(DEV, "Sending NegDReply. sector=%llus.\n", 968db830c46SAndreas Gruenbacher (unsigned long long)peer_req->i.sector); 969b411b363SPhilipp Reisner 97099920dc5SAndreas Gruenbacher err = drbd_send_ack(mdev, P_NEG_DREPLY, peer_req); 971b411b363SPhilipp Reisner } 972b411b363SPhilipp Reisner 973b411b363SPhilipp Reisner dec_unacked(mdev); 974b411b363SPhilipp Reisner 975db830c46SAndreas Gruenbacher move_to_net_ee_or_free(mdev, peer_req); 976b411b363SPhilipp Reisner 97799920dc5SAndreas Gruenbacher if (unlikely(err)) 978b411b363SPhilipp Reisner dev_err(DEV, "drbd_send_block() failed\n"); 97999920dc5SAndreas Gruenbacher return err; 980b411b363SPhilipp Reisner } 981b411b363SPhilipp Reisner 982b411b363SPhilipp Reisner /** 983a209b4aeSAndreas Gruenbacher * w_e_end_rsdata_req() - Worker callback to send a P_RS_DATA_REPLY packet in response to a P_RS_DATA_REQUEST 984b411b363SPhilipp Reisner * @mdev: DRBD device. 985b411b363SPhilipp Reisner * @w: work object. 986b411b363SPhilipp Reisner * @cancel: The connection will be closed anyways 987b411b363SPhilipp Reisner */ 98899920dc5SAndreas Gruenbacher int w_e_end_rsdata_req(struct drbd_work *w, int cancel) 989b411b363SPhilipp Reisner { 990db830c46SAndreas Gruenbacher struct drbd_peer_request *peer_req = container_of(w, struct drbd_peer_request, w); 99100d56944SPhilipp Reisner struct drbd_conf *mdev = w->mdev; 99299920dc5SAndreas Gruenbacher int err; 993b411b363SPhilipp Reisner 994b411b363SPhilipp Reisner if (unlikely(cancel)) { 9953967deb1SAndreas Gruenbacher drbd_free_peer_req(mdev, peer_req); 996b411b363SPhilipp Reisner dec_unacked(mdev); 99799920dc5SAndreas Gruenbacher return 0; 998b411b363SPhilipp Reisner } 999b411b363SPhilipp Reisner 1000b411b363SPhilipp Reisner if (get_ldev_if_state(mdev, D_FAILED)) { 1001db830c46SAndreas Gruenbacher drbd_rs_complete_io(mdev, peer_req->i.sector); 1002b411b363SPhilipp Reisner put_ldev(mdev); 1003b411b363SPhilipp Reisner } 1004b411b363SPhilipp Reisner 1005d612d309SPhilipp Reisner if (mdev->state.conn == C_AHEAD) { 100699920dc5SAndreas Gruenbacher err = drbd_send_ack(mdev, P_RS_CANCEL, peer_req); 1007db830c46SAndreas Gruenbacher } else if (likely((peer_req->flags & EE_WAS_ERROR) == 0)) { 1008b411b363SPhilipp Reisner if (likely(mdev->state.pdsk >= D_INCONSISTENT)) { 1009b411b363SPhilipp Reisner inc_rs_pending(mdev); 101099920dc5SAndreas Gruenbacher err = drbd_send_block(mdev, P_RS_DATA_REPLY, peer_req); 1011b411b363SPhilipp Reisner } else { 1012b411b363SPhilipp Reisner if (__ratelimit(&drbd_ratelimit_state)) 1013b411b363SPhilipp Reisner dev_err(DEV, "Not sending RSDataReply, " 1014b411b363SPhilipp Reisner "partner DISKLESS!\n"); 101599920dc5SAndreas Gruenbacher err = 0; 1016b411b363SPhilipp Reisner } 1017b411b363SPhilipp Reisner } else { 1018b411b363SPhilipp Reisner if (__ratelimit(&drbd_ratelimit_state)) 1019b411b363SPhilipp Reisner dev_err(DEV, "Sending NegRSDReply. sector %llus.\n", 1020db830c46SAndreas Gruenbacher (unsigned long long)peer_req->i.sector); 1021b411b363SPhilipp Reisner 102299920dc5SAndreas Gruenbacher err = drbd_send_ack(mdev, P_NEG_RS_DREPLY, peer_req); 1023b411b363SPhilipp Reisner 1024b411b363SPhilipp Reisner /* update resync data with failure */ 1025db830c46SAndreas Gruenbacher drbd_rs_failed_io(mdev, peer_req->i.sector, peer_req->i.size); 1026b411b363SPhilipp Reisner } 1027b411b363SPhilipp Reisner 1028b411b363SPhilipp Reisner dec_unacked(mdev); 1029b411b363SPhilipp Reisner 1030db830c46SAndreas Gruenbacher move_to_net_ee_or_free(mdev, peer_req); 1031b411b363SPhilipp Reisner 103299920dc5SAndreas Gruenbacher if (unlikely(err)) 1033b411b363SPhilipp Reisner dev_err(DEV, "drbd_send_block() failed\n"); 103499920dc5SAndreas Gruenbacher return err; 1035b411b363SPhilipp Reisner } 1036b411b363SPhilipp Reisner 103799920dc5SAndreas Gruenbacher int w_e_end_csum_rs_req(struct drbd_work *w, int cancel) 1038b411b363SPhilipp Reisner { 1039db830c46SAndreas Gruenbacher struct drbd_peer_request *peer_req = container_of(w, struct drbd_peer_request, w); 104000d56944SPhilipp Reisner struct drbd_conf *mdev = w->mdev; 1041b411b363SPhilipp Reisner struct digest_info *di; 1042b411b363SPhilipp Reisner int digest_size; 1043b411b363SPhilipp Reisner void *digest = NULL; 104499920dc5SAndreas Gruenbacher int err, eq = 0; 1045b411b363SPhilipp Reisner 1046b411b363SPhilipp Reisner if (unlikely(cancel)) { 10473967deb1SAndreas Gruenbacher drbd_free_peer_req(mdev, peer_req); 1048b411b363SPhilipp Reisner dec_unacked(mdev); 104999920dc5SAndreas Gruenbacher return 0; 1050b411b363SPhilipp Reisner } 1051b411b363SPhilipp Reisner 10521d53f09eSLars Ellenberg if (get_ldev(mdev)) { 1053db830c46SAndreas Gruenbacher drbd_rs_complete_io(mdev, peer_req->i.sector); 10541d53f09eSLars Ellenberg put_ldev(mdev); 10551d53f09eSLars Ellenberg } 1056b411b363SPhilipp Reisner 1057db830c46SAndreas Gruenbacher di = peer_req->digest; 1058b411b363SPhilipp Reisner 1059db830c46SAndreas Gruenbacher if (likely((peer_req->flags & EE_WAS_ERROR) == 0)) { 1060b411b363SPhilipp Reisner /* quick hack to try to avoid a race against reconfiguration. 1061b411b363SPhilipp Reisner * a real fix would be much more involved, 1062b411b363SPhilipp Reisner * introducing more locking mechanisms */ 1063f399002eSLars Ellenberg if (mdev->tconn->csums_tfm) { 1064f399002eSLars Ellenberg digest_size = crypto_hash_digestsize(mdev->tconn->csums_tfm); 1065b411b363SPhilipp Reisner D_ASSERT(digest_size == di->digest_size); 1066b411b363SPhilipp Reisner digest = kmalloc(digest_size, GFP_NOIO); 1067b411b363SPhilipp Reisner } 1068b411b363SPhilipp Reisner if (digest) { 1069f399002eSLars Ellenberg drbd_csum_ee(mdev, mdev->tconn->csums_tfm, peer_req, digest); 1070b411b363SPhilipp Reisner eq = !memcmp(digest, di->digest, digest_size); 1071b411b363SPhilipp Reisner kfree(digest); 1072b411b363SPhilipp Reisner } 1073b411b363SPhilipp Reisner 1074b411b363SPhilipp Reisner if (eq) { 1075db830c46SAndreas Gruenbacher drbd_set_in_sync(mdev, peer_req->i.sector, peer_req->i.size); 1076676396d5SLars Ellenberg /* rs_same_csums unit is BM_BLOCK_SIZE */ 1077db830c46SAndreas Gruenbacher mdev->rs_same_csum += peer_req->i.size >> BM_BLOCK_SHIFT; 107899920dc5SAndreas Gruenbacher err = drbd_send_ack(mdev, P_RS_IS_IN_SYNC, peer_req); 1079b411b363SPhilipp Reisner } else { 1080b411b363SPhilipp Reisner inc_rs_pending(mdev); 1081db830c46SAndreas Gruenbacher peer_req->block_id = ID_SYNCER; /* By setting block_id, digest pointer becomes invalid! */ 1082db830c46SAndreas Gruenbacher peer_req->flags &= ~EE_HAS_DIGEST; /* This peer request no longer has a digest pointer */ 1083204bba99SPhilipp Reisner kfree(di); 108499920dc5SAndreas Gruenbacher err = drbd_send_block(mdev, P_RS_DATA_REPLY, peer_req); 1085b411b363SPhilipp Reisner } 1086b411b363SPhilipp Reisner } else { 108799920dc5SAndreas Gruenbacher err = drbd_send_ack(mdev, P_NEG_RS_DREPLY, peer_req); 1088b411b363SPhilipp Reisner if (__ratelimit(&drbd_ratelimit_state)) 1089b411b363SPhilipp Reisner dev_err(DEV, "Sending NegDReply. I guess it gets messy.\n"); 1090b411b363SPhilipp Reisner } 1091b411b363SPhilipp Reisner 1092b411b363SPhilipp Reisner dec_unacked(mdev); 1093db830c46SAndreas Gruenbacher move_to_net_ee_or_free(mdev, peer_req); 1094b411b363SPhilipp Reisner 109599920dc5SAndreas Gruenbacher if (unlikely(err)) 1096b411b363SPhilipp Reisner dev_err(DEV, "drbd_send_block/ack() failed\n"); 109799920dc5SAndreas Gruenbacher return err; 1098b411b363SPhilipp Reisner } 1099b411b363SPhilipp Reisner 110099920dc5SAndreas Gruenbacher int w_e_end_ov_req(struct drbd_work *w, int cancel) 1101b411b363SPhilipp Reisner { 1102db830c46SAndreas Gruenbacher struct drbd_peer_request *peer_req = container_of(w, struct drbd_peer_request, w); 110300d56944SPhilipp Reisner struct drbd_conf *mdev = w->mdev; 1104db830c46SAndreas Gruenbacher sector_t sector = peer_req->i.sector; 1105db830c46SAndreas Gruenbacher unsigned int size = peer_req->i.size; 1106b411b363SPhilipp Reisner int digest_size; 1107b411b363SPhilipp Reisner void *digest; 110899920dc5SAndreas Gruenbacher int err = 0; 1109b411b363SPhilipp Reisner 1110b411b363SPhilipp Reisner if (unlikely(cancel)) 1111b411b363SPhilipp Reisner goto out; 1112b411b363SPhilipp Reisner 1113f399002eSLars Ellenberg digest_size = crypto_hash_digestsize(mdev->tconn->verify_tfm); 1114b411b363SPhilipp Reisner digest = kmalloc(digest_size, GFP_NOIO); 11158f21420eSPhilipp Reisner if (!digest) { 111699920dc5SAndreas Gruenbacher err = 1; /* terminate the connection in case the allocation failed */ 11178f21420eSPhilipp Reisner goto out; 11188f21420eSPhilipp Reisner } 11198f21420eSPhilipp Reisner 1120db830c46SAndreas Gruenbacher if (likely(!(peer_req->flags & EE_WAS_ERROR))) 1121f399002eSLars Ellenberg drbd_csum_ee(mdev, mdev->tconn->verify_tfm, peer_req, digest); 11228f21420eSPhilipp Reisner else 11238f21420eSPhilipp Reisner memset(digest, 0, digest_size); 11248f21420eSPhilipp Reisner 112553ea4331SLars Ellenberg /* Free e and pages before send. 112653ea4331SLars Ellenberg * In case we block on congestion, we could otherwise run into 112753ea4331SLars Ellenberg * some distributed deadlock, if the other side blocks on 112853ea4331SLars Ellenberg * congestion as well, because our receiver blocks in 1129c37c8ecfSAndreas Gruenbacher * drbd_alloc_pages due to pp_in_use > max_buffers. */ 11303967deb1SAndreas Gruenbacher drbd_free_peer_req(mdev, peer_req); 1131db830c46SAndreas Gruenbacher peer_req = NULL; 1132b411b363SPhilipp Reisner inc_rs_pending(mdev); 113399920dc5SAndreas Gruenbacher err = drbd_send_drequest_csum(mdev, sector, size, digest, digest_size, P_OV_REPLY); 113499920dc5SAndreas Gruenbacher if (err) 1135b411b363SPhilipp Reisner dec_rs_pending(mdev); 1136b411b363SPhilipp Reisner kfree(digest); 1137b411b363SPhilipp Reisner 1138b411b363SPhilipp Reisner out: 1139db830c46SAndreas Gruenbacher if (peer_req) 11403967deb1SAndreas Gruenbacher drbd_free_peer_req(mdev, peer_req); 1141b411b363SPhilipp Reisner dec_unacked(mdev); 114299920dc5SAndreas Gruenbacher return err; 1143b411b363SPhilipp Reisner } 1144b411b363SPhilipp Reisner 11458f7bed77SAndreas Gruenbacher void drbd_ov_out_of_sync_found(struct drbd_conf *mdev, sector_t sector, int size) 1146b411b363SPhilipp Reisner { 1147b411b363SPhilipp Reisner if (mdev->ov_last_oos_start + mdev->ov_last_oos_size == sector) { 1148b411b363SPhilipp Reisner mdev->ov_last_oos_size += size>>9; 1149b411b363SPhilipp Reisner } else { 1150b411b363SPhilipp Reisner mdev->ov_last_oos_start = sector; 1151b411b363SPhilipp Reisner mdev->ov_last_oos_size = size>>9; 1152b411b363SPhilipp Reisner } 1153b411b363SPhilipp Reisner drbd_set_out_of_sync(mdev, sector, size); 1154b411b363SPhilipp Reisner } 1155b411b363SPhilipp Reisner 115699920dc5SAndreas Gruenbacher int w_e_end_ov_reply(struct drbd_work *w, int cancel) 1157b411b363SPhilipp Reisner { 1158db830c46SAndreas Gruenbacher struct drbd_peer_request *peer_req = container_of(w, struct drbd_peer_request, w); 115900d56944SPhilipp Reisner struct drbd_conf *mdev = w->mdev; 1160b411b363SPhilipp Reisner struct digest_info *di; 1161b411b363SPhilipp Reisner void *digest; 1162db830c46SAndreas Gruenbacher sector_t sector = peer_req->i.sector; 1163db830c46SAndreas Gruenbacher unsigned int size = peer_req->i.size; 116453ea4331SLars Ellenberg int digest_size; 116599920dc5SAndreas Gruenbacher int err, eq = 0; 1166b411b363SPhilipp Reisner 1167b411b363SPhilipp Reisner if (unlikely(cancel)) { 11683967deb1SAndreas Gruenbacher drbd_free_peer_req(mdev, peer_req); 1169b411b363SPhilipp Reisner dec_unacked(mdev); 117099920dc5SAndreas Gruenbacher return 0; 1171b411b363SPhilipp Reisner } 1172b411b363SPhilipp Reisner 1173b411b363SPhilipp Reisner /* after "cancel", because after drbd_disconnect/drbd_rs_cancel_all 1174b411b363SPhilipp Reisner * the resync lru has been cleaned up already */ 11751d53f09eSLars Ellenberg if (get_ldev(mdev)) { 1176db830c46SAndreas Gruenbacher drbd_rs_complete_io(mdev, peer_req->i.sector); 11771d53f09eSLars Ellenberg put_ldev(mdev); 11781d53f09eSLars Ellenberg } 1179b411b363SPhilipp Reisner 1180db830c46SAndreas Gruenbacher di = peer_req->digest; 1181b411b363SPhilipp Reisner 1182db830c46SAndreas Gruenbacher if (likely((peer_req->flags & EE_WAS_ERROR) == 0)) { 1183f399002eSLars Ellenberg digest_size = crypto_hash_digestsize(mdev->tconn->verify_tfm); 1184b411b363SPhilipp Reisner digest = kmalloc(digest_size, GFP_NOIO); 1185b411b363SPhilipp Reisner if (digest) { 1186f399002eSLars Ellenberg drbd_csum_ee(mdev, mdev->tconn->verify_tfm, peer_req, digest); 1187b411b363SPhilipp Reisner 1188b411b363SPhilipp Reisner D_ASSERT(digest_size == di->digest_size); 1189b411b363SPhilipp Reisner eq = !memcmp(digest, di->digest, digest_size); 1190b411b363SPhilipp Reisner kfree(digest); 1191b411b363SPhilipp Reisner } 1192b411b363SPhilipp Reisner } 1193b411b363SPhilipp Reisner 11949676c760SLars Ellenberg /* Free peer_req and pages before send. 119553ea4331SLars Ellenberg * In case we block on congestion, we could otherwise run into 119653ea4331SLars Ellenberg * some distributed deadlock, if the other side blocks on 119753ea4331SLars Ellenberg * congestion as well, because our receiver blocks in 1198c37c8ecfSAndreas Gruenbacher * drbd_alloc_pages due to pp_in_use > max_buffers. */ 11993967deb1SAndreas Gruenbacher drbd_free_peer_req(mdev, peer_req); 1200b411b363SPhilipp Reisner if (!eq) 12018f7bed77SAndreas Gruenbacher drbd_ov_out_of_sync_found(mdev, sector, size); 1202b411b363SPhilipp Reisner else 12038f7bed77SAndreas Gruenbacher ov_out_of_sync_print(mdev); 1204b411b363SPhilipp Reisner 120599920dc5SAndreas Gruenbacher err = drbd_send_ack_ex(mdev, P_OV_RESULT, sector, size, 1206b411b363SPhilipp Reisner eq ? ID_IN_SYNC : ID_OUT_OF_SYNC); 1207b411b363SPhilipp Reisner 120853ea4331SLars Ellenberg dec_unacked(mdev); 1209b411b363SPhilipp Reisner 1210ea5442afSLars Ellenberg --mdev->ov_left; 1211ea5442afSLars Ellenberg 1212ea5442afSLars Ellenberg /* let's advance progress step marks only for every other megabyte */ 1213ea5442afSLars Ellenberg if ((mdev->ov_left & 0x200) == 0x200) 1214ea5442afSLars Ellenberg drbd_advance_rs_marks(mdev, mdev->ov_left); 1215ea5442afSLars Ellenberg 1216ea5442afSLars Ellenberg if (mdev->ov_left == 0) { 12178f7bed77SAndreas Gruenbacher ov_out_of_sync_print(mdev); 1218b411b363SPhilipp Reisner drbd_resync_finished(mdev); 1219b411b363SPhilipp Reisner } 1220b411b363SPhilipp Reisner 122199920dc5SAndreas Gruenbacher return err; 1222b411b363SPhilipp Reisner } 1223b411b363SPhilipp Reisner 122499920dc5SAndreas Gruenbacher int w_prev_work_done(struct drbd_work *w, int cancel) 1225b411b363SPhilipp Reisner { 1226b411b363SPhilipp Reisner struct drbd_wq_barrier *b = container_of(w, struct drbd_wq_barrier, w); 122700d56944SPhilipp Reisner 1228b411b363SPhilipp Reisner complete(&b->done); 122999920dc5SAndreas Gruenbacher return 0; 1230b411b363SPhilipp Reisner } 1231b411b363SPhilipp Reisner 123299920dc5SAndreas Gruenbacher int w_send_barrier(struct drbd_work *w, int cancel) 1233b411b363SPhilipp Reisner { 12349f5bdc33SAndreas Gruenbacher struct drbd_socket *sock; 1235b411b363SPhilipp Reisner struct drbd_tl_epoch *b = container_of(w, struct drbd_tl_epoch, w); 123600d56944SPhilipp Reisner struct drbd_conf *mdev = w->mdev; 12379f5bdc33SAndreas Gruenbacher struct p_barrier *p; 1238b411b363SPhilipp Reisner 1239b411b363SPhilipp Reisner /* really avoid racing with tl_clear. w.cb may have been referenced 1240b411b363SPhilipp Reisner * just before it was reassigned and re-queued, so double check that. 1241b411b363SPhilipp Reisner * actually, this race was harmless, since we only try to send the 1242b411b363SPhilipp Reisner * barrier packet here, and otherwise do nothing with the object. 1243b411b363SPhilipp Reisner * but compare with the head of w_clear_epoch */ 124487eeee41SPhilipp Reisner spin_lock_irq(&mdev->tconn->req_lock); 1245b411b363SPhilipp Reisner if (w->cb != w_send_barrier || mdev->state.conn < C_CONNECTED) 1246b411b363SPhilipp Reisner cancel = 1; 124787eeee41SPhilipp Reisner spin_unlock_irq(&mdev->tconn->req_lock); 1248b411b363SPhilipp Reisner if (cancel) 1249b411b363SPhilipp Reisner return 0; 125099920dc5SAndreas Gruenbacher 12519f5bdc33SAndreas Gruenbacher sock = &mdev->tconn->data; 12529f5bdc33SAndreas Gruenbacher p = drbd_prepare_command(mdev, sock); 12539f5bdc33SAndreas Gruenbacher if (!p) 12549f5bdc33SAndreas Gruenbacher return -EIO; 1255b411b363SPhilipp Reisner p->barrier = b->br_number; 1256b411b363SPhilipp Reisner /* inc_ap_pending was done where this was queued. 1257b411b363SPhilipp Reisner * dec_ap_pending will be done in got_BarrierAck 1258b411b363SPhilipp Reisner * or (on connection loss) in w_clear_epoch. */ 12599f5bdc33SAndreas Gruenbacher return drbd_send_command(mdev, sock, P_BARRIER, sizeof(*p), NULL, 0); 1260b411b363SPhilipp Reisner } 1261b411b363SPhilipp Reisner 126299920dc5SAndreas Gruenbacher int w_send_write_hint(struct drbd_work *w, int cancel) 1263b411b363SPhilipp Reisner { 126400d56944SPhilipp Reisner struct drbd_conf *mdev = w->mdev; 12659f5bdc33SAndreas Gruenbacher struct drbd_socket *sock; 12669f5bdc33SAndreas Gruenbacher 1267b411b363SPhilipp Reisner if (cancel) 126899920dc5SAndreas Gruenbacher return 0; 12699f5bdc33SAndreas Gruenbacher sock = &mdev->tconn->data; 12709f5bdc33SAndreas Gruenbacher if (!drbd_prepare_command(mdev, sock)) 12719f5bdc33SAndreas Gruenbacher return -EIO; 1272e658983aSAndreas Gruenbacher return drbd_send_command(mdev, sock, P_UNPLUG_REMOTE, 0, NULL, 0); 1273b411b363SPhilipp Reisner } 1274b411b363SPhilipp Reisner 12758f7bed77SAndreas Gruenbacher int w_send_out_of_sync(struct drbd_work *w, int cancel) 127673a01a18SPhilipp Reisner { 127773a01a18SPhilipp Reisner struct drbd_request *req = container_of(w, struct drbd_request, w); 127800d56944SPhilipp Reisner struct drbd_conf *mdev = w->mdev; 127999920dc5SAndreas Gruenbacher int err; 128073a01a18SPhilipp Reisner 128173a01a18SPhilipp Reisner if (unlikely(cancel)) { 12828554df1cSAndreas Gruenbacher req_mod(req, SEND_CANCELED); 128399920dc5SAndreas Gruenbacher return 0; 128473a01a18SPhilipp Reisner } 128573a01a18SPhilipp Reisner 12868f7bed77SAndreas Gruenbacher err = drbd_send_out_of_sync(mdev, req); 12878554df1cSAndreas Gruenbacher req_mod(req, OOS_HANDED_TO_NETWORK); 128873a01a18SPhilipp Reisner 128999920dc5SAndreas Gruenbacher return err; 129073a01a18SPhilipp Reisner } 129173a01a18SPhilipp Reisner 1292b411b363SPhilipp Reisner /** 1293b411b363SPhilipp Reisner * w_send_dblock() - Worker callback to send a P_DATA packet in order to mirror a write request 1294b411b363SPhilipp Reisner * @mdev: DRBD device. 1295b411b363SPhilipp Reisner * @w: work object. 1296b411b363SPhilipp Reisner * @cancel: The connection will be closed anyways 1297b411b363SPhilipp Reisner */ 129899920dc5SAndreas Gruenbacher int w_send_dblock(struct drbd_work *w, int cancel) 1299b411b363SPhilipp Reisner { 1300b411b363SPhilipp Reisner struct drbd_request *req = container_of(w, struct drbd_request, w); 130100d56944SPhilipp Reisner struct drbd_conf *mdev = w->mdev; 130299920dc5SAndreas Gruenbacher int err; 1303b411b363SPhilipp Reisner 1304b411b363SPhilipp Reisner if (unlikely(cancel)) { 13058554df1cSAndreas Gruenbacher req_mod(req, SEND_CANCELED); 130699920dc5SAndreas Gruenbacher return 0; 1307b411b363SPhilipp Reisner } 1308b411b363SPhilipp Reisner 130999920dc5SAndreas Gruenbacher err = drbd_send_dblock(mdev, req); 131099920dc5SAndreas Gruenbacher req_mod(req, err ? SEND_FAILED : HANDED_OVER_TO_NETWORK); 1311b411b363SPhilipp Reisner 131299920dc5SAndreas Gruenbacher return err; 1313b411b363SPhilipp Reisner } 1314b411b363SPhilipp Reisner 1315b411b363SPhilipp Reisner /** 1316b411b363SPhilipp Reisner * w_send_read_req() - Worker callback to send a read request (P_DATA_REQUEST) packet 1317b411b363SPhilipp Reisner * @mdev: DRBD device. 1318b411b363SPhilipp Reisner * @w: work object. 1319b411b363SPhilipp Reisner * @cancel: The connection will be closed anyways 1320b411b363SPhilipp Reisner */ 132199920dc5SAndreas Gruenbacher int w_send_read_req(struct drbd_work *w, int cancel) 1322b411b363SPhilipp Reisner { 1323b411b363SPhilipp Reisner struct drbd_request *req = container_of(w, struct drbd_request, w); 132400d56944SPhilipp Reisner struct drbd_conf *mdev = w->mdev; 132599920dc5SAndreas Gruenbacher int err; 1326b411b363SPhilipp Reisner 1327b411b363SPhilipp Reisner if (unlikely(cancel)) { 13288554df1cSAndreas Gruenbacher req_mod(req, SEND_CANCELED); 132999920dc5SAndreas Gruenbacher return 0; 1330b411b363SPhilipp Reisner } 1331b411b363SPhilipp Reisner 133299920dc5SAndreas Gruenbacher err = drbd_send_drequest(mdev, P_DATA_REQUEST, req->i.sector, req->i.size, 1333b411b363SPhilipp Reisner (unsigned long)req); 1334b411b363SPhilipp Reisner 133599920dc5SAndreas Gruenbacher req_mod(req, err ? SEND_FAILED : HANDED_OVER_TO_NETWORK); 1336b411b363SPhilipp Reisner 133799920dc5SAndreas Gruenbacher return err; 1338b411b363SPhilipp Reisner } 1339b411b363SPhilipp Reisner 134099920dc5SAndreas Gruenbacher int w_restart_disk_io(struct drbd_work *w, int cancel) 1341265be2d0SPhilipp Reisner { 1342265be2d0SPhilipp Reisner struct drbd_request *req = container_of(w, struct drbd_request, w); 134300d56944SPhilipp Reisner struct drbd_conf *mdev = w->mdev; 1344265be2d0SPhilipp Reisner 13450778286aSPhilipp Reisner if (bio_data_dir(req->master_bio) == WRITE && req->rq_state & RQ_IN_ACT_LOG) 1346181286adSLars Ellenberg drbd_al_begin_io(mdev, &req->i); 1347265be2d0SPhilipp Reisner 1348265be2d0SPhilipp Reisner drbd_req_make_private_bio(req, req->master_bio); 1349265be2d0SPhilipp Reisner req->private_bio->bi_bdev = mdev->ldev->backing_bdev; 1350265be2d0SPhilipp Reisner generic_make_request(req->private_bio); 1351265be2d0SPhilipp Reisner 135299920dc5SAndreas Gruenbacher return 0; 1353265be2d0SPhilipp Reisner } 1354265be2d0SPhilipp Reisner 1355b411b363SPhilipp Reisner static int _drbd_may_sync_now(struct drbd_conf *mdev) 1356b411b363SPhilipp Reisner { 1357b411b363SPhilipp Reisner struct drbd_conf *odev = mdev; 135895f8efd0SAndreas Gruenbacher int resync_after; 1359b411b363SPhilipp Reisner 1360b411b363SPhilipp Reisner while (1) { 1361438c8374SPhilipp Reisner if (!odev->ldev) 1362438c8374SPhilipp Reisner return 1; 1363daeda1ccSPhilipp Reisner rcu_read_lock(); 136495f8efd0SAndreas Gruenbacher resync_after = rcu_dereference(odev->ldev->disk_conf)->resync_after; 1365daeda1ccSPhilipp Reisner rcu_read_unlock(); 136695f8efd0SAndreas Gruenbacher if (resync_after == -1) 1367b411b363SPhilipp Reisner return 1; 136895f8efd0SAndreas Gruenbacher odev = minor_to_mdev(resync_after); 1369841ce241SAndreas Gruenbacher if (!expect(odev)) 1370841ce241SAndreas Gruenbacher return 1; 1371b411b363SPhilipp Reisner if ((odev->state.conn >= C_SYNC_SOURCE && 1372b411b363SPhilipp Reisner odev->state.conn <= C_PAUSED_SYNC_T) || 1373b411b363SPhilipp Reisner odev->state.aftr_isp || odev->state.peer_isp || 1374b411b363SPhilipp Reisner odev->state.user_isp) 1375b411b363SPhilipp Reisner return 0; 1376b411b363SPhilipp Reisner } 1377b411b363SPhilipp Reisner } 1378b411b363SPhilipp Reisner 1379b411b363SPhilipp Reisner /** 1380b411b363SPhilipp Reisner * _drbd_pause_after() - Pause resync on all devices that may not resync now 1381b411b363SPhilipp Reisner * @mdev: DRBD device. 1382b411b363SPhilipp Reisner * 1383b411b363SPhilipp Reisner * Called from process context only (admin command and after_state_ch). 1384b411b363SPhilipp Reisner */ 1385b411b363SPhilipp Reisner static int _drbd_pause_after(struct drbd_conf *mdev) 1386b411b363SPhilipp Reisner { 1387b411b363SPhilipp Reisner struct drbd_conf *odev; 1388b411b363SPhilipp Reisner int i, rv = 0; 1389b411b363SPhilipp Reisner 1390695d08faSPhilipp Reisner rcu_read_lock(); 139181a5d60eSPhilipp Reisner idr_for_each_entry(&minors, odev, i) { 1392b411b363SPhilipp Reisner if (odev->state.conn == C_STANDALONE && odev->state.disk == D_DISKLESS) 1393b411b363SPhilipp Reisner continue; 1394b411b363SPhilipp Reisner if (!_drbd_may_sync_now(odev)) 1395b411b363SPhilipp Reisner rv |= (__drbd_set_state(_NS(odev, aftr_isp, 1), CS_HARD, NULL) 1396b411b363SPhilipp Reisner != SS_NOTHING_TO_DO); 1397b411b363SPhilipp Reisner } 1398695d08faSPhilipp Reisner rcu_read_unlock(); 1399b411b363SPhilipp Reisner 1400b411b363SPhilipp Reisner return rv; 1401b411b363SPhilipp Reisner } 1402b411b363SPhilipp Reisner 1403b411b363SPhilipp Reisner /** 1404b411b363SPhilipp Reisner * _drbd_resume_next() - Resume resync on all devices that may resync now 1405b411b363SPhilipp Reisner * @mdev: DRBD device. 1406b411b363SPhilipp Reisner * 1407b411b363SPhilipp Reisner * Called from process context only (admin command and worker). 1408b411b363SPhilipp Reisner */ 1409b411b363SPhilipp Reisner static int _drbd_resume_next(struct drbd_conf *mdev) 1410b411b363SPhilipp Reisner { 1411b411b363SPhilipp Reisner struct drbd_conf *odev; 1412b411b363SPhilipp Reisner int i, rv = 0; 1413b411b363SPhilipp Reisner 1414695d08faSPhilipp Reisner rcu_read_lock(); 141581a5d60eSPhilipp Reisner idr_for_each_entry(&minors, odev, i) { 1416b411b363SPhilipp Reisner if (odev->state.conn == C_STANDALONE && odev->state.disk == D_DISKLESS) 1417b411b363SPhilipp Reisner continue; 1418b411b363SPhilipp Reisner if (odev->state.aftr_isp) { 1419b411b363SPhilipp Reisner if (_drbd_may_sync_now(odev)) 1420b411b363SPhilipp Reisner rv |= (__drbd_set_state(_NS(odev, aftr_isp, 0), 1421b411b363SPhilipp Reisner CS_HARD, NULL) 1422b411b363SPhilipp Reisner != SS_NOTHING_TO_DO) ; 1423b411b363SPhilipp Reisner } 1424b411b363SPhilipp Reisner } 1425695d08faSPhilipp Reisner rcu_read_unlock(); 1426b411b363SPhilipp Reisner return rv; 1427b411b363SPhilipp Reisner } 1428b411b363SPhilipp Reisner 1429b411b363SPhilipp Reisner void resume_next_sg(struct drbd_conf *mdev) 1430b411b363SPhilipp Reisner { 1431b411b363SPhilipp Reisner write_lock_irq(&global_state_lock); 1432b411b363SPhilipp Reisner _drbd_resume_next(mdev); 1433b411b363SPhilipp Reisner write_unlock_irq(&global_state_lock); 1434b411b363SPhilipp Reisner } 1435b411b363SPhilipp Reisner 1436b411b363SPhilipp Reisner void suspend_other_sg(struct drbd_conf *mdev) 1437b411b363SPhilipp Reisner { 1438b411b363SPhilipp Reisner write_lock_irq(&global_state_lock); 1439b411b363SPhilipp Reisner _drbd_pause_after(mdev); 1440b411b363SPhilipp Reisner write_unlock_irq(&global_state_lock); 1441b411b363SPhilipp Reisner } 1442b411b363SPhilipp Reisner 1443dc97b708SPhilipp Reisner /* caller must hold global_state_lock */ 144495f8efd0SAndreas Gruenbacher enum drbd_ret_code drbd_resync_after_valid(struct drbd_conf *mdev, int o_minor) 1445b411b363SPhilipp Reisner { 1446b411b363SPhilipp Reisner struct drbd_conf *odev; 144795f8efd0SAndreas Gruenbacher int resync_after; 1448b411b363SPhilipp Reisner 1449b411b363SPhilipp Reisner if (o_minor == -1) 1450b411b363SPhilipp Reisner return NO_ERROR; 1451b411b363SPhilipp Reisner if (o_minor < -1 || minor_to_mdev(o_minor) == NULL) 145295f8efd0SAndreas Gruenbacher return ERR_RESYNC_AFTER; 1453b411b363SPhilipp Reisner 1454b411b363SPhilipp Reisner /* check for loops */ 1455b411b363SPhilipp Reisner odev = minor_to_mdev(o_minor); 1456b411b363SPhilipp Reisner while (1) { 1457b411b363SPhilipp Reisner if (odev == mdev) 145895f8efd0SAndreas Gruenbacher return ERR_RESYNC_AFTER_CYCLE; 1459b411b363SPhilipp Reisner 1460daeda1ccSPhilipp Reisner rcu_read_lock(); 146195f8efd0SAndreas Gruenbacher resync_after = rcu_dereference(odev->ldev->disk_conf)->resync_after; 1462daeda1ccSPhilipp Reisner rcu_read_unlock(); 1463b411b363SPhilipp Reisner /* dependency chain ends here, no cycles. */ 146495f8efd0SAndreas Gruenbacher if (resync_after == -1) 1465b411b363SPhilipp Reisner return NO_ERROR; 1466b411b363SPhilipp Reisner 1467b411b363SPhilipp Reisner /* follow the dependency chain */ 146895f8efd0SAndreas Gruenbacher odev = minor_to_mdev(resync_after); 1469b411b363SPhilipp Reisner } 1470b411b363SPhilipp Reisner } 1471b411b363SPhilipp Reisner 1472dc97b708SPhilipp Reisner /* caller must hold global_state_lock */ 147395f8efd0SAndreas Gruenbacher void drbd_resync_after_changed(struct drbd_conf *mdev) 1474b411b363SPhilipp Reisner { 1475b411b363SPhilipp Reisner int changes; 1476b411b363SPhilipp Reisner 1477b411b363SPhilipp Reisner do { 1478b411b363SPhilipp Reisner changes = _drbd_pause_after(mdev); 1479b411b363SPhilipp Reisner changes |= _drbd_resume_next(mdev); 1480b411b363SPhilipp Reisner } while (changes); 1481b411b363SPhilipp Reisner } 1482b411b363SPhilipp Reisner 14839bd28d3cSLars Ellenberg void drbd_rs_controller_reset(struct drbd_conf *mdev) 14849bd28d3cSLars Ellenberg { 1485813472ceSPhilipp Reisner struct fifo_buffer *plan; 1486813472ceSPhilipp Reisner 14879bd28d3cSLars Ellenberg atomic_set(&mdev->rs_sect_in, 0); 14889bd28d3cSLars Ellenberg atomic_set(&mdev->rs_sect_ev, 0); 14899bd28d3cSLars Ellenberg mdev->rs_in_flight = 0; 1490813472ceSPhilipp Reisner 1491813472ceSPhilipp Reisner /* Updating the RCU protected object in place is necessary since 1492813472ceSPhilipp Reisner this function gets called from atomic context. 1493813472ceSPhilipp Reisner It is valid since all other updates also lead to an completely 1494813472ceSPhilipp Reisner empty fifo */ 1495813472ceSPhilipp Reisner rcu_read_lock(); 1496813472ceSPhilipp Reisner plan = rcu_dereference(mdev->rs_plan_s); 1497813472ceSPhilipp Reisner plan->total = 0; 1498813472ceSPhilipp Reisner fifo_set(plan, 0); 1499813472ceSPhilipp Reisner rcu_read_unlock(); 15009bd28d3cSLars Ellenberg } 15019bd28d3cSLars Ellenberg 15021f04af33SPhilipp Reisner void start_resync_timer_fn(unsigned long data) 15031f04af33SPhilipp Reisner { 15041f04af33SPhilipp Reisner struct drbd_conf *mdev = (struct drbd_conf *) data; 15051f04af33SPhilipp Reisner 15061f04af33SPhilipp Reisner drbd_queue_work(&mdev->tconn->data.work, &mdev->start_resync_work); 15071f04af33SPhilipp Reisner } 15081f04af33SPhilipp Reisner 150999920dc5SAndreas Gruenbacher int w_start_resync(struct drbd_work *w, int cancel) 15101f04af33SPhilipp Reisner { 151100d56944SPhilipp Reisner struct drbd_conf *mdev = w->mdev; 151200d56944SPhilipp Reisner 15131f04af33SPhilipp Reisner if (atomic_read(&mdev->unacked_cnt) || atomic_read(&mdev->rs_pending_cnt)) { 15141f04af33SPhilipp Reisner dev_warn(DEV, "w_start_resync later...\n"); 15151f04af33SPhilipp Reisner mdev->start_resync_timer.expires = jiffies + HZ/10; 15161f04af33SPhilipp Reisner add_timer(&mdev->start_resync_timer); 151799920dc5SAndreas Gruenbacher return 0; 15181f04af33SPhilipp Reisner } 15191f04af33SPhilipp Reisner 15201f04af33SPhilipp Reisner drbd_start_resync(mdev, C_SYNC_SOURCE); 15211f04af33SPhilipp Reisner clear_bit(AHEAD_TO_SYNC_SOURCE, &mdev->current_epoch->flags); 152299920dc5SAndreas Gruenbacher return 0; 15231f04af33SPhilipp Reisner } 15241f04af33SPhilipp Reisner 1525b411b363SPhilipp Reisner /** 1526b411b363SPhilipp Reisner * drbd_start_resync() - Start the resync process 1527b411b363SPhilipp Reisner * @mdev: DRBD device. 1528b411b363SPhilipp Reisner * @side: Either C_SYNC_SOURCE or C_SYNC_TARGET 1529b411b363SPhilipp Reisner * 1530b411b363SPhilipp Reisner * This function might bring you directly into one of the 1531b411b363SPhilipp Reisner * C_PAUSED_SYNC_* states. 1532b411b363SPhilipp Reisner */ 1533b411b363SPhilipp Reisner void drbd_start_resync(struct drbd_conf *mdev, enum drbd_conns side) 1534b411b363SPhilipp Reisner { 1535b411b363SPhilipp Reisner union drbd_state ns; 1536b411b363SPhilipp Reisner int r; 1537b411b363SPhilipp Reisner 1538c4752ef1SPhilipp Reisner if (mdev->state.conn >= C_SYNC_SOURCE && mdev->state.conn < C_AHEAD) { 1539b411b363SPhilipp Reisner dev_err(DEV, "Resync already running!\n"); 1540b411b363SPhilipp Reisner return; 1541b411b363SPhilipp Reisner } 1542b411b363SPhilipp Reisner 154359817f4fSPhilipp Reisner if (mdev->state.conn < C_AHEAD) { 1544b411b363SPhilipp Reisner /* In case a previous resync run was aborted by an IO error/detach on the peer. */ 1545b411b363SPhilipp Reisner drbd_rs_cancel_all(mdev); 154659817f4fSPhilipp Reisner /* This should be done when we abort the resync. We definitely do not 154759817f4fSPhilipp Reisner want to have this for connections going back and forth between 154859817f4fSPhilipp Reisner Ahead/Behind and SyncSource/SyncTarget */ 154959817f4fSPhilipp Reisner } 1550b411b363SPhilipp Reisner 1551e64a3294SPhilipp Reisner if (!test_bit(B_RS_H_DONE, &mdev->flags)) { 1552b411b363SPhilipp Reisner if (side == C_SYNC_TARGET) { 1553b411b363SPhilipp Reisner /* Since application IO was locked out during C_WF_BITMAP_T and 1554b411b363SPhilipp Reisner C_WF_SYNC_UUID we are still unmodified. Before going to C_SYNC_TARGET 1555b411b363SPhilipp Reisner we check that we might make the data inconsistent. */ 1556b411b363SPhilipp Reisner r = drbd_khelper(mdev, "before-resync-target"); 1557b411b363SPhilipp Reisner r = (r >> 8) & 0xff; 1558b411b363SPhilipp Reisner if (r > 0) { 1559b411b363SPhilipp Reisner dev_info(DEV, "before-resync-target handler returned %d, " 1560b411b363SPhilipp Reisner "dropping connection.\n", r); 156138fa9988SPhilipp Reisner conn_request_state(mdev->tconn, NS(conn, C_DISCONNECTING), CS_HARD); 1562b411b363SPhilipp Reisner return; 1563b411b363SPhilipp Reisner } 156409b9e797SPhilipp Reisner } else /* C_SYNC_SOURCE */ { 156509b9e797SPhilipp Reisner r = drbd_khelper(mdev, "before-resync-source"); 156609b9e797SPhilipp Reisner r = (r >> 8) & 0xff; 156709b9e797SPhilipp Reisner if (r > 0) { 156809b9e797SPhilipp Reisner if (r == 3) { 156909b9e797SPhilipp Reisner dev_info(DEV, "before-resync-source handler returned %d, " 157009b9e797SPhilipp Reisner "ignoring. Old userland tools?", r); 157109b9e797SPhilipp Reisner } else { 157209b9e797SPhilipp Reisner dev_info(DEV, "before-resync-source handler returned %d, " 157309b9e797SPhilipp Reisner "dropping connection.\n", r); 157438fa9988SPhilipp Reisner conn_request_state(mdev->tconn, NS(conn, C_DISCONNECTING), CS_HARD); 157509b9e797SPhilipp Reisner return; 157609b9e797SPhilipp Reisner } 157709b9e797SPhilipp Reisner } 1578b411b363SPhilipp Reisner } 1579e64a3294SPhilipp Reisner } 1580b411b363SPhilipp Reisner 1581e64a3294SPhilipp Reisner if (current == mdev->tconn->worker.task) { 1582dad20554SPhilipp Reisner /* The worker should not sleep waiting for state_mutex, 1583e64a3294SPhilipp Reisner that can take long */ 15848410da8fSPhilipp Reisner if (!mutex_trylock(mdev->state_mutex)) { 1585e64a3294SPhilipp Reisner set_bit(B_RS_H_DONE, &mdev->flags); 1586e64a3294SPhilipp Reisner mdev->start_resync_timer.expires = jiffies + HZ/5; 1587e64a3294SPhilipp Reisner add_timer(&mdev->start_resync_timer); 1588e64a3294SPhilipp Reisner return; 1589e64a3294SPhilipp Reisner } 1590e64a3294SPhilipp Reisner } else { 15918410da8fSPhilipp Reisner mutex_lock(mdev->state_mutex); 1592e64a3294SPhilipp Reisner } 1593e64a3294SPhilipp Reisner clear_bit(B_RS_H_DONE, &mdev->flags); 1594b411b363SPhilipp Reisner 15950cfac5ddSPhilipp Reisner write_lock_irq(&global_state_lock); 1596b411b363SPhilipp Reisner if (!get_ldev_if_state(mdev, D_NEGOTIATING)) { 15970cfac5ddSPhilipp Reisner write_unlock_irq(&global_state_lock); 15988410da8fSPhilipp Reisner mutex_unlock(mdev->state_mutex); 1599b411b363SPhilipp Reisner return; 1600b411b363SPhilipp Reisner } 1601b411b363SPhilipp Reisner 160278bae59bSPhilipp Reisner ns = drbd_read_state(mdev); 1603b411b363SPhilipp Reisner 1604b411b363SPhilipp Reisner ns.aftr_isp = !_drbd_may_sync_now(mdev); 1605b411b363SPhilipp Reisner 1606b411b363SPhilipp Reisner ns.conn = side; 1607b411b363SPhilipp Reisner 1608b411b363SPhilipp Reisner if (side == C_SYNC_TARGET) 1609b411b363SPhilipp Reisner ns.disk = D_INCONSISTENT; 1610b411b363SPhilipp Reisner else /* side == C_SYNC_SOURCE */ 1611b411b363SPhilipp Reisner ns.pdsk = D_INCONSISTENT; 1612b411b363SPhilipp Reisner 1613b411b363SPhilipp Reisner r = __drbd_set_state(mdev, ns, CS_VERBOSE, NULL); 161478bae59bSPhilipp Reisner ns = drbd_read_state(mdev); 1615b411b363SPhilipp Reisner 1616b411b363SPhilipp Reisner if (ns.conn < C_CONNECTED) 1617b411b363SPhilipp Reisner r = SS_UNKNOWN_ERROR; 1618b411b363SPhilipp Reisner 1619b411b363SPhilipp Reisner if (r == SS_SUCCESS) { 16201d7734a0SLars Ellenberg unsigned long tw = drbd_bm_total_weight(mdev); 16211d7734a0SLars Ellenberg unsigned long now = jiffies; 16221d7734a0SLars Ellenberg int i; 16231d7734a0SLars Ellenberg 1624b411b363SPhilipp Reisner mdev->rs_failed = 0; 1625b411b363SPhilipp Reisner mdev->rs_paused = 0; 1626b411b363SPhilipp Reisner mdev->rs_same_csum = 0; 16270f0601f4SLars Ellenberg mdev->rs_last_events = 0; 16280f0601f4SLars Ellenberg mdev->rs_last_sect_ev = 0; 16291d7734a0SLars Ellenberg mdev->rs_total = tw; 16301d7734a0SLars Ellenberg mdev->rs_start = now; 16311d7734a0SLars Ellenberg for (i = 0; i < DRBD_SYNC_MARKS; i++) { 16321d7734a0SLars Ellenberg mdev->rs_mark_left[i] = tw; 16331d7734a0SLars Ellenberg mdev->rs_mark_time[i] = now; 16341d7734a0SLars Ellenberg } 1635b411b363SPhilipp Reisner _drbd_pause_after(mdev); 1636b411b363SPhilipp Reisner } 1637b411b363SPhilipp Reisner write_unlock_irq(&global_state_lock); 16385a22db89SLars Ellenberg 16396c922ed5SLars Ellenberg if (r == SS_SUCCESS) { 16406c922ed5SLars Ellenberg dev_info(DEV, "Began resync as %s (will sync %lu KB [%lu bits set]).\n", 16416c922ed5SLars Ellenberg drbd_conn_str(ns.conn), 16426c922ed5SLars Ellenberg (unsigned long) mdev->rs_total << (BM_BLOCK_SHIFT-10), 16436c922ed5SLars Ellenberg (unsigned long) mdev->rs_total); 16445a22db89SLars Ellenberg if (side == C_SYNC_TARGET) 16455a22db89SLars Ellenberg mdev->bm_resync_fo = 0; 16465a22db89SLars Ellenberg 16475a22db89SLars Ellenberg /* Since protocol 96, we must serialize drbd_gen_and_send_sync_uuid 16485a22db89SLars Ellenberg * with w_send_oos, or the sync target will get confused as to 16495a22db89SLars Ellenberg * how much bits to resync. We cannot do that always, because for an 16505a22db89SLars Ellenberg * empty resync and protocol < 95, we need to do it here, as we call 16515a22db89SLars Ellenberg * drbd_resync_finished from here in that case. 16525a22db89SLars Ellenberg * We drbd_gen_and_send_sync_uuid here for protocol < 96, 16535a22db89SLars Ellenberg * and from after_state_ch otherwise. */ 165431890f4aSPhilipp Reisner if (side == C_SYNC_SOURCE && mdev->tconn->agreed_pro_version < 96) 16555a22db89SLars Ellenberg drbd_gen_and_send_sync_uuid(mdev); 1656b411b363SPhilipp Reisner 165731890f4aSPhilipp Reisner if (mdev->tconn->agreed_pro_version < 95 && mdev->rs_total == 0) { 1658af85e8e8SLars Ellenberg /* This still has a race (about when exactly the peers 1659af85e8e8SLars Ellenberg * detect connection loss) that can lead to a full sync 1660af85e8e8SLars Ellenberg * on next handshake. In 8.3.9 we fixed this with explicit 1661af85e8e8SLars Ellenberg * resync-finished notifications, but the fix 1662af85e8e8SLars Ellenberg * introduces a protocol change. Sleeping for some 1663af85e8e8SLars Ellenberg * time longer than the ping interval + timeout on the 1664af85e8e8SLars Ellenberg * SyncSource, to give the SyncTarget the chance to 1665af85e8e8SLars Ellenberg * detect connection loss, then waiting for a ping 1666af85e8e8SLars Ellenberg * response (implicit in drbd_resync_finished) reduces 1667af85e8e8SLars Ellenberg * the race considerably, but does not solve it. */ 166844ed167dSPhilipp Reisner if (side == C_SYNC_SOURCE) { 166944ed167dSPhilipp Reisner struct net_conf *nc; 167044ed167dSPhilipp Reisner int timeo; 167144ed167dSPhilipp Reisner 167244ed167dSPhilipp Reisner rcu_read_lock(); 167344ed167dSPhilipp Reisner nc = rcu_dereference(mdev->tconn->net_conf); 167444ed167dSPhilipp Reisner timeo = nc->ping_int * HZ + nc->ping_timeo * HZ / 9; 167544ed167dSPhilipp Reisner rcu_read_unlock(); 167644ed167dSPhilipp Reisner schedule_timeout_interruptible(timeo); 167744ed167dSPhilipp Reisner } 1678b411b363SPhilipp Reisner drbd_resync_finished(mdev); 1679b411b363SPhilipp Reisner } 1680b411b363SPhilipp Reisner 16819bd28d3cSLars Ellenberg drbd_rs_controller_reset(mdev); 1682b411b363SPhilipp Reisner /* ns.conn may already be != mdev->state.conn, 1683b411b363SPhilipp Reisner * we may have been paused in between, or become paused until 1684b411b363SPhilipp Reisner * the timer triggers. 1685b411b363SPhilipp Reisner * No matter, that is handled in resync_timer_fn() */ 1686b411b363SPhilipp Reisner if (ns.conn == C_SYNC_TARGET) 1687b411b363SPhilipp Reisner mod_timer(&mdev->resync_timer, jiffies); 1688b411b363SPhilipp Reisner 1689b411b363SPhilipp Reisner drbd_md_sync(mdev); 1690b411b363SPhilipp Reisner } 16915a22db89SLars Ellenberg put_ldev(mdev); 16928410da8fSPhilipp Reisner mutex_unlock(mdev->state_mutex); 1693b411b363SPhilipp Reisner } 1694b411b363SPhilipp Reisner 1695b411b363SPhilipp Reisner int drbd_worker(struct drbd_thread *thi) 1696b411b363SPhilipp Reisner { 1697392c8801SPhilipp Reisner struct drbd_tconn *tconn = thi->tconn; 1698b411b363SPhilipp Reisner struct drbd_work *w = NULL; 16990e29d163SPhilipp Reisner struct drbd_conf *mdev; 170044ed167dSPhilipp Reisner struct net_conf *nc; 1701b411b363SPhilipp Reisner LIST_HEAD(work_list); 1702f399002eSLars Ellenberg int vnr, intr = 0; 170344ed167dSPhilipp Reisner int cork; 1704b411b363SPhilipp Reisner 1705e77a0a5cSAndreas Gruenbacher while (get_t_state(thi) == RUNNING) { 170680822284SPhilipp Reisner drbd_thread_current_set_cpu(thi); 1707b411b363SPhilipp Reisner 170819393e10SPhilipp Reisner if (down_trylock(&tconn->data.work.s)) { 170919393e10SPhilipp Reisner mutex_lock(&tconn->data.mutex); 171044ed167dSPhilipp Reisner 171144ed167dSPhilipp Reisner rcu_read_lock(); 171244ed167dSPhilipp Reisner nc = rcu_dereference(tconn->net_conf); 1713bb77d34eSAndreas Gruenbacher cork = nc ? nc->tcp_cork : 0; 171444ed167dSPhilipp Reisner rcu_read_unlock(); 171544ed167dSPhilipp Reisner 171644ed167dSPhilipp Reisner if (tconn->data.socket && cork) 171719393e10SPhilipp Reisner drbd_tcp_uncork(tconn->data.socket); 171819393e10SPhilipp Reisner mutex_unlock(&tconn->data.mutex); 1719b411b363SPhilipp Reisner 172019393e10SPhilipp Reisner intr = down_interruptible(&tconn->data.work.s); 1721b411b363SPhilipp Reisner 172219393e10SPhilipp Reisner mutex_lock(&tconn->data.mutex); 172344ed167dSPhilipp Reisner if (tconn->data.socket && cork) 172419393e10SPhilipp Reisner drbd_tcp_cork(tconn->data.socket); 172519393e10SPhilipp Reisner mutex_unlock(&tconn->data.mutex); 1726b411b363SPhilipp Reisner } 1727b411b363SPhilipp Reisner 1728b411b363SPhilipp Reisner if (intr) { 1729b411b363SPhilipp Reisner flush_signals(current); 173019393e10SPhilipp Reisner if (get_t_state(thi) == RUNNING) { 173119393e10SPhilipp Reisner conn_warn(tconn, "Worker got an unexpected signal\n"); 1732b411b363SPhilipp Reisner continue; 173319393e10SPhilipp Reisner } 1734b411b363SPhilipp Reisner break; 1735b411b363SPhilipp Reisner } 1736b411b363SPhilipp Reisner 1737e77a0a5cSAndreas Gruenbacher if (get_t_state(thi) != RUNNING) 1738b411b363SPhilipp Reisner break; 1739b411b363SPhilipp Reisner /* With this break, we have done a down() but not consumed 1740b411b363SPhilipp Reisner the entry from the list. The cleanup code takes care of 1741b411b363SPhilipp Reisner this... */ 1742b411b363SPhilipp Reisner 1743b411b363SPhilipp Reisner w = NULL; 174419393e10SPhilipp Reisner spin_lock_irq(&tconn->data.work.q_lock); 174519393e10SPhilipp Reisner if (list_empty(&tconn->data.work.q)) { 1746b411b363SPhilipp Reisner /* something terribly wrong in our logic. 1747b411b363SPhilipp Reisner * we were able to down() the semaphore, 1748b411b363SPhilipp Reisner * but the list is empty... doh. 1749b411b363SPhilipp Reisner * 1750b411b363SPhilipp Reisner * what is the best thing to do now? 1751b411b363SPhilipp Reisner * try again from scratch, restarting the receiver, 1752b411b363SPhilipp Reisner * asender, whatnot? could break even more ugly, 1753b411b363SPhilipp Reisner * e.g. when we are primary, but no good local data. 1754b411b363SPhilipp Reisner * 1755b411b363SPhilipp Reisner * I'll try to get away just starting over this loop. 1756b411b363SPhilipp Reisner */ 175719393e10SPhilipp Reisner conn_warn(tconn, "Work list unexpectedly empty\n"); 175819393e10SPhilipp Reisner spin_unlock_irq(&tconn->data.work.q_lock); 1759b411b363SPhilipp Reisner continue; 1760b411b363SPhilipp Reisner } 176119393e10SPhilipp Reisner w = list_entry(tconn->data.work.q.next, struct drbd_work, list); 1762b411b363SPhilipp Reisner list_del_init(&w->list); 176319393e10SPhilipp Reisner spin_unlock_irq(&tconn->data.work.q_lock); 1764b411b363SPhilipp Reisner 176599920dc5SAndreas Gruenbacher if (w->cb(w, tconn->cstate < C_WF_REPORT_PARAMS)) { 1766b411b363SPhilipp Reisner /* dev_warn(DEV, "worker: a callback failed! \n"); */ 1767bbeb641cSPhilipp Reisner if (tconn->cstate >= C_WF_REPORT_PARAMS) 1768bbeb641cSPhilipp Reisner conn_request_state(tconn, NS(conn, C_NETWORK_FAILURE), CS_HARD); 1769b411b363SPhilipp Reisner } 1770b411b363SPhilipp Reisner } 1771b411b363SPhilipp Reisner 177219393e10SPhilipp Reisner spin_lock_irq(&tconn->data.work.q_lock); 177319393e10SPhilipp Reisner while (!list_empty(&tconn->data.work.q)) { 177419393e10SPhilipp Reisner list_splice_init(&tconn->data.work.q, &work_list); 177519393e10SPhilipp Reisner spin_unlock_irq(&tconn->data.work.q_lock); 1776b411b363SPhilipp Reisner 1777b411b363SPhilipp Reisner while (!list_empty(&work_list)) { 1778b411b363SPhilipp Reisner w = list_entry(work_list.next, struct drbd_work, list); 1779b411b363SPhilipp Reisner list_del_init(&w->list); 178000d56944SPhilipp Reisner w->cb(w, 1); 1781b411b363SPhilipp Reisner } 1782b411b363SPhilipp Reisner 178319393e10SPhilipp Reisner spin_lock_irq(&tconn->data.work.q_lock); 1784b411b363SPhilipp Reisner } 178519393e10SPhilipp Reisner sema_init(&tconn->data.work.s, 0); 1786b411b363SPhilipp Reisner /* DANGEROUS race: if someone did queue his work within the spinlock, 1787b411b363SPhilipp Reisner * but up() ed outside the spinlock, we could get an up() on the 1788b411b363SPhilipp Reisner * semaphore without corresponding list entry. 1789b411b363SPhilipp Reisner * So don't do that. 1790b411b363SPhilipp Reisner */ 179119393e10SPhilipp Reisner spin_unlock_irq(&tconn->data.work.q_lock); 1792b411b363SPhilipp Reisner 1793c141ebdaSPhilipp Reisner rcu_read_lock(); 1794f399002eSLars Ellenberg idr_for_each_entry(&tconn->volumes, mdev, vnr) { 17950e29d163SPhilipp Reisner D_ASSERT(mdev->state.disk == D_DISKLESS && mdev->state.conn == C_STANDALONE); 1796c141ebdaSPhilipp Reisner kref_get(&mdev->kref); 1797c141ebdaSPhilipp Reisner rcu_read_unlock(); 17980e29d163SPhilipp Reisner drbd_mdev_cleanup(mdev); 1799c141ebdaSPhilipp Reisner kref_put(&mdev->kref, &drbd_minor_destroy); 1800c141ebdaSPhilipp Reisner rcu_read_lock(); 18010e29d163SPhilipp Reisner } 1802c141ebdaSPhilipp Reisner rcu_read_unlock(); 1803b411b363SPhilipp Reisner 1804b411b363SPhilipp Reisner return 0; 1805b411b363SPhilipp Reisner } 1806