1d003e0aeSVladimir Sementsov-Ogievskiy /* 2d003e0aeSVladimir Sementsov-Ogievskiy * copy-before-write filter driver 3d003e0aeSVladimir Sementsov-Ogievskiy * 4d003e0aeSVladimir Sementsov-Ogievskiy * The driver performs Copy-Before-Write (CBW) operation: it is injected above 5d003e0aeSVladimir Sementsov-Ogievskiy * some node, and before each write it copies _old_ data to the target node. 6d003e0aeSVladimir Sementsov-Ogievskiy * 7d003e0aeSVladimir Sementsov-Ogievskiy * Copyright (c) 2018-2021 Virtuozzo International GmbH. 8d003e0aeSVladimir Sementsov-Ogievskiy * 9d003e0aeSVladimir Sementsov-Ogievskiy * Author: 10d003e0aeSVladimir Sementsov-Ogievskiy * Sementsov-Ogievskiy Vladimir <vsementsov@virtuozzo.com> 11d003e0aeSVladimir Sementsov-Ogievskiy * 12d003e0aeSVladimir Sementsov-Ogievskiy * This program is free software; you can redistribute it and/or modify 13d003e0aeSVladimir Sementsov-Ogievskiy * it under the terms of the GNU General Public License as published by 14d003e0aeSVladimir Sementsov-Ogievskiy * the Free Software Foundation; either version 2 of the License, or 15d003e0aeSVladimir Sementsov-Ogievskiy * (at your option) any later version. 16d003e0aeSVladimir Sementsov-Ogievskiy * 17d003e0aeSVladimir Sementsov-Ogievskiy * This program is distributed in the hope that it will be useful, 18d003e0aeSVladimir Sementsov-Ogievskiy * but WITHOUT ANY WARRANTY; without even the implied warranty of 19d003e0aeSVladimir Sementsov-Ogievskiy * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 20d003e0aeSVladimir Sementsov-Ogievskiy * GNU General Public License for more details. 21d003e0aeSVladimir Sementsov-Ogievskiy * 22d003e0aeSVladimir Sementsov-Ogievskiy * You should have received a copy of the GNU General Public License 23d003e0aeSVladimir Sementsov-Ogievskiy * along with this program. If not, see <http://www.gnu.org/licenses/>. 24d003e0aeSVladimir Sementsov-Ogievskiy */ 25d003e0aeSVladimir Sementsov-Ogievskiy 26d003e0aeSVladimir Sementsov-Ogievskiy #include "qemu/osdep.h" 27d003e0aeSVladimir Sementsov-Ogievskiy 28d003e0aeSVladimir Sementsov-Ogievskiy #include "sysemu/block-backend.h" 29d003e0aeSVladimir Sementsov-Ogievskiy #include "qemu/cutils.h" 30d003e0aeSVladimir Sementsov-Ogievskiy #include "qapi/error.h" 31d003e0aeSVladimir Sementsov-Ogievskiy #include "block/block_int.h" 32d003e0aeSVladimir Sementsov-Ogievskiy #include "block/qdict.h" 33d003e0aeSVladimir Sementsov-Ogievskiy #include "block/block-copy.h" 34d003e0aeSVladimir Sementsov-Ogievskiy 35d003e0aeSVladimir Sementsov-Ogievskiy #include "block/copy-before-write.h" 36d003e0aeSVladimir Sementsov-Ogievskiy 37d003e0aeSVladimir Sementsov-Ogievskiy typedef struct BDRVCopyBeforeWriteState { 38d003e0aeSVladimir Sementsov-Ogievskiy BlockCopyState *bcs; 39d003e0aeSVladimir Sementsov-Ogievskiy BdrvChild *target; 40d003e0aeSVladimir Sementsov-Ogievskiy } BDRVCopyBeforeWriteState; 41d003e0aeSVladimir Sementsov-Ogievskiy 42d003e0aeSVladimir Sementsov-Ogievskiy static coroutine_fn int cbw_co_preadv( 43f7ef38ddSVladimir Sementsov-Ogievskiy BlockDriverState *bs, int64_t offset, int64_t bytes, 44f7ef38ddSVladimir Sementsov-Ogievskiy QEMUIOVector *qiov, BdrvRequestFlags flags) 45d003e0aeSVladimir Sementsov-Ogievskiy { 463c1e6327SVladimir Sementsov-Ogievskiy return bdrv_co_preadv(bs->file, offset, bytes, qiov, flags); 47d003e0aeSVladimir Sementsov-Ogievskiy } 48d003e0aeSVladimir Sementsov-Ogievskiy 49d003e0aeSVladimir Sementsov-Ogievskiy static coroutine_fn int cbw_do_copy_before_write(BlockDriverState *bs, 50d003e0aeSVladimir Sementsov-Ogievskiy uint64_t offset, uint64_t bytes, BdrvRequestFlags flags) 51d003e0aeSVladimir Sementsov-Ogievskiy { 52d003e0aeSVladimir Sementsov-Ogievskiy BDRVCopyBeforeWriteState *s = bs->opaque; 53d003e0aeSVladimir Sementsov-Ogievskiy uint64_t off, end; 54b518e9e9SVladimir Sementsov-Ogievskiy int64_t cluster_size = block_copy_cluster_size(s->bcs); 55d003e0aeSVladimir Sementsov-Ogievskiy 56d003e0aeSVladimir Sementsov-Ogievskiy if (flags & BDRV_REQ_WRITE_UNCHANGED) { 57d003e0aeSVladimir Sementsov-Ogievskiy return 0; 58d003e0aeSVladimir Sementsov-Ogievskiy } 59d003e0aeSVladimir Sementsov-Ogievskiy 60b518e9e9SVladimir Sementsov-Ogievskiy off = QEMU_ALIGN_DOWN(offset, cluster_size); 61b518e9e9SVladimir Sementsov-Ogievskiy end = QEMU_ALIGN_UP(offset + bytes, cluster_size); 62d003e0aeSVladimir Sementsov-Ogievskiy 63d003e0aeSVladimir Sementsov-Ogievskiy return block_copy(s->bcs, off, end - off, true); 64d003e0aeSVladimir Sementsov-Ogievskiy } 65d003e0aeSVladimir Sementsov-Ogievskiy 66d003e0aeSVladimir Sementsov-Ogievskiy static int coroutine_fn cbw_co_pdiscard(BlockDriverState *bs, 670c802287SVladimir Sementsov-Ogievskiy int64_t offset, int64_t bytes) 68d003e0aeSVladimir Sementsov-Ogievskiy { 69d003e0aeSVladimir Sementsov-Ogievskiy int ret = cbw_do_copy_before_write(bs, offset, bytes, 0); 70d003e0aeSVladimir Sementsov-Ogievskiy if (ret < 0) { 71d003e0aeSVladimir Sementsov-Ogievskiy return ret; 72d003e0aeSVladimir Sementsov-Ogievskiy } 73d003e0aeSVladimir Sementsov-Ogievskiy 743c1e6327SVladimir Sementsov-Ogievskiy return bdrv_co_pdiscard(bs->file, offset, bytes); 75d003e0aeSVladimir Sementsov-Ogievskiy } 76d003e0aeSVladimir Sementsov-Ogievskiy 77d003e0aeSVladimir Sementsov-Ogievskiy static int coroutine_fn cbw_co_pwrite_zeroes(BlockDriverState *bs, 78f34b2bcfSVladimir Sementsov-Ogievskiy int64_t offset, int64_t bytes, BdrvRequestFlags flags) 79d003e0aeSVladimir Sementsov-Ogievskiy { 80d003e0aeSVladimir Sementsov-Ogievskiy int ret = cbw_do_copy_before_write(bs, offset, bytes, flags); 81d003e0aeSVladimir Sementsov-Ogievskiy if (ret < 0) { 82d003e0aeSVladimir Sementsov-Ogievskiy return ret; 83d003e0aeSVladimir Sementsov-Ogievskiy } 84d003e0aeSVladimir Sementsov-Ogievskiy 853c1e6327SVladimir Sementsov-Ogievskiy return bdrv_co_pwrite_zeroes(bs->file, offset, bytes, flags); 86d003e0aeSVladimir Sementsov-Ogievskiy } 87d003e0aeSVladimir Sementsov-Ogievskiy 88d003e0aeSVladimir Sementsov-Ogievskiy static coroutine_fn int cbw_co_pwritev(BlockDriverState *bs, 89e75abedaSVladimir Sementsov-Ogievskiy int64_t offset, 90e75abedaSVladimir Sementsov-Ogievskiy int64_t bytes, 91e75abedaSVladimir Sementsov-Ogievskiy QEMUIOVector *qiov, 92e75abedaSVladimir Sementsov-Ogievskiy BdrvRequestFlags flags) 93d003e0aeSVladimir Sementsov-Ogievskiy { 94d003e0aeSVladimir Sementsov-Ogievskiy int ret = cbw_do_copy_before_write(bs, offset, bytes, flags); 95d003e0aeSVladimir Sementsov-Ogievskiy if (ret < 0) { 96d003e0aeSVladimir Sementsov-Ogievskiy return ret; 97d003e0aeSVladimir Sementsov-Ogievskiy } 98d003e0aeSVladimir Sementsov-Ogievskiy 993c1e6327SVladimir Sementsov-Ogievskiy return bdrv_co_pwritev(bs->file, offset, bytes, qiov, flags); 100d003e0aeSVladimir Sementsov-Ogievskiy } 101d003e0aeSVladimir Sementsov-Ogievskiy 102d003e0aeSVladimir Sementsov-Ogievskiy static int coroutine_fn cbw_co_flush(BlockDriverState *bs) 103d003e0aeSVladimir Sementsov-Ogievskiy { 1043c1e6327SVladimir Sementsov-Ogievskiy if (!bs->file) { 105d003e0aeSVladimir Sementsov-Ogievskiy return 0; 106d003e0aeSVladimir Sementsov-Ogievskiy } 107d003e0aeSVladimir Sementsov-Ogievskiy 1083c1e6327SVladimir Sementsov-Ogievskiy return bdrv_co_flush(bs->file->bs); 109d003e0aeSVladimir Sementsov-Ogievskiy } 110d003e0aeSVladimir Sementsov-Ogievskiy 111d003e0aeSVladimir Sementsov-Ogievskiy static void cbw_refresh_filename(BlockDriverState *bs) 112d003e0aeSVladimir Sementsov-Ogievskiy { 113d003e0aeSVladimir Sementsov-Ogievskiy pstrcpy(bs->exact_filename, sizeof(bs->exact_filename), 1143c1e6327SVladimir Sementsov-Ogievskiy bs->file->bs->filename); 115d003e0aeSVladimir Sementsov-Ogievskiy } 116d003e0aeSVladimir Sementsov-Ogievskiy 117d003e0aeSVladimir Sementsov-Ogievskiy static void cbw_child_perm(BlockDriverState *bs, BdrvChild *c, 118d003e0aeSVladimir Sementsov-Ogievskiy BdrvChildRole role, 119d003e0aeSVladimir Sementsov-Ogievskiy BlockReopenQueue *reopen_queue, 120d003e0aeSVladimir Sementsov-Ogievskiy uint64_t perm, uint64_t shared, 121d003e0aeSVladimir Sementsov-Ogievskiy uint64_t *nperm, uint64_t *nshared) 122d003e0aeSVladimir Sementsov-Ogievskiy { 123d003e0aeSVladimir Sementsov-Ogievskiy if (!(role & BDRV_CHILD_FILTERED)) { 124d003e0aeSVladimir Sementsov-Ogievskiy /* 125d003e0aeSVladimir Sementsov-Ogievskiy * Target child 126d003e0aeSVladimir Sementsov-Ogievskiy * 127d003e0aeSVladimir Sementsov-Ogievskiy * Share write to target (child_file), to not interfere 128d003e0aeSVladimir Sementsov-Ogievskiy * with guest writes to its disk which may be in target backing chain. 129d003e0aeSVladimir Sementsov-Ogievskiy * Can't resize during a backup block job because we check the size 130d003e0aeSVladimir Sementsov-Ogievskiy * only upfront. 131d003e0aeSVladimir Sementsov-Ogievskiy */ 132d003e0aeSVladimir Sementsov-Ogievskiy *nshared = BLK_PERM_ALL & ~BLK_PERM_RESIZE; 133d003e0aeSVladimir Sementsov-Ogievskiy *nperm = BLK_PERM_WRITE; 134d003e0aeSVladimir Sementsov-Ogievskiy } else { 135d003e0aeSVladimir Sementsov-Ogievskiy /* Source child */ 136d003e0aeSVladimir Sementsov-Ogievskiy bdrv_default_perms(bs, c, role, reopen_queue, 137d003e0aeSVladimir Sementsov-Ogievskiy perm, shared, nperm, nshared); 138d003e0aeSVladimir Sementsov-Ogievskiy 1393860c020SVladimir Sementsov-Ogievskiy if (!QLIST_EMPTY(&bs->parents)) { 140d003e0aeSVladimir Sementsov-Ogievskiy if (perm & BLK_PERM_WRITE) { 141d003e0aeSVladimir Sementsov-Ogievskiy *nperm = *nperm | BLK_PERM_CONSISTENT_READ; 142d003e0aeSVladimir Sementsov-Ogievskiy } 143d003e0aeSVladimir Sementsov-Ogievskiy *nshared &= ~(BLK_PERM_WRITE | BLK_PERM_RESIZE); 144d003e0aeSVladimir Sementsov-Ogievskiy } 145d003e0aeSVladimir Sementsov-Ogievskiy } 1463860c020SVladimir Sementsov-Ogievskiy } 147d003e0aeSVladimir Sementsov-Ogievskiy 148751cec7aSVladimir Sementsov-Ogievskiy static int cbw_open(BlockDriverState *bs, QDict *options, int flags, 149751cec7aSVladimir Sementsov-Ogievskiy Error **errp) 1501f0cacb9SVladimir Sementsov-Ogievskiy { 151fe7ea40cSVladimir Sementsov-Ogievskiy BDRVCopyBeforeWriteState *s = bs->opaque; 15206e0a9c1SVladimir Sementsov-Ogievskiy BdrvDirtyBitmap *copy_bitmap; 1531f0cacb9SVladimir Sementsov-Ogievskiy 154f44fd739SVladimir Sementsov-Ogievskiy bs->file = bdrv_open_child(NULL, options, "file", bs, &child_of_bds, 155f44fd739SVladimir Sementsov-Ogievskiy BDRV_CHILD_FILTERED | BDRV_CHILD_PRIMARY, 156f44fd739SVladimir Sementsov-Ogievskiy false, errp); 157f44fd739SVladimir Sementsov-Ogievskiy if (!bs->file) { 1581f0cacb9SVladimir Sementsov-Ogievskiy return -EINVAL; 1591f0cacb9SVladimir Sementsov-Ogievskiy } 1601f0cacb9SVladimir Sementsov-Ogievskiy 161f44fd739SVladimir Sementsov-Ogievskiy s->target = bdrv_open_child(NULL, options, "target", bs, &child_of_bds, 162f44fd739SVladimir Sementsov-Ogievskiy BDRV_CHILD_DATA, false, errp); 163f44fd739SVladimir Sementsov-Ogievskiy if (!s->target) { 1641f0cacb9SVladimir Sementsov-Ogievskiy return -EINVAL; 1651f0cacb9SVladimir Sementsov-Ogievskiy } 1661f0cacb9SVladimir Sementsov-Ogievskiy 1675a507426SVladimir Sementsov-Ogievskiy bs->total_sectors = bs->file->bs->total_sectors; 1685a507426SVladimir Sementsov-Ogievskiy bs->supported_write_flags = BDRV_REQ_WRITE_UNCHANGED | 1695a507426SVladimir Sementsov-Ogievskiy (BDRV_REQ_FUA & bs->file->bs->supported_write_flags); 1705a507426SVladimir Sementsov-Ogievskiy bs->supported_zero_flags = BDRV_REQ_WRITE_UNCHANGED | 1715a507426SVladimir Sementsov-Ogievskiy ((BDRV_REQ_FUA | BDRV_REQ_MAY_UNMAP | BDRV_REQ_NO_FALLBACK) & 1725a507426SVladimir Sementsov-Ogievskiy bs->file->bs->supported_zero_flags); 1735a507426SVladimir Sementsov-Ogievskiy 174abde8ac2SVladimir Sementsov-Ogievskiy s->bcs = block_copy_state_new(bs->file, s->target, errp); 175fe7ea40cSVladimir Sementsov-Ogievskiy if (!s->bcs) { 1761f0cacb9SVladimir Sementsov-Ogievskiy error_prepend(errp, "Cannot create block-copy-state: "); 1771f0cacb9SVladimir Sementsov-Ogievskiy return -EINVAL; 1781f0cacb9SVladimir Sementsov-Ogievskiy } 1791f0cacb9SVladimir Sementsov-Ogievskiy 18006e0a9c1SVladimir Sementsov-Ogievskiy copy_bitmap = block_copy_dirty_bitmap(s->bcs); 18106e0a9c1SVladimir Sementsov-Ogievskiy bdrv_set_dirty_bitmap(copy_bitmap, 0, bdrv_dirty_bitmap_size(copy_bitmap)); 18206e0a9c1SVladimir Sementsov-Ogievskiy 1831f0cacb9SVladimir Sementsov-Ogievskiy return 0; 1841f0cacb9SVladimir Sementsov-Ogievskiy } 1851f0cacb9SVladimir Sementsov-Ogievskiy 186751cec7aSVladimir Sementsov-Ogievskiy static void cbw_close(BlockDriverState *bs) 187751cec7aSVladimir Sementsov-Ogievskiy { 188751cec7aSVladimir Sementsov-Ogievskiy BDRVCopyBeforeWriteState *s = bs->opaque; 189751cec7aSVladimir Sementsov-Ogievskiy 190751cec7aSVladimir Sementsov-Ogievskiy block_copy_state_free(s->bcs); 191751cec7aSVladimir Sementsov-Ogievskiy s->bcs = NULL; 192751cec7aSVladimir Sementsov-Ogievskiy } 193751cec7aSVladimir Sementsov-Ogievskiy 194d003e0aeSVladimir Sementsov-Ogievskiy BlockDriver bdrv_cbw_filter = { 195d003e0aeSVladimir Sementsov-Ogievskiy .format_name = "copy-before-write", 196d003e0aeSVladimir Sementsov-Ogievskiy .instance_size = sizeof(BDRVCopyBeforeWriteState), 197d003e0aeSVladimir Sementsov-Ogievskiy 198751cec7aSVladimir Sementsov-Ogievskiy .bdrv_open = cbw_open, 199751cec7aSVladimir Sementsov-Ogievskiy .bdrv_close = cbw_close, 200751cec7aSVladimir Sementsov-Ogievskiy 201d003e0aeSVladimir Sementsov-Ogievskiy .bdrv_co_preadv = cbw_co_preadv, 202d003e0aeSVladimir Sementsov-Ogievskiy .bdrv_co_pwritev = cbw_co_pwritev, 203d003e0aeSVladimir Sementsov-Ogievskiy .bdrv_co_pwrite_zeroes = cbw_co_pwrite_zeroes, 204d003e0aeSVladimir Sementsov-Ogievskiy .bdrv_co_pdiscard = cbw_co_pdiscard, 205d003e0aeSVladimir Sementsov-Ogievskiy .bdrv_co_flush = cbw_co_flush, 206d003e0aeSVladimir Sementsov-Ogievskiy 207d003e0aeSVladimir Sementsov-Ogievskiy .bdrv_refresh_filename = cbw_refresh_filename, 208d003e0aeSVladimir Sementsov-Ogievskiy 209d003e0aeSVladimir Sementsov-Ogievskiy .bdrv_child_perm = cbw_child_perm, 210d003e0aeSVladimir Sementsov-Ogievskiy 211d003e0aeSVladimir Sementsov-Ogievskiy .is_filter = true, 212d003e0aeSVladimir Sementsov-Ogievskiy }; 213d003e0aeSVladimir Sementsov-Ogievskiy 214d003e0aeSVladimir Sementsov-Ogievskiy BlockDriverState *bdrv_cbw_append(BlockDriverState *source, 215d003e0aeSVladimir Sementsov-Ogievskiy BlockDriverState *target, 216d003e0aeSVladimir Sementsov-Ogievskiy const char *filter_node_name, 217d003e0aeSVladimir Sementsov-Ogievskiy BlockCopyState **bcs, 218d003e0aeSVladimir Sementsov-Ogievskiy Error **errp) 219d003e0aeSVladimir Sementsov-Ogievskiy { 220d003e0aeSVladimir Sementsov-Ogievskiy ERRP_GUARD(); 221d003e0aeSVladimir Sementsov-Ogievskiy BDRVCopyBeforeWriteState *state; 222d003e0aeSVladimir Sementsov-Ogievskiy BlockDriverState *top; 223f44fd739SVladimir Sementsov-Ogievskiy QDict *opts; 224d003e0aeSVladimir Sementsov-Ogievskiy 225d003e0aeSVladimir Sementsov-Ogievskiy assert(source->total_sectors == target->total_sectors); 226*377cc15bSEmanuele Giuseppe Esposito GLOBAL_STATE_CODE(); 227d003e0aeSVladimir Sementsov-Ogievskiy 228f44fd739SVladimir Sementsov-Ogievskiy opts = qdict_new(); 229751cec7aSVladimir Sementsov-Ogievskiy qdict_put_str(opts, "driver", "copy-before-write"); 230751cec7aSVladimir Sementsov-Ogievskiy if (filter_node_name) { 231751cec7aSVladimir Sementsov-Ogievskiy qdict_put_str(opts, "node-name", filter_node_name); 232751cec7aSVladimir Sementsov-Ogievskiy } 233f44fd739SVladimir Sementsov-Ogievskiy qdict_put_str(opts, "file", bdrv_get_node_name(source)); 234f44fd739SVladimir Sementsov-Ogievskiy qdict_put_str(opts, "target", bdrv_get_node_name(target)); 235f44fd739SVladimir Sementsov-Ogievskiy 236751cec7aSVladimir Sementsov-Ogievskiy top = bdrv_insert_node(source, opts, BDRV_O_RDWR, errp); 237751cec7aSVladimir Sementsov-Ogievskiy if (!top) { 238751cec7aSVladimir Sementsov-Ogievskiy return NULL; 239d003e0aeSVladimir Sementsov-Ogievskiy } 240d003e0aeSVladimir Sementsov-Ogievskiy 241751cec7aSVladimir Sementsov-Ogievskiy state = top->opaque; 2427ddbce2dSVladimir Sementsov-Ogievskiy *bcs = state->bcs; 243d003e0aeSVladimir Sementsov-Ogievskiy 244d003e0aeSVladimir Sementsov-Ogievskiy return top; 245d003e0aeSVladimir Sementsov-Ogievskiy } 246d003e0aeSVladimir Sementsov-Ogievskiy 247d003e0aeSVladimir Sementsov-Ogievskiy void bdrv_cbw_drop(BlockDriverState *bs) 248d003e0aeSVladimir Sementsov-Ogievskiy { 249*377cc15bSEmanuele Giuseppe Esposito GLOBAL_STATE_CODE(); 250d003e0aeSVladimir Sementsov-Ogievskiy bdrv_drop_filter(bs, &error_abort); 251d003e0aeSVladimir Sementsov-Ogievskiy bdrv_unref(bs); 252d003e0aeSVladimir Sementsov-Ogievskiy } 253751cec7aSVladimir Sementsov-Ogievskiy 254751cec7aSVladimir Sementsov-Ogievskiy static void cbw_init(void) 255751cec7aSVladimir Sementsov-Ogievskiy { 256751cec7aSVladimir Sementsov-Ogievskiy bdrv_register(&bdrv_cbw_filter); 257751cec7aSVladimir Sementsov-Ogievskiy } 258751cec7aSVladimir Sementsov-Ogievskiy 259751cec7aSVladimir Sementsov-Ogievskiy block_init(cbw_init); 260