1 /* 2 * copy-before-write filter driver 3 * 4 * The driver performs Copy-Before-Write (CBW) operation: it is injected above 5 * some node, and before each write it copies _old_ data to the target node. 6 * 7 * Copyright (c) 2018-2021 Virtuozzo International GmbH. 8 * 9 * Author: 10 * Sementsov-Ogievskiy Vladimir <vsementsov@virtuozzo.com> 11 * 12 * This program is free software; you can redistribute it and/or modify 13 * it under the terms of the GNU General Public License as published by 14 * the Free Software Foundation; either version 2 of the License, or 15 * (at your option) any later version. 16 * 17 * This program is distributed in the hope that it will be useful, 18 * but WITHOUT ANY WARRANTY; without even the implied warranty of 19 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 20 * GNU General Public License for more details. 21 * 22 * You should have received a copy of the GNU General Public License 23 * along with this program. If not, see <http://www.gnu.org/licenses/>. 24 */ 25 26 #include "qemu/osdep.h" 27 28 #include "sysemu/block-backend.h" 29 #include "qemu/cutils.h" 30 #include "qapi/error.h" 31 #include "block/block_int.h" 32 #include "block/qdict.h" 33 #include "block/block-copy.h" 34 35 #include "block/copy-before-write.h" 36 37 typedef struct BDRVCopyBeforeWriteState { 38 BlockCopyState *bcs; 39 BdrvChild *target; 40 int64_t cluster_size; 41 } BDRVCopyBeforeWriteState; 42 43 static coroutine_fn int cbw_co_preadv( 44 BlockDriverState *bs, uint64_t offset, uint64_t bytes, 45 QEMUIOVector *qiov, int flags) 46 { 47 return bdrv_co_preadv(bs->backing, offset, bytes, qiov, flags); 48 } 49 50 static coroutine_fn int cbw_do_copy_before_write(BlockDriverState *bs, 51 uint64_t offset, uint64_t bytes, BdrvRequestFlags flags) 52 { 53 BDRVCopyBeforeWriteState *s = bs->opaque; 54 uint64_t off, end; 55 56 if (flags & BDRV_REQ_WRITE_UNCHANGED) { 57 return 0; 58 } 59 60 off = QEMU_ALIGN_DOWN(offset, s->cluster_size); 61 end = QEMU_ALIGN_UP(offset + bytes, s->cluster_size); 62 63 return block_copy(s->bcs, off, end - off, true); 64 } 65 66 static int coroutine_fn cbw_co_pdiscard(BlockDriverState *bs, 67 int64_t offset, int bytes) 68 { 69 int ret = cbw_do_copy_before_write(bs, offset, bytes, 0); 70 if (ret < 0) { 71 return ret; 72 } 73 74 return bdrv_co_pdiscard(bs->backing, offset, bytes); 75 } 76 77 static int coroutine_fn cbw_co_pwrite_zeroes(BlockDriverState *bs, 78 int64_t offset, int bytes, BdrvRequestFlags flags) 79 { 80 int ret = cbw_do_copy_before_write(bs, offset, bytes, flags); 81 if (ret < 0) { 82 return ret; 83 } 84 85 return bdrv_co_pwrite_zeroes(bs->backing, offset, bytes, flags); 86 } 87 88 static coroutine_fn int cbw_co_pwritev(BlockDriverState *bs, 89 uint64_t offset, 90 uint64_t bytes, 91 QEMUIOVector *qiov, int flags) 92 { 93 int ret = cbw_do_copy_before_write(bs, offset, bytes, flags); 94 if (ret < 0) { 95 return ret; 96 } 97 98 return bdrv_co_pwritev(bs->backing, offset, bytes, qiov, flags); 99 } 100 101 static int coroutine_fn cbw_co_flush(BlockDriverState *bs) 102 { 103 if (!bs->backing) { 104 return 0; 105 } 106 107 return bdrv_co_flush(bs->backing->bs); 108 } 109 110 static void cbw_refresh_filename(BlockDriverState *bs) 111 { 112 if (bs->backing == NULL) { 113 /* 114 * we can be here after failed bdrv_attach_child in 115 * bdrv_set_backing_hd 116 */ 117 return; 118 } 119 pstrcpy(bs->exact_filename, sizeof(bs->exact_filename), 120 bs->backing->bs->filename); 121 } 122 123 static void cbw_child_perm(BlockDriverState *bs, BdrvChild *c, 124 BdrvChildRole role, 125 BlockReopenQueue *reopen_queue, 126 uint64_t perm, uint64_t shared, 127 uint64_t *nperm, uint64_t *nshared) 128 { 129 if (!(role & BDRV_CHILD_FILTERED)) { 130 /* 131 * Target child 132 * 133 * Share write to target (child_file), to not interfere 134 * with guest writes to its disk which may be in target backing chain. 135 * Can't resize during a backup block job because we check the size 136 * only upfront. 137 */ 138 *nshared = BLK_PERM_ALL & ~BLK_PERM_RESIZE; 139 *nperm = BLK_PERM_WRITE; 140 } else { 141 /* Source child */ 142 bdrv_default_perms(bs, c, role, reopen_queue, 143 perm, shared, nperm, nshared); 144 145 if (perm & BLK_PERM_WRITE) { 146 *nperm = *nperm | BLK_PERM_CONSISTENT_READ; 147 } 148 *nshared &= ~(BLK_PERM_WRITE | BLK_PERM_RESIZE); 149 } 150 } 151 152 BlockDriver bdrv_cbw_filter = { 153 .format_name = "copy-before-write", 154 .instance_size = sizeof(BDRVCopyBeforeWriteState), 155 156 .bdrv_co_preadv = cbw_co_preadv, 157 .bdrv_co_pwritev = cbw_co_pwritev, 158 .bdrv_co_pwrite_zeroes = cbw_co_pwrite_zeroes, 159 .bdrv_co_pdiscard = cbw_co_pdiscard, 160 .bdrv_co_flush = cbw_co_flush, 161 162 .bdrv_refresh_filename = cbw_refresh_filename, 163 164 .bdrv_child_perm = cbw_child_perm, 165 166 .is_filter = true, 167 }; 168 169 BlockDriverState *bdrv_cbw_append(BlockDriverState *source, 170 BlockDriverState *target, 171 const char *filter_node_name, 172 uint64_t cluster_size, 173 BackupPerf *perf, 174 bool compress, 175 BlockCopyState **bcs, 176 Error **errp) 177 { 178 ERRP_GUARD(); 179 int ret; 180 BDRVCopyBeforeWriteState *state; 181 BlockDriverState *top; 182 bool appended = false; 183 184 assert(source->total_sectors == target->total_sectors); 185 186 top = bdrv_new_open_driver(&bdrv_cbw_filter, filter_node_name, 187 BDRV_O_RDWR, errp); 188 if (!top) { 189 return NULL; 190 } 191 192 state = top->opaque; 193 top->total_sectors = source->total_sectors; 194 top->supported_write_flags = BDRV_REQ_WRITE_UNCHANGED | 195 (BDRV_REQ_FUA & source->supported_write_flags); 196 top->supported_zero_flags = BDRV_REQ_WRITE_UNCHANGED | 197 ((BDRV_REQ_FUA | BDRV_REQ_MAY_UNMAP | BDRV_REQ_NO_FALLBACK) & 198 source->supported_zero_flags); 199 200 bdrv_ref(target); 201 state->target = bdrv_attach_child(top, target, "target", &child_of_bds, 202 BDRV_CHILD_DATA, errp); 203 if (!state->target) { 204 bdrv_unref(target); 205 bdrv_unref(top); 206 return NULL; 207 } 208 209 bdrv_drained_begin(source); 210 211 ret = bdrv_append(top, source, errp); 212 if (ret < 0) { 213 error_prepend(errp, "Cannot append copy-before-write filter: "); 214 goto fail; 215 } 216 appended = true; 217 218 state->cluster_size = cluster_size; 219 state->bcs = block_copy_state_new(top->backing, state->target, 220 cluster_size, perf->use_copy_range, 221 compress, errp); 222 if (!state->bcs) { 223 error_prepend(errp, "Cannot create block-copy-state: "); 224 goto fail; 225 } 226 *bcs = state->bcs; 227 228 bdrv_drained_end(source); 229 230 return top; 231 232 fail: 233 if (appended) { 234 bdrv_cbw_drop(top); 235 } else { 236 bdrv_unref(top); 237 } 238 239 bdrv_drained_end(source); 240 241 return NULL; 242 } 243 244 void bdrv_cbw_drop(BlockDriverState *bs) 245 { 246 BDRVCopyBeforeWriteState *s = bs->opaque; 247 248 bdrv_drop_filter(bs, &error_abort); 249 250 block_copy_state_free(s->bcs); 251 252 bdrv_unref(bs); 253 } 254