xref: /openbmc/qemu/block/copy-before-write.c (revision 377cc15bf1994a176162a5f705ff32a38aa55e2c)
1d003e0aeSVladimir Sementsov-Ogievskiy /*
2d003e0aeSVladimir Sementsov-Ogievskiy  * copy-before-write filter driver
3d003e0aeSVladimir Sementsov-Ogievskiy  *
4d003e0aeSVladimir Sementsov-Ogievskiy  * The driver performs Copy-Before-Write (CBW) operation: it is injected above
5d003e0aeSVladimir Sementsov-Ogievskiy  * some node, and before each write it copies _old_ data to the target node.
6d003e0aeSVladimir Sementsov-Ogievskiy  *
7d003e0aeSVladimir Sementsov-Ogievskiy  * Copyright (c) 2018-2021 Virtuozzo International GmbH.
8d003e0aeSVladimir Sementsov-Ogievskiy  *
9d003e0aeSVladimir Sementsov-Ogievskiy  * Author:
10d003e0aeSVladimir Sementsov-Ogievskiy  *  Sementsov-Ogievskiy Vladimir <vsementsov@virtuozzo.com>
11d003e0aeSVladimir Sementsov-Ogievskiy  *
12d003e0aeSVladimir Sementsov-Ogievskiy  * This program is free software; you can redistribute it and/or modify
13d003e0aeSVladimir Sementsov-Ogievskiy  * it under the terms of the GNU General Public License as published by
14d003e0aeSVladimir Sementsov-Ogievskiy  * the Free Software Foundation; either version 2 of the License, or
15d003e0aeSVladimir Sementsov-Ogievskiy  * (at your option) any later version.
16d003e0aeSVladimir Sementsov-Ogievskiy  *
17d003e0aeSVladimir Sementsov-Ogievskiy  * This program is distributed in the hope that it will be useful,
18d003e0aeSVladimir Sementsov-Ogievskiy  * but WITHOUT ANY WARRANTY; without even the implied warranty of
19d003e0aeSVladimir Sementsov-Ogievskiy  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
20d003e0aeSVladimir Sementsov-Ogievskiy  * GNU General Public License for more details.
21d003e0aeSVladimir Sementsov-Ogievskiy  *
22d003e0aeSVladimir Sementsov-Ogievskiy  * You should have received a copy of the GNU General Public License
23d003e0aeSVladimir Sementsov-Ogievskiy  * along with this program. If not, see <http://www.gnu.org/licenses/>.
24d003e0aeSVladimir Sementsov-Ogievskiy  */
25d003e0aeSVladimir Sementsov-Ogievskiy 
26d003e0aeSVladimir Sementsov-Ogievskiy #include "qemu/osdep.h"
27d003e0aeSVladimir Sementsov-Ogievskiy 
28d003e0aeSVladimir Sementsov-Ogievskiy #include "sysemu/block-backend.h"
29d003e0aeSVladimir Sementsov-Ogievskiy #include "qemu/cutils.h"
30d003e0aeSVladimir Sementsov-Ogievskiy #include "qapi/error.h"
31d003e0aeSVladimir Sementsov-Ogievskiy #include "block/block_int.h"
32d003e0aeSVladimir Sementsov-Ogievskiy #include "block/qdict.h"
33d003e0aeSVladimir Sementsov-Ogievskiy #include "block/block-copy.h"
34d003e0aeSVladimir Sementsov-Ogievskiy 
35d003e0aeSVladimir Sementsov-Ogievskiy #include "block/copy-before-write.h"
36d003e0aeSVladimir Sementsov-Ogievskiy 
37d003e0aeSVladimir Sementsov-Ogievskiy typedef struct BDRVCopyBeforeWriteState {
38d003e0aeSVladimir Sementsov-Ogievskiy     BlockCopyState *bcs;
39d003e0aeSVladimir Sementsov-Ogievskiy     BdrvChild *target;
40d003e0aeSVladimir Sementsov-Ogievskiy } BDRVCopyBeforeWriteState;
41d003e0aeSVladimir Sementsov-Ogievskiy 
42d003e0aeSVladimir Sementsov-Ogievskiy static coroutine_fn int cbw_co_preadv(
43f7ef38ddSVladimir Sementsov-Ogievskiy         BlockDriverState *bs, int64_t offset, int64_t bytes,
44f7ef38ddSVladimir Sementsov-Ogievskiy         QEMUIOVector *qiov, BdrvRequestFlags flags)
45d003e0aeSVladimir Sementsov-Ogievskiy {
463c1e6327SVladimir Sementsov-Ogievskiy     return bdrv_co_preadv(bs->file, offset, bytes, qiov, flags);
47d003e0aeSVladimir Sementsov-Ogievskiy }
48d003e0aeSVladimir Sementsov-Ogievskiy 
49d003e0aeSVladimir Sementsov-Ogievskiy static coroutine_fn int cbw_do_copy_before_write(BlockDriverState *bs,
50d003e0aeSVladimir Sementsov-Ogievskiy         uint64_t offset, uint64_t bytes, BdrvRequestFlags flags)
51d003e0aeSVladimir Sementsov-Ogievskiy {
52d003e0aeSVladimir Sementsov-Ogievskiy     BDRVCopyBeforeWriteState *s = bs->opaque;
53d003e0aeSVladimir Sementsov-Ogievskiy     uint64_t off, end;
54b518e9e9SVladimir Sementsov-Ogievskiy     int64_t cluster_size = block_copy_cluster_size(s->bcs);
55d003e0aeSVladimir Sementsov-Ogievskiy 
56d003e0aeSVladimir Sementsov-Ogievskiy     if (flags & BDRV_REQ_WRITE_UNCHANGED) {
57d003e0aeSVladimir Sementsov-Ogievskiy         return 0;
58d003e0aeSVladimir Sementsov-Ogievskiy     }
59d003e0aeSVladimir Sementsov-Ogievskiy 
60b518e9e9SVladimir Sementsov-Ogievskiy     off = QEMU_ALIGN_DOWN(offset, cluster_size);
61b518e9e9SVladimir Sementsov-Ogievskiy     end = QEMU_ALIGN_UP(offset + bytes, cluster_size);
62d003e0aeSVladimir Sementsov-Ogievskiy 
63d003e0aeSVladimir Sementsov-Ogievskiy     return block_copy(s->bcs, off, end - off, true);
64d003e0aeSVladimir Sementsov-Ogievskiy }
65d003e0aeSVladimir Sementsov-Ogievskiy 
66d003e0aeSVladimir Sementsov-Ogievskiy static int coroutine_fn cbw_co_pdiscard(BlockDriverState *bs,
670c802287SVladimir Sementsov-Ogievskiy                                         int64_t offset, int64_t bytes)
68d003e0aeSVladimir Sementsov-Ogievskiy {
69d003e0aeSVladimir Sementsov-Ogievskiy     int ret = cbw_do_copy_before_write(bs, offset, bytes, 0);
70d003e0aeSVladimir Sementsov-Ogievskiy     if (ret < 0) {
71d003e0aeSVladimir Sementsov-Ogievskiy         return ret;
72d003e0aeSVladimir Sementsov-Ogievskiy     }
73d003e0aeSVladimir Sementsov-Ogievskiy 
743c1e6327SVladimir Sementsov-Ogievskiy     return bdrv_co_pdiscard(bs->file, offset, bytes);
75d003e0aeSVladimir Sementsov-Ogievskiy }
76d003e0aeSVladimir Sementsov-Ogievskiy 
77d003e0aeSVladimir Sementsov-Ogievskiy static int coroutine_fn cbw_co_pwrite_zeroes(BlockDriverState *bs,
78f34b2bcfSVladimir Sementsov-Ogievskiy         int64_t offset, int64_t bytes, BdrvRequestFlags flags)
79d003e0aeSVladimir Sementsov-Ogievskiy {
80d003e0aeSVladimir Sementsov-Ogievskiy     int ret = cbw_do_copy_before_write(bs, offset, bytes, flags);
81d003e0aeSVladimir Sementsov-Ogievskiy     if (ret < 0) {
82d003e0aeSVladimir Sementsov-Ogievskiy         return ret;
83d003e0aeSVladimir Sementsov-Ogievskiy     }
84d003e0aeSVladimir Sementsov-Ogievskiy 
853c1e6327SVladimir Sementsov-Ogievskiy     return bdrv_co_pwrite_zeroes(bs->file, offset, bytes, flags);
86d003e0aeSVladimir Sementsov-Ogievskiy }
87d003e0aeSVladimir Sementsov-Ogievskiy 
88d003e0aeSVladimir Sementsov-Ogievskiy static coroutine_fn int cbw_co_pwritev(BlockDriverState *bs,
89e75abedaSVladimir Sementsov-Ogievskiy                                        int64_t offset,
90e75abedaSVladimir Sementsov-Ogievskiy                                        int64_t bytes,
91e75abedaSVladimir Sementsov-Ogievskiy                                        QEMUIOVector *qiov,
92e75abedaSVladimir Sementsov-Ogievskiy                                        BdrvRequestFlags flags)
93d003e0aeSVladimir Sementsov-Ogievskiy {
94d003e0aeSVladimir Sementsov-Ogievskiy     int ret = cbw_do_copy_before_write(bs, offset, bytes, flags);
95d003e0aeSVladimir Sementsov-Ogievskiy     if (ret < 0) {
96d003e0aeSVladimir Sementsov-Ogievskiy         return ret;
97d003e0aeSVladimir Sementsov-Ogievskiy     }
98d003e0aeSVladimir Sementsov-Ogievskiy 
993c1e6327SVladimir Sementsov-Ogievskiy     return bdrv_co_pwritev(bs->file, offset, bytes, qiov, flags);
100d003e0aeSVladimir Sementsov-Ogievskiy }
101d003e0aeSVladimir Sementsov-Ogievskiy 
102d003e0aeSVladimir Sementsov-Ogievskiy static int coroutine_fn cbw_co_flush(BlockDriverState *bs)
103d003e0aeSVladimir Sementsov-Ogievskiy {
1043c1e6327SVladimir Sementsov-Ogievskiy     if (!bs->file) {
105d003e0aeSVladimir Sementsov-Ogievskiy         return 0;
106d003e0aeSVladimir Sementsov-Ogievskiy     }
107d003e0aeSVladimir Sementsov-Ogievskiy 
1083c1e6327SVladimir Sementsov-Ogievskiy     return bdrv_co_flush(bs->file->bs);
109d003e0aeSVladimir Sementsov-Ogievskiy }
110d003e0aeSVladimir Sementsov-Ogievskiy 
111d003e0aeSVladimir Sementsov-Ogievskiy static void cbw_refresh_filename(BlockDriverState *bs)
112d003e0aeSVladimir Sementsov-Ogievskiy {
113d003e0aeSVladimir Sementsov-Ogievskiy     pstrcpy(bs->exact_filename, sizeof(bs->exact_filename),
1143c1e6327SVladimir Sementsov-Ogievskiy             bs->file->bs->filename);
115d003e0aeSVladimir Sementsov-Ogievskiy }
116d003e0aeSVladimir Sementsov-Ogievskiy 
117d003e0aeSVladimir Sementsov-Ogievskiy static void cbw_child_perm(BlockDriverState *bs, BdrvChild *c,
118d003e0aeSVladimir Sementsov-Ogievskiy                            BdrvChildRole role,
119d003e0aeSVladimir Sementsov-Ogievskiy                            BlockReopenQueue *reopen_queue,
120d003e0aeSVladimir Sementsov-Ogievskiy                            uint64_t perm, uint64_t shared,
121d003e0aeSVladimir Sementsov-Ogievskiy                            uint64_t *nperm, uint64_t *nshared)
122d003e0aeSVladimir Sementsov-Ogievskiy {
123d003e0aeSVladimir Sementsov-Ogievskiy     if (!(role & BDRV_CHILD_FILTERED)) {
124d003e0aeSVladimir Sementsov-Ogievskiy         /*
125d003e0aeSVladimir Sementsov-Ogievskiy          * Target child
126d003e0aeSVladimir Sementsov-Ogievskiy          *
127d003e0aeSVladimir Sementsov-Ogievskiy          * Share write to target (child_file), to not interfere
128d003e0aeSVladimir Sementsov-Ogievskiy          * with guest writes to its disk which may be in target backing chain.
129d003e0aeSVladimir Sementsov-Ogievskiy          * Can't resize during a backup block job because we check the size
130d003e0aeSVladimir Sementsov-Ogievskiy          * only upfront.
131d003e0aeSVladimir Sementsov-Ogievskiy          */
132d003e0aeSVladimir Sementsov-Ogievskiy         *nshared = BLK_PERM_ALL & ~BLK_PERM_RESIZE;
133d003e0aeSVladimir Sementsov-Ogievskiy         *nperm = BLK_PERM_WRITE;
134d003e0aeSVladimir Sementsov-Ogievskiy     } else {
135d003e0aeSVladimir Sementsov-Ogievskiy         /* Source child */
136d003e0aeSVladimir Sementsov-Ogievskiy         bdrv_default_perms(bs, c, role, reopen_queue,
137d003e0aeSVladimir Sementsov-Ogievskiy                            perm, shared, nperm, nshared);
138d003e0aeSVladimir Sementsov-Ogievskiy 
1393860c020SVladimir Sementsov-Ogievskiy         if (!QLIST_EMPTY(&bs->parents)) {
140d003e0aeSVladimir Sementsov-Ogievskiy             if (perm & BLK_PERM_WRITE) {
141d003e0aeSVladimir Sementsov-Ogievskiy                 *nperm = *nperm | BLK_PERM_CONSISTENT_READ;
142d003e0aeSVladimir Sementsov-Ogievskiy             }
143d003e0aeSVladimir Sementsov-Ogievskiy             *nshared &= ~(BLK_PERM_WRITE | BLK_PERM_RESIZE);
144d003e0aeSVladimir Sementsov-Ogievskiy         }
145d003e0aeSVladimir Sementsov-Ogievskiy     }
1463860c020SVladimir Sementsov-Ogievskiy }
147d003e0aeSVladimir Sementsov-Ogievskiy 
148751cec7aSVladimir Sementsov-Ogievskiy static int cbw_open(BlockDriverState *bs, QDict *options, int flags,
149751cec7aSVladimir Sementsov-Ogievskiy                     Error **errp)
1501f0cacb9SVladimir Sementsov-Ogievskiy {
151fe7ea40cSVladimir Sementsov-Ogievskiy     BDRVCopyBeforeWriteState *s = bs->opaque;
15206e0a9c1SVladimir Sementsov-Ogievskiy     BdrvDirtyBitmap *copy_bitmap;
1531f0cacb9SVladimir Sementsov-Ogievskiy 
154f44fd739SVladimir Sementsov-Ogievskiy     bs->file = bdrv_open_child(NULL, options, "file", bs, &child_of_bds,
155f44fd739SVladimir Sementsov-Ogievskiy                                BDRV_CHILD_FILTERED | BDRV_CHILD_PRIMARY,
156f44fd739SVladimir Sementsov-Ogievskiy                                false, errp);
157f44fd739SVladimir Sementsov-Ogievskiy     if (!bs->file) {
1581f0cacb9SVladimir Sementsov-Ogievskiy         return -EINVAL;
1591f0cacb9SVladimir Sementsov-Ogievskiy     }
1601f0cacb9SVladimir Sementsov-Ogievskiy 
161f44fd739SVladimir Sementsov-Ogievskiy     s->target = bdrv_open_child(NULL, options, "target", bs, &child_of_bds,
162f44fd739SVladimir Sementsov-Ogievskiy                                 BDRV_CHILD_DATA, false, errp);
163f44fd739SVladimir Sementsov-Ogievskiy     if (!s->target) {
1641f0cacb9SVladimir Sementsov-Ogievskiy         return -EINVAL;
1651f0cacb9SVladimir Sementsov-Ogievskiy     }
1661f0cacb9SVladimir Sementsov-Ogievskiy 
1675a507426SVladimir Sementsov-Ogievskiy     bs->total_sectors = bs->file->bs->total_sectors;
1685a507426SVladimir Sementsov-Ogievskiy     bs->supported_write_flags = BDRV_REQ_WRITE_UNCHANGED |
1695a507426SVladimir Sementsov-Ogievskiy             (BDRV_REQ_FUA & bs->file->bs->supported_write_flags);
1705a507426SVladimir Sementsov-Ogievskiy     bs->supported_zero_flags = BDRV_REQ_WRITE_UNCHANGED |
1715a507426SVladimir Sementsov-Ogievskiy             ((BDRV_REQ_FUA | BDRV_REQ_MAY_UNMAP | BDRV_REQ_NO_FALLBACK) &
1725a507426SVladimir Sementsov-Ogievskiy              bs->file->bs->supported_zero_flags);
1735a507426SVladimir Sementsov-Ogievskiy 
174abde8ac2SVladimir Sementsov-Ogievskiy     s->bcs = block_copy_state_new(bs->file, s->target, errp);
175fe7ea40cSVladimir Sementsov-Ogievskiy     if (!s->bcs) {
1761f0cacb9SVladimir Sementsov-Ogievskiy         error_prepend(errp, "Cannot create block-copy-state: ");
1771f0cacb9SVladimir Sementsov-Ogievskiy         return -EINVAL;
1781f0cacb9SVladimir Sementsov-Ogievskiy     }
1791f0cacb9SVladimir Sementsov-Ogievskiy 
18006e0a9c1SVladimir Sementsov-Ogievskiy     copy_bitmap = block_copy_dirty_bitmap(s->bcs);
18106e0a9c1SVladimir Sementsov-Ogievskiy     bdrv_set_dirty_bitmap(copy_bitmap, 0, bdrv_dirty_bitmap_size(copy_bitmap));
18206e0a9c1SVladimir Sementsov-Ogievskiy 
1831f0cacb9SVladimir Sementsov-Ogievskiy     return 0;
1841f0cacb9SVladimir Sementsov-Ogievskiy }
1851f0cacb9SVladimir Sementsov-Ogievskiy 
186751cec7aSVladimir Sementsov-Ogievskiy static void cbw_close(BlockDriverState *bs)
187751cec7aSVladimir Sementsov-Ogievskiy {
188751cec7aSVladimir Sementsov-Ogievskiy     BDRVCopyBeforeWriteState *s = bs->opaque;
189751cec7aSVladimir Sementsov-Ogievskiy 
190751cec7aSVladimir Sementsov-Ogievskiy     block_copy_state_free(s->bcs);
191751cec7aSVladimir Sementsov-Ogievskiy     s->bcs = NULL;
192751cec7aSVladimir Sementsov-Ogievskiy }
193751cec7aSVladimir Sementsov-Ogievskiy 
194d003e0aeSVladimir Sementsov-Ogievskiy BlockDriver bdrv_cbw_filter = {
195d003e0aeSVladimir Sementsov-Ogievskiy     .format_name = "copy-before-write",
196d003e0aeSVladimir Sementsov-Ogievskiy     .instance_size = sizeof(BDRVCopyBeforeWriteState),
197d003e0aeSVladimir Sementsov-Ogievskiy 
198751cec7aSVladimir Sementsov-Ogievskiy     .bdrv_open                  = cbw_open,
199751cec7aSVladimir Sementsov-Ogievskiy     .bdrv_close                 = cbw_close,
200751cec7aSVladimir Sementsov-Ogievskiy 
201d003e0aeSVladimir Sementsov-Ogievskiy     .bdrv_co_preadv             = cbw_co_preadv,
202d003e0aeSVladimir Sementsov-Ogievskiy     .bdrv_co_pwritev            = cbw_co_pwritev,
203d003e0aeSVladimir Sementsov-Ogievskiy     .bdrv_co_pwrite_zeroes      = cbw_co_pwrite_zeroes,
204d003e0aeSVladimir Sementsov-Ogievskiy     .bdrv_co_pdiscard           = cbw_co_pdiscard,
205d003e0aeSVladimir Sementsov-Ogievskiy     .bdrv_co_flush              = cbw_co_flush,
206d003e0aeSVladimir Sementsov-Ogievskiy 
207d003e0aeSVladimir Sementsov-Ogievskiy     .bdrv_refresh_filename      = cbw_refresh_filename,
208d003e0aeSVladimir Sementsov-Ogievskiy 
209d003e0aeSVladimir Sementsov-Ogievskiy     .bdrv_child_perm            = cbw_child_perm,
210d003e0aeSVladimir Sementsov-Ogievskiy 
211d003e0aeSVladimir Sementsov-Ogievskiy     .is_filter = true,
212d003e0aeSVladimir Sementsov-Ogievskiy };
213d003e0aeSVladimir Sementsov-Ogievskiy 
214d003e0aeSVladimir Sementsov-Ogievskiy BlockDriverState *bdrv_cbw_append(BlockDriverState *source,
215d003e0aeSVladimir Sementsov-Ogievskiy                                   BlockDriverState *target,
216d003e0aeSVladimir Sementsov-Ogievskiy                                   const char *filter_node_name,
217d003e0aeSVladimir Sementsov-Ogievskiy                                   BlockCopyState **bcs,
218d003e0aeSVladimir Sementsov-Ogievskiy                                   Error **errp)
219d003e0aeSVladimir Sementsov-Ogievskiy {
220d003e0aeSVladimir Sementsov-Ogievskiy     ERRP_GUARD();
221d003e0aeSVladimir Sementsov-Ogievskiy     BDRVCopyBeforeWriteState *state;
222d003e0aeSVladimir Sementsov-Ogievskiy     BlockDriverState *top;
223f44fd739SVladimir Sementsov-Ogievskiy     QDict *opts;
224d003e0aeSVladimir Sementsov-Ogievskiy 
225d003e0aeSVladimir Sementsov-Ogievskiy     assert(source->total_sectors == target->total_sectors);
226*377cc15bSEmanuele Giuseppe Esposito     GLOBAL_STATE_CODE();
227d003e0aeSVladimir Sementsov-Ogievskiy 
228f44fd739SVladimir Sementsov-Ogievskiy     opts = qdict_new();
229751cec7aSVladimir Sementsov-Ogievskiy     qdict_put_str(opts, "driver", "copy-before-write");
230751cec7aSVladimir Sementsov-Ogievskiy     if (filter_node_name) {
231751cec7aSVladimir Sementsov-Ogievskiy         qdict_put_str(opts, "node-name", filter_node_name);
232751cec7aSVladimir Sementsov-Ogievskiy     }
233f44fd739SVladimir Sementsov-Ogievskiy     qdict_put_str(opts, "file", bdrv_get_node_name(source));
234f44fd739SVladimir Sementsov-Ogievskiy     qdict_put_str(opts, "target", bdrv_get_node_name(target));
235f44fd739SVladimir Sementsov-Ogievskiy 
236751cec7aSVladimir Sementsov-Ogievskiy     top = bdrv_insert_node(source, opts, BDRV_O_RDWR, errp);
237751cec7aSVladimir Sementsov-Ogievskiy     if (!top) {
238751cec7aSVladimir Sementsov-Ogievskiy         return NULL;
239d003e0aeSVladimir Sementsov-Ogievskiy     }
240d003e0aeSVladimir Sementsov-Ogievskiy 
241751cec7aSVladimir Sementsov-Ogievskiy     state = top->opaque;
2427ddbce2dSVladimir Sementsov-Ogievskiy     *bcs = state->bcs;
243d003e0aeSVladimir Sementsov-Ogievskiy 
244d003e0aeSVladimir Sementsov-Ogievskiy     return top;
245d003e0aeSVladimir Sementsov-Ogievskiy }
246d003e0aeSVladimir Sementsov-Ogievskiy 
247d003e0aeSVladimir Sementsov-Ogievskiy void bdrv_cbw_drop(BlockDriverState *bs)
248d003e0aeSVladimir Sementsov-Ogievskiy {
249*377cc15bSEmanuele Giuseppe Esposito     GLOBAL_STATE_CODE();
250d003e0aeSVladimir Sementsov-Ogievskiy     bdrv_drop_filter(bs, &error_abort);
251d003e0aeSVladimir Sementsov-Ogievskiy     bdrv_unref(bs);
252d003e0aeSVladimir Sementsov-Ogievskiy }
253751cec7aSVladimir Sementsov-Ogievskiy 
254751cec7aSVladimir Sementsov-Ogievskiy static void cbw_init(void)
255751cec7aSVladimir Sementsov-Ogievskiy {
256751cec7aSVladimir Sementsov-Ogievskiy     bdrv_register(&bdrv_cbw_filter);
257751cec7aSVladimir Sementsov-Ogievskiy }
258751cec7aSVladimir Sementsov-Ogievskiy 
259751cec7aSVladimir Sementsov-Ogievskiy block_init(cbw_init);
260