xref: /openbmc/qemu/block/copy-before-write.c (revision 0fd05c8d807dc7cd25b2f9bf32dd4135c94acb7a)
1d003e0aeSVladimir Sementsov-Ogievskiy /*
2d003e0aeSVladimir Sementsov-Ogievskiy  * copy-before-write filter driver
3d003e0aeSVladimir Sementsov-Ogievskiy  *
4d003e0aeSVladimir Sementsov-Ogievskiy  * The driver performs Copy-Before-Write (CBW) operation: it is injected above
5d003e0aeSVladimir Sementsov-Ogievskiy  * some node, and before each write it copies _old_ data to the target node.
6d003e0aeSVladimir Sementsov-Ogievskiy  *
7d003e0aeSVladimir Sementsov-Ogievskiy  * Copyright (c) 2018-2021 Virtuozzo International GmbH.
8d003e0aeSVladimir Sementsov-Ogievskiy  *
9d003e0aeSVladimir Sementsov-Ogievskiy  * Author:
10d003e0aeSVladimir Sementsov-Ogievskiy  *  Sementsov-Ogievskiy Vladimir <vsementsov@virtuozzo.com>
11d003e0aeSVladimir Sementsov-Ogievskiy  *
12d003e0aeSVladimir Sementsov-Ogievskiy  * This program is free software; you can redistribute it and/or modify
13d003e0aeSVladimir Sementsov-Ogievskiy  * it under the terms of the GNU General Public License as published by
14d003e0aeSVladimir Sementsov-Ogievskiy  * the Free Software Foundation; either version 2 of the License, or
15d003e0aeSVladimir Sementsov-Ogievskiy  * (at your option) any later version.
16d003e0aeSVladimir Sementsov-Ogievskiy  *
17d003e0aeSVladimir Sementsov-Ogievskiy  * This program is distributed in the hope that it will be useful,
18d003e0aeSVladimir Sementsov-Ogievskiy  * but WITHOUT ANY WARRANTY; without even the implied warranty of
19d003e0aeSVladimir Sementsov-Ogievskiy  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
20d003e0aeSVladimir Sementsov-Ogievskiy  * GNU General Public License for more details.
21d003e0aeSVladimir Sementsov-Ogievskiy  *
22d003e0aeSVladimir Sementsov-Ogievskiy  * You should have received a copy of the GNU General Public License
23d003e0aeSVladimir Sementsov-Ogievskiy  * along with this program. If not, see <http://www.gnu.org/licenses/>.
24d003e0aeSVladimir Sementsov-Ogievskiy  */
25d003e0aeSVladimir Sementsov-Ogievskiy 
26d003e0aeSVladimir Sementsov-Ogievskiy #include "qemu/osdep.h"
2779ef0cebSVladimir Sementsov-Ogievskiy #include "qapi/qmp/qjson.h"
28d003e0aeSVladimir Sementsov-Ogievskiy 
29d003e0aeSVladimir Sementsov-Ogievskiy #include "sysemu/block-backend.h"
30d003e0aeSVladimir Sementsov-Ogievskiy #include "qemu/cutils.h"
31d003e0aeSVladimir Sementsov-Ogievskiy #include "qapi/error.h"
32d003e0aeSVladimir Sementsov-Ogievskiy #include "block/block_int.h"
33d003e0aeSVladimir Sementsov-Ogievskiy #include "block/qdict.h"
34d003e0aeSVladimir Sementsov-Ogievskiy #include "block/block-copy.h"
35e2c1c34fSMarkus Armbruster #include "block/dirty-bitmap.h"
36d003e0aeSVladimir Sementsov-Ogievskiy 
37d003e0aeSVladimir Sementsov-Ogievskiy #include "block/copy-before-write.h"
38af5bcd77SVladimir Sementsov-Ogievskiy #include "block/reqlist.h"
39d003e0aeSVladimir Sementsov-Ogievskiy 
405f3a3cd7SVladimir Sementsov-Ogievskiy #include "qapi/qapi-visit-block-core.h"
415f3a3cd7SVladimir Sementsov-Ogievskiy 
42d003e0aeSVladimir Sementsov-Ogievskiy typedef struct BDRVCopyBeforeWriteState {
43d003e0aeSVladimir Sementsov-Ogievskiy     BlockCopyState *bcs;
44d003e0aeSVladimir Sementsov-Ogievskiy     BdrvChild *target;
45f1bb39a8SVladimir Sementsov-Ogievskiy     OnCbwError on_cbw_error;
466db7fd1cSVladimir Sementsov-Ogievskiy     uint32_t cbw_timeout_ns;
47*0fd05c8dSVladimir Sementsov-Ogievskiy     bool discard_source;
48af5bcd77SVladimir Sementsov-Ogievskiy 
49af5bcd77SVladimir Sementsov-Ogievskiy     /*
50af5bcd77SVladimir Sementsov-Ogievskiy      * @lock: protects access to @access_bitmap, @done_bitmap and
51af5bcd77SVladimir Sementsov-Ogievskiy      * @frozen_read_reqs
52af5bcd77SVladimir Sementsov-Ogievskiy      */
53af5bcd77SVladimir Sementsov-Ogievskiy     CoMutex lock;
54af5bcd77SVladimir Sementsov-Ogievskiy 
55af5bcd77SVladimir Sementsov-Ogievskiy     /*
56af5bcd77SVladimir Sementsov-Ogievskiy      * @access_bitmap: represents areas allowed for reading by fleecing user.
57af5bcd77SVladimir Sementsov-Ogievskiy      * Reading from non-dirty areas leads to -EACCES.
58af5bcd77SVladimir Sementsov-Ogievskiy      */
59af5bcd77SVladimir Sementsov-Ogievskiy     BdrvDirtyBitmap *access_bitmap;
60af5bcd77SVladimir Sementsov-Ogievskiy 
61af5bcd77SVladimir Sementsov-Ogievskiy     /*
62af5bcd77SVladimir Sementsov-Ogievskiy      * @done_bitmap: represents areas that was successfully copied to @target by
63af5bcd77SVladimir Sementsov-Ogievskiy      * copy-before-write operations.
64af5bcd77SVladimir Sementsov-Ogievskiy      */
65af5bcd77SVladimir Sementsov-Ogievskiy     BdrvDirtyBitmap *done_bitmap;
66af5bcd77SVladimir Sementsov-Ogievskiy 
67af5bcd77SVladimir Sementsov-Ogievskiy     /*
68af5bcd77SVladimir Sementsov-Ogievskiy      * @frozen_read_reqs: current read requests for fleecing user in bs->file
69af5bcd77SVladimir Sementsov-Ogievskiy      * node. These areas must not be rewritten by guest.
70af5bcd77SVladimir Sementsov-Ogievskiy      */
71af5bcd77SVladimir Sementsov-Ogievskiy     BlockReqList frozen_read_reqs;
72f1bb39a8SVladimir Sementsov-Ogievskiy 
73f1bb39a8SVladimir Sementsov-Ogievskiy     /*
74f1bb39a8SVladimir Sementsov-Ogievskiy      * @snapshot_error is normally zero. But on first copy-before-write failure
75f1bb39a8SVladimir Sementsov-Ogievskiy      * when @on_cbw_error == ON_CBW_ERROR_BREAK_SNAPSHOT, @snapshot_error takes
76f1bb39a8SVladimir Sementsov-Ogievskiy      * value of this error (<0). After that all in-flight and further
77f1bb39a8SVladimir Sementsov-Ogievskiy      * snapshot-API requests will fail with that error.
78f1bb39a8SVladimir Sementsov-Ogievskiy      */
79f1bb39a8SVladimir Sementsov-Ogievskiy     int snapshot_error;
80d003e0aeSVladimir Sementsov-Ogievskiy } BDRVCopyBeforeWriteState;
81d003e0aeSVladimir Sementsov-Ogievskiy 
82b9b10c35SKevin Wolf static int coroutine_fn GRAPH_RDLOCK
83b9b10c35SKevin Wolf cbw_co_preadv(BlockDriverState *bs, int64_t offset, int64_t bytes,
84f7ef38ddSVladimir Sementsov-Ogievskiy               QEMUIOVector *qiov, BdrvRequestFlags flags)
85d003e0aeSVladimir Sementsov-Ogievskiy {
863c1e6327SVladimir Sementsov-Ogievskiy     return bdrv_co_preadv(bs->file, offset, bytes, qiov, flags);
87d003e0aeSVladimir Sementsov-Ogievskiy }
88d003e0aeSVladimir Sementsov-Ogievskiy 
896db7fd1cSVladimir Sementsov-Ogievskiy static void block_copy_cb(void *opaque)
906db7fd1cSVladimir Sementsov-Ogievskiy {
916db7fd1cSVladimir Sementsov-Ogievskiy     BlockDriverState *bs = opaque;
926db7fd1cSVladimir Sementsov-Ogievskiy 
936db7fd1cSVladimir Sementsov-Ogievskiy     bdrv_dec_in_flight(bs);
946db7fd1cSVladimir Sementsov-Ogievskiy }
956db7fd1cSVladimir Sementsov-Ogievskiy 
96af5bcd77SVladimir Sementsov-Ogievskiy /*
97af5bcd77SVladimir Sementsov-Ogievskiy  * Do copy-before-write operation.
98af5bcd77SVladimir Sementsov-Ogievskiy  *
99af5bcd77SVladimir Sementsov-Ogievskiy  * On failure guest request must be failed too.
100af5bcd77SVladimir Sementsov-Ogievskiy  *
101af5bcd77SVladimir Sementsov-Ogievskiy  * On success, we also wait for all in-flight fleecing read requests in source
102af5bcd77SVladimir Sementsov-Ogievskiy  * node, and it's guaranteed that after cbw_do_copy_before_write() successful
103af5bcd77SVladimir Sementsov-Ogievskiy  * return there are no such requests and they will never appear.
104af5bcd77SVladimir Sementsov-Ogievskiy  */
105d003e0aeSVladimir Sementsov-Ogievskiy static coroutine_fn int cbw_do_copy_before_write(BlockDriverState *bs,
106d003e0aeSVladimir Sementsov-Ogievskiy         uint64_t offset, uint64_t bytes, BdrvRequestFlags flags)
107d003e0aeSVladimir Sementsov-Ogievskiy {
108d003e0aeSVladimir Sementsov-Ogievskiy     BDRVCopyBeforeWriteState *s = bs->opaque;
109af5bcd77SVladimir Sementsov-Ogievskiy     int ret;
110d003e0aeSVladimir Sementsov-Ogievskiy     uint64_t off, end;
111b518e9e9SVladimir Sementsov-Ogievskiy     int64_t cluster_size = block_copy_cluster_size(s->bcs);
112d003e0aeSVladimir Sementsov-Ogievskiy 
113d003e0aeSVladimir Sementsov-Ogievskiy     if (flags & BDRV_REQ_WRITE_UNCHANGED) {
114d003e0aeSVladimir Sementsov-Ogievskiy         return 0;
115d003e0aeSVladimir Sementsov-Ogievskiy     }
116d003e0aeSVladimir Sementsov-Ogievskiy 
117f1bb39a8SVladimir Sementsov-Ogievskiy     if (s->snapshot_error) {
118f1bb39a8SVladimir Sementsov-Ogievskiy         return 0;
119f1bb39a8SVladimir Sementsov-Ogievskiy     }
120f1bb39a8SVladimir Sementsov-Ogievskiy 
121b518e9e9SVladimir Sementsov-Ogievskiy     off = QEMU_ALIGN_DOWN(offset, cluster_size);
122b518e9e9SVladimir Sementsov-Ogievskiy     end = QEMU_ALIGN_UP(offset + bytes, cluster_size);
123d003e0aeSVladimir Sementsov-Ogievskiy 
1246db7fd1cSVladimir Sementsov-Ogievskiy     /*
1256db7fd1cSVladimir Sementsov-Ogievskiy      * Increase in_flight, so that in case of timed-out block-copy, the
1266db7fd1cSVladimir Sementsov-Ogievskiy      * remaining background block_copy() request (which can't be immediately
1276db7fd1cSVladimir Sementsov-Ogievskiy      * cancelled by timeout) is presented in bs->in_flight. This way we are
1286db7fd1cSVladimir Sementsov-Ogievskiy      * sure that on bs close() we'll previously wait for all timed-out but yet
1296db7fd1cSVladimir Sementsov-Ogievskiy      * running block_copy calls.
1306db7fd1cSVladimir Sementsov-Ogievskiy      */
1316db7fd1cSVladimir Sementsov-Ogievskiy     bdrv_inc_in_flight(bs);
1326db7fd1cSVladimir Sementsov-Ogievskiy     ret = block_copy(s->bcs, off, end - off, true, s->cbw_timeout_ns,
1336db7fd1cSVladimir Sementsov-Ogievskiy                      block_copy_cb, bs);
134f1bb39a8SVladimir Sementsov-Ogievskiy     if (ret < 0 && s->on_cbw_error == ON_CBW_ERROR_BREAK_GUEST_WRITE) {
135af5bcd77SVladimir Sementsov-Ogievskiy         return ret;
136af5bcd77SVladimir Sementsov-Ogievskiy     }
137af5bcd77SVladimir Sementsov-Ogievskiy 
138af5bcd77SVladimir Sementsov-Ogievskiy     WITH_QEMU_LOCK_GUARD(&s->lock) {
139f1bb39a8SVladimir Sementsov-Ogievskiy         if (ret < 0) {
140f1bb39a8SVladimir Sementsov-Ogievskiy             assert(s->on_cbw_error == ON_CBW_ERROR_BREAK_SNAPSHOT);
141f1bb39a8SVladimir Sementsov-Ogievskiy             if (!s->snapshot_error) {
142f1bb39a8SVladimir Sementsov-Ogievskiy                 s->snapshot_error = ret;
143f1bb39a8SVladimir Sementsov-Ogievskiy             }
144f1bb39a8SVladimir Sementsov-Ogievskiy         } else {
145af5bcd77SVladimir Sementsov-Ogievskiy             bdrv_set_dirty_bitmap(s->done_bitmap, off, end - off);
146f1bb39a8SVladimir Sementsov-Ogievskiy         }
147af5bcd77SVladimir Sementsov-Ogievskiy         reqlist_wait_all(&s->frozen_read_reqs, off, end - off, &s->lock);
148af5bcd77SVladimir Sementsov-Ogievskiy     }
149af5bcd77SVladimir Sementsov-Ogievskiy 
150af5bcd77SVladimir Sementsov-Ogievskiy     return 0;
151d003e0aeSVladimir Sementsov-Ogievskiy }
152d003e0aeSVladimir Sementsov-Ogievskiy 
1539a5a1c62SEmanuele Giuseppe Esposito static int coroutine_fn GRAPH_RDLOCK
1549a5a1c62SEmanuele Giuseppe Esposito cbw_co_pdiscard(BlockDriverState *bs, int64_t offset, int64_t bytes)
155d003e0aeSVladimir Sementsov-Ogievskiy {
156d003e0aeSVladimir Sementsov-Ogievskiy     int ret = cbw_do_copy_before_write(bs, offset, bytes, 0);
157d003e0aeSVladimir Sementsov-Ogievskiy     if (ret < 0) {
158d003e0aeSVladimir Sementsov-Ogievskiy         return ret;
159d003e0aeSVladimir Sementsov-Ogievskiy     }
160d003e0aeSVladimir Sementsov-Ogievskiy 
1613c1e6327SVladimir Sementsov-Ogievskiy     return bdrv_co_pdiscard(bs->file, offset, bytes);
162d003e0aeSVladimir Sementsov-Ogievskiy }
163d003e0aeSVladimir Sementsov-Ogievskiy 
164abaf8b75SKevin Wolf static int coroutine_fn GRAPH_RDLOCK
165abaf8b75SKevin Wolf cbw_co_pwrite_zeroes(BlockDriverState *bs, int64_t offset, int64_t bytes,
166abaf8b75SKevin Wolf                      BdrvRequestFlags flags)
167d003e0aeSVladimir Sementsov-Ogievskiy {
168d003e0aeSVladimir Sementsov-Ogievskiy     int ret = cbw_do_copy_before_write(bs, offset, bytes, flags);
169d003e0aeSVladimir Sementsov-Ogievskiy     if (ret < 0) {
170d003e0aeSVladimir Sementsov-Ogievskiy         return ret;
171d003e0aeSVladimir Sementsov-Ogievskiy     }
172d003e0aeSVladimir Sementsov-Ogievskiy 
1733c1e6327SVladimir Sementsov-Ogievskiy     return bdrv_co_pwrite_zeroes(bs->file, offset, bytes, flags);
174d003e0aeSVladimir Sementsov-Ogievskiy }
175d003e0aeSVladimir Sementsov-Ogievskiy 
176b9b10c35SKevin Wolf static coroutine_fn GRAPH_RDLOCK
177b9b10c35SKevin Wolf int cbw_co_pwritev(BlockDriverState *bs, int64_t offset, int64_t bytes,
178b9b10c35SKevin Wolf                    QEMUIOVector *qiov, BdrvRequestFlags flags)
179d003e0aeSVladimir Sementsov-Ogievskiy {
180d003e0aeSVladimir Sementsov-Ogievskiy     int ret = cbw_do_copy_before_write(bs, offset, bytes, flags);
181d003e0aeSVladimir Sementsov-Ogievskiy     if (ret < 0) {
182d003e0aeSVladimir Sementsov-Ogievskiy         return ret;
183d003e0aeSVladimir Sementsov-Ogievskiy     }
184d003e0aeSVladimir Sementsov-Ogievskiy 
1853c1e6327SVladimir Sementsov-Ogievskiy     return bdrv_co_pwritev(bs->file, offset, bytes, qiov, flags);
186d003e0aeSVladimir Sementsov-Ogievskiy }
187d003e0aeSVladimir Sementsov-Ogievskiy 
18888095349SEmanuele Giuseppe Esposito static int coroutine_fn GRAPH_RDLOCK cbw_co_flush(BlockDriverState *bs)
189d003e0aeSVladimir Sementsov-Ogievskiy {
1903c1e6327SVladimir Sementsov-Ogievskiy     if (!bs->file) {
191d003e0aeSVladimir Sementsov-Ogievskiy         return 0;
192d003e0aeSVladimir Sementsov-Ogievskiy     }
193d003e0aeSVladimir Sementsov-Ogievskiy 
1943c1e6327SVladimir Sementsov-Ogievskiy     return bdrv_co_flush(bs->file->bs);
195d003e0aeSVladimir Sementsov-Ogievskiy }
196d003e0aeSVladimir Sementsov-Ogievskiy 
197af5bcd77SVladimir Sementsov-Ogievskiy /*
198af5bcd77SVladimir Sementsov-Ogievskiy  * If @offset not accessible - return NULL.
199af5bcd77SVladimir Sementsov-Ogievskiy  *
200af5bcd77SVladimir Sementsov-Ogievskiy  * Otherwise, set @pnum to some bytes that accessible from @file (@file is set
201af5bcd77SVladimir Sementsov-Ogievskiy  * to bs->file or to s->target). Return newly allocated BlockReq object that
202af5bcd77SVladimir Sementsov-Ogievskiy  * should be than passed to cbw_snapshot_read_unlock().
203af5bcd77SVladimir Sementsov-Ogievskiy  *
204af5bcd77SVladimir Sementsov-Ogievskiy  * It's guaranteed that guest writes will not interact in the region until
205af5bcd77SVladimir Sementsov-Ogievskiy  * cbw_snapshot_read_unlock() called.
206af5bcd77SVladimir Sementsov-Ogievskiy  */
2071f051dcbSKevin Wolf static BlockReq * coroutine_fn GRAPH_RDLOCK
2083e614042SPaolo Bonzini cbw_snapshot_read_lock(BlockDriverState *bs, int64_t offset, int64_t bytes,
209af5bcd77SVladimir Sementsov-Ogievskiy                        int64_t *pnum, BdrvChild **file)
210af5bcd77SVladimir Sementsov-Ogievskiy {
211af5bcd77SVladimir Sementsov-Ogievskiy     BDRVCopyBeforeWriteState *s = bs->opaque;
212af5bcd77SVladimir Sementsov-Ogievskiy     BlockReq *req = g_new(BlockReq, 1);
213af5bcd77SVladimir Sementsov-Ogievskiy     bool done;
214af5bcd77SVladimir Sementsov-Ogievskiy 
215af5bcd77SVladimir Sementsov-Ogievskiy     QEMU_LOCK_GUARD(&s->lock);
216af5bcd77SVladimir Sementsov-Ogievskiy 
217f1bb39a8SVladimir Sementsov-Ogievskiy     if (s->snapshot_error) {
218f1bb39a8SVladimir Sementsov-Ogievskiy         g_free(req);
219f1bb39a8SVladimir Sementsov-Ogievskiy         return NULL;
220f1bb39a8SVladimir Sementsov-Ogievskiy     }
221f1bb39a8SVladimir Sementsov-Ogievskiy 
222af5bcd77SVladimir Sementsov-Ogievskiy     if (bdrv_dirty_bitmap_next_zero(s->access_bitmap, offset, bytes) != -1) {
223af5bcd77SVladimir Sementsov-Ogievskiy         g_free(req);
224af5bcd77SVladimir Sementsov-Ogievskiy         return NULL;
225af5bcd77SVladimir Sementsov-Ogievskiy     }
226af5bcd77SVladimir Sementsov-Ogievskiy 
227af5bcd77SVladimir Sementsov-Ogievskiy     done = bdrv_dirty_bitmap_status(s->done_bitmap, offset, bytes, pnum);
228af5bcd77SVladimir Sementsov-Ogievskiy     if (done) {
229af5bcd77SVladimir Sementsov-Ogievskiy         /*
230af5bcd77SVladimir Sementsov-Ogievskiy          * Special invalid BlockReq, that is handled in
231af5bcd77SVladimir Sementsov-Ogievskiy          * cbw_snapshot_read_unlock(). We don't need to lock something to read
232af5bcd77SVladimir Sementsov-Ogievskiy          * from s->target.
233af5bcd77SVladimir Sementsov-Ogievskiy          */
234af5bcd77SVladimir Sementsov-Ogievskiy         *req = (BlockReq) {.offset = -1, .bytes = -1};
235af5bcd77SVladimir Sementsov-Ogievskiy         *file = s->target;
236af5bcd77SVladimir Sementsov-Ogievskiy     } else {
237af5bcd77SVladimir Sementsov-Ogievskiy         reqlist_init_req(&s->frozen_read_reqs, req, offset, bytes);
238af5bcd77SVladimir Sementsov-Ogievskiy         *file = bs->file;
239af5bcd77SVladimir Sementsov-Ogievskiy     }
240af5bcd77SVladimir Sementsov-Ogievskiy 
241af5bcd77SVladimir Sementsov-Ogievskiy     return req;
242af5bcd77SVladimir Sementsov-Ogievskiy }
243af5bcd77SVladimir Sementsov-Ogievskiy 
2443e614042SPaolo Bonzini static coroutine_fn void
2453e614042SPaolo Bonzini cbw_snapshot_read_unlock(BlockDriverState *bs, BlockReq *req)
246af5bcd77SVladimir Sementsov-Ogievskiy {
247af5bcd77SVladimir Sementsov-Ogievskiy     BDRVCopyBeforeWriteState *s = bs->opaque;
248af5bcd77SVladimir Sementsov-Ogievskiy 
249af5bcd77SVladimir Sementsov-Ogievskiy     if (req->offset == -1 && req->bytes == -1) {
250af5bcd77SVladimir Sementsov-Ogievskiy         g_free(req);
251af5bcd77SVladimir Sementsov-Ogievskiy         return;
252af5bcd77SVladimir Sementsov-Ogievskiy     }
253af5bcd77SVladimir Sementsov-Ogievskiy 
254af5bcd77SVladimir Sementsov-Ogievskiy     QEMU_LOCK_GUARD(&s->lock);
255af5bcd77SVladimir Sementsov-Ogievskiy 
256af5bcd77SVladimir Sementsov-Ogievskiy     reqlist_remove_req(req);
257af5bcd77SVladimir Sementsov-Ogievskiy     g_free(req);
258af5bcd77SVladimir Sementsov-Ogievskiy }
259af5bcd77SVladimir Sementsov-Ogievskiy 
2607b9e8b22SKevin Wolf static int coroutine_fn GRAPH_RDLOCK
261af5bcd77SVladimir Sementsov-Ogievskiy cbw_co_preadv_snapshot(BlockDriverState *bs, int64_t offset, int64_t bytes,
262af5bcd77SVladimir Sementsov-Ogievskiy                        QEMUIOVector *qiov, size_t qiov_offset)
263af5bcd77SVladimir Sementsov-Ogievskiy {
264af5bcd77SVladimir Sementsov-Ogievskiy     BlockReq *req;
265af5bcd77SVladimir Sementsov-Ogievskiy     BdrvChild *file;
266af5bcd77SVladimir Sementsov-Ogievskiy     int ret;
267af5bcd77SVladimir Sementsov-Ogievskiy 
268af5bcd77SVladimir Sementsov-Ogievskiy     /* TODO: upgrade to async loop using AioTask */
269af5bcd77SVladimir Sementsov-Ogievskiy     while (bytes) {
270af5bcd77SVladimir Sementsov-Ogievskiy         int64_t cur_bytes;
271af5bcd77SVladimir Sementsov-Ogievskiy 
272af5bcd77SVladimir Sementsov-Ogievskiy         req = cbw_snapshot_read_lock(bs, offset, bytes, &cur_bytes, &file);
273af5bcd77SVladimir Sementsov-Ogievskiy         if (!req) {
274af5bcd77SVladimir Sementsov-Ogievskiy             return -EACCES;
275af5bcd77SVladimir Sementsov-Ogievskiy         }
276af5bcd77SVladimir Sementsov-Ogievskiy 
277af5bcd77SVladimir Sementsov-Ogievskiy         ret = bdrv_co_preadv_part(file, offset, cur_bytes,
278af5bcd77SVladimir Sementsov-Ogievskiy                                   qiov, qiov_offset, 0);
279af5bcd77SVladimir Sementsov-Ogievskiy         cbw_snapshot_read_unlock(bs, req);
280af5bcd77SVladimir Sementsov-Ogievskiy         if (ret < 0) {
281af5bcd77SVladimir Sementsov-Ogievskiy             return ret;
282af5bcd77SVladimir Sementsov-Ogievskiy         }
283af5bcd77SVladimir Sementsov-Ogievskiy 
284af5bcd77SVladimir Sementsov-Ogievskiy         bytes -= cur_bytes;
285af5bcd77SVladimir Sementsov-Ogievskiy         offset += cur_bytes;
286af5bcd77SVladimir Sementsov-Ogievskiy         qiov_offset += cur_bytes;
287af5bcd77SVladimir Sementsov-Ogievskiy     }
288af5bcd77SVladimir Sementsov-Ogievskiy 
289af5bcd77SVladimir Sementsov-Ogievskiy     return 0;
290af5bcd77SVladimir Sementsov-Ogievskiy }
291af5bcd77SVladimir Sementsov-Ogievskiy 
2927b9e8b22SKevin Wolf static int coroutine_fn GRAPH_RDLOCK
293af5bcd77SVladimir Sementsov-Ogievskiy cbw_co_snapshot_block_status(BlockDriverState *bs,
294af5bcd77SVladimir Sementsov-Ogievskiy                              bool want_zero, int64_t offset, int64_t bytes,
295af5bcd77SVladimir Sementsov-Ogievskiy                              int64_t *pnum, int64_t *map,
296af5bcd77SVladimir Sementsov-Ogievskiy                              BlockDriverState **file)
297af5bcd77SVladimir Sementsov-Ogievskiy {
298af5bcd77SVladimir Sementsov-Ogievskiy     BDRVCopyBeforeWriteState *s = bs->opaque;
299af5bcd77SVladimir Sementsov-Ogievskiy     BlockReq *req;
300af5bcd77SVladimir Sementsov-Ogievskiy     int ret;
301af5bcd77SVladimir Sementsov-Ogievskiy     int64_t cur_bytes;
302af5bcd77SVladimir Sementsov-Ogievskiy     BdrvChild *child;
303af5bcd77SVladimir Sementsov-Ogievskiy 
304af5bcd77SVladimir Sementsov-Ogievskiy     req = cbw_snapshot_read_lock(bs, offset, bytes, &cur_bytes, &child);
305af5bcd77SVladimir Sementsov-Ogievskiy     if (!req) {
306af5bcd77SVladimir Sementsov-Ogievskiy         return -EACCES;
307af5bcd77SVladimir Sementsov-Ogievskiy     }
308af5bcd77SVladimir Sementsov-Ogievskiy 
309cc323997SPaolo Bonzini     ret = bdrv_co_block_status(child->bs, offset, cur_bytes, pnum, map, file);
310af5bcd77SVladimir Sementsov-Ogievskiy     if (child == s->target) {
311af5bcd77SVladimir Sementsov-Ogievskiy         /*
312af5bcd77SVladimir Sementsov-Ogievskiy          * We refer to s->target only for areas that we've written to it.
313af5bcd77SVladimir Sementsov-Ogievskiy          * And we can not report unallocated blocks in s->target: this will
314af5bcd77SVladimir Sementsov-Ogievskiy          * break generic block-status-above logic, that will go to
315af5bcd77SVladimir Sementsov-Ogievskiy          * copy-before-write filtered child in this case.
316af5bcd77SVladimir Sementsov-Ogievskiy          */
317af5bcd77SVladimir Sementsov-Ogievskiy         assert(ret & BDRV_BLOCK_ALLOCATED);
318af5bcd77SVladimir Sementsov-Ogievskiy     }
319af5bcd77SVladimir Sementsov-Ogievskiy 
320af5bcd77SVladimir Sementsov-Ogievskiy     cbw_snapshot_read_unlock(bs, req);
321af5bcd77SVladimir Sementsov-Ogievskiy 
322af5bcd77SVladimir Sementsov-Ogievskiy     return ret;
323af5bcd77SVladimir Sementsov-Ogievskiy }
324af5bcd77SVladimir Sementsov-Ogievskiy 
3259a5a1c62SEmanuele Giuseppe Esposito static int coroutine_fn GRAPH_RDLOCK
3269a5a1c62SEmanuele Giuseppe Esposito cbw_co_pdiscard_snapshot(BlockDriverState *bs, int64_t offset, int64_t bytes)
327af5bcd77SVladimir Sementsov-Ogievskiy {
328af5bcd77SVladimir Sementsov-Ogievskiy     BDRVCopyBeforeWriteState *s = bs->opaque;
32950717519SVladimir Sementsov-Ogievskiy     uint32_t cluster_size = block_copy_cluster_size(s->bcs);
33050717519SVladimir Sementsov-Ogievskiy     int64_t aligned_offset = QEMU_ALIGN_UP(offset, cluster_size);
33150717519SVladimir Sementsov-Ogievskiy     int64_t aligned_end = QEMU_ALIGN_DOWN(offset + bytes, cluster_size);
33250717519SVladimir Sementsov-Ogievskiy     int64_t aligned_bytes;
33350717519SVladimir Sementsov-Ogievskiy 
33450717519SVladimir Sementsov-Ogievskiy     if (aligned_end <= aligned_offset) {
33550717519SVladimir Sementsov-Ogievskiy         return 0;
33650717519SVladimir Sementsov-Ogievskiy     }
33750717519SVladimir Sementsov-Ogievskiy     aligned_bytes = aligned_end - aligned_offset;
338af5bcd77SVladimir Sementsov-Ogievskiy 
339af5bcd77SVladimir Sementsov-Ogievskiy     WITH_QEMU_LOCK_GUARD(&s->lock) {
34050717519SVladimir Sementsov-Ogievskiy         bdrv_reset_dirty_bitmap(s->access_bitmap, aligned_offset,
34150717519SVladimir Sementsov-Ogievskiy                                 aligned_bytes);
342af5bcd77SVladimir Sementsov-Ogievskiy     }
343af5bcd77SVladimir Sementsov-Ogievskiy 
34450717519SVladimir Sementsov-Ogievskiy     block_copy_reset(s->bcs, aligned_offset, aligned_bytes);
345af5bcd77SVladimir Sementsov-Ogievskiy 
34650717519SVladimir Sementsov-Ogievskiy     return bdrv_co_pdiscard(s->target, aligned_offset, aligned_bytes);
347af5bcd77SVladimir Sementsov-Ogievskiy }
348af5bcd77SVladimir Sementsov-Ogievskiy 
34979a55866SKevin Wolf static void GRAPH_RDLOCK cbw_refresh_filename(BlockDriverState *bs)
350d003e0aeSVladimir Sementsov-Ogievskiy {
351d003e0aeSVladimir Sementsov-Ogievskiy     pstrcpy(bs->exact_filename, sizeof(bs->exact_filename),
3523c1e6327SVladimir Sementsov-Ogievskiy             bs->file->bs->filename);
353d003e0aeSVladimir Sementsov-Ogievskiy }
354d003e0aeSVladimir Sementsov-Ogievskiy 
355c629b6d2SKevin Wolf static void GRAPH_RDLOCK
356c629b6d2SKevin Wolf cbw_child_perm(BlockDriverState *bs, BdrvChild *c, BdrvChildRole role,
357d003e0aeSVladimir Sementsov-Ogievskiy                BlockReopenQueue *reopen_queue,
358d003e0aeSVladimir Sementsov-Ogievskiy                uint64_t perm, uint64_t shared,
359d003e0aeSVladimir Sementsov-Ogievskiy                uint64_t *nperm, uint64_t *nshared)
360d003e0aeSVladimir Sementsov-Ogievskiy {
361*0fd05c8dSVladimir Sementsov-Ogievskiy     BDRVCopyBeforeWriteState *s = bs->opaque;
362*0fd05c8dSVladimir Sementsov-Ogievskiy 
363d003e0aeSVladimir Sementsov-Ogievskiy     if (!(role & BDRV_CHILD_FILTERED)) {
364d003e0aeSVladimir Sementsov-Ogievskiy         /*
365d003e0aeSVladimir Sementsov-Ogievskiy          * Target child
366d003e0aeSVladimir Sementsov-Ogievskiy          *
367d003e0aeSVladimir Sementsov-Ogievskiy          * Share write to target (child_file), to not interfere
368d003e0aeSVladimir Sementsov-Ogievskiy          * with guest writes to its disk which may be in target backing chain.
369d003e0aeSVladimir Sementsov-Ogievskiy          * Can't resize during a backup block job because we check the size
370d003e0aeSVladimir Sementsov-Ogievskiy          * only upfront.
371d003e0aeSVladimir Sementsov-Ogievskiy          */
372d003e0aeSVladimir Sementsov-Ogievskiy         *nshared = BLK_PERM_ALL & ~BLK_PERM_RESIZE;
373d003e0aeSVladimir Sementsov-Ogievskiy         *nperm = BLK_PERM_WRITE;
374d003e0aeSVladimir Sementsov-Ogievskiy     } else {
375d003e0aeSVladimir Sementsov-Ogievskiy         /* Source child */
376d003e0aeSVladimir Sementsov-Ogievskiy         bdrv_default_perms(bs, c, role, reopen_queue,
377d003e0aeSVladimir Sementsov-Ogievskiy                            perm, shared, nperm, nshared);
378d003e0aeSVladimir Sementsov-Ogievskiy 
3793860c020SVladimir Sementsov-Ogievskiy         if (!QLIST_EMPTY(&bs->parents)) {
380137b4d4bSVladimir Sementsov-Ogievskiy             /*
381137b4d4bSVladimir Sementsov-Ogievskiy              * Note, that source child may be shared with backup job. Backup job
382137b4d4bSVladimir Sementsov-Ogievskiy              * does create own blk parent on copy-before-write node, so this
383137b4d4bSVladimir Sementsov-Ogievskiy              * works even if source node does not have any parents before backup
384137b4d4bSVladimir Sementsov-Ogievskiy              * start
385137b4d4bSVladimir Sementsov-Ogievskiy              */
386d003e0aeSVladimir Sementsov-Ogievskiy             *nperm = *nperm | BLK_PERM_CONSISTENT_READ;
387*0fd05c8dSVladimir Sementsov-Ogievskiy             if (s->discard_source) {
388*0fd05c8dSVladimir Sementsov-Ogievskiy                 *nperm = *nperm | BLK_PERM_WRITE;
389*0fd05c8dSVladimir Sementsov-Ogievskiy             }
390*0fd05c8dSVladimir Sementsov-Ogievskiy 
391d003e0aeSVladimir Sementsov-Ogievskiy             *nshared &= ~(BLK_PERM_WRITE | BLK_PERM_RESIZE);
392d003e0aeSVladimir Sementsov-Ogievskiy         }
393d003e0aeSVladimir Sementsov-Ogievskiy     }
3943860c020SVladimir Sementsov-Ogievskiy }
395d003e0aeSVladimir Sementsov-Ogievskiy 
39679ef0cebSVladimir Sementsov-Ogievskiy static BlockdevOptions *cbw_parse_options(QDict *options, Error **errp)
3975f3a3cd7SVladimir Sementsov-Ogievskiy {
39879ef0cebSVladimir Sementsov-Ogievskiy     BlockdevOptions *opts = NULL;
3995f3a3cd7SVladimir Sementsov-Ogievskiy     Visitor *v = NULL;
4005f3a3cd7SVladimir Sementsov-Ogievskiy 
40179ef0cebSVladimir Sementsov-Ogievskiy     qdict_put_str(options, "driver", "copy-before-write");
4025f3a3cd7SVladimir Sementsov-Ogievskiy 
40379ef0cebSVladimir Sementsov-Ogievskiy     v = qobject_input_visitor_new_flat_confused(options, errp);
4045f3a3cd7SVladimir Sementsov-Ogievskiy     if (!v) {
4055f3a3cd7SVladimir Sementsov-Ogievskiy         goto out;
4065f3a3cd7SVladimir Sementsov-Ogievskiy     }
4075f3a3cd7SVladimir Sementsov-Ogievskiy 
40879ef0cebSVladimir Sementsov-Ogievskiy     visit_type_BlockdevOptions(v, NULL, &opts, errp);
40979ef0cebSVladimir Sementsov-Ogievskiy     if (!opts) {
4105f3a3cd7SVladimir Sementsov-Ogievskiy         goto out;
4115f3a3cd7SVladimir Sementsov-Ogievskiy     }
4125f3a3cd7SVladimir Sementsov-Ogievskiy 
41379ef0cebSVladimir Sementsov-Ogievskiy     /*
41479ef0cebSVladimir Sementsov-Ogievskiy      * Delete options which we are going to parse through BlockdevOptions
41579ef0cebSVladimir Sementsov-Ogievskiy      * object for original options.
41679ef0cebSVladimir Sementsov-Ogievskiy      */
41779ef0cebSVladimir Sementsov-Ogievskiy     qdict_extract_subqdict(options, NULL, "bitmap");
418f1bb39a8SVladimir Sementsov-Ogievskiy     qdict_del(options, "on-cbw-error");
4196db7fd1cSVladimir Sementsov-Ogievskiy     qdict_del(options, "cbw-timeout");
4205f3a3cd7SVladimir Sementsov-Ogievskiy 
4215f3a3cd7SVladimir Sementsov-Ogievskiy out:
4225f3a3cd7SVladimir Sementsov-Ogievskiy     visit_free(v);
42379ef0cebSVladimir Sementsov-Ogievskiy     qdict_del(options, "driver");
4245f3a3cd7SVladimir Sementsov-Ogievskiy 
42579ef0cebSVladimir Sementsov-Ogievskiy     return opts;
4265f3a3cd7SVladimir Sementsov-Ogievskiy }
4275f3a3cd7SVladimir Sementsov-Ogievskiy 
428751cec7aSVladimir Sementsov-Ogievskiy static int cbw_open(BlockDriverState *bs, QDict *options, int flags,
429751cec7aSVladimir Sementsov-Ogievskiy                     Error **errp)
4301f0cacb9SVladimir Sementsov-Ogievskiy {
431c79eabc5SZhao Liu     ERRP_GUARD();
432fe7ea40cSVladimir Sementsov-Ogievskiy     BDRVCopyBeforeWriteState *s = bs->opaque;
4335f3a3cd7SVladimir Sementsov-Ogievskiy     BdrvDirtyBitmap *bitmap = NULL;
434af5bcd77SVladimir Sementsov-Ogievskiy     int64_t cluster_size;
43579ef0cebSVladimir Sementsov-Ogievskiy     g_autoptr(BlockdevOptions) full_opts = NULL;
43679ef0cebSVladimir Sementsov-Ogievskiy     BlockdevOptionsCbw *opts;
43783930780SVladimir Sementsov-Ogievskiy     int ret;
43879ef0cebSVladimir Sementsov-Ogievskiy 
43979ef0cebSVladimir Sementsov-Ogievskiy     full_opts = cbw_parse_options(options, errp);
44079ef0cebSVladimir Sementsov-Ogievskiy     if (!full_opts) {
44179ef0cebSVladimir Sementsov-Ogievskiy         return -EINVAL;
44279ef0cebSVladimir Sementsov-Ogievskiy     }
44379ef0cebSVladimir Sementsov-Ogievskiy     assert(full_opts->driver == BLOCKDEV_DRIVER_COPY_BEFORE_WRITE);
44479ef0cebSVladimir Sementsov-Ogievskiy     opts = &full_opts->u.copy_before_write;
4451f0cacb9SVladimir Sementsov-Ogievskiy 
44683930780SVladimir Sementsov-Ogievskiy     ret = bdrv_open_file_child(NULL, options, "file", bs, errp);
44783930780SVladimir Sementsov-Ogievskiy     if (ret < 0) {
44883930780SVladimir Sementsov-Ogievskiy         return ret;
4491f0cacb9SVladimir Sementsov-Ogievskiy     }
4501f0cacb9SVladimir Sementsov-Ogievskiy 
451f44fd739SVladimir Sementsov-Ogievskiy     s->target = bdrv_open_child(NULL, options, "target", bs, &child_of_bds,
452f44fd739SVladimir Sementsov-Ogievskiy                                 BDRV_CHILD_DATA, false, errp);
453f44fd739SVladimir Sementsov-Ogievskiy     if (!s->target) {
4541f0cacb9SVladimir Sementsov-Ogievskiy         return -EINVAL;
4551f0cacb9SVladimir Sementsov-Ogievskiy     }
4561f0cacb9SVladimir Sementsov-Ogievskiy 
457a4b740dbSKevin Wolf     GRAPH_RDLOCK_GUARD_MAINLOOP();
458a4b740dbSKevin Wolf 
45954fde4ffSMarkus Armbruster     if (opts->bitmap) {
46079ef0cebSVladimir Sementsov-Ogievskiy         bitmap = block_dirty_bitmap_lookup(opts->bitmap->node,
46179ef0cebSVladimir Sementsov-Ogievskiy                                            opts->bitmap->name, NULL, errp);
46279ef0cebSVladimir Sementsov-Ogievskiy         if (!bitmap) {
463b49f4755SStefan Hajnoczi             return -EINVAL;
4645f3a3cd7SVladimir Sementsov-Ogievskiy         }
46579ef0cebSVladimir Sementsov-Ogievskiy     }
466f1bb39a8SVladimir Sementsov-Ogievskiy     s->on_cbw_error = opts->has_on_cbw_error ? opts->on_cbw_error :
467f1bb39a8SVladimir Sementsov-Ogievskiy             ON_CBW_ERROR_BREAK_GUEST_WRITE;
4686db7fd1cSVladimir Sementsov-Ogievskiy     s->cbw_timeout_ns = opts->has_cbw_timeout ?
4696db7fd1cSVladimir Sementsov-Ogievskiy         opts->cbw_timeout * NANOSECONDS_PER_SECOND : 0;
4705f3a3cd7SVladimir Sementsov-Ogievskiy 
4715a507426SVladimir Sementsov-Ogievskiy     bs->total_sectors = bs->file->bs->total_sectors;
4725a507426SVladimir Sementsov-Ogievskiy     bs->supported_write_flags = BDRV_REQ_WRITE_UNCHANGED |
4735a507426SVladimir Sementsov-Ogievskiy             (BDRV_REQ_FUA & bs->file->bs->supported_write_flags);
4745a507426SVladimir Sementsov-Ogievskiy     bs->supported_zero_flags = BDRV_REQ_WRITE_UNCHANGED |
4755a507426SVladimir Sementsov-Ogievskiy             ((BDRV_REQ_FUA | BDRV_REQ_MAY_UNMAP | BDRV_REQ_NO_FALLBACK) &
4765a507426SVladimir Sementsov-Ogievskiy              bs->file->bs->supported_zero_flags);
4775a507426SVladimir Sementsov-Ogievskiy 
478*0fd05c8dSVladimir Sementsov-Ogievskiy     s->discard_source = flags & BDRV_O_CBW_DISCARD_SOURCE;
479*0fd05c8dSVladimir Sementsov-Ogievskiy     s->bcs = block_copy_state_new(bs->file, s->target, bs, bitmap,
480*0fd05c8dSVladimir Sementsov-Ogievskiy                                   flags & BDRV_O_CBW_DISCARD_SOURCE, errp);
481fe7ea40cSVladimir Sementsov-Ogievskiy     if (!s->bcs) {
4821f0cacb9SVladimir Sementsov-Ogievskiy         error_prepend(errp, "Cannot create block-copy-state: ");
483b49f4755SStefan Hajnoczi         return -EINVAL;
4841f0cacb9SVladimir Sementsov-Ogievskiy     }
4851f0cacb9SVladimir Sementsov-Ogievskiy 
486af5bcd77SVladimir Sementsov-Ogievskiy     cluster_size = block_copy_cluster_size(s->bcs);
487af5bcd77SVladimir Sementsov-Ogievskiy 
488af5bcd77SVladimir Sementsov-Ogievskiy     s->done_bitmap = bdrv_create_dirty_bitmap(bs, cluster_size, NULL, errp);
489af5bcd77SVladimir Sementsov-Ogievskiy     if (!s->done_bitmap) {
490b49f4755SStefan Hajnoczi         return -EINVAL;
491af5bcd77SVladimir Sementsov-Ogievskiy     }
492af5bcd77SVladimir Sementsov-Ogievskiy     bdrv_disable_dirty_bitmap(s->done_bitmap);
493af5bcd77SVladimir Sementsov-Ogievskiy 
494af5bcd77SVladimir Sementsov-Ogievskiy     /* s->access_bitmap starts equal to bcs bitmap */
495af5bcd77SVladimir Sementsov-Ogievskiy     s->access_bitmap = bdrv_create_dirty_bitmap(bs, cluster_size, NULL, errp);
496af5bcd77SVladimir Sementsov-Ogievskiy     if (!s->access_bitmap) {
497b49f4755SStefan Hajnoczi         return -EINVAL;
498af5bcd77SVladimir Sementsov-Ogievskiy     }
499af5bcd77SVladimir Sementsov-Ogievskiy     bdrv_disable_dirty_bitmap(s->access_bitmap);
500af5bcd77SVladimir Sementsov-Ogievskiy     bdrv_dirty_bitmap_merge_internal(s->access_bitmap,
501af5bcd77SVladimir Sementsov-Ogievskiy                                      block_copy_dirty_bitmap(s->bcs), NULL,
502af5bcd77SVladimir Sementsov-Ogievskiy                                      true);
503af5bcd77SVladimir Sementsov-Ogievskiy 
504af5bcd77SVladimir Sementsov-Ogievskiy     qemu_co_mutex_init(&s->lock);
505af5bcd77SVladimir Sementsov-Ogievskiy     QLIST_INIT(&s->frozen_read_reqs);
506b49f4755SStefan Hajnoczi     return 0;
5071f0cacb9SVladimir Sementsov-Ogievskiy }
5081f0cacb9SVladimir Sementsov-Ogievskiy 
509751cec7aSVladimir Sementsov-Ogievskiy static void cbw_close(BlockDriverState *bs)
510751cec7aSVladimir Sementsov-Ogievskiy {
511751cec7aSVladimir Sementsov-Ogievskiy     BDRVCopyBeforeWriteState *s = bs->opaque;
512751cec7aSVladimir Sementsov-Ogievskiy 
513af5bcd77SVladimir Sementsov-Ogievskiy     bdrv_release_dirty_bitmap(s->access_bitmap);
514af5bcd77SVladimir Sementsov-Ogievskiy     bdrv_release_dirty_bitmap(s->done_bitmap);
515af5bcd77SVladimir Sementsov-Ogievskiy 
516751cec7aSVladimir Sementsov-Ogievskiy     block_copy_state_free(s->bcs);
517751cec7aSVladimir Sementsov-Ogievskiy     s->bcs = NULL;
518751cec7aSVladimir Sementsov-Ogievskiy }
519751cec7aSVladimir Sementsov-Ogievskiy 
5209ea473fbSKevin Wolf static BlockDriver bdrv_cbw_filter = {
521d003e0aeSVladimir Sementsov-Ogievskiy     .format_name = "copy-before-write",
522d003e0aeSVladimir Sementsov-Ogievskiy     .instance_size = sizeof(BDRVCopyBeforeWriteState),
523d003e0aeSVladimir Sementsov-Ogievskiy 
524751cec7aSVladimir Sementsov-Ogievskiy     .bdrv_open                  = cbw_open,
525751cec7aSVladimir Sementsov-Ogievskiy     .bdrv_close                 = cbw_close,
526751cec7aSVladimir Sementsov-Ogievskiy 
527d003e0aeSVladimir Sementsov-Ogievskiy     .bdrv_co_preadv             = cbw_co_preadv,
528d003e0aeSVladimir Sementsov-Ogievskiy     .bdrv_co_pwritev            = cbw_co_pwritev,
529d003e0aeSVladimir Sementsov-Ogievskiy     .bdrv_co_pwrite_zeroes      = cbw_co_pwrite_zeroes,
530d003e0aeSVladimir Sementsov-Ogievskiy     .bdrv_co_pdiscard           = cbw_co_pdiscard,
531d003e0aeSVladimir Sementsov-Ogievskiy     .bdrv_co_flush              = cbw_co_flush,
532d003e0aeSVladimir Sementsov-Ogievskiy 
533af5bcd77SVladimir Sementsov-Ogievskiy     .bdrv_co_preadv_snapshot       = cbw_co_preadv_snapshot,
534af5bcd77SVladimir Sementsov-Ogievskiy     .bdrv_co_pdiscard_snapshot     = cbw_co_pdiscard_snapshot,
535af5bcd77SVladimir Sementsov-Ogievskiy     .bdrv_co_snapshot_block_status = cbw_co_snapshot_block_status,
536af5bcd77SVladimir Sementsov-Ogievskiy 
537d003e0aeSVladimir Sementsov-Ogievskiy     .bdrv_refresh_filename      = cbw_refresh_filename,
538d003e0aeSVladimir Sementsov-Ogievskiy 
539d003e0aeSVladimir Sementsov-Ogievskiy     .bdrv_child_perm            = cbw_child_perm,
540d003e0aeSVladimir Sementsov-Ogievskiy 
541d003e0aeSVladimir Sementsov-Ogievskiy     .is_filter = true,
542d003e0aeSVladimir Sementsov-Ogievskiy };
543d003e0aeSVladimir Sementsov-Ogievskiy 
544d003e0aeSVladimir Sementsov-Ogievskiy BlockDriverState *bdrv_cbw_append(BlockDriverState *source,
545d003e0aeSVladimir Sementsov-Ogievskiy                                   BlockDriverState *target,
546d003e0aeSVladimir Sementsov-Ogievskiy                                   const char *filter_node_name,
547*0fd05c8dSVladimir Sementsov-Ogievskiy                                   bool discard_source,
548d003e0aeSVladimir Sementsov-Ogievskiy                                   BlockCopyState **bcs,
549d003e0aeSVladimir Sementsov-Ogievskiy                                   Error **errp)
550d003e0aeSVladimir Sementsov-Ogievskiy {
551d003e0aeSVladimir Sementsov-Ogievskiy     BDRVCopyBeforeWriteState *state;
552d003e0aeSVladimir Sementsov-Ogievskiy     BlockDriverState *top;
553f44fd739SVladimir Sementsov-Ogievskiy     QDict *opts;
554*0fd05c8dSVladimir Sementsov-Ogievskiy     int flags = BDRV_O_RDWR | (discard_source ? BDRV_O_CBW_DISCARD_SOURCE : 0);
555d003e0aeSVladimir Sementsov-Ogievskiy 
556d003e0aeSVladimir Sementsov-Ogievskiy     assert(source->total_sectors == target->total_sectors);
557377cc15bSEmanuele Giuseppe Esposito     GLOBAL_STATE_CODE();
558d003e0aeSVladimir Sementsov-Ogievskiy 
559f44fd739SVladimir Sementsov-Ogievskiy     opts = qdict_new();
560751cec7aSVladimir Sementsov-Ogievskiy     qdict_put_str(opts, "driver", "copy-before-write");
561751cec7aSVladimir Sementsov-Ogievskiy     if (filter_node_name) {
562751cec7aSVladimir Sementsov-Ogievskiy         qdict_put_str(opts, "node-name", filter_node_name);
563751cec7aSVladimir Sementsov-Ogievskiy     }
564f44fd739SVladimir Sementsov-Ogievskiy     qdict_put_str(opts, "file", bdrv_get_node_name(source));
565f44fd739SVladimir Sementsov-Ogievskiy     qdict_put_str(opts, "target", bdrv_get_node_name(target));
566f44fd739SVladimir Sementsov-Ogievskiy 
567*0fd05c8dSVladimir Sementsov-Ogievskiy     top = bdrv_insert_node(source, opts, flags, errp);
568751cec7aSVladimir Sementsov-Ogievskiy     if (!top) {
569751cec7aSVladimir Sementsov-Ogievskiy         return NULL;
570d003e0aeSVladimir Sementsov-Ogievskiy     }
571d003e0aeSVladimir Sementsov-Ogievskiy 
572751cec7aSVladimir Sementsov-Ogievskiy     state = top->opaque;
5737ddbce2dSVladimir Sementsov-Ogievskiy     *bcs = state->bcs;
574d003e0aeSVladimir Sementsov-Ogievskiy 
575d003e0aeSVladimir Sementsov-Ogievskiy     return top;
576d003e0aeSVladimir Sementsov-Ogievskiy }
577d003e0aeSVladimir Sementsov-Ogievskiy 
578d003e0aeSVladimir Sementsov-Ogievskiy void bdrv_cbw_drop(BlockDriverState *bs)
579d003e0aeSVladimir Sementsov-Ogievskiy {
580377cc15bSEmanuele Giuseppe Esposito     GLOBAL_STATE_CODE();
581d003e0aeSVladimir Sementsov-Ogievskiy     bdrv_drop_filter(bs, &error_abort);
582d003e0aeSVladimir Sementsov-Ogievskiy     bdrv_unref(bs);
583d003e0aeSVladimir Sementsov-Ogievskiy }
584751cec7aSVladimir Sementsov-Ogievskiy 
585751cec7aSVladimir Sementsov-Ogievskiy static void cbw_init(void)
586751cec7aSVladimir Sementsov-Ogievskiy {
587751cec7aSVladimir Sementsov-Ogievskiy     bdrv_register(&bdrv_cbw_filter);
588751cec7aSVladimir Sementsov-Ogievskiy }
589751cec7aSVladimir Sementsov-Ogievskiy 
590751cec7aSVladimir Sementsov-Ogievskiy block_init(cbw_init);
591