xref: /openbmc/qemu/block.c (revision 76b223200ef4fb09dd87f0e213159795eb68e7a5)
1fc01f7e7Sbellard /*
2fc01f7e7Sbellard  * QEMU System Emulator block driver
3fc01f7e7Sbellard  *
4fc01f7e7Sbellard  * Copyright (c) 2003 Fabrice Bellard
5fc01f7e7Sbellard  *
6fc01f7e7Sbellard  * Permission is hereby granted, free of charge, to any person obtaining a copy
7fc01f7e7Sbellard  * of this software and associated documentation files (the "Software"), to deal
8fc01f7e7Sbellard  * in the Software without restriction, including without limitation the rights
9fc01f7e7Sbellard  * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10fc01f7e7Sbellard  * copies of the Software, and to permit persons to whom the Software is
11fc01f7e7Sbellard  * furnished to do so, subject to the following conditions:
12fc01f7e7Sbellard  *
13fc01f7e7Sbellard  * The above copyright notice and this permission notice shall be included in
14fc01f7e7Sbellard  * all copies or substantial portions of the Software.
15fc01f7e7Sbellard  *
16fc01f7e7Sbellard  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17fc01f7e7Sbellard  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18fc01f7e7Sbellard  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19fc01f7e7Sbellard  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20fc01f7e7Sbellard  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21fc01f7e7Sbellard  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22fc01f7e7Sbellard  * THE SOFTWARE.
23fc01f7e7Sbellard  */
24d38ea87aSPeter Maydell #include "qemu/osdep.h"
256d519a5fSStefan Hajnoczi #include "trace.h"
26737e150eSPaolo Bonzini #include "block/block_int.h"
27737e150eSPaolo Bonzini #include "block/blockjob.h"
28d49b6836SMarkus Armbruster #include "qemu/error-report.h"
291de7afc9SPaolo Bonzini #include "qemu/module.h"
30cc7a8ea7SMarkus Armbruster #include "qapi/qmp/qerror.h"
3191a097e7SKevin Wolf #include "qapi/qmp/qbool.h"
327b1b5d19SPaolo Bonzini #include "qapi/qmp/qjson.h"
33bfb197e0SMarkus Armbruster #include "sysemu/block-backend.h"
349c17d615SPaolo Bonzini #include "sysemu/sysemu.h"
351de7afc9SPaolo Bonzini #include "qemu/notify.h"
3610817bf0SDaniel P. Berrange #include "qemu/coroutine.h"
37c13163fbSBenoît Canet #include "block/qapi.h"
38b2023818SLuiz Capitulino #include "qmp-commands.h"
391de7afc9SPaolo Bonzini #include "qemu/timer.h"
40a5ee7bd4SWenchao Xia #include "qapi-event.h"
41db628338SAlberto Garcia #include "block/throttle-groups.h"
42f348b6d1SVeronia Bahaa #include "qemu/cutils.h"
43f348b6d1SVeronia Bahaa #include "qemu/id.h"
44fc01f7e7Sbellard 
4571e72a19SJuan Quintela #ifdef CONFIG_BSD
467674e7bfSbellard #include <sys/ioctl.h>
4772cf2d4fSBlue Swirl #include <sys/queue.h>
48c5e97233Sblueswir1 #ifndef __DragonFly__
497674e7bfSbellard #include <sys/disk.h>
507674e7bfSbellard #endif
51c5e97233Sblueswir1 #endif
527674e7bfSbellard 
5349dc768dSaliguori #ifdef _WIN32
5449dc768dSaliguori #include <windows.h>
5549dc768dSaliguori #endif
5649dc768dSaliguori 
571c9805a3SStefan Hajnoczi #define NOT_DONE 0x7fffffff /* used while emulated sync operation in progress */
581c9805a3SStefan Hajnoczi 
59dc364f4cSBenoît Canet static QTAILQ_HEAD(, BlockDriverState) graph_bdrv_states =
60dc364f4cSBenoît Canet     QTAILQ_HEAD_INITIALIZER(graph_bdrv_states);
61dc364f4cSBenoît Canet 
622c1d04e0SMax Reitz static QTAILQ_HEAD(, BlockDriverState) all_bdrv_states =
632c1d04e0SMax Reitz     QTAILQ_HEAD_INITIALIZER(all_bdrv_states);
642c1d04e0SMax Reitz 
658a22f02aSStefan Hajnoczi static QLIST_HEAD(, BlockDriver) bdrv_drivers =
668a22f02aSStefan Hajnoczi     QLIST_HEAD_INITIALIZER(bdrv_drivers);
67ea2384d3Sbellard 
68f3930ed0SKevin Wolf static int bdrv_open_inherit(BlockDriverState **pbs, const char *filename,
69f3930ed0SKevin Wolf                              const char *reference, QDict *options, int flags,
70f3930ed0SKevin Wolf                              BlockDriverState *parent,
71ce343771SMax Reitz                              const BdrvChildRole *child_role, Error **errp);
72f3930ed0SKevin Wolf 
73eb852011SMarkus Armbruster /* If non-zero, use only whitelisted block drivers */
74eb852011SMarkus Armbruster static int use_bdrv_whitelist;
75eb852011SMarkus Armbruster 
7664dff520SMax Reitz static void bdrv_close(BlockDriverState *bs);
7764dff520SMax Reitz 
789e0b22f4SStefan Hajnoczi #ifdef _WIN32
799e0b22f4SStefan Hajnoczi static int is_windows_drive_prefix(const char *filename)
809e0b22f4SStefan Hajnoczi {
819e0b22f4SStefan Hajnoczi     return (((filename[0] >= 'a' && filename[0] <= 'z') ||
829e0b22f4SStefan Hajnoczi              (filename[0] >= 'A' && filename[0] <= 'Z')) &&
839e0b22f4SStefan Hajnoczi             filename[1] == ':');
849e0b22f4SStefan Hajnoczi }
859e0b22f4SStefan Hajnoczi 
869e0b22f4SStefan Hajnoczi int is_windows_drive(const char *filename)
879e0b22f4SStefan Hajnoczi {
889e0b22f4SStefan Hajnoczi     if (is_windows_drive_prefix(filename) &&
899e0b22f4SStefan Hajnoczi         filename[2] == '\0')
909e0b22f4SStefan Hajnoczi         return 1;
919e0b22f4SStefan Hajnoczi     if (strstart(filename, "\\\\.\\", NULL) ||
929e0b22f4SStefan Hajnoczi         strstart(filename, "//./", NULL))
939e0b22f4SStefan Hajnoczi         return 1;
949e0b22f4SStefan Hajnoczi     return 0;
959e0b22f4SStefan Hajnoczi }
969e0b22f4SStefan Hajnoczi #endif
979e0b22f4SStefan Hajnoczi 
98339064d5SKevin Wolf size_t bdrv_opt_mem_align(BlockDriverState *bs)
99339064d5SKevin Wolf {
100339064d5SKevin Wolf     if (!bs || !bs->drv) {
101459b4e66SDenis V. Lunev         /* page size or 4k (hdd sector size) should be on the safe side */
102459b4e66SDenis V. Lunev         return MAX(4096, getpagesize());
103339064d5SKevin Wolf     }
104339064d5SKevin Wolf 
105339064d5SKevin Wolf     return bs->bl.opt_mem_alignment;
106339064d5SKevin Wolf }
107339064d5SKevin Wolf 
1084196d2f0SDenis V. Lunev size_t bdrv_min_mem_align(BlockDriverState *bs)
1094196d2f0SDenis V. Lunev {
1104196d2f0SDenis V. Lunev     if (!bs || !bs->drv) {
111459b4e66SDenis V. Lunev         /* page size or 4k (hdd sector size) should be on the safe side */
112459b4e66SDenis V. Lunev         return MAX(4096, getpagesize());
1134196d2f0SDenis V. Lunev     }
1144196d2f0SDenis V. Lunev 
1154196d2f0SDenis V. Lunev     return bs->bl.min_mem_alignment;
1164196d2f0SDenis V. Lunev }
1174196d2f0SDenis V. Lunev 
1189e0b22f4SStefan Hajnoczi /* check if the path starts with "<protocol>:" */
1195c98415bSMax Reitz int path_has_protocol(const char *path)
1209e0b22f4SStefan Hajnoczi {
121947995c0SPaolo Bonzini     const char *p;
122947995c0SPaolo Bonzini 
1239e0b22f4SStefan Hajnoczi #ifdef _WIN32
1249e0b22f4SStefan Hajnoczi     if (is_windows_drive(path) ||
1259e0b22f4SStefan Hajnoczi         is_windows_drive_prefix(path)) {
1269e0b22f4SStefan Hajnoczi         return 0;
1279e0b22f4SStefan Hajnoczi     }
128947995c0SPaolo Bonzini     p = path + strcspn(path, ":/\\");
129947995c0SPaolo Bonzini #else
130947995c0SPaolo Bonzini     p = path + strcspn(path, ":/");
1319e0b22f4SStefan Hajnoczi #endif
1329e0b22f4SStefan Hajnoczi 
133947995c0SPaolo Bonzini     return *p == ':';
1349e0b22f4SStefan Hajnoczi }
1359e0b22f4SStefan Hajnoczi 
13683f64091Sbellard int path_is_absolute(const char *path)
13783f64091Sbellard {
13821664424Sbellard #ifdef _WIN32
13921664424Sbellard     /* specific case for names like: "\\.\d:" */
140f53f4da9SPaolo Bonzini     if (is_windows_drive(path) || is_windows_drive_prefix(path)) {
14121664424Sbellard         return 1;
142f53f4da9SPaolo Bonzini     }
143f53f4da9SPaolo Bonzini     return (*path == '/' || *path == '\\');
1443b9f94e1Sbellard #else
145f53f4da9SPaolo Bonzini     return (*path == '/');
1463b9f94e1Sbellard #endif
14783f64091Sbellard }
14883f64091Sbellard 
14983f64091Sbellard /* if filename is absolute, just copy it to dest. Otherwise, build a
15083f64091Sbellard    path to it by considering it is relative to base_path. URL are
15183f64091Sbellard    supported. */
15283f64091Sbellard void path_combine(char *dest, int dest_size,
15383f64091Sbellard                   const char *base_path,
15483f64091Sbellard                   const char *filename)
15583f64091Sbellard {
15683f64091Sbellard     const char *p, *p1;
15783f64091Sbellard     int len;
15883f64091Sbellard 
15983f64091Sbellard     if (dest_size <= 0)
16083f64091Sbellard         return;
16183f64091Sbellard     if (path_is_absolute(filename)) {
16283f64091Sbellard         pstrcpy(dest, dest_size, filename);
16383f64091Sbellard     } else {
16483f64091Sbellard         p = strchr(base_path, ':');
16583f64091Sbellard         if (p)
16683f64091Sbellard             p++;
16783f64091Sbellard         else
16883f64091Sbellard             p = base_path;
1693b9f94e1Sbellard         p1 = strrchr(base_path, '/');
1703b9f94e1Sbellard #ifdef _WIN32
1713b9f94e1Sbellard         {
1723b9f94e1Sbellard             const char *p2;
1733b9f94e1Sbellard             p2 = strrchr(base_path, '\\');
1743b9f94e1Sbellard             if (!p1 || p2 > p1)
1753b9f94e1Sbellard                 p1 = p2;
1763b9f94e1Sbellard         }
1773b9f94e1Sbellard #endif
17883f64091Sbellard         if (p1)
17983f64091Sbellard             p1++;
18083f64091Sbellard         else
18183f64091Sbellard             p1 = base_path;
18283f64091Sbellard         if (p1 > p)
18383f64091Sbellard             p = p1;
18483f64091Sbellard         len = p - base_path;
18583f64091Sbellard         if (len > dest_size - 1)
18683f64091Sbellard             len = dest_size - 1;
18783f64091Sbellard         memcpy(dest, base_path, len);
18883f64091Sbellard         dest[len] = '\0';
18983f64091Sbellard         pstrcat(dest, dest_size, filename);
19083f64091Sbellard     }
19183f64091Sbellard }
19283f64091Sbellard 
1930a82855aSMax Reitz void bdrv_get_full_backing_filename_from_filename(const char *backed,
1940a82855aSMax Reitz                                                   const char *backing,
1959f07429eSMax Reitz                                                   char *dest, size_t sz,
1969f07429eSMax Reitz                                                   Error **errp)
1970a82855aSMax Reitz {
1989f07429eSMax Reitz     if (backing[0] == '\0' || path_has_protocol(backing) ||
1999f07429eSMax Reitz         path_is_absolute(backing))
2009f07429eSMax Reitz     {
2010a82855aSMax Reitz         pstrcpy(dest, sz, backing);
2029f07429eSMax Reitz     } else if (backed[0] == '\0' || strstart(backed, "json:", NULL)) {
2039f07429eSMax Reitz         error_setg(errp, "Cannot use relative backing file names for '%s'",
2049f07429eSMax Reitz                    backed);
2050a82855aSMax Reitz     } else {
2060a82855aSMax Reitz         path_combine(dest, sz, backed, backing);
2070a82855aSMax Reitz     }
2080a82855aSMax Reitz }
2090a82855aSMax Reitz 
2109f07429eSMax Reitz void bdrv_get_full_backing_filename(BlockDriverState *bs, char *dest, size_t sz,
2119f07429eSMax Reitz                                     Error **errp)
212dc5a1371SPaolo Bonzini {
2139f07429eSMax Reitz     char *backed = bs->exact_filename[0] ? bs->exact_filename : bs->filename;
2149f07429eSMax Reitz 
2159f07429eSMax Reitz     bdrv_get_full_backing_filename_from_filename(backed, bs->backing_file,
2169f07429eSMax Reitz                                                  dest, sz, errp);
217dc5a1371SPaolo Bonzini }
218dc5a1371SPaolo Bonzini 
2190eb7217eSStefan Hajnoczi void bdrv_register(BlockDriver *bdrv)
2200eb7217eSStefan Hajnoczi {
2210eb7217eSStefan Hajnoczi     bdrv_setup_io_funcs(bdrv);
222b2e12bc6SChristoph Hellwig 
2238a22f02aSStefan Hajnoczi     QLIST_INSERT_HEAD(&bdrv_drivers, bdrv, list);
224ea2384d3Sbellard }
225b338082bSbellard 
2267f06d47eSMarkus Armbruster BlockDriverState *bdrv_new_root(void)
227fc01f7e7Sbellard {
2289aaf28c6SMax Reitz     return bdrv_new();
229e4e9986bSMarkus Armbruster }
230e4e9986bSMarkus Armbruster 
231e4e9986bSMarkus Armbruster BlockDriverState *bdrv_new(void)
232e4e9986bSMarkus Armbruster {
233e4e9986bSMarkus Armbruster     BlockDriverState *bs;
234e4e9986bSMarkus Armbruster     int i;
235e4e9986bSMarkus Armbruster 
2365839e53bSMarkus Armbruster     bs = g_new0(BlockDriverState, 1);
237e4654d2dSFam Zheng     QLIST_INIT(&bs->dirty_bitmaps);
238fbe40ff7SFam Zheng     for (i = 0; i < BLOCK_OP_TYPE_MAX; i++) {
239fbe40ff7SFam Zheng         QLIST_INIT(&bs->op_blockers[i]);
240fbe40ff7SFam Zheng     }
241d616b224SStefan Hajnoczi     notifier_with_return_list_init(&bs->before_write_notifiers);
242cc0681c4SBenoît Canet     qemu_co_queue_init(&bs->throttled_reqs[0]);
243cc0681c4SBenoît Canet     qemu_co_queue_init(&bs->throttled_reqs[1]);
2449fcb0251SFam Zheng     bs->refcnt = 1;
245dcd04228SStefan Hajnoczi     bs->aio_context = qemu_get_aio_context();
246d7d512f6SPaolo Bonzini 
2472c1d04e0SMax Reitz     QTAILQ_INSERT_TAIL(&all_bdrv_states, bs, bs_list);
2482c1d04e0SMax Reitz 
249b338082bSbellard     return bs;
250b338082bSbellard }
251b338082bSbellard 
252ea2384d3Sbellard BlockDriver *bdrv_find_format(const char *format_name)
253ea2384d3Sbellard {
254ea2384d3Sbellard     BlockDriver *drv1;
2558a22f02aSStefan Hajnoczi     QLIST_FOREACH(drv1, &bdrv_drivers, list) {
2568a22f02aSStefan Hajnoczi         if (!strcmp(drv1->format_name, format_name)) {
257ea2384d3Sbellard             return drv1;
258ea2384d3Sbellard         }
2598a22f02aSStefan Hajnoczi     }
260ea2384d3Sbellard     return NULL;
261ea2384d3Sbellard }
262ea2384d3Sbellard 
263b64ec4e4SFam Zheng static int bdrv_is_whitelisted(BlockDriver *drv, bool read_only)
264eb852011SMarkus Armbruster {
265b64ec4e4SFam Zheng     static const char *whitelist_rw[] = {
266b64ec4e4SFam Zheng         CONFIG_BDRV_RW_WHITELIST
267b64ec4e4SFam Zheng     };
268b64ec4e4SFam Zheng     static const char *whitelist_ro[] = {
269b64ec4e4SFam Zheng         CONFIG_BDRV_RO_WHITELIST
270eb852011SMarkus Armbruster     };
271eb852011SMarkus Armbruster     const char **p;
272eb852011SMarkus Armbruster 
273b64ec4e4SFam Zheng     if (!whitelist_rw[0] && !whitelist_ro[0]) {
274eb852011SMarkus Armbruster         return 1;               /* no whitelist, anything goes */
275b64ec4e4SFam Zheng     }
276eb852011SMarkus Armbruster 
277b64ec4e4SFam Zheng     for (p = whitelist_rw; *p; p++) {
278eb852011SMarkus Armbruster         if (!strcmp(drv->format_name, *p)) {
279eb852011SMarkus Armbruster             return 1;
280eb852011SMarkus Armbruster         }
281eb852011SMarkus Armbruster     }
282b64ec4e4SFam Zheng     if (read_only) {
283b64ec4e4SFam Zheng         for (p = whitelist_ro; *p; p++) {
284b64ec4e4SFam Zheng             if (!strcmp(drv->format_name, *p)) {
285b64ec4e4SFam Zheng                 return 1;
286b64ec4e4SFam Zheng             }
287b64ec4e4SFam Zheng         }
288b64ec4e4SFam Zheng     }
289eb852011SMarkus Armbruster     return 0;
290eb852011SMarkus Armbruster }
291eb852011SMarkus Armbruster 
292e6ff69bfSDaniel P. Berrange bool bdrv_uses_whitelist(void)
293e6ff69bfSDaniel P. Berrange {
294e6ff69bfSDaniel P. Berrange     return use_bdrv_whitelist;
295e6ff69bfSDaniel P. Berrange }
296e6ff69bfSDaniel P. Berrange 
2975b7e1542SZhi Yong Wu typedef struct CreateCo {
2985b7e1542SZhi Yong Wu     BlockDriver *drv;
2995b7e1542SZhi Yong Wu     char *filename;
30083d0521aSChunyan Liu     QemuOpts *opts;
3015b7e1542SZhi Yong Wu     int ret;
302cc84d90fSMax Reitz     Error *err;
3035b7e1542SZhi Yong Wu } CreateCo;
3045b7e1542SZhi Yong Wu 
3055b7e1542SZhi Yong Wu static void coroutine_fn bdrv_create_co_entry(void *opaque)
3065b7e1542SZhi Yong Wu {
307cc84d90fSMax Reitz     Error *local_err = NULL;
308cc84d90fSMax Reitz     int ret;
309cc84d90fSMax Reitz 
3105b7e1542SZhi Yong Wu     CreateCo *cco = opaque;
3115b7e1542SZhi Yong Wu     assert(cco->drv);
3125b7e1542SZhi Yong Wu 
313c282e1fdSChunyan Liu     ret = cco->drv->bdrv_create(cco->filename, cco->opts, &local_err);
31484d18f06SMarkus Armbruster     if (local_err) {
315cc84d90fSMax Reitz         error_propagate(&cco->err, local_err);
316cc84d90fSMax Reitz     }
317cc84d90fSMax Reitz     cco->ret = ret;
3185b7e1542SZhi Yong Wu }
3195b7e1542SZhi Yong Wu 
3200e7e1989SKevin Wolf int bdrv_create(BlockDriver *drv, const char* filename,
32183d0521aSChunyan Liu                 QemuOpts *opts, Error **errp)
322ea2384d3Sbellard {
3235b7e1542SZhi Yong Wu     int ret;
3240e7e1989SKevin Wolf 
3255b7e1542SZhi Yong Wu     Coroutine *co;
3265b7e1542SZhi Yong Wu     CreateCo cco = {
3275b7e1542SZhi Yong Wu         .drv = drv,
3285b7e1542SZhi Yong Wu         .filename = g_strdup(filename),
32983d0521aSChunyan Liu         .opts = opts,
3305b7e1542SZhi Yong Wu         .ret = NOT_DONE,
331cc84d90fSMax Reitz         .err = NULL,
3325b7e1542SZhi Yong Wu     };
3335b7e1542SZhi Yong Wu 
334c282e1fdSChunyan Liu     if (!drv->bdrv_create) {
335cc84d90fSMax Reitz         error_setg(errp, "Driver '%s' does not support image creation", drv->format_name);
33680168bffSLuiz Capitulino         ret = -ENOTSUP;
33780168bffSLuiz Capitulino         goto out;
3385b7e1542SZhi Yong Wu     }
3395b7e1542SZhi Yong Wu 
3405b7e1542SZhi Yong Wu     if (qemu_in_coroutine()) {
3415b7e1542SZhi Yong Wu         /* Fast-path if already in coroutine context */
3425b7e1542SZhi Yong Wu         bdrv_create_co_entry(&cco);
3435b7e1542SZhi Yong Wu     } else {
3445b7e1542SZhi Yong Wu         co = qemu_coroutine_create(bdrv_create_co_entry);
3455b7e1542SZhi Yong Wu         qemu_coroutine_enter(co, &cco);
3465b7e1542SZhi Yong Wu         while (cco.ret == NOT_DONE) {
347b47ec2c4SPaolo Bonzini             aio_poll(qemu_get_aio_context(), true);
3485b7e1542SZhi Yong Wu         }
3495b7e1542SZhi Yong Wu     }
3505b7e1542SZhi Yong Wu 
3515b7e1542SZhi Yong Wu     ret = cco.ret;
352cc84d90fSMax Reitz     if (ret < 0) {
35384d18f06SMarkus Armbruster         if (cco.err) {
354cc84d90fSMax Reitz             error_propagate(errp, cco.err);
355cc84d90fSMax Reitz         } else {
356cc84d90fSMax Reitz             error_setg_errno(errp, -ret, "Could not create image");
357cc84d90fSMax Reitz         }
358cc84d90fSMax Reitz     }
3595b7e1542SZhi Yong Wu 
36080168bffSLuiz Capitulino out:
36180168bffSLuiz Capitulino     g_free(cco.filename);
3625b7e1542SZhi Yong Wu     return ret;
363ea2384d3Sbellard }
364ea2384d3Sbellard 
365c282e1fdSChunyan Liu int bdrv_create_file(const char *filename, QemuOpts *opts, Error **errp)
36684a12e66SChristoph Hellwig {
36784a12e66SChristoph Hellwig     BlockDriver *drv;
368cc84d90fSMax Reitz     Error *local_err = NULL;
369cc84d90fSMax Reitz     int ret;
37084a12e66SChristoph Hellwig 
371b65a5e12SMax Reitz     drv = bdrv_find_protocol(filename, true, errp);
37284a12e66SChristoph Hellwig     if (drv == NULL) {
37316905d71SStefan Hajnoczi         return -ENOENT;
37484a12e66SChristoph Hellwig     }
37584a12e66SChristoph Hellwig 
376c282e1fdSChunyan Liu     ret = bdrv_create(drv, filename, opts, &local_err);
37784d18f06SMarkus Armbruster     if (local_err) {
378cc84d90fSMax Reitz         error_propagate(errp, local_err);
379cc84d90fSMax Reitz     }
380cc84d90fSMax Reitz     return ret;
38184a12e66SChristoph Hellwig }
38284a12e66SChristoph Hellwig 
383892b7de8SEkaterina Tumanova /**
384892b7de8SEkaterina Tumanova  * Try to get @bs's logical and physical block size.
385892b7de8SEkaterina Tumanova  * On success, store them in @bsz struct and return 0.
386892b7de8SEkaterina Tumanova  * On failure return -errno.
387892b7de8SEkaterina Tumanova  * @bs must not be empty.
388892b7de8SEkaterina Tumanova  */
389892b7de8SEkaterina Tumanova int bdrv_probe_blocksizes(BlockDriverState *bs, BlockSizes *bsz)
390892b7de8SEkaterina Tumanova {
391892b7de8SEkaterina Tumanova     BlockDriver *drv = bs->drv;
392892b7de8SEkaterina Tumanova 
393892b7de8SEkaterina Tumanova     if (drv && drv->bdrv_probe_blocksizes) {
394892b7de8SEkaterina Tumanova         return drv->bdrv_probe_blocksizes(bs, bsz);
395892b7de8SEkaterina Tumanova     }
396892b7de8SEkaterina Tumanova 
397892b7de8SEkaterina Tumanova     return -ENOTSUP;
398892b7de8SEkaterina Tumanova }
399892b7de8SEkaterina Tumanova 
400892b7de8SEkaterina Tumanova /**
401892b7de8SEkaterina Tumanova  * Try to get @bs's geometry (cyls, heads, sectors).
402892b7de8SEkaterina Tumanova  * On success, store them in @geo struct and return 0.
403892b7de8SEkaterina Tumanova  * On failure return -errno.
404892b7de8SEkaterina Tumanova  * @bs must not be empty.
405892b7de8SEkaterina Tumanova  */
406892b7de8SEkaterina Tumanova int bdrv_probe_geometry(BlockDriverState *bs, HDGeometry *geo)
407892b7de8SEkaterina Tumanova {
408892b7de8SEkaterina Tumanova     BlockDriver *drv = bs->drv;
409892b7de8SEkaterina Tumanova 
410892b7de8SEkaterina Tumanova     if (drv && drv->bdrv_probe_geometry) {
411892b7de8SEkaterina Tumanova         return drv->bdrv_probe_geometry(bs, geo);
412892b7de8SEkaterina Tumanova     }
413892b7de8SEkaterina Tumanova 
414892b7de8SEkaterina Tumanova     return -ENOTSUP;
415892b7de8SEkaterina Tumanova }
416892b7de8SEkaterina Tumanova 
417eba25057SJim Meyering /*
418eba25057SJim Meyering  * Create a uniquely-named empty temporary file.
419eba25057SJim Meyering  * Return 0 upon success, otherwise a negative errno value.
420eba25057SJim Meyering  */
421eba25057SJim Meyering int get_tmp_filename(char *filename, int size)
422eba25057SJim Meyering {
423d5249393Sbellard #ifdef _WIN32
4243b9f94e1Sbellard     char temp_dir[MAX_PATH];
425eba25057SJim Meyering     /* GetTempFileName requires that its output buffer (4th param)
426eba25057SJim Meyering        have length MAX_PATH or greater.  */
427eba25057SJim Meyering     assert(size >= MAX_PATH);
428eba25057SJim Meyering     return (GetTempPath(MAX_PATH, temp_dir)
429eba25057SJim Meyering             && GetTempFileName(temp_dir, "qem", 0, filename)
430eba25057SJim Meyering             ? 0 : -GetLastError());
431d5249393Sbellard #else
432ea2384d3Sbellard     int fd;
4337ccfb2ebSblueswir1     const char *tmpdir;
4340badc1eeSaurel32     tmpdir = getenv("TMPDIR");
43569bef793SAmit Shah     if (!tmpdir) {
43669bef793SAmit Shah         tmpdir = "/var/tmp";
43769bef793SAmit Shah     }
438eba25057SJim Meyering     if (snprintf(filename, size, "%s/vl.XXXXXX", tmpdir) >= size) {
439eba25057SJim Meyering         return -EOVERFLOW;
440ea2384d3Sbellard     }
441eba25057SJim Meyering     fd = mkstemp(filename);
442fe235a06SDunrong Huang     if (fd < 0) {
443fe235a06SDunrong Huang         return -errno;
444fe235a06SDunrong Huang     }
445fe235a06SDunrong Huang     if (close(fd) != 0) {
446fe235a06SDunrong Huang         unlink(filename);
447eba25057SJim Meyering         return -errno;
448eba25057SJim Meyering     }
449eba25057SJim Meyering     return 0;
450d5249393Sbellard #endif
451eba25057SJim Meyering }
452ea2384d3Sbellard 
453f3a5d3f8SChristoph Hellwig /*
454f3a5d3f8SChristoph Hellwig  * Detect host devices. By convention, /dev/cdrom[N] is always
455f3a5d3f8SChristoph Hellwig  * recognized as a host CDROM.
456f3a5d3f8SChristoph Hellwig  */
457f3a5d3f8SChristoph Hellwig static BlockDriver *find_hdev_driver(const char *filename)
458f3a5d3f8SChristoph Hellwig {
459508c7cb3SChristoph Hellwig     int score_max = 0, score;
460508c7cb3SChristoph Hellwig     BlockDriver *drv = NULL, *d;
461f3a5d3f8SChristoph Hellwig 
4628a22f02aSStefan Hajnoczi     QLIST_FOREACH(d, &bdrv_drivers, list) {
463508c7cb3SChristoph Hellwig         if (d->bdrv_probe_device) {
464508c7cb3SChristoph Hellwig             score = d->bdrv_probe_device(filename);
465508c7cb3SChristoph Hellwig             if (score > score_max) {
466508c7cb3SChristoph Hellwig                 score_max = score;
467508c7cb3SChristoph Hellwig                 drv = d;
468f3a5d3f8SChristoph Hellwig             }
469508c7cb3SChristoph Hellwig         }
470f3a5d3f8SChristoph Hellwig     }
471f3a5d3f8SChristoph Hellwig 
472508c7cb3SChristoph Hellwig     return drv;
473f3a5d3f8SChristoph Hellwig }
474f3a5d3f8SChristoph Hellwig 
47598289620SKevin Wolf BlockDriver *bdrv_find_protocol(const char *filename,
476b65a5e12SMax Reitz                                 bool allow_protocol_prefix,
477b65a5e12SMax Reitz                                 Error **errp)
47884a12e66SChristoph Hellwig {
47984a12e66SChristoph Hellwig     BlockDriver *drv1;
48084a12e66SChristoph Hellwig     char protocol[128];
48184a12e66SChristoph Hellwig     int len;
48284a12e66SChristoph Hellwig     const char *p;
48384a12e66SChristoph Hellwig 
48466f82ceeSKevin Wolf     /* TODO Drivers without bdrv_file_open must be specified explicitly */
48566f82ceeSKevin Wolf 
48639508e7aSChristoph Hellwig     /*
48739508e7aSChristoph Hellwig      * XXX(hch): we really should not let host device detection
48839508e7aSChristoph Hellwig      * override an explicit protocol specification, but moving this
48939508e7aSChristoph Hellwig      * later breaks access to device names with colons in them.
49039508e7aSChristoph Hellwig      * Thanks to the brain-dead persistent naming schemes on udev-
49139508e7aSChristoph Hellwig      * based Linux systems those actually are quite common.
49239508e7aSChristoph Hellwig      */
49384a12e66SChristoph Hellwig     drv1 = find_hdev_driver(filename);
49439508e7aSChristoph Hellwig     if (drv1) {
49584a12e66SChristoph Hellwig         return drv1;
49684a12e66SChristoph Hellwig     }
49739508e7aSChristoph Hellwig 
49898289620SKevin Wolf     if (!path_has_protocol(filename) || !allow_protocol_prefix) {
499ef810437SMax Reitz         return &bdrv_file;
50039508e7aSChristoph Hellwig     }
50198289620SKevin Wolf 
5029e0b22f4SStefan Hajnoczi     p = strchr(filename, ':');
5039e0b22f4SStefan Hajnoczi     assert(p != NULL);
50484a12e66SChristoph Hellwig     len = p - filename;
50584a12e66SChristoph Hellwig     if (len > sizeof(protocol) - 1)
50684a12e66SChristoph Hellwig         len = sizeof(protocol) - 1;
50784a12e66SChristoph Hellwig     memcpy(protocol, filename, len);
50884a12e66SChristoph Hellwig     protocol[len] = '\0';
50984a12e66SChristoph Hellwig     QLIST_FOREACH(drv1, &bdrv_drivers, list) {
51084a12e66SChristoph Hellwig         if (drv1->protocol_name &&
51184a12e66SChristoph Hellwig             !strcmp(drv1->protocol_name, protocol)) {
51284a12e66SChristoph Hellwig             return drv1;
51384a12e66SChristoph Hellwig         }
51484a12e66SChristoph Hellwig     }
515b65a5e12SMax Reitz 
516b65a5e12SMax Reitz     error_setg(errp, "Unknown protocol '%s'", protocol);
51784a12e66SChristoph Hellwig     return NULL;
51884a12e66SChristoph Hellwig }
51984a12e66SChristoph Hellwig 
520c6684249SMarkus Armbruster /*
521c6684249SMarkus Armbruster  * Guess image format by probing its contents.
522c6684249SMarkus Armbruster  * This is not a good idea when your image is raw (CVE-2008-2004), but
523c6684249SMarkus Armbruster  * we do it anyway for backward compatibility.
524c6684249SMarkus Armbruster  *
525c6684249SMarkus Armbruster  * @buf         contains the image's first @buf_size bytes.
5267cddd372SKevin Wolf  * @buf_size    is the buffer size in bytes (generally BLOCK_PROBE_BUF_SIZE,
5277cddd372SKevin Wolf  *              but can be smaller if the image file is smaller)
528c6684249SMarkus Armbruster  * @filename    is its filename.
529c6684249SMarkus Armbruster  *
530c6684249SMarkus Armbruster  * For all block drivers, call the bdrv_probe() method to get its
531c6684249SMarkus Armbruster  * probing score.
532c6684249SMarkus Armbruster  * Return the first block driver with the highest probing score.
533c6684249SMarkus Armbruster  */
53438f3ef57SKevin Wolf BlockDriver *bdrv_probe_all(const uint8_t *buf, int buf_size,
535c6684249SMarkus Armbruster                             const char *filename)
536c6684249SMarkus Armbruster {
537c6684249SMarkus Armbruster     int score_max = 0, score;
538c6684249SMarkus Armbruster     BlockDriver *drv = NULL, *d;
539c6684249SMarkus Armbruster 
540c6684249SMarkus Armbruster     QLIST_FOREACH(d, &bdrv_drivers, list) {
541c6684249SMarkus Armbruster         if (d->bdrv_probe) {
542c6684249SMarkus Armbruster             score = d->bdrv_probe(buf, buf_size, filename);
543c6684249SMarkus Armbruster             if (score > score_max) {
544c6684249SMarkus Armbruster                 score_max = score;
545c6684249SMarkus Armbruster                 drv = d;
546c6684249SMarkus Armbruster             }
547c6684249SMarkus Armbruster         }
548c6684249SMarkus Armbruster     }
549c6684249SMarkus Armbruster 
550c6684249SMarkus Armbruster     return drv;
551c6684249SMarkus Armbruster }
552c6684249SMarkus Armbruster 
553f500a6d3SKevin Wolf static int find_image_format(BlockDriverState *bs, const char *filename,
55434b5d2c6SMax Reitz                              BlockDriver **pdrv, Error **errp)
555ea2384d3Sbellard {
556c6684249SMarkus Armbruster     BlockDriver *drv;
5577cddd372SKevin Wolf     uint8_t buf[BLOCK_PROBE_BUF_SIZE];
558f500a6d3SKevin Wolf     int ret = 0;
559f8ea0b00SNicholas Bellinger 
56008a00559SKevin Wolf     /* Return the raw BlockDriver * to scsi-generic devices or empty drives */
561b192af8aSDimitris Aragiorgis     if (bdrv_is_sg(bs) || !bdrv_is_inserted(bs) || bdrv_getlength(bs) == 0) {
562ef810437SMax Reitz         *pdrv = &bdrv_raw;
563c98ac35dSStefan Weil         return ret;
5641a396859SNicholas A. Bellinger     }
565f8ea0b00SNicholas Bellinger 
56683f64091Sbellard     ret = bdrv_pread(bs, 0, buf, sizeof(buf));
567ea2384d3Sbellard     if (ret < 0) {
56834b5d2c6SMax Reitz         error_setg_errno(errp, -ret, "Could not read image for determining its "
56934b5d2c6SMax Reitz                          "format");
570c98ac35dSStefan Weil         *pdrv = NULL;
571c98ac35dSStefan Weil         return ret;
572ea2384d3Sbellard     }
573ea2384d3Sbellard 
574c6684249SMarkus Armbruster     drv = bdrv_probe_all(buf, ret, filename);
575c98ac35dSStefan Weil     if (!drv) {
57634b5d2c6SMax Reitz         error_setg(errp, "Could not determine image format: No compatible "
57734b5d2c6SMax Reitz                    "driver found");
578c98ac35dSStefan Weil         ret = -ENOENT;
579c98ac35dSStefan Weil     }
580c98ac35dSStefan Weil     *pdrv = drv;
581c98ac35dSStefan Weil     return ret;
582ea2384d3Sbellard }
583ea2384d3Sbellard 
58451762288SStefan Hajnoczi /**
58551762288SStefan Hajnoczi  * Set the current 'total_sectors' value
58665a9bb25SMarkus Armbruster  * Return 0 on success, -errno on error.
58751762288SStefan Hajnoczi  */
58851762288SStefan Hajnoczi static int refresh_total_sectors(BlockDriverState *bs, int64_t hint)
58951762288SStefan Hajnoczi {
59051762288SStefan Hajnoczi     BlockDriver *drv = bs->drv;
59151762288SStefan Hajnoczi 
592396759adSNicholas Bellinger     /* Do not attempt drv->bdrv_getlength() on scsi-generic devices */
593b192af8aSDimitris Aragiorgis     if (bdrv_is_sg(bs))
594396759adSNicholas Bellinger         return 0;
595396759adSNicholas Bellinger 
59651762288SStefan Hajnoczi     /* query actual device if possible, otherwise just trust the hint */
59751762288SStefan Hajnoczi     if (drv->bdrv_getlength) {
59851762288SStefan Hajnoczi         int64_t length = drv->bdrv_getlength(bs);
59951762288SStefan Hajnoczi         if (length < 0) {
60051762288SStefan Hajnoczi             return length;
60151762288SStefan Hajnoczi         }
6027e382003SFam Zheng         hint = DIV_ROUND_UP(length, BDRV_SECTOR_SIZE);
60351762288SStefan Hajnoczi     }
60451762288SStefan Hajnoczi 
60551762288SStefan Hajnoczi     bs->total_sectors = hint;
60651762288SStefan Hajnoczi     return 0;
60751762288SStefan Hajnoczi }
60851762288SStefan Hajnoczi 
609c3993cdcSStefan Hajnoczi /**
610cddff5baSKevin Wolf  * Combines a QDict of new block driver @options with any missing options taken
611cddff5baSKevin Wolf  * from @old_options, so that leaving out an option defaults to its old value.
612cddff5baSKevin Wolf  */
613cddff5baSKevin Wolf static void bdrv_join_options(BlockDriverState *bs, QDict *options,
614cddff5baSKevin Wolf                               QDict *old_options)
615cddff5baSKevin Wolf {
616cddff5baSKevin Wolf     if (bs->drv && bs->drv->bdrv_join_options) {
617cddff5baSKevin Wolf         bs->drv->bdrv_join_options(options, old_options);
618cddff5baSKevin Wolf     } else {
619cddff5baSKevin Wolf         qdict_join(options, old_options, false);
620cddff5baSKevin Wolf     }
621cddff5baSKevin Wolf }
622cddff5baSKevin Wolf 
623cddff5baSKevin Wolf /**
6249e8f1835SPaolo Bonzini  * Set open flags for a given discard mode
6259e8f1835SPaolo Bonzini  *
6269e8f1835SPaolo Bonzini  * Return 0 on success, -1 if the discard mode was invalid.
6279e8f1835SPaolo Bonzini  */
6289e8f1835SPaolo Bonzini int bdrv_parse_discard_flags(const char *mode, int *flags)
6299e8f1835SPaolo Bonzini {
6309e8f1835SPaolo Bonzini     *flags &= ~BDRV_O_UNMAP;
6319e8f1835SPaolo Bonzini 
6329e8f1835SPaolo Bonzini     if (!strcmp(mode, "off") || !strcmp(mode, "ignore")) {
6339e8f1835SPaolo Bonzini         /* do nothing */
6349e8f1835SPaolo Bonzini     } else if (!strcmp(mode, "on") || !strcmp(mode, "unmap")) {
6359e8f1835SPaolo Bonzini         *flags |= BDRV_O_UNMAP;
6369e8f1835SPaolo Bonzini     } else {
6379e8f1835SPaolo Bonzini         return -1;
6389e8f1835SPaolo Bonzini     }
6399e8f1835SPaolo Bonzini 
6409e8f1835SPaolo Bonzini     return 0;
6419e8f1835SPaolo Bonzini }
6429e8f1835SPaolo Bonzini 
6439e8f1835SPaolo Bonzini /**
644c3993cdcSStefan Hajnoczi  * Set open flags for a given cache mode
645c3993cdcSStefan Hajnoczi  *
646c3993cdcSStefan Hajnoczi  * Return 0 on success, -1 if the cache mode was invalid.
647c3993cdcSStefan Hajnoczi  */
64853e8ae01SKevin Wolf int bdrv_parse_cache_mode(const char *mode, int *flags, bool *writethrough)
649c3993cdcSStefan Hajnoczi {
650c3993cdcSStefan Hajnoczi     *flags &= ~BDRV_O_CACHE_MASK;
651c3993cdcSStefan Hajnoczi 
652c3993cdcSStefan Hajnoczi     if (!strcmp(mode, "off") || !strcmp(mode, "none")) {
65353e8ae01SKevin Wolf         *writethrough = false;
65453e8ae01SKevin Wolf         *flags |= BDRV_O_NOCACHE;
65592196b2fSStefan Hajnoczi     } else if (!strcmp(mode, "directsync")) {
65653e8ae01SKevin Wolf         *writethrough = true;
65792196b2fSStefan Hajnoczi         *flags |= BDRV_O_NOCACHE;
658c3993cdcSStefan Hajnoczi     } else if (!strcmp(mode, "writeback")) {
65953e8ae01SKevin Wolf         *writethrough = false;
660c3993cdcSStefan Hajnoczi     } else if (!strcmp(mode, "unsafe")) {
66153e8ae01SKevin Wolf         *writethrough = false;
662c3993cdcSStefan Hajnoczi         *flags |= BDRV_O_NO_FLUSH;
663c3993cdcSStefan Hajnoczi     } else if (!strcmp(mode, "writethrough")) {
66453e8ae01SKevin Wolf         *writethrough = true;
665c3993cdcSStefan Hajnoczi     } else {
666c3993cdcSStefan Hajnoczi         return -1;
667c3993cdcSStefan Hajnoczi     }
668c3993cdcSStefan Hajnoczi 
669c3993cdcSStefan Hajnoczi     return 0;
670c3993cdcSStefan Hajnoczi }
671c3993cdcSStefan Hajnoczi 
6720b50cc88SKevin Wolf /*
67373176beeSKevin Wolf  * Returns the options and flags that a temporary snapshot should get, based on
67473176beeSKevin Wolf  * the originally requested flags (the originally requested image will have
67573176beeSKevin Wolf  * flags like a backing file)
676b1e6fc08SKevin Wolf  */
67773176beeSKevin Wolf static void bdrv_temp_snapshot_options(int *child_flags, QDict *child_options,
67873176beeSKevin Wolf                                        int parent_flags, QDict *parent_options)
679b1e6fc08SKevin Wolf {
68073176beeSKevin Wolf     *child_flags = (parent_flags & ~BDRV_O_SNAPSHOT) | BDRV_O_TEMPORARY;
68173176beeSKevin Wolf 
68273176beeSKevin Wolf     /* For temporary files, unconditional cache=unsafe is fine */
68373176beeSKevin Wolf     qdict_set_default_str(child_options, BDRV_OPT_CACHE_DIRECT, "off");
68473176beeSKevin Wolf     qdict_set_default_str(child_options, BDRV_OPT_CACHE_NO_FLUSH, "on");
685b1e6fc08SKevin Wolf }
686b1e6fc08SKevin Wolf 
687b1e6fc08SKevin Wolf /*
6888e2160e2SKevin Wolf  * Returns the options and flags that bs->file should get if a protocol driver
6898e2160e2SKevin Wolf  * is expected, based on the given options and flags for the parent BDS
6900b50cc88SKevin Wolf  */
6918e2160e2SKevin Wolf static void bdrv_inherited_options(int *child_flags, QDict *child_options,
6928e2160e2SKevin Wolf                                    int parent_flags, QDict *parent_options)
6930b50cc88SKevin Wolf {
6948e2160e2SKevin Wolf     int flags = parent_flags;
6958e2160e2SKevin Wolf 
6960b50cc88SKevin Wolf     /* Enable protocol handling, disable format probing for bs->file */
6970b50cc88SKevin Wolf     flags |= BDRV_O_PROTOCOL;
6980b50cc88SKevin Wolf 
69991a097e7SKevin Wolf     /* If the cache mode isn't explicitly set, inherit direct and no-flush from
70091a097e7SKevin Wolf      * the parent. */
70191a097e7SKevin Wolf     qdict_copy_default(child_options, parent_options, BDRV_OPT_CACHE_DIRECT);
70291a097e7SKevin Wolf     qdict_copy_default(child_options, parent_options, BDRV_OPT_CACHE_NO_FLUSH);
70391a097e7SKevin Wolf 
7040b50cc88SKevin Wolf     /* Our block drivers take care to send flushes and respect unmap policy,
70591a097e7SKevin Wolf      * so we can default to enable both on lower layers regardless of the
70691a097e7SKevin Wolf      * corresponding parent options. */
70791a097e7SKevin Wolf     flags |= BDRV_O_UNMAP;
7080b50cc88SKevin Wolf 
7090b50cc88SKevin Wolf     /* Clear flags that only apply to the top layer */
710abb06c5aSDaniel P. Berrange     flags &= ~(BDRV_O_SNAPSHOT | BDRV_O_NO_BACKING | BDRV_O_COPY_ON_READ |
711abb06c5aSDaniel P. Berrange                BDRV_O_NO_IO);
7120b50cc88SKevin Wolf 
7138e2160e2SKevin Wolf     *child_flags = flags;
7140b50cc88SKevin Wolf }
7150b50cc88SKevin Wolf 
716f3930ed0SKevin Wolf const BdrvChildRole child_file = {
7178e2160e2SKevin Wolf     .inherit_options = bdrv_inherited_options,
718f3930ed0SKevin Wolf };
719f3930ed0SKevin Wolf 
720f3930ed0SKevin Wolf /*
7218e2160e2SKevin Wolf  * Returns the options and flags that bs->file should get if the use of formats
7228e2160e2SKevin Wolf  * (and not only protocols) is permitted for it, based on the given options and
7238e2160e2SKevin Wolf  * flags for the parent BDS
724f3930ed0SKevin Wolf  */
7258e2160e2SKevin Wolf static void bdrv_inherited_fmt_options(int *child_flags, QDict *child_options,
7268e2160e2SKevin Wolf                                        int parent_flags, QDict *parent_options)
727f3930ed0SKevin Wolf {
7288e2160e2SKevin Wolf     child_file.inherit_options(child_flags, child_options,
7298e2160e2SKevin Wolf                                parent_flags, parent_options);
7308e2160e2SKevin Wolf 
731abb06c5aSDaniel P. Berrange     *child_flags &= ~(BDRV_O_PROTOCOL | BDRV_O_NO_IO);
732f3930ed0SKevin Wolf }
733f3930ed0SKevin Wolf 
734f3930ed0SKevin Wolf const BdrvChildRole child_format = {
7358e2160e2SKevin Wolf     .inherit_options = bdrv_inherited_fmt_options,
736f3930ed0SKevin Wolf };
737f3930ed0SKevin Wolf 
738317fc44eSKevin Wolf /*
7398e2160e2SKevin Wolf  * Returns the options and flags that bs->backing should get, based on the
7408e2160e2SKevin Wolf  * given options and flags for the parent BDS
741317fc44eSKevin Wolf  */
7428e2160e2SKevin Wolf static void bdrv_backing_options(int *child_flags, QDict *child_options,
7438e2160e2SKevin Wolf                                  int parent_flags, QDict *parent_options)
744317fc44eSKevin Wolf {
7458e2160e2SKevin Wolf     int flags = parent_flags;
7468e2160e2SKevin Wolf 
747b8816a43SKevin Wolf     /* The cache mode is inherited unmodified for backing files; except WCE,
748b8816a43SKevin Wolf      * which is only applied on the top level (BlockBackend) */
74991a097e7SKevin Wolf     qdict_copy_default(child_options, parent_options, BDRV_OPT_CACHE_DIRECT);
75091a097e7SKevin Wolf     qdict_copy_default(child_options, parent_options, BDRV_OPT_CACHE_NO_FLUSH);
75191a097e7SKevin Wolf 
752317fc44eSKevin Wolf     /* backing files always opened read-only */
753317fc44eSKevin Wolf     flags &= ~(BDRV_O_RDWR | BDRV_O_COPY_ON_READ);
754317fc44eSKevin Wolf 
755317fc44eSKevin Wolf     /* snapshot=on is handled on the top layer */
7568bfea15dSKevin Wolf     flags &= ~(BDRV_O_SNAPSHOT | BDRV_O_TEMPORARY);
757317fc44eSKevin Wolf 
7588e2160e2SKevin Wolf     *child_flags = flags;
759317fc44eSKevin Wolf }
760317fc44eSKevin Wolf 
761f3930ed0SKevin Wolf static const BdrvChildRole child_backing = {
7628e2160e2SKevin Wolf     .inherit_options = bdrv_backing_options,
763f3930ed0SKevin Wolf };
764f3930ed0SKevin Wolf 
7657b272452SKevin Wolf static int bdrv_open_flags(BlockDriverState *bs, int flags)
7667b272452SKevin Wolf {
76761de4c68SKevin Wolf     int open_flags = flags;
7687b272452SKevin Wolf 
7697b272452SKevin Wolf     /*
7707b272452SKevin Wolf      * Clear flags that are internal to the block layer before opening the
7717b272452SKevin Wolf      * image.
7727b272452SKevin Wolf      */
77320cca275SKevin Wolf     open_flags &= ~(BDRV_O_SNAPSHOT | BDRV_O_NO_BACKING | BDRV_O_PROTOCOL);
7747b272452SKevin Wolf 
7757b272452SKevin Wolf     /*
7767b272452SKevin Wolf      * Snapshots should be writable.
7777b272452SKevin Wolf      */
7788bfea15dSKevin Wolf     if (flags & BDRV_O_TEMPORARY) {
7797b272452SKevin Wolf         open_flags |= BDRV_O_RDWR;
7807b272452SKevin Wolf     }
7817b272452SKevin Wolf 
7827b272452SKevin Wolf     return open_flags;
7837b272452SKevin Wolf }
7847b272452SKevin Wolf 
78591a097e7SKevin Wolf static void update_flags_from_options(int *flags, QemuOpts *opts)
78691a097e7SKevin Wolf {
78791a097e7SKevin Wolf     *flags &= ~BDRV_O_CACHE_MASK;
78891a097e7SKevin Wolf 
78991a097e7SKevin Wolf     assert(qemu_opt_find(opts, BDRV_OPT_CACHE_NO_FLUSH));
79091a097e7SKevin Wolf     if (qemu_opt_get_bool(opts, BDRV_OPT_CACHE_NO_FLUSH, false)) {
79191a097e7SKevin Wolf         *flags |= BDRV_O_NO_FLUSH;
79291a097e7SKevin Wolf     }
79391a097e7SKevin Wolf 
79491a097e7SKevin Wolf     assert(qemu_opt_find(opts, BDRV_OPT_CACHE_DIRECT));
79591a097e7SKevin Wolf     if (qemu_opt_get_bool(opts, BDRV_OPT_CACHE_DIRECT, false)) {
79691a097e7SKevin Wolf         *flags |= BDRV_O_NOCACHE;
79791a097e7SKevin Wolf     }
79891a097e7SKevin Wolf }
79991a097e7SKevin Wolf 
80091a097e7SKevin Wolf static void update_options_from_flags(QDict *options, int flags)
80191a097e7SKevin Wolf {
80291a097e7SKevin Wolf     if (!qdict_haskey(options, BDRV_OPT_CACHE_DIRECT)) {
80391a097e7SKevin Wolf         qdict_put(options, BDRV_OPT_CACHE_DIRECT,
80491a097e7SKevin Wolf                   qbool_from_bool(flags & BDRV_O_NOCACHE));
80591a097e7SKevin Wolf     }
80691a097e7SKevin Wolf     if (!qdict_haskey(options, BDRV_OPT_CACHE_NO_FLUSH)) {
80791a097e7SKevin Wolf         qdict_put(options, BDRV_OPT_CACHE_NO_FLUSH,
80891a097e7SKevin Wolf                   qbool_from_bool(flags & BDRV_O_NO_FLUSH));
80991a097e7SKevin Wolf     }
81091a097e7SKevin Wolf }
81191a097e7SKevin Wolf 
812636ea370SKevin Wolf static void bdrv_assign_node_name(BlockDriverState *bs,
8136913c0c2SBenoît Canet                                   const char *node_name,
8146913c0c2SBenoît Canet                                   Error **errp)
8156913c0c2SBenoît Canet {
81615489c76SJeff Cody     char *gen_node_name = NULL;
8176913c0c2SBenoît Canet 
81815489c76SJeff Cody     if (!node_name) {
81915489c76SJeff Cody         node_name = gen_node_name = id_generate(ID_BLOCK);
82015489c76SJeff Cody     } else if (!id_wellformed(node_name)) {
82115489c76SJeff Cody         /*
82215489c76SJeff Cody          * Check for empty string or invalid characters, but not if it is
82315489c76SJeff Cody          * generated (generated names use characters not available to the user)
82415489c76SJeff Cody          */
8259aebf3b8SKevin Wolf         error_setg(errp, "Invalid node name");
826636ea370SKevin Wolf         return;
8276913c0c2SBenoît Canet     }
8286913c0c2SBenoît Canet 
8290c5e94eeSBenoît Canet     /* takes care of avoiding namespaces collisions */
8307f06d47eSMarkus Armbruster     if (blk_by_name(node_name)) {
8310c5e94eeSBenoît Canet         error_setg(errp, "node-name=%s is conflicting with a device id",
8320c5e94eeSBenoît Canet                    node_name);
83315489c76SJeff Cody         goto out;
8340c5e94eeSBenoît Canet     }
8350c5e94eeSBenoît Canet 
8366913c0c2SBenoît Canet     /* takes care of avoiding duplicates node names */
8376913c0c2SBenoît Canet     if (bdrv_find_node(node_name)) {
8386913c0c2SBenoît Canet         error_setg(errp, "Duplicate node name");
83915489c76SJeff Cody         goto out;
8406913c0c2SBenoît Canet     }
8416913c0c2SBenoît Canet 
8426913c0c2SBenoît Canet     /* copy node name into the bs and insert it into the graph list */
8436913c0c2SBenoît Canet     pstrcpy(bs->node_name, sizeof(bs->node_name), node_name);
8446913c0c2SBenoît Canet     QTAILQ_INSERT_TAIL(&graph_bdrv_states, bs, node_list);
84515489c76SJeff Cody out:
84615489c76SJeff Cody     g_free(gen_node_name);
8476913c0c2SBenoît Canet }
8486913c0c2SBenoît Canet 
84918edf289SKevin Wolf static QemuOptsList bdrv_runtime_opts = {
85018edf289SKevin Wolf     .name = "bdrv_common",
85118edf289SKevin Wolf     .head = QTAILQ_HEAD_INITIALIZER(bdrv_runtime_opts.head),
85218edf289SKevin Wolf     .desc = {
85318edf289SKevin Wolf         {
85418edf289SKevin Wolf             .name = "node-name",
85518edf289SKevin Wolf             .type = QEMU_OPT_STRING,
85618edf289SKevin Wolf             .help = "Node name of the block device node",
85718edf289SKevin Wolf         },
85862392ebbSKevin Wolf         {
85962392ebbSKevin Wolf             .name = "driver",
86062392ebbSKevin Wolf             .type = QEMU_OPT_STRING,
86162392ebbSKevin Wolf             .help = "Block driver to use for the node",
86262392ebbSKevin Wolf         },
86391a097e7SKevin Wolf         {
86491a097e7SKevin Wolf             .name = BDRV_OPT_CACHE_DIRECT,
86591a097e7SKevin Wolf             .type = QEMU_OPT_BOOL,
86691a097e7SKevin Wolf             .help = "Bypass software writeback cache on the host",
86791a097e7SKevin Wolf         },
86891a097e7SKevin Wolf         {
86991a097e7SKevin Wolf             .name = BDRV_OPT_CACHE_NO_FLUSH,
87091a097e7SKevin Wolf             .type = QEMU_OPT_BOOL,
87191a097e7SKevin Wolf             .help = "Ignore flush requests",
87291a097e7SKevin Wolf         },
87318edf289SKevin Wolf         { /* end of list */ }
87418edf289SKevin Wolf     },
87518edf289SKevin Wolf };
87618edf289SKevin Wolf 
877b6ce07aaSKevin Wolf /*
87857915332SKevin Wolf  * Common part for opening disk images and files
879b6ad491aSKevin Wolf  *
880b6ad491aSKevin Wolf  * Removes all processed options from *options.
88157915332SKevin Wolf  */
8829a4f4c31SKevin Wolf static int bdrv_open_common(BlockDriverState *bs, BdrvChild *file,
88382dc8b41SKevin Wolf                             QDict *options, Error **errp)
88457915332SKevin Wolf {
88557915332SKevin Wolf     int ret, open_flags;
886035fccdfSKevin Wolf     const char *filename;
88762392ebbSKevin Wolf     const char *driver_name = NULL;
8886913c0c2SBenoît Canet     const char *node_name = NULL;
88918edf289SKevin Wolf     QemuOpts *opts;
89062392ebbSKevin Wolf     BlockDriver *drv;
89134b5d2c6SMax Reitz     Error *local_err = NULL;
89257915332SKevin Wolf 
8936405875cSPaolo Bonzini     assert(bs->file == NULL);
894707ff828SKevin Wolf     assert(options != NULL && bs->options != options);
89557915332SKevin Wolf 
89662392ebbSKevin Wolf     opts = qemu_opts_create(&bdrv_runtime_opts, NULL, 0, &error_abort);
89762392ebbSKevin Wolf     qemu_opts_absorb_qdict(opts, options, &local_err);
89862392ebbSKevin Wolf     if (local_err) {
89962392ebbSKevin Wolf         error_propagate(errp, local_err);
90062392ebbSKevin Wolf         ret = -EINVAL;
90162392ebbSKevin Wolf         goto fail_opts;
90262392ebbSKevin Wolf     }
90362392ebbSKevin Wolf 
90462392ebbSKevin Wolf     driver_name = qemu_opt_get(opts, "driver");
90562392ebbSKevin Wolf     drv = bdrv_find_format(driver_name);
90662392ebbSKevin Wolf     assert(drv != NULL);
90762392ebbSKevin Wolf 
90845673671SKevin Wolf     if (file != NULL) {
9099a4f4c31SKevin Wolf         filename = file->bs->filename;
91045673671SKevin Wolf     } else {
91145673671SKevin Wolf         filename = qdict_get_try_str(options, "filename");
91245673671SKevin Wolf     }
91345673671SKevin Wolf 
914765003dbSKevin Wolf     if (drv->bdrv_needs_filename && !filename) {
915765003dbSKevin Wolf         error_setg(errp, "The '%s' block driver requires a file name",
916765003dbSKevin Wolf                    drv->format_name);
91718edf289SKevin Wolf         ret = -EINVAL;
91818edf289SKevin Wolf         goto fail_opts;
91918edf289SKevin Wolf     }
92018edf289SKevin Wolf 
92182dc8b41SKevin Wolf     trace_bdrv_open_common(bs, filename ?: "", bs->open_flags,
92282dc8b41SKevin Wolf                            drv->format_name);
92362392ebbSKevin Wolf 
92418edf289SKevin Wolf     node_name = qemu_opt_get(opts, "node-name");
925636ea370SKevin Wolf     bdrv_assign_node_name(bs, node_name, &local_err);
9260fb6395cSMarkus Armbruster     if (local_err) {
927636ea370SKevin Wolf         error_propagate(errp, local_err);
92818edf289SKevin Wolf         ret = -EINVAL;
92918edf289SKevin Wolf         goto fail_opts;
9305d186eb0SKevin Wolf     }
9315d186eb0SKevin Wolf 
932c25f53b0SPaolo Bonzini     bs->request_alignment = 512;
9330d51b4deSAsias He     bs->zero_beyond_eof = true;
93482dc8b41SKevin Wolf     bs->read_only = !(bs->open_flags & BDRV_O_RDWR);
935b64ec4e4SFam Zheng 
936b64ec4e4SFam Zheng     if (use_bdrv_whitelist && !bdrv_is_whitelisted(drv, bs->read_only)) {
9378f94a6e4SKevin Wolf         error_setg(errp,
9388f94a6e4SKevin Wolf                    !bs->read_only && bdrv_is_whitelisted(drv, true)
9398f94a6e4SKevin Wolf                         ? "Driver '%s' can only be used for read-only devices"
9408f94a6e4SKevin Wolf                         : "Driver '%s' is not whitelisted",
9418f94a6e4SKevin Wolf                    drv->format_name);
94218edf289SKevin Wolf         ret = -ENOTSUP;
94318edf289SKevin Wolf         goto fail_opts;
944b64ec4e4SFam Zheng     }
94557915332SKevin Wolf 
94653fec9d3SStefan Hajnoczi     assert(bs->copy_on_read == 0); /* bdrv_new() and bdrv_close() make it so */
94782dc8b41SKevin Wolf     if (bs->open_flags & BDRV_O_COPY_ON_READ) {
9480ebd24e0SKevin Wolf         if (!bs->read_only) {
94953fec9d3SStefan Hajnoczi             bdrv_enable_copy_on_read(bs);
9500ebd24e0SKevin Wolf         } else {
9510ebd24e0SKevin Wolf             error_setg(errp, "Can't use copy-on-read on read-only device");
95218edf289SKevin Wolf             ret = -EINVAL;
95318edf289SKevin Wolf             goto fail_opts;
9540ebd24e0SKevin Wolf         }
95553fec9d3SStefan Hajnoczi     }
95653fec9d3SStefan Hajnoczi 
957c2ad1b0cSKevin Wolf     if (filename != NULL) {
95857915332SKevin Wolf         pstrcpy(bs->filename, sizeof(bs->filename), filename);
959c2ad1b0cSKevin Wolf     } else {
960c2ad1b0cSKevin Wolf         bs->filename[0] = '\0';
961c2ad1b0cSKevin Wolf     }
96291af7014SMax Reitz     pstrcpy(bs->exact_filename, sizeof(bs->exact_filename), bs->filename);
96357915332SKevin Wolf 
96457915332SKevin Wolf     bs->drv = drv;
9657267c094SAnthony Liguori     bs->opaque = g_malloc0(drv->instance_size);
96657915332SKevin Wolf 
96791a097e7SKevin Wolf     /* Apply cache mode options */
96891a097e7SKevin Wolf     update_flags_from_options(&bs->open_flags, opts);
96973ac451fSKevin Wolf 
97066f82ceeSKevin Wolf     /* Open the image, either directly or using a protocol */
97182dc8b41SKevin Wolf     open_flags = bdrv_open_flags(bs, bs->open_flags);
97266f82ceeSKevin Wolf     if (drv->bdrv_file_open) {
9735d186eb0SKevin Wolf         assert(file == NULL);
974030be321SBenoît Canet         assert(!drv->bdrv_needs_filename || filename != NULL);
97534b5d2c6SMax Reitz         ret = drv->bdrv_file_open(bs, options, open_flags, &local_err);
976f500a6d3SKevin Wolf     } else {
9772af5ef70SKevin Wolf         if (file == NULL) {
97834b5d2c6SMax Reitz             error_setg(errp, "Can't use '%s' as a block driver for the "
97934b5d2c6SMax Reitz                        "protocol level", drv->format_name);
9802af5ef70SKevin Wolf             ret = -EINVAL;
9812af5ef70SKevin Wolf             goto free_and_fail;
9822af5ef70SKevin Wolf         }
983f500a6d3SKevin Wolf         bs->file = file;
98434b5d2c6SMax Reitz         ret = drv->bdrv_open(bs, options, open_flags, &local_err);
98566f82ceeSKevin Wolf     }
98666f82ceeSKevin Wolf 
98757915332SKevin Wolf     if (ret < 0) {
98884d18f06SMarkus Armbruster         if (local_err) {
98934b5d2c6SMax Reitz             error_propagate(errp, local_err);
9902fa9aa59SDunrong Huang         } else if (bs->filename[0]) {
9912fa9aa59SDunrong Huang             error_setg_errno(errp, -ret, "Could not open '%s'", bs->filename);
99234b5d2c6SMax Reitz         } else {
99334b5d2c6SMax Reitz             error_setg_errno(errp, -ret, "Could not open image");
99434b5d2c6SMax Reitz         }
99557915332SKevin Wolf         goto free_and_fail;
99657915332SKevin Wolf     }
99757915332SKevin Wolf 
99851762288SStefan Hajnoczi     ret = refresh_total_sectors(bs, bs->total_sectors);
99951762288SStefan Hajnoczi     if (ret < 0) {
100034b5d2c6SMax Reitz         error_setg_errno(errp, -ret, "Could not refresh total sector count");
100151762288SStefan Hajnoczi         goto free_and_fail;
100257915332SKevin Wolf     }
100351762288SStefan Hajnoczi 
10043baca891SKevin Wolf     bdrv_refresh_limits(bs, &local_err);
10053baca891SKevin Wolf     if (local_err) {
10063baca891SKevin Wolf         error_propagate(errp, local_err);
10073baca891SKevin Wolf         ret = -EINVAL;
10083baca891SKevin Wolf         goto free_and_fail;
10093baca891SKevin Wolf     }
10103baca891SKevin Wolf 
1011c25f53b0SPaolo Bonzini     assert(bdrv_opt_mem_align(bs) != 0);
10124196d2f0SDenis V. Lunev     assert(bdrv_min_mem_align(bs) != 0);
1013b192af8aSDimitris Aragiorgis     assert((bs->request_alignment != 0) || bdrv_is_sg(bs));
101418edf289SKevin Wolf 
101518edf289SKevin Wolf     qemu_opts_del(opts);
101657915332SKevin Wolf     return 0;
101757915332SKevin Wolf 
101857915332SKevin Wolf free_and_fail:
101966f82ceeSKevin Wolf     bs->file = NULL;
10207267c094SAnthony Liguori     g_free(bs->opaque);
102157915332SKevin Wolf     bs->opaque = NULL;
102257915332SKevin Wolf     bs->drv = NULL;
102318edf289SKevin Wolf fail_opts:
102418edf289SKevin Wolf     qemu_opts_del(opts);
102557915332SKevin Wolf     return ret;
102657915332SKevin Wolf }
102757915332SKevin Wolf 
10285e5c4f63SKevin Wolf static QDict *parse_json_filename(const char *filename, Error **errp)
10295e5c4f63SKevin Wolf {
10305e5c4f63SKevin Wolf     QObject *options_obj;
10315e5c4f63SKevin Wolf     QDict *options;
10325e5c4f63SKevin Wolf     int ret;
10335e5c4f63SKevin Wolf 
10345e5c4f63SKevin Wolf     ret = strstart(filename, "json:", &filename);
10355e5c4f63SKevin Wolf     assert(ret);
10365e5c4f63SKevin Wolf 
10375e5c4f63SKevin Wolf     options_obj = qobject_from_json(filename);
10385e5c4f63SKevin Wolf     if (!options_obj) {
10395e5c4f63SKevin Wolf         error_setg(errp, "Could not parse the JSON options");
10405e5c4f63SKevin Wolf         return NULL;
10415e5c4f63SKevin Wolf     }
10425e5c4f63SKevin Wolf 
10435e5c4f63SKevin Wolf     if (qobject_type(options_obj) != QTYPE_QDICT) {
10445e5c4f63SKevin Wolf         qobject_decref(options_obj);
10455e5c4f63SKevin Wolf         error_setg(errp, "Invalid JSON object given");
10465e5c4f63SKevin Wolf         return NULL;
10475e5c4f63SKevin Wolf     }
10485e5c4f63SKevin Wolf 
10495e5c4f63SKevin Wolf     options = qobject_to_qdict(options_obj);
10505e5c4f63SKevin Wolf     qdict_flatten(options);
10515e5c4f63SKevin Wolf 
10525e5c4f63SKevin Wolf     return options;
10535e5c4f63SKevin Wolf }
10545e5c4f63SKevin Wolf 
1055de3b53f0SKevin Wolf static void parse_json_protocol(QDict *options, const char **pfilename,
1056de3b53f0SKevin Wolf                                 Error **errp)
1057de3b53f0SKevin Wolf {
1058de3b53f0SKevin Wolf     QDict *json_options;
1059de3b53f0SKevin Wolf     Error *local_err = NULL;
1060de3b53f0SKevin Wolf 
1061de3b53f0SKevin Wolf     /* Parse json: pseudo-protocol */
1062de3b53f0SKevin Wolf     if (!*pfilename || !g_str_has_prefix(*pfilename, "json:")) {
1063de3b53f0SKevin Wolf         return;
1064de3b53f0SKevin Wolf     }
1065de3b53f0SKevin Wolf 
1066de3b53f0SKevin Wolf     json_options = parse_json_filename(*pfilename, &local_err);
1067de3b53f0SKevin Wolf     if (local_err) {
1068de3b53f0SKevin Wolf         error_propagate(errp, local_err);
1069de3b53f0SKevin Wolf         return;
1070de3b53f0SKevin Wolf     }
1071de3b53f0SKevin Wolf 
1072de3b53f0SKevin Wolf     /* Options given in the filename have lower priority than options
1073de3b53f0SKevin Wolf      * specified directly */
1074de3b53f0SKevin Wolf     qdict_join(options, json_options, false);
1075de3b53f0SKevin Wolf     QDECREF(json_options);
1076de3b53f0SKevin Wolf     *pfilename = NULL;
1077de3b53f0SKevin Wolf }
1078de3b53f0SKevin Wolf 
107957915332SKevin Wolf /*
1080f54120ffSKevin Wolf  * Fills in default options for opening images and converts the legacy
1081f54120ffSKevin Wolf  * filename/flags pair to option QDict entries.
108253a29513SMax Reitz  * The BDRV_O_PROTOCOL flag in *flags will be set or cleared accordingly if a
108353a29513SMax Reitz  * block driver has been specified explicitly.
1084f54120ffSKevin Wolf  */
1085de3b53f0SKevin Wolf static int bdrv_fill_options(QDict **options, const char *filename,
1086053e1578SMax Reitz                              int *flags, Error **errp)
1087f54120ffSKevin Wolf {
1088f54120ffSKevin Wolf     const char *drvname;
108953a29513SMax Reitz     bool protocol = *flags & BDRV_O_PROTOCOL;
1090f54120ffSKevin Wolf     bool parse_filename = false;
1091053e1578SMax Reitz     BlockDriver *drv = NULL;
1092f54120ffSKevin Wolf     Error *local_err = NULL;
1093f54120ffSKevin Wolf 
109453a29513SMax Reitz     drvname = qdict_get_try_str(*options, "driver");
1095053e1578SMax Reitz     if (drvname) {
1096053e1578SMax Reitz         drv = bdrv_find_format(drvname);
1097053e1578SMax Reitz         if (!drv) {
1098053e1578SMax Reitz             error_setg(errp, "Unknown driver '%s'", drvname);
1099053e1578SMax Reitz             return -ENOENT;
1100053e1578SMax Reitz         }
110153a29513SMax Reitz         /* If the user has explicitly specified the driver, this choice should
110253a29513SMax Reitz          * override the BDRV_O_PROTOCOL flag */
1103053e1578SMax Reitz         protocol = drv->bdrv_file_open;
110453a29513SMax Reitz     }
110553a29513SMax Reitz 
110653a29513SMax Reitz     if (protocol) {
110753a29513SMax Reitz         *flags |= BDRV_O_PROTOCOL;
110853a29513SMax Reitz     } else {
110953a29513SMax Reitz         *flags &= ~BDRV_O_PROTOCOL;
111053a29513SMax Reitz     }
111153a29513SMax Reitz 
111291a097e7SKevin Wolf     /* Translate cache options from flags into options */
111391a097e7SKevin Wolf     update_options_from_flags(*options, *flags);
111491a097e7SKevin Wolf 
1115f54120ffSKevin Wolf     /* Fetch the file name from the options QDict if necessary */
111617b005f1SKevin Wolf     if (protocol && filename) {
1117f54120ffSKevin Wolf         if (!qdict_haskey(*options, "filename")) {
1118f54120ffSKevin Wolf             qdict_put(*options, "filename", qstring_from_str(filename));
1119f54120ffSKevin Wolf             parse_filename = true;
1120f54120ffSKevin Wolf         } else {
1121f54120ffSKevin Wolf             error_setg(errp, "Can't specify 'file' and 'filename' options at "
1122f54120ffSKevin Wolf                              "the same time");
1123f54120ffSKevin Wolf             return -EINVAL;
1124f54120ffSKevin Wolf         }
1125f54120ffSKevin Wolf     }
1126f54120ffSKevin Wolf 
1127f54120ffSKevin Wolf     /* Find the right block driver */
1128f54120ffSKevin Wolf     filename = qdict_get_try_str(*options, "filename");
1129f54120ffSKevin Wolf 
113017b005f1SKevin Wolf     if (!drvname && protocol) {
1131f54120ffSKevin Wolf         if (filename) {
1132b65a5e12SMax Reitz             drv = bdrv_find_protocol(filename, parse_filename, errp);
1133f54120ffSKevin Wolf             if (!drv) {
1134f54120ffSKevin Wolf                 return -EINVAL;
1135f54120ffSKevin Wolf             }
1136f54120ffSKevin Wolf 
1137f54120ffSKevin Wolf             drvname = drv->format_name;
1138f54120ffSKevin Wolf             qdict_put(*options, "driver", qstring_from_str(drvname));
1139f54120ffSKevin Wolf         } else {
1140f54120ffSKevin Wolf             error_setg(errp, "Must specify either driver or file");
1141f54120ffSKevin Wolf             return -EINVAL;
1142f54120ffSKevin Wolf         }
114317b005f1SKevin Wolf     }
114417b005f1SKevin Wolf 
114517b005f1SKevin Wolf     assert(drv || !protocol);
1146f54120ffSKevin Wolf 
1147f54120ffSKevin Wolf     /* Driver-specific filename parsing */
114817b005f1SKevin Wolf     if (drv && drv->bdrv_parse_filename && parse_filename) {
1149f54120ffSKevin Wolf         drv->bdrv_parse_filename(filename, *options, &local_err);
1150f54120ffSKevin Wolf         if (local_err) {
1151f54120ffSKevin Wolf             error_propagate(errp, local_err);
1152f54120ffSKevin Wolf             return -EINVAL;
1153f54120ffSKevin Wolf         }
1154f54120ffSKevin Wolf 
1155f54120ffSKevin Wolf         if (!drv->bdrv_needs_filename) {
1156f54120ffSKevin Wolf             qdict_del(*options, "filename");
1157f54120ffSKevin Wolf         }
1158f54120ffSKevin Wolf     }
1159f54120ffSKevin Wolf 
1160f54120ffSKevin Wolf     return 0;
1161f54120ffSKevin Wolf }
1162f54120ffSKevin Wolf 
1163f21d96d0SKevin Wolf BdrvChild *bdrv_root_attach_child(BlockDriverState *child_bs,
1164260fecf1SKevin Wolf                                   const char *child_name,
1165df581792SKevin Wolf                                   const BdrvChildRole *child_role)
1166df581792SKevin Wolf {
1167df581792SKevin Wolf     BdrvChild *child = g_new(BdrvChild, 1);
1168df581792SKevin Wolf     *child = (BdrvChild) {
1169df581792SKevin Wolf         .bs     = child_bs,
1170260fecf1SKevin Wolf         .name   = g_strdup(child_name),
1171df581792SKevin Wolf         .role   = child_role,
1172df581792SKevin Wolf     };
1173df581792SKevin Wolf 
1174d42a8a93SKevin Wolf     QLIST_INSERT_HEAD(&child_bs->parents, child, next_parent);
1175b4b059f6SKevin Wolf 
1176b4b059f6SKevin Wolf     return child;
1177df581792SKevin Wolf }
1178df581792SKevin Wolf 
1179f21d96d0SKevin Wolf static BdrvChild *bdrv_attach_child(BlockDriverState *parent_bs,
1180f21d96d0SKevin Wolf                                     BlockDriverState *child_bs,
1181f21d96d0SKevin Wolf                                     const char *child_name,
1182f21d96d0SKevin Wolf                                     const BdrvChildRole *child_role)
1183f21d96d0SKevin Wolf {
1184f21d96d0SKevin Wolf     BdrvChild *child = bdrv_root_attach_child(child_bs, child_name, child_role);
1185f21d96d0SKevin Wolf     QLIST_INSERT_HEAD(&parent_bs->children, child, next);
1186f21d96d0SKevin Wolf     return child;
1187f21d96d0SKevin Wolf }
1188f21d96d0SKevin Wolf 
11893f09bfbcSKevin Wolf static void bdrv_detach_child(BdrvChild *child)
119033a60407SKevin Wolf {
1191f21d96d0SKevin Wolf     if (child->next.le_prev) {
119233a60407SKevin Wolf         QLIST_REMOVE(child, next);
1193f21d96d0SKevin Wolf         child->next.le_prev = NULL;
1194f21d96d0SKevin Wolf     }
1195d42a8a93SKevin Wolf     QLIST_REMOVE(child, next_parent);
1196260fecf1SKevin Wolf     g_free(child->name);
119733a60407SKevin Wolf     g_free(child);
119833a60407SKevin Wolf }
119933a60407SKevin Wolf 
1200f21d96d0SKevin Wolf void bdrv_root_unref_child(BdrvChild *child)
120133a60407SKevin Wolf {
1202779020cbSKevin Wolf     BlockDriverState *child_bs;
1203779020cbSKevin Wolf 
1204f21d96d0SKevin Wolf     child_bs = child->bs;
1205f21d96d0SKevin Wolf     bdrv_detach_child(child);
1206f21d96d0SKevin Wolf     bdrv_unref(child_bs);
1207f21d96d0SKevin Wolf }
1208f21d96d0SKevin Wolf 
1209f21d96d0SKevin Wolf void bdrv_unref_child(BlockDriverState *parent, BdrvChild *child)
1210f21d96d0SKevin Wolf {
1211779020cbSKevin Wolf     if (child == NULL) {
1212779020cbSKevin Wolf         return;
1213779020cbSKevin Wolf     }
121433a60407SKevin Wolf 
121533a60407SKevin Wolf     if (child->bs->inherits_from == parent) {
121633a60407SKevin Wolf         child->bs->inherits_from = NULL;
121733a60407SKevin Wolf     }
121833a60407SKevin Wolf 
1219f21d96d0SKevin Wolf     bdrv_root_unref_child(child);
122033a60407SKevin Wolf }
122133a60407SKevin Wolf 
12225db15a57SKevin Wolf /*
12235db15a57SKevin Wolf  * Sets the backing file link of a BDS. A new reference is created; callers
12245db15a57SKevin Wolf  * which don't need their own reference any more must call bdrv_unref().
12255db15a57SKevin Wolf  */
12268d24cce1SFam Zheng void bdrv_set_backing_hd(BlockDriverState *bs, BlockDriverState *backing_hd)
12278d24cce1SFam Zheng {
12285db15a57SKevin Wolf     if (backing_hd) {
12295db15a57SKevin Wolf         bdrv_ref(backing_hd);
12305db15a57SKevin Wolf     }
12318d24cce1SFam Zheng 
1232760e0063SKevin Wolf     if (bs->backing) {
1233826b6ca0SFam Zheng         assert(bs->backing_blocker);
1234760e0063SKevin Wolf         bdrv_op_unblock_all(bs->backing->bs, bs->backing_blocker);
12355db15a57SKevin Wolf         bdrv_unref_child(bs, bs->backing);
1236826b6ca0SFam Zheng     } else if (backing_hd) {
1237826b6ca0SFam Zheng         error_setg(&bs->backing_blocker,
123881e5f78aSAlberto Garcia                    "node is used as backing hd of '%s'",
123981e5f78aSAlberto Garcia                    bdrv_get_device_or_node_name(bs));
1240826b6ca0SFam Zheng     }
1241826b6ca0SFam Zheng 
12428d24cce1SFam Zheng     if (!backing_hd) {
1243826b6ca0SFam Zheng         error_free(bs->backing_blocker);
1244826b6ca0SFam Zheng         bs->backing_blocker = NULL;
1245760e0063SKevin Wolf         bs->backing = NULL;
12468d24cce1SFam Zheng         goto out;
12478d24cce1SFam Zheng     }
1248260fecf1SKevin Wolf     bs->backing = bdrv_attach_child(bs, backing_hd, "backing", &child_backing);
12498d24cce1SFam Zheng     bs->open_flags &= ~BDRV_O_NO_BACKING;
12508d24cce1SFam Zheng     pstrcpy(bs->backing_file, sizeof(bs->backing_file), backing_hd->filename);
12518d24cce1SFam Zheng     pstrcpy(bs->backing_format, sizeof(bs->backing_format),
12528d24cce1SFam Zheng             backing_hd->drv ? backing_hd->drv->format_name : "");
1253826b6ca0SFam Zheng 
1254760e0063SKevin Wolf     bdrv_op_block_all(backing_hd, bs->backing_blocker);
1255826b6ca0SFam Zheng     /* Otherwise we won't be able to commit due to check in bdrv_commit */
1256760e0063SKevin Wolf     bdrv_op_unblock(backing_hd, BLOCK_OP_TYPE_COMMIT_TARGET,
1257826b6ca0SFam Zheng                     bs->backing_blocker);
12588d24cce1SFam Zheng out:
12593baca891SKevin Wolf     bdrv_refresh_limits(bs, NULL);
12608d24cce1SFam Zheng }
12618d24cce1SFam Zheng 
126231ca6d07SKevin Wolf /*
126331ca6d07SKevin Wolf  * Opens the backing file for a BlockDriverState if not yet open
126431ca6d07SKevin Wolf  *
1265d9b7b057SKevin Wolf  * bdref_key specifies the key for the image's BlockdevRef in the options QDict.
1266d9b7b057SKevin Wolf  * That QDict has to be flattened; therefore, if the BlockdevRef is a QDict
1267d9b7b057SKevin Wolf  * itself, all options starting with "${bdref_key}." are considered part of the
1268d9b7b057SKevin Wolf  * BlockdevRef.
1269d9b7b057SKevin Wolf  *
1270d9b7b057SKevin Wolf  * TODO Can this be unified with bdrv_open_image()?
127131ca6d07SKevin Wolf  */
1272d9b7b057SKevin Wolf int bdrv_open_backing_file(BlockDriverState *bs, QDict *parent_options,
1273d9b7b057SKevin Wolf                            const char *bdref_key, Error **errp)
12749156df12SPaolo Bonzini {
12751ba4b6a5SBenoît Canet     char *backing_filename = g_malloc0(PATH_MAX);
1276d9b7b057SKevin Wolf     char *bdref_key_dot;
1277d9b7b057SKevin Wolf     const char *reference = NULL;
1278317fc44eSKevin Wolf     int ret = 0;
12798d24cce1SFam Zheng     BlockDriverState *backing_hd;
1280d9b7b057SKevin Wolf     QDict *options;
1281d9b7b057SKevin Wolf     QDict *tmp_parent_options = NULL;
128234b5d2c6SMax Reitz     Error *local_err = NULL;
12839156df12SPaolo Bonzini 
1284760e0063SKevin Wolf     if (bs->backing != NULL) {
12851ba4b6a5SBenoît Canet         goto free_exit;
12869156df12SPaolo Bonzini     }
12879156df12SPaolo Bonzini 
128831ca6d07SKevin Wolf     /* NULL means an empty set of options */
1289d9b7b057SKevin Wolf     if (parent_options == NULL) {
1290d9b7b057SKevin Wolf         tmp_parent_options = qdict_new();
1291d9b7b057SKevin Wolf         parent_options = tmp_parent_options;
129231ca6d07SKevin Wolf     }
129331ca6d07SKevin Wolf 
12949156df12SPaolo Bonzini     bs->open_flags &= ~BDRV_O_NO_BACKING;
1295d9b7b057SKevin Wolf 
1296d9b7b057SKevin Wolf     bdref_key_dot = g_strdup_printf("%s.", bdref_key);
1297d9b7b057SKevin Wolf     qdict_extract_subqdict(parent_options, &options, bdref_key_dot);
1298d9b7b057SKevin Wolf     g_free(bdref_key_dot);
1299d9b7b057SKevin Wolf 
1300d9b7b057SKevin Wolf     reference = qdict_get_try_str(parent_options, bdref_key);
1301d9b7b057SKevin Wolf     if (reference || qdict_haskey(options, "file.filename")) {
13021cb6f506SKevin Wolf         backing_filename[0] = '\0';
13031cb6f506SKevin Wolf     } else if (bs->backing_file[0] == '\0' && qdict_size(options) == 0) {
130431ca6d07SKevin Wolf         QDECREF(options);
13051ba4b6a5SBenoît Canet         goto free_exit;
1306dbecebddSFam Zheng     } else {
13079f07429eSMax Reitz         bdrv_get_full_backing_filename(bs, backing_filename, PATH_MAX,
13089f07429eSMax Reitz                                        &local_err);
13099f07429eSMax Reitz         if (local_err) {
13109f07429eSMax Reitz             ret = -EINVAL;
13119f07429eSMax Reitz             error_propagate(errp, local_err);
13129f07429eSMax Reitz             QDECREF(options);
13139f07429eSMax Reitz             goto free_exit;
13149f07429eSMax Reitz         }
13159156df12SPaolo Bonzini     }
13169156df12SPaolo Bonzini 
13178ee79e70SKevin Wolf     if (!bs->drv || !bs->drv->supports_backing) {
13188ee79e70SKevin Wolf         ret = -EINVAL;
13198ee79e70SKevin Wolf         error_setg(errp, "Driver doesn't support backing files");
13208ee79e70SKevin Wolf         QDECREF(options);
13218ee79e70SKevin Wolf         goto free_exit;
13228ee79e70SKevin Wolf     }
13238ee79e70SKevin Wolf 
1324c5f6e493SKevin Wolf     if (bs->backing_format[0] != '\0' && !qdict_haskey(options, "driver")) {
1325c5f6e493SKevin Wolf         qdict_put(options, "driver", qstring_from_str(bs->backing_format));
13269156df12SPaolo Bonzini     }
13279156df12SPaolo Bonzini 
1328d9b7b057SKevin Wolf     backing_hd = NULL;
1329f3930ed0SKevin Wolf     ret = bdrv_open_inherit(&backing_hd,
1330f3930ed0SKevin Wolf                             *backing_filename ? backing_filename : NULL,
1331d9b7b057SKevin Wolf                             reference, options, 0, bs, &child_backing,
1332e43bfd9cSMarkus Armbruster                             errp);
13339156df12SPaolo Bonzini     if (ret < 0) {
13349156df12SPaolo Bonzini         bs->open_flags |= BDRV_O_NO_BACKING;
1335e43bfd9cSMarkus Armbruster         error_prepend(errp, "Could not open backing file: ");
13361ba4b6a5SBenoît Canet         goto free_exit;
13379156df12SPaolo Bonzini     }
1338df581792SKevin Wolf 
13395db15a57SKevin Wolf     /* Hook up the backing file link; drop our reference, bs owns the
13405db15a57SKevin Wolf      * backing_hd reference now */
13418d24cce1SFam Zheng     bdrv_set_backing_hd(bs, backing_hd);
13425db15a57SKevin Wolf     bdrv_unref(backing_hd);
1343d80ac658SPeter Feiner 
1344d9b7b057SKevin Wolf     qdict_del(parent_options, bdref_key);
1345d9b7b057SKevin Wolf 
13461ba4b6a5SBenoît Canet free_exit:
13471ba4b6a5SBenoît Canet     g_free(backing_filename);
1348d9b7b057SKevin Wolf     QDECREF(tmp_parent_options);
13491ba4b6a5SBenoît Canet     return ret;
13509156df12SPaolo Bonzini }
13519156df12SPaolo Bonzini 
1352b6ce07aaSKevin Wolf /*
1353da557aacSMax Reitz  * Opens a disk image whose options are given as BlockdevRef in another block
1354da557aacSMax Reitz  * device's options.
1355da557aacSMax Reitz  *
1356da557aacSMax Reitz  * If allow_none is true, no image will be opened if filename is false and no
1357b4b059f6SKevin Wolf  * BlockdevRef is given. NULL will be returned, but errp remains unset.
1358da557aacSMax Reitz  *
1359da557aacSMax Reitz  * bdrev_key specifies the key for the image's BlockdevRef in the options QDict.
1360da557aacSMax Reitz  * That QDict has to be flattened; therefore, if the BlockdevRef is a QDict
1361da557aacSMax Reitz  * itself, all options starting with "${bdref_key}." are considered part of the
1362da557aacSMax Reitz  * BlockdevRef.
1363da557aacSMax Reitz  *
1364da557aacSMax Reitz  * The BlockdevRef will be removed from the options QDict.
1365da557aacSMax Reitz  */
1366b4b059f6SKevin Wolf BdrvChild *bdrv_open_child(const char *filename,
1367f3930ed0SKevin Wolf                            QDict *options, const char *bdref_key,
1368b4b059f6SKevin Wolf                            BlockDriverState* parent,
1369b4b059f6SKevin Wolf                            const BdrvChildRole *child_role,
1370f7d9fd8cSMax Reitz                            bool allow_none, Error **errp)
1371da557aacSMax Reitz {
1372b4b059f6SKevin Wolf     BdrvChild *c = NULL;
1373b4b059f6SKevin Wolf     BlockDriverState *bs;
1374da557aacSMax Reitz     QDict *image_options;
1375da557aacSMax Reitz     int ret;
1376da557aacSMax Reitz     char *bdref_key_dot;
1377da557aacSMax Reitz     const char *reference;
1378da557aacSMax Reitz 
1379df581792SKevin Wolf     assert(child_role != NULL);
1380f67503e5SMax Reitz 
1381da557aacSMax Reitz     bdref_key_dot = g_strdup_printf("%s.", bdref_key);
1382da557aacSMax Reitz     qdict_extract_subqdict(options, &image_options, bdref_key_dot);
1383da557aacSMax Reitz     g_free(bdref_key_dot);
1384da557aacSMax Reitz 
1385da557aacSMax Reitz     reference = qdict_get_try_str(options, bdref_key);
1386da557aacSMax Reitz     if (!filename && !reference && !qdict_size(image_options)) {
1387b4b059f6SKevin Wolf         if (!allow_none) {
1388da557aacSMax Reitz             error_setg(errp, "A block device must be specified for \"%s\"",
1389da557aacSMax Reitz                        bdref_key);
1390da557aacSMax Reitz         }
1391b20e61e0SMarkus Armbruster         QDECREF(image_options);
1392da557aacSMax Reitz         goto done;
1393da557aacSMax Reitz     }
1394da557aacSMax Reitz 
1395b4b059f6SKevin Wolf     bs = NULL;
1396b4b059f6SKevin Wolf     ret = bdrv_open_inherit(&bs, filename, reference, image_options, 0,
1397ce343771SMax Reitz                             parent, child_role, errp);
1398df581792SKevin Wolf     if (ret < 0) {
1399df581792SKevin Wolf         goto done;
1400df581792SKevin Wolf     }
1401df581792SKevin Wolf 
1402260fecf1SKevin Wolf     c = bdrv_attach_child(parent, bs, bdref_key, child_role);
1403da557aacSMax Reitz 
1404da557aacSMax Reitz done:
1405da557aacSMax Reitz     qdict_del(options, bdref_key);
1406b4b059f6SKevin Wolf     return c;
1407b4b059f6SKevin Wolf }
1408b4b059f6SKevin Wolf 
140973176beeSKevin Wolf static int bdrv_append_temp_snapshot(BlockDriverState *bs, int flags,
141073176beeSKevin Wolf                                      QDict *snapshot_options, Error **errp)
1411b998875dSKevin Wolf {
1412b998875dSKevin Wolf     /* TODO: extra byte is a hack to ensure MAX_PATH space on Windows. */
14131ba4b6a5SBenoît Canet     char *tmp_filename = g_malloc0(PATH_MAX + 1);
1414b998875dSKevin Wolf     int64_t total_size;
141583d0521aSChunyan Liu     QemuOpts *opts = NULL;
1416b998875dSKevin Wolf     BlockDriverState *bs_snapshot;
1417c2e0dbbfSFam Zheng     Error *local_err = NULL;
1418b998875dSKevin Wolf     int ret;
1419b998875dSKevin Wolf 
1420b998875dSKevin Wolf     /* if snapshot, we create a temporary backing file and open it
1421b998875dSKevin Wolf        instead of opening 'filename' directly */
1422b998875dSKevin Wolf 
1423b998875dSKevin Wolf     /* Get the required size from the image */
1424f187743aSKevin Wolf     total_size = bdrv_getlength(bs);
1425f187743aSKevin Wolf     if (total_size < 0) {
14266b8aeca5SChen Gang         ret = total_size;
1427f187743aSKevin Wolf         error_setg_errno(errp, -total_size, "Could not get image size");
14281ba4b6a5SBenoît Canet         goto out;
1429f187743aSKevin Wolf     }
1430b998875dSKevin Wolf 
1431b998875dSKevin Wolf     /* Create the temporary image */
14321ba4b6a5SBenoît Canet     ret = get_tmp_filename(tmp_filename, PATH_MAX + 1);
1433b998875dSKevin Wolf     if (ret < 0) {
1434b998875dSKevin Wolf         error_setg_errno(errp, -ret, "Could not get temporary filename");
14351ba4b6a5SBenoît Canet         goto out;
1436b998875dSKevin Wolf     }
1437b998875dSKevin Wolf 
1438ef810437SMax Reitz     opts = qemu_opts_create(bdrv_qcow2.create_opts, NULL, 0,
1439c282e1fdSChunyan Liu                             &error_abort);
144039101f25SMarkus Armbruster     qemu_opt_set_number(opts, BLOCK_OPT_SIZE, total_size, &error_abort);
1441e43bfd9cSMarkus Armbruster     ret = bdrv_create(&bdrv_qcow2, tmp_filename, opts, errp);
144283d0521aSChunyan Liu     qemu_opts_del(opts);
1443b998875dSKevin Wolf     if (ret < 0) {
1444e43bfd9cSMarkus Armbruster         error_prepend(errp, "Could not create temporary overlay '%s': ",
1445e43bfd9cSMarkus Armbruster                       tmp_filename);
14461ba4b6a5SBenoît Canet         goto out;
1447b998875dSKevin Wolf     }
1448b998875dSKevin Wolf 
144973176beeSKevin Wolf     /* Prepare options QDict for the temporary file */
1450b998875dSKevin Wolf     qdict_put(snapshot_options, "file.driver",
1451b998875dSKevin Wolf               qstring_from_str("file"));
1452b998875dSKevin Wolf     qdict_put(snapshot_options, "file.filename",
1453b998875dSKevin Wolf               qstring_from_str(tmp_filename));
1454e6641719SMax Reitz     qdict_put(snapshot_options, "driver",
1455e6641719SMax Reitz               qstring_from_str("qcow2"));
1456b998875dSKevin Wolf 
1457e4e9986bSMarkus Armbruster     bs_snapshot = bdrv_new();
1458b998875dSKevin Wolf 
1459b998875dSKevin Wolf     ret = bdrv_open(&bs_snapshot, NULL, NULL, snapshot_options,
14606ebf9aa2SMax Reitz                     flags, &local_err);
146173176beeSKevin Wolf     snapshot_options = NULL;
1462b998875dSKevin Wolf     if (ret < 0) {
1463b998875dSKevin Wolf         error_propagate(errp, local_err);
14641ba4b6a5SBenoît Canet         goto out;
1465b998875dSKevin Wolf     }
1466b998875dSKevin Wolf 
1467b998875dSKevin Wolf     bdrv_append(bs_snapshot, bs);
14681ba4b6a5SBenoît Canet 
14691ba4b6a5SBenoît Canet out:
147073176beeSKevin Wolf     QDECREF(snapshot_options);
14711ba4b6a5SBenoît Canet     g_free(tmp_filename);
14726b8aeca5SChen Gang     return ret;
1473b998875dSKevin Wolf }
1474b998875dSKevin Wolf 
1475da557aacSMax Reitz /*
1476b6ce07aaSKevin Wolf  * Opens a disk image (raw, qcow2, vmdk, ...)
1477de9c0cecSKevin Wolf  *
1478de9c0cecSKevin Wolf  * options is a QDict of options to pass to the block drivers, or NULL for an
1479de9c0cecSKevin Wolf  * empty set of options. The reference to the QDict belongs to the block layer
1480de9c0cecSKevin Wolf  * after the call (even on failure), so if the caller intends to reuse the
1481de9c0cecSKevin Wolf  * dictionary, it needs to use QINCREF() before calling bdrv_open.
1482f67503e5SMax Reitz  *
1483f67503e5SMax Reitz  * If *pbs is NULL, a new BDS will be created with a pointer to it stored there.
1484f67503e5SMax Reitz  * If it is not NULL, the referenced BDS will be reused.
1485ddf5636dSMax Reitz  *
1486ddf5636dSMax Reitz  * The reference parameter may be used to specify an existing block device which
1487ddf5636dSMax Reitz  * should be opened. If specified, neither options nor a filename may be given,
1488ddf5636dSMax Reitz  * nor can an existing BDS be reused (that is, *pbs has to be NULL).
1489b6ce07aaSKevin Wolf  */
1490f3930ed0SKevin Wolf static int bdrv_open_inherit(BlockDriverState **pbs, const char *filename,
1491ddf5636dSMax Reitz                              const char *reference, QDict *options, int flags,
1492f3930ed0SKevin Wolf                              BlockDriverState *parent,
1493ce343771SMax Reitz                              const BdrvChildRole *child_role, Error **errp)
1494ea2384d3Sbellard {
1495b6ce07aaSKevin Wolf     int ret;
14969a4f4c31SKevin Wolf     BdrvChild *file = NULL;
14979a4f4c31SKevin Wolf     BlockDriverState *bs;
1498ce343771SMax Reitz     BlockDriver *drv = NULL;
149974fe54f2SKevin Wolf     const char *drvname;
15003e8c2e57SAlberto Garcia     const char *backing;
150134b5d2c6SMax Reitz     Error *local_err = NULL;
150273176beeSKevin Wolf     QDict *snapshot_options = NULL;
1503b1e6fc08SKevin Wolf     int snapshot_flags = 0;
150433e3963eSbellard 
1505f67503e5SMax Reitz     assert(pbs);
1506f3930ed0SKevin Wolf     assert(!child_role || !flags);
1507f3930ed0SKevin Wolf     assert(!child_role == !parent);
1508f67503e5SMax Reitz 
1509ddf5636dSMax Reitz     if (reference) {
1510ddf5636dSMax Reitz         bool options_non_empty = options ? qdict_size(options) : false;
1511ddf5636dSMax Reitz         QDECREF(options);
1512ddf5636dSMax Reitz 
1513ddf5636dSMax Reitz         if (*pbs) {
1514ddf5636dSMax Reitz             error_setg(errp, "Cannot reuse an existing BDS when referencing "
1515ddf5636dSMax Reitz                        "another block device");
1516ddf5636dSMax Reitz             return -EINVAL;
1517ddf5636dSMax Reitz         }
1518ddf5636dSMax Reitz 
1519ddf5636dSMax Reitz         if (filename || options_non_empty) {
1520ddf5636dSMax Reitz             error_setg(errp, "Cannot reference an existing block device with "
1521ddf5636dSMax Reitz                        "additional options or a new filename");
1522ddf5636dSMax Reitz             return -EINVAL;
1523ddf5636dSMax Reitz         }
1524ddf5636dSMax Reitz 
1525ddf5636dSMax Reitz         bs = bdrv_lookup_bs(reference, reference, errp);
1526ddf5636dSMax Reitz         if (!bs) {
1527ddf5636dSMax Reitz             return -ENODEV;
1528ddf5636dSMax Reitz         }
1529*76b22320SKevin Wolf 
1530*76b22320SKevin Wolf         if (bs->throttle_state) {
1531*76b22320SKevin Wolf             error_setg(errp, "Cannot reference an existing block device for "
1532*76b22320SKevin Wolf                        "which I/O throttling is enabled");
1533*76b22320SKevin Wolf             return -EINVAL;
1534*76b22320SKevin Wolf         }
1535*76b22320SKevin Wolf 
1536ddf5636dSMax Reitz         bdrv_ref(bs);
1537ddf5636dSMax Reitz         *pbs = bs;
1538ddf5636dSMax Reitz         return 0;
1539ddf5636dSMax Reitz     }
1540ddf5636dSMax Reitz 
1541f67503e5SMax Reitz     if (*pbs) {
1542f67503e5SMax Reitz         bs = *pbs;
1543f67503e5SMax Reitz     } else {
1544e4e9986bSMarkus Armbruster         bs = bdrv_new();
1545f67503e5SMax Reitz     }
1546f67503e5SMax Reitz 
1547de9c0cecSKevin Wolf     /* NULL means an empty set of options */
1548de9c0cecSKevin Wolf     if (options == NULL) {
1549de9c0cecSKevin Wolf         options = qdict_new();
1550de9c0cecSKevin Wolf     }
1551de9c0cecSKevin Wolf 
1552145f598eSKevin Wolf     /* json: syntax counts as explicit options, as if in the QDict */
1553de3b53f0SKevin Wolf     parse_json_protocol(options, &filename, &local_err);
1554de3b53f0SKevin Wolf     if (local_err) {
1555de3b53f0SKevin Wolf         ret = -EINVAL;
1556de3b53f0SKevin Wolf         goto fail;
1557de3b53f0SKevin Wolf     }
1558de3b53f0SKevin Wolf 
1559145f598eSKevin Wolf     bs->explicit_options = qdict_clone_shallow(options);
1560145f598eSKevin Wolf 
1561f3930ed0SKevin Wolf     if (child_role) {
1562bddcec37SKevin Wolf         bs->inherits_from = parent;
15638e2160e2SKevin Wolf         child_role->inherit_options(&flags, options,
15648e2160e2SKevin Wolf                                     parent->open_flags, parent->options);
1565f3930ed0SKevin Wolf     }
1566f3930ed0SKevin Wolf 
1567de3b53f0SKevin Wolf     ret = bdrv_fill_options(&options, filename, &flags, &local_err);
1568462f5bcfSKevin Wolf     if (local_err) {
1569462f5bcfSKevin Wolf         goto fail;
1570462f5bcfSKevin Wolf     }
1571462f5bcfSKevin Wolf 
157262392ebbSKevin Wolf     bs->open_flags = flags;
157362392ebbSKevin Wolf     bs->options = options;
157462392ebbSKevin Wolf     options = qdict_clone_shallow(options);
157562392ebbSKevin Wolf 
157676c591b0SKevin Wolf     /* Find the right image format driver */
157776c591b0SKevin Wolf     drvname = qdict_get_try_str(options, "driver");
157876c591b0SKevin Wolf     if (drvname) {
157976c591b0SKevin Wolf         drv = bdrv_find_format(drvname);
158076c591b0SKevin Wolf         if (!drv) {
158176c591b0SKevin Wolf             error_setg(errp, "Unknown driver: '%s'", drvname);
158276c591b0SKevin Wolf             ret = -EINVAL;
158376c591b0SKevin Wolf             goto fail;
158476c591b0SKevin Wolf         }
158576c591b0SKevin Wolf     }
158676c591b0SKevin Wolf 
158776c591b0SKevin Wolf     assert(drvname || !(flags & BDRV_O_PROTOCOL));
158876c591b0SKevin Wolf 
15893e8c2e57SAlberto Garcia     backing = qdict_get_try_str(options, "backing");
15903e8c2e57SAlberto Garcia     if (backing && *backing == '\0') {
15913e8c2e57SAlberto Garcia         flags |= BDRV_O_NO_BACKING;
15923e8c2e57SAlberto Garcia         qdict_del(options, "backing");
15933e8c2e57SAlberto Garcia     }
15943e8c2e57SAlberto Garcia 
1595f500a6d3SKevin Wolf     /* Open image file without format layer */
1596f4788adcSKevin Wolf     if ((flags & BDRV_O_PROTOCOL) == 0) {
1597be028adcSJeff Cody         if (flags & BDRV_O_RDWR) {
1598be028adcSJeff Cody             flags |= BDRV_O_ALLOW_RDWR;
1599be028adcSJeff Cody         }
1600b1e6fc08SKevin Wolf         if (flags & BDRV_O_SNAPSHOT) {
160173176beeSKevin Wolf             snapshot_options = qdict_new();
160273176beeSKevin Wolf             bdrv_temp_snapshot_options(&snapshot_flags, snapshot_options,
160373176beeSKevin Wolf                                        flags, options);
16048e2160e2SKevin Wolf             bdrv_backing_options(&flags, options, flags, options);
1605b1e6fc08SKevin Wolf         }
1606be028adcSJeff Cody 
1607f3930ed0SKevin Wolf         bs->open_flags = flags;
16081fdd6933SKevin Wolf 
16099a4f4c31SKevin Wolf         file = bdrv_open_child(filename, options, "file", bs,
16101fdd6933SKevin Wolf                                &child_file, true, &local_err);
16111fdd6933SKevin Wolf         if (local_err) {
16121fdd6933SKevin Wolf             ret = -EINVAL;
16138bfea15dSKevin Wolf             goto fail;
1614f500a6d3SKevin Wolf         }
1615f4788adcSKevin Wolf     }
1616f500a6d3SKevin Wolf 
161776c591b0SKevin Wolf     /* Image format probing */
161838f3ef57SKevin Wolf     bs->probed = !drv;
161976c591b0SKevin Wolf     if (!drv && file) {
16209a4f4c31SKevin Wolf         ret = find_image_format(file->bs, filename, &drv, &local_err);
162117b005f1SKevin Wolf         if (ret < 0) {
162217b005f1SKevin Wolf             goto fail;
162317b005f1SKevin Wolf         }
162462392ebbSKevin Wolf         /*
162562392ebbSKevin Wolf          * This option update would logically belong in bdrv_fill_options(),
162662392ebbSKevin Wolf          * but we first need to open bs->file for the probing to work, while
162762392ebbSKevin Wolf          * opening bs->file already requires the (mostly) final set of options
162862392ebbSKevin Wolf          * so that cache mode etc. can be inherited.
162962392ebbSKevin Wolf          *
163062392ebbSKevin Wolf          * Adding the driver later is somewhat ugly, but it's not an option
163162392ebbSKevin Wolf          * that would ever be inherited, so it's correct. We just need to make
163262392ebbSKevin Wolf          * sure to update both bs->options (which has the full effective
163362392ebbSKevin Wolf          * options for bs) and options (which has file.* already removed).
163462392ebbSKevin Wolf          */
163562392ebbSKevin Wolf         qdict_put(bs->options, "driver", qstring_from_str(drv->format_name));
163662392ebbSKevin Wolf         qdict_put(options, "driver", qstring_from_str(drv->format_name));
163776c591b0SKevin Wolf     } else if (!drv) {
16382a05cbe4SMax Reitz         error_setg(errp, "Must specify either driver or file");
16392a05cbe4SMax Reitz         ret = -EINVAL;
16408bfea15dSKevin Wolf         goto fail;
16412a05cbe4SMax Reitz     }
1642f500a6d3SKevin Wolf 
164353a29513SMax Reitz     /* BDRV_O_PROTOCOL must be set iff a protocol BDS is about to be created */
164453a29513SMax Reitz     assert(!!(flags & BDRV_O_PROTOCOL) == !!drv->bdrv_file_open);
164553a29513SMax Reitz     /* file must be NULL if a protocol BDS is about to be created
164653a29513SMax Reitz      * (the inverse results in an error message from bdrv_open_common()) */
164753a29513SMax Reitz     assert(!(flags & BDRV_O_PROTOCOL) || !file);
164853a29513SMax Reitz 
1649b6ce07aaSKevin Wolf     /* Open the image */
165082dc8b41SKevin Wolf     ret = bdrv_open_common(bs, file, options, &local_err);
1651b6ce07aaSKevin Wolf     if (ret < 0) {
16528bfea15dSKevin Wolf         goto fail;
16536987307cSChristoph Hellwig     }
16546987307cSChristoph Hellwig 
16552a05cbe4SMax Reitz     if (file && (bs->file != file)) {
16569a4f4c31SKevin Wolf         bdrv_unref_child(bs, file);
1657f500a6d3SKevin Wolf         file = NULL;
1658f500a6d3SKevin Wolf     }
1659f500a6d3SKevin Wolf 
1660b6ce07aaSKevin Wolf     /* If there is a backing file, use it */
16619156df12SPaolo Bonzini     if ((flags & BDRV_O_NO_BACKING) == 0) {
1662d9b7b057SKevin Wolf         ret = bdrv_open_backing_file(bs, options, "backing", &local_err);
1663b6ce07aaSKevin Wolf         if (ret < 0) {
1664b6ad491aSKevin Wolf             goto close_and_fail;
1665b6ce07aaSKevin Wolf         }
1666b6ce07aaSKevin Wolf     }
1667b6ce07aaSKevin Wolf 
166891af7014SMax Reitz     bdrv_refresh_filename(bs);
166991af7014SMax Reitz 
1670b6ad491aSKevin Wolf     /* Check if any unknown options were used */
16715acd9d81SMax Reitz     if (options && (qdict_size(options) != 0)) {
1672b6ad491aSKevin Wolf         const QDictEntry *entry = qdict_first(options);
16735acd9d81SMax Reitz         if (flags & BDRV_O_PROTOCOL) {
16745acd9d81SMax Reitz             error_setg(errp, "Block protocol '%s' doesn't support the option "
16755acd9d81SMax Reitz                        "'%s'", drv->format_name, entry->key);
16765acd9d81SMax Reitz         } else {
1677d0e46a55SMax Reitz             error_setg(errp,
1678d0e46a55SMax Reitz                        "Block format '%s' does not support the option '%s'",
1679d0e46a55SMax Reitz                        drv->format_name, entry->key);
16805acd9d81SMax Reitz         }
1681b6ad491aSKevin Wolf 
1682b6ad491aSKevin Wolf         ret = -EINVAL;
1683b6ad491aSKevin Wolf         goto close_and_fail;
1684b6ad491aSKevin Wolf     }
1685b6ad491aSKevin Wolf 
1686b6ce07aaSKevin Wolf     if (!bdrv_key_required(bs)) {
1687a7f53e26SMarkus Armbruster         if (bs->blk) {
1688a7f53e26SMarkus Armbruster             blk_dev_change_media_cb(bs->blk, true);
1689a7f53e26SMarkus Armbruster         }
1690c3adb58fSMarkus Armbruster     } else if (!runstate_check(RUN_STATE_PRELAUNCH)
1691c3adb58fSMarkus Armbruster                && !runstate_check(RUN_STATE_INMIGRATE)
1692c3adb58fSMarkus Armbruster                && !runstate_check(RUN_STATE_PAUSED)) { /* HACK */
1693c3adb58fSMarkus Armbruster         error_setg(errp,
1694c3adb58fSMarkus Armbruster                    "Guest must be stopped for opening of encrypted image");
1695c3adb58fSMarkus Armbruster         ret = -EBUSY;
1696c3adb58fSMarkus Armbruster         goto close_and_fail;
1697b6ce07aaSKevin Wolf     }
1698b6ce07aaSKevin Wolf 
1699c3adb58fSMarkus Armbruster     QDECREF(options);
1700f67503e5SMax Reitz     *pbs = bs;
1701dd62f1caSKevin Wolf 
1702dd62f1caSKevin Wolf     /* For snapshot=on, create a temporary qcow2 overlay. bs points to the
1703dd62f1caSKevin Wolf      * temporary snapshot afterwards. */
1704dd62f1caSKevin Wolf     if (snapshot_flags) {
170573176beeSKevin Wolf         ret = bdrv_append_temp_snapshot(bs, snapshot_flags, snapshot_options,
170673176beeSKevin Wolf                                         &local_err);
170773176beeSKevin Wolf         snapshot_options = NULL;
1708dd62f1caSKevin Wolf         if (local_err) {
1709dd62f1caSKevin Wolf             goto close_and_fail;
1710dd62f1caSKevin Wolf         }
1711dd62f1caSKevin Wolf     }
1712dd62f1caSKevin Wolf 
1713b6ce07aaSKevin Wolf     return 0;
1714b6ce07aaSKevin Wolf 
17158bfea15dSKevin Wolf fail:
1716f500a6d3SKevin Wolf     if (file != NULL) {
17179a4f4c31SKevin Wolf         bdrv_unref_child(bs, file);
1718f500a6d3SKevin Wolf     }
171973176beeSKevin Wolf     QDECREF(snapshot_options);
1720145f598eSKevin Wolf     QDECREF(bs->explicit_options);
1721de9c0cecSKevin Wolf     QDECREF(bs->options);
1722b6ad491aSKevin Wolf     QDECREF(options);
1723de9c0cecSKevin Wolf     bs->options = NULL;
1724f67503e5SMax Reitz     if (!*pbs) {
1725f67503e5SMax Reitz         /* If *pbs is NULL, a new BDS has been created in this function and
1726f67503e5SMax Reitz            needs to be freed now. Otherwise, it does not need to be closed,
1727f67503e5SMax Reitz            since it has not really been opened yet. */
1728f67503e5SMax Reitz         bdrv_unref(bs);
1729f67503e5SMax Reitz     }
173084d18f06SMarkus Armbruster     if (local_err) {
173134b5d2c6SMax Reitz         error_propagate(errp, local_err);
173234b5d2c6SMax Reitz     }
1733b6ad491aSKevin Wolf     return ret;
1734de9c0cecSKevin Wolf 
1735b6ad491aSKevin Wolf close_and_fail:
1736f67503e5SMax Reitz     /* See fail path, but now the BDS has to be always closed */
1737f67503e5SMax Reitz     if (*pbs) {
1738b6ad491aSKevin Wolf         bdrv_close(bs);
1739f67503e5SMax Reitz     } else {
1740f67503e5SMax Reitz         bdrv_unref(bs);
1741f67503e5SMax Reitz     }
174273176beeSKevin Wolf     QDECREF(snapshot_options);
1743b6ad491aSKevin Wolf     QDECREF(options);
174484d18f06SMarkus Armbruster     if (local_err) {
174534b5d2c6SMax Reitz         error_propagate(errp, local_err);
174634b5d2c6SMax Reitz     }
1747b6ce07aaSKevin Wolf     return ret;
1748b6ce07aaSKevin Wolf }
1749b6ce07aaSKevin Wolf 
1750f3930ed0SKevin Wolf int bdrv_open(BlockDriverState **pbs, const char *filename,
17516ebf9aa2SMax Reitz               const char *reference, QDict *options, int flags, Error **errp)
1752f3930ed0SKevin Wolf {
1753f3930ed0SKevin Wolf     return bdrv_open_inherit(pbs, filename, reference, options, flags, NULL,
1754ce343771SMax Reitz                              NULL, errp);
1755f3930ed0SKevin Wolf }
1756f3930ed0SKevin Wolf 
1757e971aa12SJeff Cody typedef struct BlockReopenQueueEntry {
1758e971aa12SJeff Cody      bool prepared;
1759e971aa12SJeff Cody      BDRVReopenState state;
1760e971aa12SJeff Cody      QSIMPLEQ_ENTRY(BlockReopenQueueEntry) entry;
1761e971aa12SJeff Cody } BlockReopenQueueEntry;
1762e971aa12SJeff Cody 
1763e971aa12SJeff Cody /*
1764e971aa12SJeff Cody  * Adds a BlockDriverState to a simple queue for an atomic, transactional
1765e971aa12SJeff Cody  * reopen of multiple devices.
1766e971aa12SJeff Cody  *
1767e971aa12SJeff Cody  * bs_queue can either be an existing BlockReopenQueue that has had QSIMPLE_INIT
1768e971aa12SJeff Cody  * already performed, or alternatively may be NULL a new BlockReopenQueue will
1769e971aa12SJeff Cody  * be created and initialized. This newly created BlockReopenQueue should be
1770e971aa12SJeff Cody  * passed back in for subsequent calls that are intended to be of the same
1771e971aa12SJeff Cody  * atomic 'set'.
1772e971aa12SJeff Cody  *
1773e971aa12SJeff Cody  * bs is the BlockDriverState to add to the reopen queue.
1774e971aa12SJeff Cody  *
17754d2cb092SKevin Wolf  * options contains the changed options for the associated bs
17764d2cb092SKevin Wolf  * (the BlockReopenQueue takes ownership)
17774d2cb092SKevin Wolf  *
1778e971aa12SJeff Cody  * flags contains the open flags for the associated bs
1779e971aa12SJeff Cody  *
1780e971aa12SJeff Cody  * returns a pointer to bs_queue, which is either the newly allocated
1781e971aa12SJeff Cody  * bs_queue, or the existing bs_queue being used.
1782e971aa12SJeff Cody  *
1783e971aa12SJeff Cody  */
178428518102SKevin Wolf static BlockReopenQueue *bdrv_reopen_queue_child(BlockReopenQueue *bs_queue,
17854d2cb092SKevin Wolf                                                  BlockDriverState *bs,
178628518102SKevin Wolf                                                  QDict *options,
178728518102SKevin Wolf                                                  int flags,
178828518102SKevin Wolf                                                  const BdrvChildRole *role,
178928518102SKevin Wolf                                                  QDict *parent_options,
179028518102SKevin Wolf                                                  int parent_flags)
1791e971aa12SJeff Cody {
1792e971aa12SJeff Cody     assert(bs != NULL);
1793e971aa12SJeff Cody 
1794e971aa12SJeff Cody     BlockReopenQueueEntry *bs_entry;
179567251a31SKevin Wolf     BdrvChild *child;
1796145f598eSKevin Wolf     QDict *old_options, *explicit_options;
179767251a31SKevin Wolf 
1798e971aa12SJeff Cody     if (bs_queue == NULL) {
1799e971aa12SJeff Cody         bs_queue = g_new0(BlockReopenQueue, 1);
1800e971aa12SJeff Cody         QSIMPLEQ_INIT(bs_queue);
1801e971aa12SJeff Cody     }
1802e971aa12SJeff Cody 
18034d2cb092SKevin Wolf     if (!options) {
18044d2cb092SKevin Wolf         options = qdict_new();
18054d2cb092SKevin Wolf     }
18064d2cb092SKevin Wolf 
180728518102SKevin Wolf     /*
180828518102SKevin Wolf      * Precedence of options:
180928518102SKevin Wolf      * 1. Explicitly passed in options (highest)
181091a097e7SKevin Wolf      * 2. Set in flags (only for top level)
1811145f598eSKevin Wolf      * 3. Retained from explicitly set options of bs
18128e2160e2SKevin Wolf      * 4. Inherited from parent node
181328518102SKevin Wolf      * 5. Retained from effective options of bs
181428518102SKevin Wolf      */
181528518102SKevin Wolf 
181691a097e7SKevin Wolf     if (!parent_options) {
181791a097e7SKevin Wolf         /*
181891a097e7SKevin Wolf          * Any setting represented by flags is always updated. If the
181991a097e7SKevin Wolf          * corresponding QDict option is set, it takes precedence. Otherwise
182091a097e7SKevin Wolf          * the flag is translated into a QDict option. The old setting of bs is
182191a097e7SKevin Wolf          * not considered.
182291a097e7SKevin Wolf          */
182391a097e7SKevin Wolf         update_options_from_flags(options, flags);
182491a097e7SKevin Wolf     }
182591a097e7SKevin Wolf 
1826145f598eSKevin Wolf     /* Old explicitly set values (don't overwrite by inherited value) */
1827145f598eSKevin Wolf     old_options = qdict_clone_shallow(bs->explicit_options);
1828145f598eSKevin Wolf     bdrv_join_options(bs, options, old_options);
1829145f598eSKevin Wolf     QDECREF(old_options);
1830145f598eSKevin Wolf 
1831145f598eSKevin Wolf     explicit_options = qdict_clone_shallow(options);
1832145f598eSKevin Wolf 
183328518102SKevin Wolf     /* Inherit from parent node */
183428518102SKevin Wolf     if (parent_options) {
183528518102SKevin Wolf         assert(!flags);
18368e2160e2SKevin Wolf         role->inherit_options(&flags, options, parent_flags, parent_options);
183728518102SKevin Wolf     }
183828518102SKevin Wolf 
183928518102SKevin Wolf     /* Old values are used for options that aren't set yet */
18404d2cb092SKevin Wolf     old_options = qdict_clone_shallow(bs->options);
1841cddff5baSKevin Wolf     bdrv_join_options(bs, options, old_options);
18424d2cb092SKevin Wolf     QDECREF(old_options);
18434d2cb092SKevin Wolf 
1844f1f25a2eSKevin Wolf     /* bdrv_open() masks this flag out */
1845f1f25a2eSKevin Wolf     flags &= ~BDRV_O_PROTOCOL;
1846f1f25a2eSKevin Wolf 
184767251a31SKevin Wolf     QLIST_FOREACH(child, &bs->children, next) {
18484c9dfe5dSKevin Wolf         QDict *new_child_options;
18494c9dfe5dSKevin Wolf         char *child_key_dot;
185067251a31SKevin Wolf 
18514c9dfe5dSKevin Wolf         /* reopen can only change the options of block devices that were
18524c9dfe5dSKevin Wolf          * implicitly created and inherited options. For other (referenced)
18534c9dfe5dSKevin Wolf          * block devices, a syntax like "backing.foo" results in an error. */
185467251a31SKevin Wolf         if (child->bs->inherits_from != bs) {
185567251a31SKevin Wolf             continue;
185667251a31SKevin Wolf         }
185767251a31SKevin Wolf 
18584c9dfe5dSKevin Wolf         child_key_dot = g_strdup_printf("%s.", child->name);
18594c9dfe5dSKevin Wolf         qdict_extract_subqdict(options, &new_child_options, child_key_dot);
18604c9dfe5dSKevin Wolf         g_free(child_key_dot);
18614c9dfe5dSKevin Wolf 
186228518102SKevin Wolf         bdrv_reopen_queue_child(bs_queue, child->bs, new_child_options, 0,
186328518102SKevin Wolf                                 child->role, options, flags);
1864e971aa12SJeff Cody     }
1865e971aa12SJeff Cody 
1866e971aa12SJeff Cody     bs_entry = g_new0(BlockReopenQueueEntry, 1);
1867e971aa12SJeff Cody     QSIMPLEQ_INSERT_TAIL(bs_queue, bs_entry, entry);
1868e971aa12SJeff Cody 
1869e971aa12SJeff Cody     bs_entry->state.bs = bs;
18704d2cb092SKevin Wolf     bs_entry->state.options = options;
1871145f598eSKevin Wolf     bs_entry->state.explicit_options = explicit_options;
1872e971aa12SJeff Cody     bs_entry->state.flags = flags;
1873e971aa12SJeff Cody 
1874e971aa12SJeff Cody     return bs_queue;
1875e971aa12SJeff Cody }
1876e971aa12SJeff Cody 
187728518102SKevin Wolf BlockReopenQueue *bdrv_reopen_queue(BlockReopenQueue *bs_queue,
187828518102SKevin Wolf                                     BlockDriverState *bs,
187928518102SKevin Wolf                                     QDict *options, int flags)
188028518102SKevin Wolf {
188128518102SKevin Wolf     return bdrv_reopen_queue_child(bs_queue, bs, options, flags,
188228518102SKevin Wolf                                    NULL, NULL, 0);
188328518102SKevin Wolf }
188428518102SKevin Wolf 
1885e971aa12SJeff Cody /*
1886e971aa12SJeff Cody  * Reopen multiple BlockDriverStates atomically & transactionally.
1887e971aa12SJeff Cody  *
1888e971aa12SJeff Cody  * The queue passed in (bs_queue) must have been built up previous
1889e971aa12SJeff Cody  * via bdrv_reopen_queue().
1890e971aa12SJeff Cody  *
1891e971aa12SJeff Cody  * Reopens all BDS specified in the queue, with the appropriate
1892e971aa12SJeff Cody  * flags.  All devices are prepared for reopen, and failure of any
1893e971aa12SJeff Cody  * device will cause all device changes to be abandonded, and intermediate
1894e971aa12SJeff Cody  * data cleaned up.
1895e971aa12SJeff Cody  *
1896e971aa12SJeff Cody  * If all devices prepare successfully, then the changes are committed
1897e971aa12SJeff Cody  * to all devices.
1898e971aa12SJeff Cody  *
1899e971aa12SJeff Cody  */
1900e971aa12SJeff Cody int bdrv_reopen_multiple(BlockReopenQueue *bs_queue, Error **errp)
1901e971aa12SJeff Cody {
1902e971aa12SJeff Cody     int ret = -1;
1903e971aa12SJeff Cody     BlockReopenQueueEntry *bs_entry, *next;
1904e971aa12SJeff Cody     Error *local_err = NULL;
1905e971aa12SJeff Cody 
1906e971aa12SJeff Cody     assert(bs_queue != NULL);
1907e971aa12SJeff Cody 
1908e971aa12SJeff Cody     bdrv_drain_all();
1909e971aa12SJeff Cody 
1910e971aa12SJeff Cody     QSIMPLEQ_FOREACH(bs_entry, bs_queue, entry) {
1911e971aa12SJeff Cody         if (bdrv_reopen_prepare(&bs_entry->state, bs_queue, &local_err)) {
1912e971aa12SJeff Cody             error_propagate(errp, local_err);
1913e971aa12SJeff Cody             goto cleanup;
1914e971aa12SJeff Cody         }
1915e971aa12SJeff Cody         bs_entry->prepared = true;
1916e971aa12SJeff Cody     }
1917e971aa12SJeff Cody 
1918e971aa12SJeff Cody     /* If we reach this point, we have success and just need to apply the
1919e971aa12SJeff Cody      * changes
1920e971aa12SJeff Cody      */
1921e971aa12SJeff Cody     QSIMPLEQ_FOREACH(bs_entry, bs_queue, entry) {
1922e971aa12SJeff Cody         bdrv_reopen_commit(&bs_entry->state);
1923e971aa12SJeff Cody     }
1924e971aa12SJeff Cody 
1925e971aa12SJeff Cody     ret = 0;
1926e971aa12SJeff Cody 
1927e971aa12SJeff Cody cleanup:
1928e971aa12SJeff Cody     QSIMPLEQ_FOREACH_SAFE(bs_entry, bs_queue, entry, next) {
1929e971aa12SJeff Cody         if (ret && bs_entry->prepared) {
1930e971aa12SJeff Cody             bdrv_reopen_abort(&bs_entry->state);
1931145f598eSKevin Wolf         } else if (ret) {
1932145f598eSKevin Wolf             QDECREF(bs_entry->state.explicit_options);
1933e971aa12SJeff Cody         }
19344d2cb092SKevin Wolf         QDECREF(bs_entry->state.options);
1935e971aa12SJeff Cody         g_free(bs_entry);
1936e971aa12SJeff Cody     }
1937e971aa12SJeff Cody     g_free(bs_queue);
1938e971aa12SJeff Cody     return ret;
1939e971aa12SJeff Cody }
1940e971aa12SJeff Cody 
1941e971aa12SJeff Cody 
1942e971aa12SJeff Cody /* Reopen a single BlockDriverState with the specified flags. */
1943e971aa12SJeff Cody int bdrv_reopen(BlockDriverState *bs, int bdrv_flags, Error **errp)
1944e971aa12SJeff Cody {
1945e971aa12SJeff Cody     int ret = -1;
1946e971aa12SJeff Cody     Error *local_err = NULL;
19474d2cb092SKevin Wolf     BlockReopenQueue *queue = bdrv_reopen_queue(NULL, bs, NULL, bdrv_flags);
1948e971aa12SJeff Cody 
1949e971aa12SJeff Cody     ret = bdrv_reopen_multiple(queue, &local_err);
1950e971aa12SJeff Cody     if (local_err != NULL) {
1951e971aa12SJeff Cody         error_propagate(errp, local_err);
1952e971aa12SJeff Cody     }
1953e971aa12SJeff Cody     return ret;
1954e971aa12SJeff Cody }
1955e971aa12SJeff Cody 
1956e971aa12SJeff Cody 
1957e971aa12SJeff Cody /*
1958e971aa12SJeff Cody  * Prepares a BlockDriverState for reopen. All changes are staged in the
1959e971aa12SJeff Cody  * 'opaque' field of the BDRVReopenState, which is used and allocated by
1960e971aa12SJeff Cody  * the block driver layer .bdrv_reopen_prepare()
1961e971aa12SJeff Cody  *
1962e971aa12SJeff Cody  * bs is the BlockDriverState to reopen
1963e971aa12SJeff Cody  * flags are the new open flags
1964e971aa12SJeff Cody  * queue is the reopen queue
1965e971aa12SJeff Cody  *
1966e971aa12SJeff Cody  * Returns 0 on success, non-zero on error.  On error errp will be set
1967e971aa12SJeff Cody  * as well.
1968e971aa12SJeff Cody  *
1969e971aa12SJeff Cody  * On failure, bdrv_reopen_abort() will be called to clean up any data.
1970e971aa12SJeff Cody  * It is the responsibility of the caller to then call the abort() or
1971e971aa12SJeff Cody  * commit() for any other BDS that have been left in a prepare() state
1972e971aa12SJeff Cody  *
1973e971aa12SJeff Cody  */
1974e971aa12SJeff Cody int bdrv_reopen_prepare(BDRVReopenState *reopen_state, BlockReopenQueue *queue,
1975e971aa12SJeff Cody                         Error **errp)
1976e971aa12SJeff Cody {
1977e971aa12SJeff Cody     int ret = -1;
1978e971aa12SJeff Cody     Error *local_err = NULL;
1979e971aa12SJeff Cody     BlockDriver *drv;
1980ccf9dc07SKevin Wolf     QemuOpts *opts;
1981ccf9dc07SKevin Wolf     const char *value;
1982e971aa12SJeff Cody 
1983e971aa12SJeff Cody     assert(reopen_state != NULL);
1984e971aa12SJeff Cody     assert(reopen_state->bs->drv != NULL);
1985e971aa12SJeff Cody     drv = reopen_state->bs->drv;
1986e971aa12SJeff Cody 
1987ccf9dc07SKevin Wolf     /* Process generic block layer options */
1988ccf9dc07SKevin Wolf     opts = qemu_opts_create(&bdrv_runtime_opts, NULL, 0, &error_abort);
1989ccf9dc07SKevin Wolf     qemu_opts_absorb_qdict(opts, reopen_state->options, &local_err);
1990ccf9dc07SKevin Wolf     if (local_err) {
1991ccf9dc07SKevin Wolf         error_propagate(errp, local_err);
1992ccf9dc07SKevin Wolf         ret = -EINVAL;
1993ccf9dc07SKevin Wolf         goto error;
1994ccf9dc07SKevin Wolf     }
1995ccf9dc07SKevin Wolf 
199691a097e7SKevin Wolf     update_flags_from_options(&reopen_state->flags, opts);
199791a097e7SKevin Wolf 
1998ccf9dc07SKevin Wolf     /* node-name and driver must be unchanged. Put them back into the QDict, so
1999ccf9dc07SKevin Wolf      * that they are checked at the end of this function. */
2000ccf9dc07SKevin Wolf     value = qemu_opt_get(opts, "node-name");
2001ccf9dc07SKevin Wolf     if (value) {
2002ccf9dc07SKevin Wolf         qdict_put(reopen_state->options, "node-name", qstring_from_str(value));
2003ccf9dc07SKevin Wolf     }
2004ccf9dc07SKevin Wolf 
2005ccf9dc07SKevin Wolf     value = qemu_opt_get(opts, "driver");
2006ccf9dc07SKevin Wolf     if (value) {
2007ccf9dc07SKevin Wolf         qdict_put(reopen_state->options, "driver", qstring_from_str(value));
2008ccf9dc07SKevin Wolf     }
2009ccf9dc07SKevin Wolf 
2010e971aa12SJeff Cody     /* if we are to stay read-only, do not allow permission change
2011e971aa12SJeff Cody      * to r/w */
2012e971aa12SJeff Cody     if (!(reopen_state->bs->open_flags & BDRV_O_ALLOW_RDWR) &&
2013e971aa12SJeff Cody         reopen_state->flags & BDRV_O_RDWR) {
201481e5f78aSAlberto Garcia         error_setg(errp, "Node '%s' is read only",
201581e5f78aSAlberto Garcia                    bdrv_get_device_or_node_name(reopen_state->bs));
2016e971aa12SJeff Cody         goto error;
2017e971aa12SJeff Cody     }
2018e971aa12SJeff Cody 
2019e971aa12SJeff Cody 
2020e971aa12SJeff Cody     ret = bdrv_flush(reopen_state->bs);
2021e971aa12SJeff Cody     if (ret) {
2022455b0fdeSEric Blake         error_setg_errno(errp, -ret, "Error flushing drive");
2023e971aa12SJeff Cody         goto error;
2024e971aa12SJeff Cody     }
2025e971aa12SJeff Cody 
2026e971aa12SJeff Cody     if (drv->bdrv_reopen_prepare) {
2027e971aa12SJeff Cody         ret = drv->bdrv_reopen_prepare(reopen_state, queue, &local_err);
2028e971aa12SJeff Cody         if (ret) {
2029e971aa12SJeff Cody             if (local_err != NULL) {
2030e971aa12SJeff Cody                 error_propagate(errp, local_err);
2031e971aa12SJeff Cody             } else {
2032d8b6895fSLuiz Capitulino                 error_setg(errp, "failed while preparing to reopen image '%s'",
2033e971aa12SJeff Cody                            reopen_state->bs->filename);
2034e971aa12SJeff Cody             }
2035e971aa12SJeff Cody             goto error;
2036e971aa12SJeff Cody         }
2037e971aa12SJeff Cody     } else {
2038e971aa12SJeff Cody         /* It is currently mandatory to have a bdrv_reopen_prepare()
2039e971aa12SJeff Cody          * handler for each supported drv. */
204081e5f78aSAlberto Garcia         error_setg(errp, "Block format '%s' used by node '%s' "
204181e5f78aSAlberto Garcia                    "does not support reopening files", drv->format_name,
204281e5f78aSAlberto Garcia                    bdrv_get_device_or_node_name(reopen_state->bs));
2043e971aa12SJeff Cody         ret = -1;
2044e971aa12SJeff Cody         goto error;
2045e971aa12SJeff Cody     }
2046e971aa12SJeff Cody 
20474d2cb092SKevin Wolf     /* Options that are not handled are only okay if they are unchanged
20484d2cb092SKevin Wolf      * compared to the old state. It is expected that some options are only
20494d2cb092SKevin Wolf      * used for the initial open, but not reopen (e.g. filename) */
20504d2cb092SKevin Wolf     if (qdict_size(reopen_state->options)) {
20514d2cb092SKevin Wolf         const QDictEntry *entry = qdict_first(reopen_state->options);
20524d2cb092SKevin Wolf 
20534d2cb092SKevin Wolf         do {
20544d2cb092SKevin Wolf             QString *new_obj = qobject_to_qstring(entry->value);
20554d2cb092SKevin Wolf             const char *new = qstring_get_str(new_obj);
20564d2cb092SKevin Wolf             const char *old = qdict_get_try_str(reopen_state->bs->options,
20574d2cb092SKevin Wolf                                                 entry->key);
20584d2cb092SKevin Wolf 
20594d2cb092SKevin Wolf             if (!old || strcmp(new, old)) {
20604d2cb092SKevin Wolf                 error_setg(errp, "Cannot change the option '%s'", entry->key);
20614d2cb092SKevin Wolf                 ret = -EINVAL;
20624d2cb092SKevin Wolf                 goto error;
20634d2cb092SKevin Wolf             }
20644d2cb092SKevin Wolf         } while ((entry = qdict_next(reopen_state->options, entry)));
20654d2cb092SKevin Wolf     }
20664d2cb092SKevin Wolf 
2067e971aa12SJeff Cody     ret = 0;
2068e971aa12SJeff Cody 
2069e971aa12SJeff Cody error:
2070ccf9dc07SKevin Wolf     qemu_opts_del(opts);
2071e971aa12SJeff Cody     return ret;
2072e971aa12SJeff Cody }
2073e971aa12SJeff Cody 
2074e971aa12SJeff Cody /*
2075e971aa12SJeff Cody  * Takes the staged changes for the reopen from bdrv_reopen_prepare(), and
2076e971aa12SJeff Cody  * makes them final by swapping the staging BlockDriverState contents into
2077e971aa12SJeff Cody  * the active BlockDriverState contents.
2078e971aa12SJeff Cody  */
2079e971aa12SJeff Cody void bdrv_reopen_commit(BDRVReopenState *reopen_state)
2080e971aa12SJeff Cody {
2081e971aa12SJeff Cody     BlockDriver *drv;
2082e971aa12SJeff Cody 
2083e971aa12SJeff Cody     assert(reopen_state != NULL);
2084e971aa12SJeff Cody     drv = reopen_state->bs->drv;
2085e971aa12SJeff Cody     assert(drv != NULL);
2086e971aa12SJeff Cody 
2087e971aa12SJeff Cody     /* If there are any driver level actions to take */
2088e971aa12SJeff Cody     if (drv->bdrv_reopen_commit) {
2089e971aa12SJeff Cody         drv->bdrv_reopen_commit(reopen_state);
2090e971aa12SJeff Cody     }
2091e971aa12SJeff Cody 
2092e971aa12SJeff Cody     /* set BDS specific flags now */
2093145f598eSKevin Wolf     QDECREF(reopen_state->bs->explicit_options);
2094145f598eSKevin Wolf 
2095145f598eSKevin Wolf     reopen_state->bs->explicit_options   = reopen_state->explicit_options;
2096e971aa12SJeff Cody     reopen_state->bs->open_flags         = reopen_state->flags;
2097e971aa12SJeff Cody     reopen_state->bs->read_only = !(reopen_state->flags & BDRV_O_RDWR);
2098355ef4acSKevin Wolf 
20993baca891SKevin Wolf     bdrv_refresh_limits(reopen_state->bs, NULL);
2100e971aa12SJeff Cody }
2101e971aa12SJeff Cody 
2102e971aa12SJeff Cody /*
2103e971aa12SJeff Cody  * Abort the reopen, and delete and free the staged changes in
2104e971aa12SJeff Cody  * reopen_state
2105e971aa12SJeff Cody  */
2106e971aa12SJeff Cody void bdrv_reopen_abort(BDRVReopenState *reopen_state)
2107e971aa12SJeff Cody {
2108e971aa12SJeff Cody     BlockDriver *drv;
2109e971aa12SJeff Cody 
2110e971aa12SJeff Cody     assert(reopen_state != NULL);
2111e971aa12SJeff Cody     drv = reopen_state->bs->drv;
2112e971aa12SJeff Cody     assert(drv != NULL);
2113e971aa12SJeff Cody 
2114e971aa12SJeff Cody     if (drv->bdrv_reopen_abort) {
2115e971aa12SJeff Cody         drv->bdrv_reopen_abort(reopen_state);
2116e971aa12SJeff Cody     }
2117145f598eSKevin Wolf 
2118145f598eSKevin Wolf     QDECREF(reopen_state->explicit_options);
2119e971aa12SJeff Cody }
2120e971aa12SJeff Cody 
2121e971aa12SJeff Cody 
212264dff520SMax Reitz static void bdrv_close(BlockDriverState *bs)
2123fc01f7e7Sbellard {
212433384421SMax Reitz     BdrvAioNotifier *ban, *ban_next;
212533384421SMax Reitz 
2126ca9bd24cSMax Reitz     assert(!bs->job);
212799b7e775SAlberto Garcia 
212899b7e775SAlberto Garcia     /* Disable I/O limits and drain all pending throttled requests */
2129a0d64a61SAlberto Garcia     if (bs->throttle_state) {
213099b7e775SAlberto Garcia         bdrv_io_limits_disable(bs);
213199b7e775SAlberto Garcia     }
213299b7e775SAlberto Garcia 
2133fc27291dSPaolo Bonzini     bdrv_drained_begin(bs); /* complete I/O */
213458fda173SStefan Hajnoczi     bdrv_flush(bs);
213553ec73e2SFam Zheng     bdrv_drain(bs); /* in case flush left pending I/O */
2136fc27291dSPaolo Bonzini 
2137c5acdc9aSMax Reitz     bdrv_release_named_dirty_bitmaps(bs);
2138c5acdc9aSMax Reitz     assert(QLIST_EMPTY(&bs->dirty_bitmaps));
2139c5acdc9aSMax Reitz 
2140b4d02820SMax Reitz     if (bs->blk) {
2141b4d02820SMax Reitz         blk_dev_change_media_cb(bs->blk, false);
2142b4d02820SMax Reitz     }
2143b4d02820SMax Reitz 
21443cbc002cSPaolo Bonzini     if (bs->drv) {
21456e93e7c4SKevin Wolf         BdrvChild *child, *next;
21466e93e7c4SKevin Wolf 
21479a7dedbcSKevin Wolf         bs->drv->bdrv_close(bs);
21489a4f4c31SKevin Wolf         bs->drv = NULL;
21499a7dedbcSKevin Wolf 
21509a7dedbcSKevin Wolf         bdrv_set_backing_hd(bs, NULL);
21519a7dedbcSKevin Wolf 
21529a4f4c31SKevin Wolf         if (bs->file != NULL) {
21539a4f4c31SKevin Wolf             bdrv_unref_child(bs, bs->file);
21549a4f4c31SKevin Wolf             bs->file = NULL;
21559a4f4c31SKevin Wolf         }
21569a4f4c31SKevin Wolf 
21576e93e7c4SKevin Wolf         QLIST_FOREACH_SAFE(child, &bs->children, next, next) {
215833a60407SKevin Wolf             /* TODO Remove bdrv_unref() from drivers' close function and use
215933a60407SKevin Wolf              * bdrv_unref_child() here */
2160bddcec37SKevin Wolf             if (child->bs->inherits_from == bs) {
2161bddcec37SKevin Wolf                 child->bs->inherits_from = NULL;
2162bddcec37SKevin Wolf             }
216333a60407SKevin Wolf             bdrv_detach_child(child);
21646e93e7c4SKevin Wolf         }
21656e93e7c4SKevin Wolf 
21667267c094SAnthony Liguori         g_free(bs->opaque);
2167ea2384d3Sbellard         bs->opaque = NULL;
216853fec9d3SStefan Hajnoczi         bs->copy_on_read = 0;
2169a275fa42SPaolo Bonzini         bs->backing_file[0] = '\0';
2170a275fa42SPaolo Bonzini         bs->backing_format[0] = '\0';
21716405875cSPaolo Bonzini         bs->total_sectors = 0;
21726405875cSPaolo Bonzini         bs->encrypted = 0;
21736405875cSPaolo Bonzini         bs->valid_key = 0;
21746405875cSPaolo Bonzini         bs->sg = 0;
21750d51b4deSAsias He         bs->zero_beyond_eof = false;
2176de9c0cecSKevin Wolf         QDECREF(bs->options);
2177145f598eSKevin Wolf         QDECREF(bs->explicit_options);
2178de9c0cecSKevin Wolf         bs->options = NULL;
217991af7014SMax Reitz         QDECREF(bs->full_open_options);
218091af7014SMax Reitz         bs->full_open_options = NULL;
21819ca11154SPavel Hrdina     }
218266f82ceeSKevin Wolf 
218333384421SMax Reitz     QLIST_FOREACH_SAFE(ban, &bs->aio_notifiers, list, ban_next) {
218433384421SMax Reitz         g_free(ban);
218533384421SMax Reitz     }
218633384421SMax Reitz     QLIST_INIT(&bs->aio_notifiers);
2187fc27291dSPaolo Bonzini     bdrv_drained_end(bs);
2188b338082bSbellard }
2189b338082bSbellard 
21902bc93fedSMORITA Kazutaka void bdrv_close_all(void)
21912bc93fedSMORITA Kazutaka {
21922bc93fedSMORITA Kazutaka     BlockDriverState *bs;
2193ca9bd24cSMax Reitz     AioContext *aio_context;
21942bc93fedSMORITA Kazutaka 
2195ca9bd24cSMax Reitz     /* Drop references from requests still in flight, such as canceled block
2196ca9bd24cSMax Reitz      * jobs whose AIO context has not been polled yet */
2197ca9bd24cSMax Reitz     bdrv_drain_all();
2198ca9bd24cSMax Reitz 
2199ca9bd24cSMax Reitz     blk_remove_all_bs();
2200ca9bd24cSMax Reitz     blockdev_close_all_bdrv_states();
2201ca9bd24cSMax Reitz 
2202ca9bd24cSMax Reitz     /* Cancel all block jobs */
2203ca9bd24cSMax Reitz     while (!QTAILQ_EMPTY(&all_bdrv_states)) {
2204ca9bd24cSMax Reitz         QTAILQ_FOREACH(bs, &all_bdrv_states, bs_list) {
2205ca9bd24cSMax Reitz             aio_context = bdrv_get_aio_context(bs);
2206ed78cda3SStefan Hajnoczi 
2207ed78cda3SStefan Hajnoczi             aio_context_acquire(aio_context);
2208ca9bd24cSMax Reitz             if (bs->job) {
2209ca9bd24cSMax Reitz                 block_job_cancel_sync(bs->job);
2210ed78cda3SStefan Hajnoczi                 aio_context_release(aio_context);
2211ca9bd24cSMax Reitz                 break;
2212ca9bd24cSMax Reitz             }
2213ca9bd24cSMax Reitz             aio_context_release(aio_context);
2214ca9bd24cSMax Reitz         }
2215ca9bd24cSMax Reitz 
2216ca9bd24cSMax Reitz         /* All the remaining BlockDriverStates are referenced directly or
2217ca9bd24cSMax Reitz          * indirectly from block jobs, so there needs to be at least one BDS
2218ca9bd24cSMax Reitz          * directly used by a block job */
2219ca9bd24cSMax Reitz         assert(bs);
22202bc93fedSMORITA Kazutaka     }
22212bc93fedSMORITA Kazutaka }
22222bc93fedSMORITA Kazutaka 
22238e419aefSKevin Wolf /* Fields that need to stay with the top-level BDS */
22244ddc07caSPaolo Bonzini static void bdrv_move_feature_fields(BlockDriverState *bs_dest,
22254ddc07caSPaolo Bonzini                                      BlockDriverState *bs_src)
22264ddc07caSPaolo Bonzini {
22274ddc07caSPaolo Bonzini     /* move some fields that need to stay attached to the device */
2228dd62f1caSKevin Wolf }
2229dd62f1caSKevin Wolf 
2230dd62f1caSKevin Wolf static void change_parent_backing_link(BlockDriverState *from,
2231dd62f1caSKevin Wolf                                        BlockDriverState *to)
2232dd62f1caSKevin Wolf {
2233dd62f1caSKevin Wolf     BdrvChild *c, *next;
2234dd62f1caSKevin Wolf 
2235f21d96d0SKevin Wolf     if (from->blk) {
2236f21d96d0SKevin Wolf         /* FIXME We bypass blk_set_bs(), so we need to make these updates
2237f21d96d0SKevin Wolf          * manually. The root problem is not in this change function, but the
2238f21d96d0SKevin Wolf          * existence of BlockDriverState.blk. */
2239f21d96d0SKevin Wolf         to->blk = from->blk;
2240f21d96d0SKevin Wolf         from->blk = NULL;
2241f21d96d0SKevin Wolf     }
2242f21d96d0SKevin Wolf 
2243dd62f1caSKevin Wolf     QLIST_FOREACH_SAFE(c, &from->parents, next_parent, next) {
2244dd62f1caSKevin Wolf         assert(c->role != &child_backing);
2245dd62f1caSKevin Wolf         c->bs = to;
2246dd62f1caSKevin Wolf         QLIST_REMOVE(c, next_parent);
2247dd62f1caSKevin Wolf         QLIST_INSERT_HEAD(&to->parents, c, next_parent);
2248dd62f1caSKevin Wolf         bdrv_ref(to);
2249dd62f1caSKevin Wolf         bdrv_unref(from);
2250dd62f1caSKevin Wolf     }
2251dd62f1caSKevin Wolf }
2252dd62f1caSKevin Wolf 
2253dd62f1caSKevin Wolf static void swap_feature_fields(BlockDriverState *bs_top,
2254dd62f1caSKevin Wolf                                 BlockDriverState *bs_new)
2255dd62f1caSKevin Wolf {
2256dd62f1caSKevin Wolf     BlockDriverState tmp;
2257dd62f1caSKevin Wolf 
2258dd62f1caSKevin Wolf     bdrv_move_feature_fields(&tmp, bs_top);
2259dd62f1caSKevin Wolf     bdrv_move_feature_fields(bs_top, bs_new);
2260dd62f1caSKevin Wolf     bdrv_move_feature_fields(bs_new, &tmp);
2261dd62f1caSKevin Wolf 
2262dd62f1caSKevin Wolf     assert(!bs_new->throttle_state);
2263dd62f1caSKevin Wolf     if (bs_top->throttle_state) {
2264dd62f1caSKevin Wolf         assert(bs_top->io_limits_enabled);
2265dd62f1caSKevin Wolf         bdrv_io_limits_enable(bs_new, throttle_group_get_name(bs_top));
2266dd62f1caSKevin Wolf         bdrv_io_limits_disable(bs_top);
2267dd62f1caSKevin Wolf     }
2268dd62f1caSKevin Wolf }
2269dd62f1caSKevin Wolf 
22708802d1fdSJeff Cody /*
22718802d1fdSJeff Cody  * Add new bs contents at the top of an image chain while the chain is
22728802d1fdSJeff Cody  * live, while keeping required fields on the top layer.
22738802d1fdSJeff Cody  *
22748802d1fdSJeff Cody  * This will modify the BlockDriverState fields, and swap contents
22758802d1fdSJeff Cody  * between bs_new and bs_top. Both bs_new and bs_top are modified.
22768802d1fdSJeff Cody  *
2277bfb197e0SMarkus Armbruster  * bs_new must not be attached to a BlockBackend.
2278f6801b83SJeff Cody  *
22798802d1fdSJeff Cody  * This function does not create any image files.
2280dd62f1caSKevin Wolf  *
2281dd62f1caSKevin Wolf  * bdrv_append() takes ownership of a bs_new reference and unrefs it because
2282dd62f1caSKevin Wolf  * that's what the callers commonly need. bs_new will be referenced by the old
2283dd62f1caSKevin Wolf  * parents of bs_top after bdrv_append() returns. If the caller needs to keep a
2284dd62f1caSKevin Wolf  * reference of its own, it must call bdrv_ref().
22858802d1fdSJeff Cody  */
22868802d1fdSJeff Cody void bdrv_append(BlockDriverState *bs_new, BlockDriverState *bs_top)
22878802d1fdSJeff Cody {
2288dd62f1caSKevin Wolf     assert(!bdrv_requests_pending(bs_top));
2289dd62f1caSKevin Wolf     assert(!bdrv_requests_pending(bs_new));
22908802d1fdSJeff Cody 
2291dd62f1caSKevin Wolf     bdrv_ref(bs_top);
2292dd62f1caSKevin Wolf     change_parent_backing_link(bs_top, bs_new);
2293dd62f1caSKevin Wolf 
2294dd62f1caSKevin Wolf     /* Some fields always stay on top of the backing file chain */
2295dd62f1caSKevin Wolf     swap_feature_fields(bs_top, bs_new);
2296dd62f1caSKevin Wolf 
2297dd62f1caSKevin Wolf     bdrv_set_backing_hd(bs_new, bs_top);
2298dd62f1caSKevin Wolf     bdrv_unref(bs_top);
2299dd62f1caSKevin Wolf 
2300dd62f1caSKevin Wolf     /* bs_new is now referenced by its new parents, we don't need the
2301dd62f1caSKevin Wolf      * additional reference any more. */
2302dd62f1caSKevin Wolf     bdrv_unref(bs_new);
23038802d1fdSJeff Cody }
23048802d1fdSJeff Cody 
23053f09bfbcSKevin Wolf void bdrv_replace_in_backing_chain(BlockDriverState *old, BlockDriverState *new)
23063f09bfbcSKevin Wolf {
23073f09bfbcSKevin Wolf     assert(!bdrv_requests_pending(old));
23083f09bfbcSKevin Wolf     assert(!bdrv_requests_pending(new));
23093f09bfbcSKevin Wolf 
23103f09bfbcSKevin Wolf     bdrv_ref(old);
23113f09bfbcSKevin Wolf 
23123f09bfbcSKevin Wolf     if (old->blk) {
23133f09bfbcSKevin Wolf         /* As long as these fields aren't in BlockBackend, but in the top-level
23143f09bfbcSKevin Wolf          * BlockDriverState, it's not possible for a BDS to have two BBs.
23153f09bfbcSKevin Wolf          *
23163f09bfbcSKevin Wolf          * We really want to copy the fields from old to new, but we go for a
23173f09bfbcSKevin Wolf          * swap instead so that pointers aren't duplicated and cause trouble.
23183f09bfbcSKevin Wolf          * (Also, bdrv_swap() used to do the same.) */
23193f09bfbcSKevin Wolf         assert(!new->blk);
23203f09bfbcSKevin Wolf         swap_feature_fields(old, new);
23213f09bfbcSKevin Wolf     }
23223f09bfbcSKevin Wolf     change_parent_backing_link(old, new);
23233f09bfbcSKevin Wolf 
23243f09bfbcSKevin Wolf     /* Change backing files if a previously independent node is added to the
23253f09bfbcSKevin Wolf      * chain. For active commit, we replace top by its own (indirect) backing
23263f09bfbcSKevin Wolf      * file and don't do anything here so we don't build a loop. */
23273f09bfbcSKevin Wolf     if (new->backing == NULL && !bdrv_chain_contains(backing_bs(old), new)) {
23283f09bfbcSKevin Wolf         bdrv_set_backing_hd(new, backing_bs(old));
23293f09bfbcSKevin Wolf         bdrv_set_backing_hd(old, NULL);
23303f09bfbcSKevin Wolf     }
23313f09bfbcSKevin Wolf 
23323f09bfbcSKevin Wolf     bdrv_unref(old);
23333f09bfbcSKevin Wolf }
23343f09bfbcSKevin Wolf 
23354f6fd349SFam Zheng static void bdrv_delete(BlockDriverState *bs)
2336b338082bSbellard {
23373e914655SPaolo Bonzini     assert(!bs->job);
23383718d8abSFam Zheng     assert(bdrv_op_blocker_is_empty(bs));
23394f6fd349SFam Zheng     assert(!bs->refcnt);
234018846deeSMarkus Armbruster 
2341e1b5c52eSStefan Hajnoczi     bdrv_close(bs);
2342e1b5c52eSStefan Hajnoczi 
23431b7bdbc1SStefan Hajnoczi     /* remove from list, if necessary */
234463eaaae0SKevin Wolf     if (bs->node_name[0] != '\0') {
234563eaaae0SKevin Wolf         QTAILQ_REMOVE(&graph_bdrv_states, bs, node_list);
234663eaaae0SKevin Wolf     }
23472c1d04e0SMax Reitz     QTAILQ_REMOVE(&all_bdrv_states, bs, bs_list);
23482c1d04e0SMax Reitz 
23497267c094SAnthony Liguori     g_free(bs);
2350fc01f7e7Sbellard }
2351fc01f7e7Sbellard 
2352e97fc193Saliguori /*
2353e97fc193Saliguori  * Run consistency checks on an image
2354e97fc193Saliguori  *
2355e076f338SKevin Wolf  * Returns 0 if the check could be completed (it doesn't mean that the image is
2356a1c7273bSStefan Weil  * free of errors) or -errno when an internal error occurred. The results of the
2357e076f338SKevin Wolf  * check are stored in res.
2358e97fc193Saliguori  */
23594534ff54SKevin Wolf int bdrv_check(BlockDriverState *bs, BdrvCheckResult *res, BdrvCheckMode fix)
2360e97fc193Saliguori {
2361908bcd54SMax Reitz     if (bs->drv == NULL) {
2362908bcd54SMax Reitz         return -ENOMEDIUM;
2363908bcd54SMax Reitz     }
2364e97fc193Saliguori     if (bs->drv->bdrv_check == NULL) {
2365e97fc193Saliguori         return -ENOTSUP;
2366e97fc193Saliguori     }
2367e97fc193Saliguori 
2368e076f338SKevin Wolf     memset(res, 0, sizeof(*res));
23694534ff54SKevin Wolf     return bs->drv->bdrv_check(bs, res, fix);
2370e97fc193Saliguori }
2371e97fc193Saliguori 
23728a426614SKevin Wolf #define COMMIT_BUF_SECTORS 2048
23738a426614SKevin Wolf 
237433e3963eSbellard /* commit COW file into the raw image */
237533e3963eSbellard int bdrv_commit(BlockDriverState *bs)
237633e3963eSbellard {
237719cb3738Sbellard     BlockDriver *drv = bs->drv;
237872706ea4SJeff Cody     int64_t sector, total_sectors, length, backing_length;
23798a426614SKevin Wolf     int n, ro, open_flags;
23800bce597dSJeff Cody     int ret = 0;
238172706ea4SJeff Cody     uint8_t *buf = NULL;
238233e3963eSbellard 
238319cb3738Sbellard     if (!drv)
238419cb3738Sbellard         return -ENOMEDIUM;
238533e3963eSbellard 
2386760e0063SKevin Wolf     if (!bs->backing) {
23874dca4b63SNaphtali Sprei         return -ENOTSUP;
23884dca4b63SNaphtali Sprei     }
23894dca4b63SNaphtali Sprei 
2390bb00021dSFam Zheng     if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_COMMIT_SOURCE, NULL) ||
2391760e0063SKevin Wolf         bdrv_op_is_blocked(bs->backing->bs, BLOCK_OP_TYPE_COMMIT_TARGET, NULL)) {
23922d3735d3SStefan Hajnoczi         return -EBUSY;
23932d3735d3SStefan Hajnoczi     }
23942d3735d3SStefan Hajnoczi 
2395760e0063SKevin Wolf     ro = bs->backing->bs->read_only;
2396760e0063SKevin Wolf     open_flags =  bs->backing->bs->open_flags;
23974dca4b63SNaphtali Sprei 
23984dca4b63SNaphtali Sprei     if (ro) {
2399760e0063SKevin Wolf         if (bdrv_reopen(bs->backing->bs, open_flags | BDRV_O_RDWR, NULL)) {
24000bce597dSJeff Cody             return -EACCES;
24014dca4b63SNaphtali Sprei         }
2402ea2384d3Sbellard     }
2403ea2384d3Sbellard 
240472706ea4SJeff Cody     length = bdrv_getlength(bs);
240572706ea4SJeff Cody     if (length < 0) {
240672706ea4SJeff Cody         ret = length;
240772706ea4SJeff Cody         goto ro_cleanup;
240872706ea4SJeff Cody     }
240972706ea4SJeff Cody 
2410760e0063SKevin Wolf     backing_length = bdrv_getlength(bs->backing->bs);
241172706ea4SJeff Cody     if (backing_length < 0) {
241272706ea4SJeff Cody         ret = backing_length;
241372706ea4SJeff Cody         goto ro_cleanup;
241472706ea4SJeff Cody     }
241572706ea4SJeff Cody 
241672706ea4SJeff Cody     /* If our top snapshot is larger than the backing file image,
241772706ea4SJeff Cody      * grow the backing file image if possible.  If not possible,
241872706ea4SJeff Cody      * we must return an error */
241972706ea4SJeff Cody     if (length > backing_length) {
2420760e0063SKevin Wolf         ret = bdrv_truncate(bs->backing->bs, length);
242172706ea4SJeff Cody         if (ret < 0) {
242272706ea4SJeff Cody             goto ro_cleanup;
242372706ea4SJeff Cody         }
242472706ea4SJeff Cody     }
242572706ea4SJeff Cody 
242672706ea4SJeff Cody     total_sectors = length >> BDRV_SECTOR_BITS;
2427857d4f46SKevin Wolf 
2428857d4f46SKevin Wolf     /* qemu_try_blockalign() for bs will choose an alignment that works for
2429760e0063SKevin Wolf      * bs->backing->bs as well, so no need to compare the alignment manually. */
2430857d4f46SKevin Wolf     buf = qemu_try_blockalign(bs, COMMIT_BUF_SECTORS * BDRV_SECTOR_SIZE);
2431857d4f46SKevin Wolf     if (buf == NULL) {
2432857d4f46SKevin Wolf         ret = -ENOMEM;
2433857d4f46SKevin Wolf         goto ro_cleanup;
2434857d4f46SKevin Wolf     }
24358a426614SKevin Wolf 
24368a426614SKevin Wolf     for (sector = 0; sector < total_sectors; sector += n) {
2437d663640cSPaolo Bonzini         ret = bdrv_is_allocated(bs, sector, COMMIT_BUF_SECTORS, &n);
2438d663640cSPaolo Bonzini         if (ret < 0) {
2439d663640cSPaolo Bonzini             goto ro_cleanup;
2440d663640cSPaolo Bonzini         }
2441d663640cSPaolo Bonzini         if (ret) {
2442dabfa6ccSKevin Wolf             ret = bdrv_read(bs, sector, buf, n);
2443dabfa6ccSKevin Wolf             if (ret < 0) {
24444dca4b63SNaphtali Sprei                 goto ro_cleanup;
244533e3963eSbellard             }
244633e3963eSbellard 
2447760e0063SKevin Wolf             ret = bdrv_write(bs->backing->bs, sector, buf, n);
2448dabfa6ccSKevin Wolf             if (ret < 0) {
24494dca4b63SNaphtali Sprei                 goto ro_cleanup;
245033e3963eSbellard             }
245133e3963eSbellard         }
245233e3963eSbellard     }
245395389c86Sbellard 
24541d44952fSChristoph Hellwig     if (drv->bdrv_make_empty) {
24551d44952fSChristoph Hellwig         ret = drv->bdrv_make_empty(bs);
2456dabfa6ccSKevin Wolf         if (ret < 0) {
2457dabfa6ccSKevin Wolf             goto ro_cleanup;
2458dabfa6ccSKevin Wolf         }
24591d44952fSChristoph Hellwig         bdrv_flush(bs);
24601d44952fSChristoph Hellwig     }
246195389c86Sbellard 
24623f5075aeSChristoph Hellwig     /*
24633f5075aeSChristoph Hellwig      * Make sure all data we wrote to the backing device is actually
24643f5075aeSChristoph Hellwig      * stable on disk.
24653f5075aeSChristoph Hellwig      */
2466760e0063SKevin Wolf     if (bs->backing) {
2467760e0063SKevin Wolf         bdrv_flush(bs->backing->bs);
2468dabfa6ccSKevin Wolf     }
24694dca4b63SNaphtali Sprei 
2470dabfa6ccSKevin Wolf     ret = 0;
24714dca4b63SNaphtali Sprei ro_cleanup:
2472857d4f46SKevin Wolf     qemu_vfree(buf);
24734dca4b63SNaphtali Sprei 
24744dca4b63SNaphtali Sprei     if (ro) {
24750bce597dSJeff Cody         /* ignoring error return here */
2476760e0063SKevin Wolf         bdrv_reopen(bs->backing->bs, open_flags & ~BDRV_O_RDWR, NULL);
24774dca4b63SNaphtali Sprei     }
24784dca4b63SNaphtali Sprei 
24791d44952fSChristoph Hellwig     return ret;
248033e3963eSbellard }
248133e3963eSbellard 
2482756e6736SKevin Wolf /*
2483756e6736SKevin Wolf  * Return values:
2484756e6736SKevin Wolf  * 0        - success
2485756e6736SKevin Wolf  * -EINVAL  - backing format specified, but no file
2486756e6736SKevin Wolf  * -ENOSPC  - can't update the backing file because no space is left in the
2487756e6736SKevin Wolf  *            image file header
2488756e6736SKevin Wolf  * -ENOTSUP - format driver doesn't support changing the backing file
2489756e6736SKevin Wolf  */
2490756e6736SKevin Wolf int bdrv_change_backing_file(BlockDriverState *bs,
2491756e6736SKevin Wolf     const char *backing_file, const char *backing_fmt)
2492756e6736SKevin Wolf {
2493756e6736SKevin Wolf     BlockDriver *drv = bs->drv;
2494469ef350SPaolo Bonzini     int ret;
2495756e6736SKevin Wolf 
24965f377794SPaolo Bonzini     /* Backing file format doesn't make sense without a backing file */
24975f377794SPaolo Bonzini     if (backing_fmt && !backing_file) {
24985f377794SPaolo Bonzini         return -EINVAL;
24995f377794SPaolo Bonzini     }
25005f377794SPaolo Bonzini 
2501756e6736SKevin Wolf     if (drv->bdrv_change_backing_file != NULL) {
2502469ef350SPaolo Bonzini         ret = drv->bdrv_change_backing_file(bs, backing_file, backing_fmt);
2503756e6736SKevin Wolf     } else {
2504469ef350SPaolo Bonzini         ret = -ENOTSUP;
2505756e6736SKevin Wolf     }
2506469ef350SPaolo Bonzini 
2507469ef350SPaolo Bonzini     if (ret == 0) {
2508469ef350SPaolo Bonzini         pstrcpy(bs->backing_file, sizeof(bs->backing_file), backing_file ?: "");
2509469ef350SPaolo Bonzini         pstrcpy(bs->backing_format, sizeof(bs->backing_format), backing_fmt ?: "");
2510469ef350SPaolo Bonzini     }
2511469ef350SPaolo Bonzini     return ret;
2512756e6736SKevin Wolf }
2513756e6736SKevin Wolf 
25146ebdcee2SJeff Cody /*
25156ebdcee2SJeff Cody  * Finds the image layer in the chain that has 'bs' as its backing file.
25166ebdcee2SJeff Cody  *
25176ebdcee2SJeff Cody  * active is the current topmost image.
25186ebdcee2SJeff Cody  *
25196ebdcee2SJeff Cody  * Returns NULL if bs is not found in active's image chain,
25206ebdcee2SJeff Cody  * or if active == bs.
25214caf0fcdSJeff Cody  *
25224caf0fcdSJeff Cody  * Returns the bottommost base image if bs == NULL.
25236ebdcee2SJeff Cody  */
25246ebdcee2SJeff Cody BlockDriverState *bdrv_find_overlay(BlockDriverState *active,
25256ebdcee2SJeff Cody                                     BlockDriverState *bs)
25266ebdcee2SJeff Cody {
2527760e0063SKevin Wolf     while (active && bs != backing_bs(active)) {
2528760e0063SKevin Wolf         active = backing_bs(active);
25296ebdcee2SJeff Cody     }
25306ebdcee2SJeff Cody 
25314caf0fcdSJeff Cody     return active;
25326ebdcee2SJeff Cody }
25336ebdcee2SJeff Cody 
25344caf0fcdSJeff Cody /* Given a BDS, searches for the base layer. */
25354caf0fcdSJeff Cody BlockDriverState *bdrv_find_base(BlockDriverState *bs)
25364caf0fcdSJeff Cody {
25374caf0fcdSJeff Cody     return bdrv_find_overlay(bs, NULL);
25386ebdcee2SJeff Cody }
25396ebdcee2SJeff Cody 
25406ebdcee2SJeff Cody /*
25416ebdcee2SJeff Cody  * Drops images above 'base' up to and including 'top', and sets the image
25426ebdcee2SJeff Cody  * above 'top' to have base as its backing file.
25436ebdcee2SJeff Cody  *
25446ebdcee2SJeff Cody  * Requires that the overlay to 'top' is opened r/w, so that the backing file
25456ebdcee2SJeff Cody  * information in 'bs' can be properly updated.
25466ebdcee2SJeff Cody  *
25476ebdcee2SJeff Cody  * E.g., this will convert the following chain:
25486ebdcee2SJeff Cody  * bottom <- base <- intermediate <- top <- active
25496ebdcee2SJeff Cody  *
25506ebdcee2SJeff Cody  * to
25516ebdcee2SJeff Cody  *
25526ebdcee2SJeff Cody  * bottom <- base <- active
25536ebdcee2SJeff Cody  *
25546ebdcee2SJeff Cody  * It is allowed for bottom==base, in which case it converts:
25556ebdcee2SJeff Cody  *
25566ebdcee2SJeff Cody  * base <- intermediate <- top <- active
25576ebdcee2SJeff Cody  *
25586ebdcee2SJeff Cody  * to
25596ebdcee2SJeff Cody  *
25606ebdcee2SJeff Cody  * base <- active
25616ebdcee2SJeff Cody  *
256254e26900SJeff Cody  * If backing_file_str is non-NULL, it will be used when modifying top's
256354e26900SJeff Cody  * overlay image metadata.
256454e26900SJeff Cody  *
25656ebdcee2SJeff Cody  * Error conditions:
25666ebdcee2SJeff Cody  *  if active == top, that is considered an error
25676ebdcee2SJeff Cody  *
25686ebdcee2SJeff Cody  */
25696ebdcee2SJeff Cody int bdrv_drop_intermediate(BlockDriverState *active, BlockDriverState *top,
257054e26900SJeff Cody                            BlockDriverState *base, const char *backing_file_str)
25716ebdcee2SJeff Cody {
25726ebdcee2SJeff Cody     BlockDriverState *new_top_bs = NULL;
25736ebdcee2SJeff Cody     int ret = -EIO;
25746ebdcee2SJeff Cody 
25756ebdcee2SJeff Cody     if (!top->drv || !base->drv) {
25766ebdcee2SJeff Cody         goto exit;
25776ebdcee2SJeff Cody     }
25786ebdcee2SJeff Cody 
25796ebdcee2SJeff Cody     new_top_bs = bdrv_find_overlay(active, top);
25806ebdcee2SJeff Cody 
25816ebdcee2SJeff Cody     if (new_top_bs == NULL) {
25826ebdcee2SJeff Cody         /* we could not find the image above 'top', this is an error */
25836ebdcee2SJeff Cody         goto exit;
25846ebdcee2SJeff Cody     }
25856ebdcee2SJeff Cody 
2586760e0063SKevin Wolf     /* special case of new_top_bs->backing->bs already pointing to base - nothing
25876ebdcee2SJeff Cody      * to do, no intermediate images */
2588760e0063SKevin Wolf     if (backing_bs(new_top_bs) == base) {
25896ebdcee2SJeff Cody         ret = 0;
25906ebdcee2SJeff Cody         goto exit;
25916ebdcee2SJeff Cody     }
25926ebdcee2SJeff Cody 
25935db15a57SKevin Wolf     /* Make sure that base is in the backing chain of top */
25945db15a57SKevin Wolf     if (!bdrv_chain_contains(top, base)) {
25956ebdcee2SJeff Cody         goto exit;
25966ebdcee2SJeff Cody     }
25976ebdcee2SJeff Cody 
25986ebdcee2SJeff Cody     /* success - we can delete the intermediate states, and link top->base */
25995db15a57SKevin Wolf     backing_file_str = backing_file_str ? backing_file_str : base->filename;
260054e26900SJeff Cody     ret = bdrv_change_backing_file(new_top_bs, backing_file_str,
26015db15a57SKevin Wolf                                    base->drv ? base->drv->format_name : "");
26026ebdcee2SJeff Cody     if (ret) {
26036ebdcee2SJeff Cody         goto exit;
26046ebdcee2SJeff Cody     }
26055db15a57SKevin Wolf     bdrv_set_backing_hd(new_top_bs, base);
26066ebdcee2SJeff Cody 
26076ebdcee2SJeff Cody     ret = 0;
26086ebdcee2SJeff Cody exit:
26096ebdcee2SJeff Cody     return ret;
26106ebdcee2SJeff Cody }
26116ebdcee2SJeff Cody 
261283f64091Sbellard /**
261383f64091Sbellard  * Truncate file to 'offset' bytes (needed only for file protocols)
261483f64091Sbellard  */
261583f64091Sbellard int bdrv_truncate(BlockDriverState *bs, int64_t offset)
261683f64091Sbellard {
261783f64091Sbellard     BlockDriver *drv = bs->drv;
261851762288SStefan Hajnoczi     int ret;
261983f64091Sbellard     if (!drv)
262019cb3738Sbellard         return -ENOMEDIUM;
262183f64091Sbellard     if (!drv->bdrv_truncate)
262283f64091Sbellard         return -ENOTSUP;
262359f2689dSNaphtali Sprei     if (bs->read_only)
262459f2689dSNaphtali Sprei         return -EACCES;
26259c75e168SJeff Cody 
262651762288SStefan Hajnoczi     ret = drv->bdrv_truncate(bs, offset);
262751762288SStefan Hajnoczi     if (ret == 0) {
262851762288SStefan Hajnoczi         ret = refresh_total_sectors(bs, offset >> BDRV_SECTOR_BITS);
2629ce1ffea8SJohn Snow         bdrv_dirty_bitmap_truncate(bs);
2630a7f53e26SMarkus Armbruster         if (bs->blk) {
2631a7f53e26SMarkus Armbruster             blk_dev_resize_cb(bs->blk);
2632a7f53e26SMarkus Armbruster         }
263351762288SStefan Hajnoczi     }
263451762288SStefan Hajnoczi     return ret;
263583f64091Sbellard }
263683f64091Sbellard 
263783f64091Sbellard /**
26384a1d5e1fSFam Zheng  * Length of a allocated file in bytes. Sparse files are counted by actual
26394a1d5e1fSFam Zheng  * allocated space. Return < 0 if error or unknown.
26404a1d5e1fSFam Zheng  */
26414a1d5e1fSFam Zheng int64_t bdrv_get_allocated_file_size(BlockDriverState *bs)
26424a1d5e1fSFam Zheng {
26434a1d5e1fSFam Zheng     BlockDriver *drv = bs->drv;
26444a1d5e1fSFam Zheng     if (!drv) {
26454a1d5e1fSFam Zheng         return -ENOMEDIUM;
26464a1d5e1fSFam Zheng     }
26474a1d5e1fSFam Zheng     if (drv->bdrv_get_allocated_file_size) {
26484a1d5e1fSFam Zheng         return drv->bdrv_get_allocated_file_size(bs);
26494a1d5e1fSFam Zheng     }
26504a1d5e1fSFam Zheng     if (bs->file) {
26519a4f4c31SKevin Wolf         return bdrv_get_allocated_file_size(bs->file->bs);
26524a1d5e1fSFam Zheng     }
26534a1d5e1fSFam Zheng     return -ENOTSUP;
26544a1d5e1fSFam Zheng }
26554a1d5e1fSFam Zheng 
26564a1d5e1fSFam Zheng /**
265765a9bb25SMarkus Armbruster  * Return number of sectors on success, -errno on error.
265883f64091Sbellard  */
265965a9bb25SMarkus Armbruster int64_t bdrv_nb_sectors(BlockDriverState *bs)
266083f64091Sbellard {
266183f64091Sbellard     BlockDriver *drv = bs->drv;
266265a9bb25SMarkus Armbruster 
266383f64091Sbellard     if (!drv)
266419cb3738Sbellard         return -ENOMEDIUM;
266551762288SStefan Hajnoczi 
2666b94a2610SKevin Wolf     if (drv->has_variable_length) {
2667b94a2610SKevin Wolf         int ret = refresh_total_sectors(bs, bs->total_sectors);
2668b94a2610SKevin Wolf         if (ret < 0) {
2669b94a2610SKevin Wolf             return ret;
2670fc01f7e7Sbellard         }
267146a4e4e6SStefan Hajnoczi     }
267265a9bb25SMarkus Armbruster     return bs->total_sectors;
267365a9bb25SMarkus Armbruster }
267465a9bb25SMarkus Armbruster 
267565a9bb25SMarkus Armbruster /**
267665a9bb25SMarkus Armbruster  * Return length in bytes on success, -errno on error.
267765a9bb25SMarkus Armbruster  * The length is always a multiple of BDRV_SECTOR_SIZE.
267865a9bb25SMarkus Armbruster  */
267965a9bb25SMarkus Armbruster int64_t bdrv_getlength(BlockDriverState *bs)
268065a9bb25SMarkus Armbruster {
268165a9bb25SMarkus Armbruster     int64_t ret = bdrv_nb_sectors(bs);
268265a9bb25SMarkus Armbruster 
26834a9c9ea0SFam Zheng     ret = ret > INT64_MAX / BDRV_SECTOR_SIZE ? -EFBIG : ret;
268465a9bb25SMarkus Armbruster     return ret < 0 ? ret : ret * BDRV_SECTOR_SIZE;
268546a4e4e6SStefan Hajnoczi }
2686fc01f7e7Sbellard 
268719cb3738Sbellard /* return 0 as number of sectors if no device present or error */
268896b8f136Sths void bdrv_get_geometry(BlockDriverState *bs, uint64_t *nb_sectors_ptr)
2689fc01f7e7Sbellard {
269065a9bb25SMarkus Armbruster     int64_t nb_sectors = bdrv_nb_sectors(bs);
269165a9bb25SMarkus Armbruster 
269265a9bb25SMarkus Armbruster     *nb_sectors_ptr = nb_sectors < 0 ? 0 : nb_sectors;
2693fc01f7e7Sbellard }
2694cf98951bSbellard 
2695b338082bSbellard int bdrv_is_read_only(BlockDriverState *bs)
2696b338082bSbellard {
2697b338082bSbellard     return bs->read_only;
2698b338082bSbellard }
2699b338082bSbellard 
2700985a03b0Sths int bdrv_is_sg(BlockDriverState *bs)
2701985a03b0Sths {
2702985a03b0Sths     return bs->sg;
2703985a03b0Sths }
2704985a03b0Sths 
2705ea2384d3Sbellard int bdrv_is_encrypted(BlockDriverState *bs)
2706ea2384d3Sbellard {
2707760e0063SKevin Wolf     if (bs->backing && bs->backing->bs->encrypted) {
2708ea2384d3Sbellard         return 1;
2709760e0063SKevin Wolf     }
2710ea2384d3Sbellard     return bs->encrypted;
2711ea2384d3Sbellard }
2712ea2384d3Sbellard 
2713c0f4ce77Saliguori int bdrv_key_required(BlockDriverState *bs)
2714c0f4ce77Saliguori {
2715760e0063SKevin Wolf     BdrvChild *backing = bs->backing;
2716c0f4ce77Saliguori 
2717760e0063SKevin Wolf     if (backing && backing->bs->encrypted && !backing->bs->valid_key) {
2718c0f4ce77Saliguori         return 1;
2719760e0063SKevin Wolf     }
2720c0f4ce77Saliguori     return (bs->encrypted && !bs->valid_key);
2721c0f4ce77Saliguori }
2722c0f4ce77Saliguori 
2723ea2384d3Sbellard int bdrv_set_key(BlockDriverState *bs, const char *key)
2724ea2384d3Sbellard {
2725ea2384d3Sbellard     int ret;
2726760e0063SKevin Wolf     if (bs->backing && bs->backing->bs->encrypted) {
2727760e0063SKevin Wolf         ret = bdrv_set_key(bs->backing->bs, key);
2728ea2384d3Sbellard         if (ret < 0)
2729ea2384d3Sbellard             return ret;
2730ea2384d3Sbellard         if (!bs->encrypted)
2731ea2384d3Sbellard             return 0;
2732ea2384d3Sbellard     }
2733fd04a2aeSShahar Havivi     if (!bs->encrypted) {
2734fd04a2aeSShahar Havivi         return -EINVAL;
2735fd04a2aeSShahar Havivi     } else if (!bs->drv || !bs->drv->bdrv_set_key) {
2736fd04a2aeSShahar Havivi         return -ENOMEDIUM;
2737fd04a2aeSShahar Havivi     }
2738c0f4ce77Saliguori     ret = bs->drv->bdrv_set_key(bs, key);
2739bb5fc20fSaliguori     if (ret < 0) {
2740bb5fc20fSaliguori         bs->valid_key = 0;
2741bb5fc20fSaliguori     } else if (!bs->valid_key) {
2742bb5fc20fSaliguori         bs->valid_key = 1;
2743a7f53e26SMarkus Armbruster         if (bs->blk) {
2744bb5fc20fSaliguori             /* call the change callback now, we skipped it on open */
2745a7f53e26SMarkus Armbruster             blk_dev_change_media_cb(bs->blk, true);
2746a7f53e26SMarkus Armbruster         }
2747bb5fc20fSaliguori     }
2748c0f4ce77Saliguori     return ret;
2749ea2384d3Sbellard }
2750ea2384d3Sbellard 
27514d2855a3SMarkus Armbruster /*
27524d2855a3SMarkus Armbruster  * Provide an encryption key for @bs.
27534d2855a3SMarkus Armbruster  * If @key is non-null:
27544d2855a3SMarkus Armbruster  *     If @bs is not encrypted, fail.
27554d2855a3SMarkus Armbruster  *     Else if the key is invalid, fail.
27564d2855a3SMarkus Armbruster  *     Else set @bs's key to @key, replacing the existing key, if any.
27574d2855a3SMarkus Armbruster  * If @key is null:
27584d2855a3SMarkus Armbruster  *     If @bs is encrypted and still lacks a key, fail.
27594d2855a3SMarkus Armbruster  *     Else do nothing.
27604d2855a3SMarkus Armbruster  * On failure, store an error object through @errp if non-null.
27614d2855a3SMarkus Armbruster  */
27624d2855a3SMarkus Armbruster void bdrv_add_key(BlockDriverState *bs, const char *key, Error **errp)
27634d2855a3SMarkus Armbruster {
27644d2855a3SMarkus Armbruster     if (key) {
27654d2855a3SMarkus Armbruster         if (!bdrv_is_encrypted(bs)) {
276681e5f78aSAlberto Garcia             error_setg(errp, "Node '%s' is not encrypted",
276781e5f78aSAlberto Garcia                       bdrv_get_device_or_node_name(bs));
27684d2855a3SMarkus Armbruster         } else if (bdrv_set_key(bs, key) < 0) {
2769c6bd8c70SMarkus Armbruster             error_setg(errp, QERR_INVALID_PASSWORD);
27704d2855a3SMarkus Armbruster         }
27714d2855a3SMarkus Armbruster     } else {
27724d2855a3SMarkus Armbruster         if (bdrv_key_required(bs)) {
2773b1ca6391SMarkus Armbruster             error_set(errp, ERROR_CLASS_DEVICE_ENCRYPTED,
2774b1ca6391SMarkus Armbruster                       "'%s' (%s) is encrypted",
277581e5f78aSAlberto Garcia                       bdrv_get_device_or_node_name(bs),
27764d2855a3SMarkus Armbruster                       bdrv_get_encrypted_filename(bs));
27774d2855a3SMarkus Armbruster         }
27784d2855a3SMarkus Armbruster     }
27794d2855a3SMarkus Armbruster }
27804d2855a3SMarkus Armbruster 
2781f8d6bba1SMarkus Armbruster const char *bdrv_get_format_name(BlockDriverState *bs)
2782ea2384d3Sbellard {
2783f8d6bba1SMarkus Armbruster     return bs->drv ? bs->drv->format_name : NULL;
2784ea2384d3Sbellard }
2785ea2384d3Sbellard 
2786ada42401SStefan Hajnoczi static int qsort_strcmp(const void *a, const void *b)
2787ada42401SStefan Hajnoczi {
2788ada42401SStefan Hajnoczi     return strcmp(a, b);
2789ada42401SStefan Hajnoczi }
2790ada42401SStefan Hajnoczi 
2791ea2384d3Sbellard void bdrv_iterate_format(void (*it)(void *opaque, const char *name),
2792ea2384d3Sbellard                          void *opaque)
2793ea2384d3Sbellard {
2794ea2384d3Sbellard     BlockDriver *drv;
2795e855e4fbSJeff Cody     int count = 0;
2796ada42401SStefan Hajnoczi     int i;
2797e855e4fbSJeff Cody     const char **formats = NULL;
2798ea2384d3Sbellard 
27998a22f02aSStefan Hajnoczi     QLIST_FOREACH(drv, &bdrv_drivers, list) {
2800e855e4fbSJeff Cody         if (drv->format_name) {
2801e855e4fbSJeff Cody             bool found = false;
2802e855e4fbSJeff Cody             int i = count;
2803e855e4fbSJeff Cody             while (formats && i && !found) {
2804e855e4fbSJeff Cody                 found = !strcmp(formats[--i], drv->format_name);
2805e855e4fbSJeff Cody             }
2806e855e4fbSJeff Cody 
2807e855e4fbSJeff Cody             if (!found) {
28085839e53bSMarkus Armbruster                 formats = g_renew(const char *, formats, count + 1);
2809e855e4fbSJeff Cody                 formats[count++] = drv->format_name;
2810ea2384d3Sbellard             }
2811ea2384d3Sbellard         }
2812e855e4fbSJeff Cody     }
2813ada42401SStefan Hajnoczi 
2814ada42401SStefan Hajnoczi     qsort(formats, count, sizeof(formats[0]), qsort_strcmp);
2815ada42401SStefan Hajnoczi 
2816ada42401SStefan Hajnoczi     for (i = 0; i < count; i++) {
2817ada42401SStefan Hajnoczi         it(opaque, formats[i]);
2818ada42401SStefan Hajnoczi     }
2819ada42401SStefan Hajnoczi 
2820e855e4fbSJeff Cody     g_free(formats);
2821e855e4fbSJeff Cody }
2822ea2384d3Sbellard 
2823dc364f4cSBenoît Canet /* This function is to find a node in the bs graph */
2824dc364f4cSBenoît Canet BlockDriverState *bdrv_find_node(const char *node_name)
2825dc364f4cSBenoît Canet {
2826dc364f4cSBenoît Canet     BlockDriverState *bs;
2827dc364f4cSBenoît Canet 
2828dc364f4cSBenoît Canet     assert(node_name);
2829dc364f4cSBenoît Canet 
2830dc364f4cSBenoît Canet     QTAILQ_FOREACH(bs, &graph_bdrv_states, node_list) {
2831dc364f4cSBenoît Canet         if (!strcmp(node_name, bs->node_name)) {
2832dc364f4cSBenoît Canet             return bs;
2833dc364f4cSBenoît Canet         }
2834dc364f4cSBenoît Canet     }
2835dc364f4cSBenoît Canet     return NULL;
2836dc364f4cSBenoît Canet }
2837dc364f4cSBenoît Canet 
2838c13163fbSBenoît Canet /* Put this QMP function here so it can access the static graph_bdrv_states. */
2839d5a8ee60SAlberto Garcia BlockDeviceInfoList *bdrv_named_nodes_list(Error **errp)
2840c13163fbSBenoît Canet {
2841c13163fbSBenoît Canet     BlockDeviceInfoList *list, *entry;
2842c13163fbSBenoît Canet     BlockDriverState *bs;
2843c13163fbSBenoît Canet 
2844c13163fbSBenoît Canet     list = NULL;
2845c13163fbSBenoît Canet     QTAILQ_FOREACH(bs, &graph_bdrv_states, node_list) {
2846c83f9fbaSKevin Wolf         BlockDeviceInfo *info = bdrv_block_device_info(NULL, bs, errp);
2847d5a8ee60SAlberto Garcia         if (!info) {
2848d5a8ee60SAlberto Garcia             qapi_free_BlockDeviceInfoList(list);
2849d5a8ee60SAlberto Garcia             return NULL;
2850d5a8ee60SAlberto Garcia         }
2851c13163fbSBenoît Canet         entry = g_malloc0(sizeof(*entry));
2852d5a8ee60SAlberto Garcia         entry->value = info;
2853c13163fbSBenoît Canet         entry->next = list;
2854c13163fbSBenoît Canet         list = entry;
2855c13163fbSBenoît Canet     }
2856c13163fbSBenoît Canet 
2857c13163fbSBenoît Canet     return list;
2858c13163fbSBenoît Canet }
2859c13163fbSBenoît Canet 
286012d3ba82SBenoît Canet BlockDriverState *bdrv_lookup_bs(const char *device,
286112d3ba82SBenoît Canet                                  const char *node_name,
286212d3ba82SBenoît Canet                                  Error **errp)
286312d3ba82SBenoît Canet {
28647f06d47eSMarkus Armbruster     BlockBackend *blk;
28657f06d47eSMarkus Armbruster     BlockDriverState *bs;
286612d3ba82SBenoît Canet 
286712d3ba82SBenoît Canet     if (device) {
28687f06d47eSMarkus Armbruster         blk = blk_by_name(device);
286912d3ba82SBenoît Canet 
28707f06d47eSMarkus Armbruster         if (blk) {
28719f4ed6fbSAlberto Garcia             bs = blk_bs(blk);
28729f4ed6fbSAlberto Garcia             if (!bs) {
28735433c24fSMax Reitz                 error_setg(errp, "Device '%s' has no medium", device);
28745433c24fSMax Reitz             }
28755433c24fSMax Reitz 
28769f4ed6fbSAlberto Garcia             return bs;
287712d3ba82SBenoît Canet         }
2878dd67fa50SBenoît Canet     }
287912d3ba82SBenoît Canet 
2880dd67fa50SBenoît Canet     if (node_name) {
288112d3ba82SBenoît Canet         bs = bdrv_find_node(node_name);
288212d3ba82SBenoît Canet 
2883dd67fa50SBenoît Canet         if (bs) {
2884dd67fa50SBenoît Canet             return bs;
2885dd67fa50SBenoît Canet         }
288612d3ba82SBenoît Canet     }
288712d3ba82SBenoît Canet 
2888dd67fa50SBenoît Canet     error_setg(errp, "Cannot find device=%s nor node_name=%s",
2889dd67fa50SBenoît Canet                      device ? device : "",
2890dd67fa50SBenoît Canet                      node_name ? node_name : "");
2891dd67fa50SBenoît Canet     return NULL;
289212d3ba82SBenoît Canet }
289312d3ba82SBenoît Canet 
28945a6684d2SJeff Cody /* If 'base' is in the same chain as 'top', return true. Otherwise,
28955a6684d2SJeff Cody  * return false.  If either argument is NULL, return false. */
28965a6684d2SJeff Cody bool bdrv_chain_contains(BlockDriverState *top, BlockDriverState *base)
28975a6684d2SJeff Cody {
28985a6684d2SJeff Cody     while (top && top != base) {
2899760e0063SKevin Wolf         top = backing_bs(top);
29005a6684d2SJeff Cody     }
29015a6684d2SJeff Cody 
29025a6684d2SJeff Cody     return top != NULL;
29035a6684d2SJeff Cody }
29045a6684d2SJeff Cody 
290504df765aSFam Zheng BlockDriverState *bdrv_next_node(BlockDriverState *bs)
290604df765aSFam Zheng {
290704df765aSFam Zheng     if (!bs) {
290804df765aSFam Zheng         return QTAILQ_FIRST(&graph_bdrv_states);
290904df765aSFam Zheng     }
291004df765aSFam Zheng     return QTAILQ_NEXT(bs, node_list);
291104df765aSFam Zheng }
291204df765aSFam Zheng 
291326260580SMax Reitz /* Iterates over all top-level BlockDriverStates, i.e. BDSs that are owned by
291426260580SMax Reitz  * the monitor or attached to a BlockBackend */
29152f399b0aSMarkus Armbruster BlockDriverState *bdrv_next(BlockDriverState *bs)
29162f399b0aSMarkus Armbruster {
291726260580SMax Reitz     if (!bs || bs->blk) {
291826260580SMax Reitz         bs = blk_next_root_bs(bs);
291926260580SMax Reitz         if (bs) {
292026260580SMax Reitz             return bs;
29212f399b0aSMarkus Armbruster         }
292226260580SMax Reitz     }
292326260580SMax Reitz 
292426260580SMax Reitz     /* Ignore all BDSs that are attached to a BlockBackend here; they have been
292526260580SMax Reitz      * handled by the above block already */
292626260580SMax Reitz     do {
292726260580SMax Reitz         bs = bdrv_next_monitor_owned(bs);
292826260580SMax Reitz     } while (bs && bs->blk);
292926260580SMax Reitz     return bs;
29302f399b0aSMarkus Armbruster }
29312f399b0aSMarkus Armbruster 
293220a9e77dSFam Zheng const char *bdrv_get_node_name(const BlockDriverState *bs)
293320a9e77dSFam Zheng {
293420a9e77dSFam Zheng     return bs->node_name;
293520a9e77dSFam Zheng }
293620a9e77dSFam Zheng 
29377f06d47eSMarkus Armbruster /* TODO check what callers really want: bs->node_name or blk_name() */
2938bfb197e0SMarkus Armbruster const char *bdrv_get_device_name(const BlockDriverState *bs)
2939ea2384d3Sbellard {
2940bfb197e0SMarkus Armbruster     return bs->blk ? blk_name(bs->blk) : "";
2941ea2384d3Sbellard }
2942ea2384d3Sbellard 
29439b2aa84fSAlberto Garcia /* This can be used to identify nodes that might not have a device
29449b2aa84fSAlberto Garcia  * name associated. Since node and device names live in the same
29459b2aa84fSAlberto Garcia  * namespace, the result is unambiguous. The exception is if both are
29469b2aa84fSAlberto Garcia  * absent, then this returns an empty (non-null) string. */
29479b2aa84fSAlberto Garcia const char *bdrv_get_device_or_node_name(const BlockDriverState *bs)
29489b2aa84fSAlberto Garcia {
29499b2aa84fSAlberto Garcia     return bs->blk ? blk_name(bs->blk) : bs->node_name;
29509b2aa84fSAlberto Garcia }
29519b2aa84fSAlberto Garcia 
2952c8433287SMarkus Armbruster int bdrv_get_flags(BlockDriverState *bs)
2953c8433287SMarkus Armbruster {
2954c8433287SMarkus Armbruster     return bs->open_flags;
2955c8433287SMarkus Armbruster }
2956c8433287SMarkus Armbruster 
29573ac21627SPeter Lieven int bdrv_has_zero_init_1(BlockDriverState *bs)
29583ac21627SPeter Lieven {
29593ac21627SPeter Lieven     return 1;
29603ac21627SPeter Lieven }
29613ac21627SPeter Lieven 
2962f2feebbdSKevin Wolf int bdrv_has_zero_init(BlockDriverState *bs)
2963f2feebbdSKevin Wolf {
2964f2feebbdSKevin Wolf     assert(bs->drv);
2965f2feebbdSKevin Wolf 
296611212d8fSPaolo Bonzini     /* If BS is a copy on write image, it is initialized to
296711212d8fSPaolo Bonzini        the contents of the base image, which may not be zeroes.  */
2968760e0063SKevin Wolf     if (bs->backing) {
296911212d8fSPaolo Bonzini         return 0;
297011212d8fSPaolo Bonzini     }
2971336c1c12SKevin Wolf     if (bs->drv->bdrv_has_zero_init) {
2972336c1c12SKevin Wolf         return bs->drv->bdrv_has_zero_init(bs);
2973f2feebbdSKevin Wolf     }
2974f2feebbdSKevin Wolf 
29753ac21627SPeter Lieven     /* safe default */
29763ac21627SPeter Lieven     return 0;
2977f2feebbdSKevin Wolf }
2978f2feebbdSKevin Wolf 
29794ce78691SPeter Lieven bool bdrv_unallocated_blocks_are_zero(BlockDriverState *bs)
29804ce78691SPeter Lieven {
29814ce78691SPeter Lieven     BlockDriverInfo bdi;
29824ce78691SPeter Lieven 
2983760e0063SKevin Wolf     if (bs->backing) {
29844ce78691SPeter Lieven         return false;
29854ce78691SPeter Lieven     }
29864ce78691SPeter Lieven 
29874ce78691SPeter Lieven     if (bdrv_get_info(bs, &bdi) == 0) {
29884ce78691SPeter Lieven         return bdi.unallocated_blocks_are_zero;
29894ce78691SPeter Lieven     }
29904ce78691SPeter Lieven 
29914ce78691SPeter Lieven     return false;
29924ce78691SPeter Lieven }
29934ce78691SPeter Lieven 
29944ce78691SPeter Lieven bool bdrv_can_write_zeroes_with_unmap(BlockDriverState *bs)
29954ce78691SPeter Lieven {
29964ce78691SPeter Lieven     BlockDriverInfo bdi;
29974ce78691SPeter Lieven 
2998760e0063SKevin Wolf     if (bs->backing || !(bs->open_flags & BDRV_O_UNMAP)) {
29994ce78691SPeter Lieven         return false;
30004ce78691SPeter Lieven     }
30014ce78691SPeter Lieven 
30024ce78691SPeter Lieven     if (bdrv_get_info(bs, &bdi) == 0) {
30034ce78691SPeter Lieven         return bdi.can_write_zeroes_with_unmap;
30044ce78691SPeter Lieven     }
30054ce78691SPeter Lieven 
30064ce78691SPeter Lieven     return false;
30074ce78691SPeter Lieven }
30084ce78691SPeter Lieven 
3009045df330Saliguori const char *bdrv_get_encrypted_filename(BlockDriverState *bs)
3010045df330Saliguori {
3011760e0063SKevin Wolf     if (bs->backing && bs->backing->bs->encrypted)
3012045df330Saliguori         return bs->backing_file;
3013045df330Saliguori     else if (bs->encrypted)
3014045df330Saliguori         return bs->filename;
3015045df330Saliguori     else
3016045df330Saliguori         return NULL;
3017045df330Saliguori }
3018045df330Saliguori 
301983f64091Sbellard void bdrv_get_backing_filename(BlockDriverState *bs,
302083f64091Sbellard                                char *filename, int filename_size)
302183f64091Sbellard {
302283f64091Sbellard     pstrcpy(filename, filename_size, bs->backing_file);
302383f64091Sbellard }
302483f64091Sbellard 
3025faea38e7Sbellard int bdrv_get_info(BlockDriverState *bs, BlockDriverInfo *bdi)
3026faea38e7Sbellard {
3027faea38e7Sbellard     BlockDriver *drv = bs->drv;
3028faea38e7Sbellard     if (!drv)
302919cb3738Sbellard         return -ENOMEDIUM;
3030faea38e7Sbellard     if (!drv->bdrv_get_info)
3031faea38e7Sbellard         return -ENOTSUP;
3032faea38e7Sbellard     memset(bdi, 0, sizeof(*bdi));
3033faea38e7Sbellard     return drv->bdrv_get_info(bs, bdi);
3034faea38e7Sbellard }
3035faea38e7Sbellard 
3036eae041feSMax Reitz ImageInfoSpecific *bdrv_get_specific_info(BlockDriverState *bs)
3037eae041feSMax Reitz {
3038eae041feSMax Reitz     BlockDriver *drv = bs->drv;
3039eae041feSMax Reitz     if (drv && drv->bdrv_get_specific_info) {
3040eae041feSMax Reitz         return drv->bdrv_get_specific_info(bs);
3041eae041feSMax Reitz     }
3042eae041feSMax Reitz     return NULL;
3043eae041feSMax Reitz }
3044eae041feSMax Reitz 
3045a31939e6SEric Blake void bdrv_debug_event(BlockDriverState *bs, BlkdebugEvent event)
30468b9b0cc2SKevin Wolf {
3047bf736fe3SKevin Wolf     if (!bs || !bs->drv || !bs->drv->bdrv_debug_event) {
30488b9b0cc2SKevin Wolf         return;
30498b9b0cc2SKevin Wolf     }
30508b9b0cc2SKevin Wolf 
3051bf736fe3SKevin Wolf     bs->drv->bdrv_debug_event(bs, event);
305241c695c7SKevin Wolf }
30538b9b0cc2SKevin Wolf 
305441c695c7SKevin Wolf int bdrv_debug_breakpoint(BlockDriverState *bs, const char *event,
305541c695c7SKevin Wolf                           const char *tag)
305641c695c7SKevin Wolf {
305741c695c7SKevin Wolf     while (bs && bs->drv && !bs->drv->bdrv_debug_breakpoint) {
30589a4f4c31SKevin Wolf         bs = bs->file ? bs->file->bs : NULL;
305941c695c7SKevin Wolf     }
306041c695c7SKevin Wolf 
306141c695c7SKevin Wolf     if (bs && bs->drv && bs->drv->bdrv_debug_breakpoint) {
306241c695c7SKevin Wolf         return bs->drv->bdrv_debug_breakpoint(bs, event, tag);
306341c695c7SKevin Wolf     }
306441c695c7SKevin Wolf 
306541c695c7SKevin Wolf     return -ENOTSUP;
306641c695c7SKevin Wolf }
306741c695c7SKevin Wolf 
30684cc70e93SFam Zheng int bdrv_debug_remove_breakpoint(BlockDriverState *bs, const char *tag)
30694cc70e93SFam Zheng {
30704cc70e93SFam Zheng     while (bs && bs->drv && !bs->drv->bdrv_debug_remove_breakpoint) {
30719a4f4c31SKevin Wolf         bs = bs->file ? bs->file->bs : NULL;
30724cc70e93SFam Zheng     }
30734cc70e93SFam Zheng 
30744cc70e93SFam Zheng     if (bs && bs->drv && bs->drv->bdrv_debug_remove_breakpoint) {
30754cc70e93SFam Zheng         return bs->drv->bdrv_debug_remove_breakpoint(bs, tag);
30764cc70e93SFam Zheng     }
30774cc70e93SFam Zheng 
30784cc70e93SFam Zheng     return -ENOTSUP;
30794cc70e93SFam Zheng }
30804cc70e93SFam Zheng 
308141c695c7SKevin Wolf int bdrv_debug_resume(BlockDriverState *bs, const char *tag)
308241c695c7SKevin Wolf {
3083938789eaSMax Reitz     while (bs && (!bs->drv || !bs->drv->bdrv_debug_resume)) {
30849a4f4c31SKevin Wolf         bs = bs->file ? bs->file->bs : NULL;
308541c695c7SKevin Wolf     }
308641c695c7SKevin Wolf 
308741c695c7SKevin Wolf     if (bs && bs->drv && bs->drv->bdrv_debug_resume) {
308841c695c7SKevin Wolf         return bs->drv->bdrv_debug_resume(bs, tag);
308941c695c7SKevin Wolf     }
309041c695c7SKevin Wolf 
309141c695c7SKevin Wolf     return -ENOTSUP;
309241c695c7SKevin Wolf }
309341c695c7SKevin Wolf 
309441c695c7SKevin Wolf bool bdrv_debug_is_suspended(BlockDriverState *bs, const char *tag)
309541c695c7SKevin Wolf {
309641c695c7SKevin Wolf     while (bs && bs->drv && !bs->drv->bdrv_debug_is_suspended) {
30979a4f4c31SKevin Wolf         bs = bs->file ? bs->file->bs : NULL;
309841c695c7SKevin Wolf     }
309941c695c7SKevin Wolf 
310041c695c7SKevin Wolf     if (bs && bs->drv && bs->drv->bdrv_debug_is_suspended) {
310141c695c7SKevin Wolf         return bs->drv->bdrv_debug_is_suspended(bs, tag);
310241c695c7SKevin Wolf     }
310341c695c7SKevin Wolf 
310441c695c7SKevin Wolf     return false;
31058b9b0cc2SKevin Wolf }
31068b9b0cc2SKevin Wolf 
3107199630b6SBlue Swirl int bdrv_is_snapshot(BlockDriverState *bs)
3108199630b6SBlue Swirl {
3109199630b6SBlue Swirl     return !!(bs->open_flags & BDRV_O_SNAPSHOT);
3110199630b6SBlue Swirl }
3111199630b6SBlue Swirl 
3112b1b1d783SJeff Cody /* backing_file can either be relative, or absolute, or a protocol.  If it is
3113b1b1d783SJeff Cody  * relative, it must be relative to the chain.  So, passing in bs->filename
3114b1b1d783SJeff Cody  * from a BDS as backing_file should not be done, as that may be relative to
3115b1b1d783SJeff Cody  * the CWD rather than the chain. */
3116e8a6bb9cSMarcelo Tosatti BlockDriverState *bdrv_find_backing_image(BlockDriverState *bs,
3117e8a6bb9cSMarcelo Tosatti         const char *backing_file)
3118e8a6bb9cSMarcelo Tosatti {
3119b1b1d783SJeff Cody     char *filename_full = NULL;
3120b1b1d783SJeff Cody     char *backing_file_full = NULL;
3121b1b1d783SJeff Cody     char *filename_tmp = NULL;
3122b1b1d783SJeff Cody     int is_protocol = 0;
3123b1b1d783SJeff Cody     BlockDriverState *curr_bs = NULL;
3124b1b1d783SJeff Cody     BlockDriverState *retval = NULL;
3125b1b1d783SJeff Cody 
3126b1b1d783SJeff Cody     if (!bs || !bs->drv || !backing_file) {
3127e8a6bb9cSMarcelo Tosatti         return NULL;
3128e8a6bb9cSMarcelo Tosatti     }
3129e8a6bb9cSMarcelo Tosatti 
3130b1b1d783SJeff Cody     filename_full     = g_malloc(PATH_MAX);
3131b1b1d783SJeff Cody     backing_file_full = g_malloc(PATH_MAX);
3132b1b1d783SJeff Cody     filename_tmp      = g_malloc(PATH_MAX);
3133b1b1d783SJeff Cody 
3134b1b1d783SJeff Cody     is_protocol = path_has_protocol(backing_file);
3135b1b1d783SJeff Cody 
3136760e0063SKevin Wolf     for (curr_bs = bs; curr_bs->backing; curr_bs = curr_bs->backing->bs) {
3137b1b1d783SJeff Cody 
3138b1b1d783SJeff Cody         /* If either of the filename paths is actually a protocol, then
3139b1b1d783SJeff Cody          * compare unmodified paths; otherwise make paths relative */
3140b1b1d783SJeff Cody         if (is_protocol || path_has_protocol(curr_bs->backing_file)) {
3141b1b1d783SJeff Cody             if (strcmp(backing_file, curr_bs->backing_file) == 0) {
3142760e0063SKevin Wolf                 retval = curr_bs->backing->bs;
3143b1b1d783SJeff Cody                 break;
3144b1b1d783SJeff Cody             }
3145e8a6bb9cSMarcelo Tosatti         } else {
3146b1b1d783SJeff Cody             /* If not an absolute filename path, make it relative to the current
3147b1b1d783SJeff Cody              * image's filename path */
3148b1b1d783SJeff Cody             path_combine(filename_tmp, PATH_MAX, curr_bs->filename,
3149b1b1d783SJeff Cody                          backing_file);
3150b1b1d783SJeff Cody 
3151b1b1d783SJeff Cody             /* We are going to compare absolute pathnames */
3152b1b1d783SJeff Cody             if (!realpath(filename_tmp, filename_full)) {
3153b1b1d783SJeff Cody                 continue;
3154b1b1d783SJeff Cody             }
3155b1b1d783SJeff Cody 
3156b1b1d783SJeff Cody             /* We need to make sure the backing filename we are comparing against
3157b1b1d783SJeff Cody              * is relative to the current image filename (or absolute) */
3158b1b1d783SJeff Cody             path_combine(filename_tmp, PATH_MAX, curr_bs->filename,
3159b1b1d783SJeff Cody                          curr_bs->backing_file);
3160b1b1d783SJeff Cody 
3161b1b1d783SJeff Cody             if (!realpath(filename_tmp, backing_file_full)) {
3162b1b1d783SJeff Cody                 continue;
3163b1b1d783SJeff Cody             }
3164b1b1d783SJeff Cody 
3165b1b1d783SJeff Cody             if (strcmp(backing_file_full, filename_full) == 0) {
3166760e0063SKevin Wolf                 retval = curr_bs->backing->bs;
3167b1b1d783SJeff Cody                 break;
3168b1b1d783SJeff Cody             }
3169e8a6bb9cSMarcelo Tosatti         }
3170e8a6bb9cSMarcelo Tosatti     }
3171e8a6bb9cSMarcelo Tosatti 
3172b1b1d783SJeff Cody     g_free(filename_full);
3173b1b1d783SJeff Cody     g_free(backing_file_full);
3174b1b1d783SJeff Cody     g_free(filename_tmp);
3175b1b1d783SJeff Cody     return retval;
3176e8a6bb9cSMarcelo Tosatti }
3177e8a6bb9cSMarcelo Tosatti 
3178f198fd1cSBenoît Canet int bdrv_get_backing_file_depth(BlockDriverState *bs)
3179f198fd1cSBenoît Canet {
3180f198fd1cSBenoît Canet     if (!bs->drv) {
3181f198fd1cSBenoît Canet         return 0;
3182f198fd1cSBenoît Canet     }
3183f198fd1cSBenoît Canet 
3184760e0063SKevin Wolf     if (!bs->backing) {
3185f198fd1cSBenoît Canet         return 0;
3186f198fd1cSBenoît Canet     }
3187f198fd1cSBenoît Canet 
3188760e0063SKevin Wolf     return 1 + bdrv_get_backing_file_depth(bs->backing->bs);
3189f198fd1cSBenoît Canet }
3190f198fd1cSBenoît Canet 
3191ea2384d3Sbellard void bdrv_init(void)
3192ea2384d3Sbellard {
31935efa9d5aSAnthony Liguori     module_call_init(MODULE_INIT_BLOCK);
3194ea2384d3Sbellard }
3195ce1a14dcSpbrook 
3196eb852011SMarkus Armbruster void bdrv_init_with_whitelist(void)
3197eb852011SMarkus Armbruster {
3198eb852011SMarkus Armbruster     use_bdrv_whitelist = 1;
3199eb852011SMarkus Armbruster     bdrv_init();
3200eb852011SMarkus Armbruster }
3201eb852011SMarkus Armbruster 
32025a8a30dbSKevin Wolf void bdrv_invalidate_cache(BlockDriverState *bs, Error **errp)
32030f15423cSAnthony Liguori {
32045a8a30dbSKevin Wolf     Error *local_err = NULL;
32055a8a30dbSKevin Wolf     int ret;
32065a8a30dbSKevin Wolf 
32073456a8d1SKevin Wolf     if (!bs->drv)  {
32083456a8d1SKevin Wolf         return;
32090f15423cSAnthony Liguori     }
32103456a8d1SKevin Wolf 
321104c01a5cSKevin Wolf     if (!(bs->open_flags & BDRV_O_INACTIVE)) {
32127ea2d269SAlexey Kardashevskiy         return;
32137ea2d269SAlexey Kardashevskiy     }
321404c01a5cSKevin Wolf     bs->open_flags &= ~BDRV_O_INACTIVE;
32157ea2d269SAlexey Kardashevskiy 
32163456a8d1SKevin Wolf     if (bs->drv->bdrv_invalidate_cache) {
32175a8a30dbSKevin Wolf         bs->drv->bdrv_invalidate_cache(bs, &local_err);
32183456a8d1SKevin Wolf     } else if (bs->file) {
32199a4f4c31SKevin Wolf         bdrv_invalidate_cache(bs->file->bs, &local_err);
32205a8a30dbSKevin Wolf     }
32215a8a30dbSKevin Wolf     if (local_err) {
322204c01a5cSKevin Wolf         bs->open_flags |= BDRV_O_INACTIVE;
32235a8a30dbSKevin Wolf         error_propagate(errp, local_err);
32245a8a30dbSKevin Wolf         return;
32253456a8d1SKevin Wolf     }
32263456a8d1SKevin Wolf 
32275a8a30dbSKevin Wolf     ret = refresh_total_sectors(bs, bs->total_sectors);
32285a8a30dbSKevin Wolf     if (ret < 0) {
322904c01a5cSKevin Wolf         bs->open_flags |= BDRV_O_INACTIVE;
32305a8a30dbSKevin Wolf         error_setg_errno(errp, -ret, "Could not refresh total sector count");
32315a8a30dbSKevin Wolf         return;
32325a8a30dbSKevin Wolf     }
32330f15423cSAnthony Liguori }
32340f15423cSAnthony Liguori 
32355a8a30dbSKevin Wolf void bdrv_invalidate_cache_all(Error **errp)
32360f15423cSAnthony Liguori {
323779720af6SMax Reitz     BlockDriverState *bs = NULL;
32385a8a30dbSKevin Wolf     Error *local_err = NULL;
32390f15423cSAnthony Liguori 
324079720af6SMax Reitz     while ((bs = bdrv_next(bs)) != NULL) {
3241ed78cda3SStefan Hajnoczi         AioContext *aio_context = bdrv_get_aio_context(bs);
3242ed78cda3SStefan Hajnoczi 
3243ed78cda3SStefan Hajnoczi         aio_context_acquire(aio_context);
32445a8a30dbSKevin Wolf         bdrv_invalidate_cache(bs, &local_err);
3245ed78cda3SStefan Hajnoczi         aio_context_release(aio_context);
32465a8a30dbSKevin Wolf         if (local_err) {
32475a8a30dbSKevin Wolf             error_propagate(errp, local_err);
32485a8a30dbSKevin Wolf             return;
32495a8a30dbSKevin Wolf         }
32500f15423cSAnthony Liguori     }
32510f15423cSAnthony Liguori }
32520f15423cSAnthony Liguori 
325376b1c7feSKevin Wolf static int bdrv_inactivate(BlockDriverState *bs)
325476b1c7feSKevin Wolf {
325576b1c7feSKevin Wolf     int ret;
325676b1c7feSKevin Wolf 
325776b1c7feSKevin Wolf     if (bs->drv->bdrv_inactivate) {
325876b1c7feSKevin Wolf         ret = bs->drv->bdrv_inactivate(bs);
325976b1c7feSKevin Wolf         if (ret < 0) {
326076b1c7feSKevin Wolf             return ret;
326176b1c7feSKevin Wolf         }
326276b1c7feSKevin Wolf     }
326376b1c7feSKevin Wolf 
326476b1c7feSKevin Wolf     bs->open_flags |= BDRV_O_INACTIVE;
326576b1c7feSKevin Wolf     return 0;
326676b1c7feSKevin Wolf }
326776b1c7feSKevin Wolf 
326876b1c7feSKevin Wolf int bdrv_inactivate_all(void)
326976b1c7feSKevin Wolf {
327079720af6SMax Reitz     BlockDriverState *bs = NULL;
327176b1c7feSKevin Wolf     int ret;
327276b1c7feSKevin Wolf 
327379720af6SMax Reitz     while ((bs = bdrv_next(bs)) != NULL) {
327476b1c7feSKevin Wolf         AioContext *aio_context = bdrv_get_aio_context(bs);
327576b1c7feSKevin Wolf 
327676b1c7feSKevin Wolf         aio_context_acquire(aio_context);
327776b1c7feSKevin Wolf         ret = bdrv_inactivate(bs);
327876b1c7feSKevin Wolf         aio_context_release(aio_context);
327976b1c7feSKevin Wolf         if (ret < 0) {
328076b1c7feSKevin Wolf             return ret;
328176b1c7feSKevin Wolf         }
328276b1c7feSKevin Wolf     }
328376b1c7feSKevin Wolf 
328476b1c7feSKevin Wolf     return 0;
328576b1c7feSKevin Wolf }
328676b1c7feSKevin Wolf 
3287f9f05dc5SKevin Wolf /**************************************************************/
328819cb3738Sbellard /* removable device support */
328919cb3738Sbellard 
329019cb3738Sbellard /**
329119cb3738Sbellard  * Return TRUE if the media is present
329219cb3738Sbellard  */
3293e031f750SMax Reitz bool bdrv_is_inserted(BlockDriverState *bs)
329419cb3738Sbellard {
329519cb3738Sbellard     BlockDriver *drv = bs->drv;
329628d7a789SMax Reitz     BdrvChild *child;
3297a1aff5bfSMarkus Armbruster 
3298e031f750SMax Reitz     if (!drv) {
3299e031f750SMax Reitz         return false;
3300e031f750SMax Reitz     }
330128d7a789SMax Reitz     if (drv->bdrv_is_inserted) {
3302a1aff5bfSMarkus Armbruster         return drv->bdrv_is_inserted(bs);
330319cb3738Sbellard     }
330428d7a789SMax Reitz     QLIST_FOREACH(child, &bs->children, next) {
330528d7a789SMax Reitz         if (!bdrv_is_inserted(child->bs)) {
330628d7a789SMax Reitz             return false;
330728d7a789SMax Reitz         }
330828d7a789SMax Reitz     }
330928d7a789SMax Reitz     return true;
331028d7a789SMax Reitz }
331119cb3738Sbellard 
331219cb3738Sbellard /**
33138e49ca46SMarkus Armbruster  * Return whether the media changed since the last call to this
33148e49ca46SMarkus Armbruster  * function, or -ENOTSUP if we don't know.  Most drivers don't know.
331519cb3738Sbellard  */
331619cb3738Sbellard int bdrv_media_changed(BlockDriverState *bs)
331719cb3738Sbellard {
331819cb3738Sbellard     BlockDriver *drv = bs->drv;
331919cb3738Sbellard 
33208e49ca46SMarkus Armbruster     if (drv && drv->bdrv_media_changed) {
33218e49ca46SMarkus Armbruster         return drv->bdrv_media_changed(bs);
33228e49ca46SMarkus Armbruster     }
33238e49ca46SMarkus Armbruster     return -ENOTSUP;
332419cb3738Sbellard }
332519cb3738Sbellard 
332619cb3738Sbellard /**
332719cb3738Sbellard  * If eject_flag is TRUE, eject the media. Otherwise, close the tray
332819cb3738Sbellard  */
3329f36f3949SLuiz Capitulino void bdrv_eject(BlockDriverState *bs, bool eject_flag)
333019cb3738Sbellard {
333119cb3738Sbellard     BlockDriver *drv = bs->drv;
3332bfb197e0SMarkus Armbruster     const char *device_name;
333319cb3738Sbellard 
3334822e1cd1SMarkus Armbruster     if (drv && drv->bdrv_eject) {
3335822e1cd1SMarkus Armbruster         drv->bdrv_eject(bs, eject_flag);
333619cb3738Sbellard     }
33376f382ed2SLuiz Capitulino 
3338bfb197e0SMarkus Armbruster     device_name = bdrv_get_device_name(bs);
3339bfb197e0SMarkus Armbruster     if (device_name[0] != '\0') {
3340bfb197e0SMarkus Armbruster         qapi_event_send_device_tray_moved(device_name,
3341a5ee7bd4SWenchao Xia                                           eject_flag, &error_abort);
33426f382ed2SLuiz Capitulino     }
334319cb3738Sbellard }
334419cb3738Sbellard 
334519cb3738Sbellard /**
334619cb3738Sbellard  * Lock or unlock the media (if it is locked, the user won't be able
334719cb3738Sbellard  * to eject it manually).
334819cb3738Sbellard  */
3349025e849aSMarkus Armbruster void bdrv_lock_medium(BlockDriverState *bs, bool locked)
335019cb3738Sbellard {
335119cb3738Sbellard     BlockDriver *drv = bs->drv;
335219cb3738Sbellard 
3353025e849aSMarkus Armbruster     trace_bdrv_lock_medium(bs, locked);
3354b8c6d095SStefan Hajnoczi 
3355025e849aSMarkus Armbruster     if (drv && drv->bdrv_lock_medium) {
3356025e849aSMarkus Armbruster         drv->bdrv_lock_medium(bs, locked);
335719cb3738Sbellard     }
335819cb3738Sbellard }
3359985a03b0Sths 
33609fcb0251SFam Zheng /* Get a reference to bs */
33619fcb0251SFam Zheng void bdrv_ref(BlockDriverState *bs)
33629fcb0251SFam Zheng {
33639fcb0251SFam Zheng     bs->refcnt++;
33649fcb0251SFam Zheng }
33659fcb0251SFam Zheng 
33669fcb0251SFam Zheng /* Release a previously grabbed reference to bs.
33679fcb0251SFam Zheng  * If after releasing, reference count is zero, the BlockDriverState is
33689fcb0251SFam Zheng  * deleted. */
33699fcb0251SFam Zheng void bdrv_unref(BlockDriverState *bs)
33709fcb0251SFam Zheng {
33719a4d5ca6SJeff Cody     if (!bs) {
33729a4d5ca6SJeff Cody         return;
33739a4d5ca6SJeff Cody     }
33749fcb0251SFam Zheng     assert(bs->refcnt > 0);
33759fcb0251SFam Zheng     if (--bs->refcnt == 0) {
33769fcb0251SFam Zheng         bdrv_delete(bs);
33779fcb0251SFam Zheng     }
33789fcb0251SFam Zheng }
33799fcb0251SFam Zheng 
3380fbe40ff7SFam Zheng struct BdrvOpBlocker {
3381fbe40ff7SFam Zheng     Error *reason;
3382fbe40ff7SFam Zheng     QLIST_ENTRY(BdrvOpBlocker) list;
3383fbe40ff7SFam Zheng };
3384fbe40ff7SFam Zheng 
3385fbe40ff7SFam Zheng bool bdrv_op_is_blocked(BlockDriverState *bs, BlockOpType op, Error **errp)
3386fbe40ff7SFam Zheng {
3387fbe40ff7SFam Zheng     BdrvOpBlocker *blocker;
3388fbe40ff7SFam Zheng     assert((int) op >= 0 && op < BLOCK_OP_TYPE_MAX);
3389fbe40ff7SFam Zheng     if (!QLIST_EMPTY(&bs->op_blockers[op])) {
3390fbe40ff7SFam Zheng         blocker = QLIST_FIRST(&bs->op_blockers[op]);
3391fbe40ff7SFam Zheng         if (errp) {
3392e43bfd9cSMarkus Armbruster             *errp = error_copy(blocker->reason);
3393e43bfd9cSMarkus Armbruster             error_prepend(errp, "Node '%s' is busy: ",
3394e43bfd9cSMarkus Armbruster                           bdrv_get_device_or_node_name(bs));
3395fbe40ff7SFam Zheng         }
3396fbe40ff7SFam Zheng         return true;
3397fbe40ff7SFam Zheng     }
3398fbe40ff7SFam Zheng     return false;
3399fbe40ff7SFam Zheng }
3400fbe40ff7SFam Zheng 
3401fbe40ff7SFam Zheng void bdrv_op_block(BlockDriverState *bs, BlockOpType op, Error *reason)
3402fbe40ff7SFam Zheng {
3403fbe40ff7SFam Zheng     BdrvOpBlocker *blocker;
3404fbe40ff7SFam Zheng     assert((int) op >= 0 && op < BLOCK_OP_TYPE_MAX);
3405fbe40ff7SFam Zheng 
34065839e53bSMarkus Armbruster     blocker = g_new0(BdrvOpBlocker, 1);
3407fbe40ff7SFam Zheng     blocker->reason = reason;
3408fbe40ff7SFam Zheng     QLIST_INSERT_HEAD(&bs->op_blockers[op], blocker, list);
3409fbe40ff7SFam Zheng }
3410fbe40ff7SFam Zheng 
3411fbe40ff7SFam Zheng void bdrv_op_unblock(BlockDriverState *bs, BlockOpType op, Error *reason)
3412fbe40ff7SFam Zheng {
3413fbe40ff7SFam Zheng     BdrvOpBlocker *blocker, *next;
3414fbe40ff7SFam Zheng     assert((int) op >= 0 && op < BLOCK_OP_TYPE_MAX);
3415fbe40ff7SFam Zheng     QLIST_FOREACH_SAFE(blocker, &bs->op_blockers[op], list, next) {
3416fbe40ff7SFam Zheng         if (blocker->reason == reason) {
3417fbe40ff7SFam Zheng             QLIST_REMOVE(blocker, list);
3418fbe40ff7SFam Zheng             g_free(blocker);
3419fbe40ff7SFam Zheng         }
3420fbe40ff7SFam Zheng     }
3421fbe40ff7SFam Zheng }
3422fbe40ff7SFam Zheng 
3423fbe40ff7SFam Zheng void bdrv_op_block_all(BlockDriverState *bs, Error *reason)
3424fbe40ff7SFam Zheng {
3425fbe40ff7SFam Zheng     int i;
3426fbe40ff7SFam Zheng     for (i = 0; i < BLOCK_OP_TYPE_MAX; i++) {
3427fbe40ff7SFam Zheng         bdrv_op_block(bs, i, reason);
3428fbe40ff7SFam Zheng     }
3429fbe40ff7SFam Zheng }
3430fbe40ff7SFam Zheng 
3431fbe40ff7SFam Zheng void bdrv_op_unblock_all(BlockDriverState *bs, Error *reason)
3432fbe40ff7SFam Zheng {
3433fbe40ff7SFam Zheng     int i;
3434fbe40ff7SFam Zheng     for (i = 0; i < BLOCK_OP_TYPE_MAX; i++) {
3435fbe40ff7SFam Zheng         bdrv_op_unblock(bs, i, reason);
3436fbe40ff7SFam Zheng     }
3437fbe40ff7SFam Zheng }
3438fbe40ff7SFam Zheng 
3439fbe40ff7SFam Zheng bool bdrv_op_blocker_is_empty(BlockDriverState *bs)
3440fbe40ff7SFam Zheng {
3441fbe40ff7SFam Zheng     int i;
3442fbe40ff7SFam Zheng 
3443fbe40ff7SFam Zheng     for (i = 0; i < BLOCK_OP_TYPE_MAX; i++) {
3444fbe40ff7SFam Zheng         if (!QLIST_EMPTY(&bs->op_blockers[i])) {
3445fbe40ff7SFam Zheng             return false;
3446fbe40ff7SFam Zheng         }
3447fbe40ff7SFam Zheng     }
3448fbe40ff7SFam Zheng     return true;
3449fbe40ff7SFam Zheng }
3450fbe40ff7SFam Zheng 
3451d92ada22SLuiz Capitulino void bdrv_img_create(const char *filename, const char *fmt,
3452f88e1a42SJes Sorensen                      const char *base_filename, const char *base_fmt,
3453f382d43aSMiroslav Rezanina                      char *options, uint64_t img_size, int flags,
3454f382d43aSMiroslav Rezanina                      Error **errp, bool quiet)
3455f88e1a42SJes Sorensen {
345683d0521aSChunyan Liu     QemuOptsList *create_opts = NULL;
345783d0521aSChunyan Liu     QemuOpts *opts = NULL;
345883d0521aSChunyan Liu     const char *backing_fmt, *backing_file;
345983d0521aSChunyan Liu     int64_t size;
3460f88e1a42SJes Sorensen     BlockDriver *drv, *proto_drv;
3461cc84d90fSMax Reitz     Error *local_err = NULL;
3462f88e1a42SJes Sorensen     int ret = 0;
3463f88e1a42SJes Sorensen 
3464f88e1a42SJes Sorensen     /* Find driver and parse its options */
3465f88e1a42SJes Sorensen     drv = bdrv_find_format(fmt);
3466f88e1a42SJes Sorensen     if (!drv) {
346771c79813SLuiz Capitulino         error_setg(errp, "Unknown file format '%s'", fmt);
3468d92ada22SLuiz Capitulino         return;
3469f88e1a42SJes Sorensen     }
3470f88e1a42SJes Sorensen 
3471b65a5e12SMax Reitz     proto_drv = bdrv_find_protocol(filename, true, errp);
3472f88e1a42SJes Sorensen     if (!proto_drv) {
3473d92ada22SLuiz Capitulino         return;
3474f88e1a42SJes Sorensen     }
3475f88e1a42SJes Sorensen 
3476c6149724SMax Reitz     if (!drv->create_opts) {
3477c6149724SMax Reitz         error_setg(errp, "Format driver '%s' does not support image creation",
3478c6149724SMax Reitz                    drv->format_name);
3479c6149724SMax Reitz         return;
3480c6149724SMax Reitz     }
3481c6149724SMax Reitz 
3482c6149724SMax Reitz     if (!proto_drv->create_opts) {
3483c6149724SMax Reitz         error_setg(errp, "Protocol driver '%s' does not support image creation",
3484c6149724SMax Reitz                    proto_drv->format_name);
3485c6149724SMax Reitz         return;
3486c6149724SMax Reitz     }
3487c6149724SMax Reitz 
3488c282e1fdSChunyan Liu     create_opts = qemu_opts_append(create_opts, drv->create_opts);
3489c282e1fdSChunyan Liu     create_opts = qemu_opts_append(create_opts, proto_drv->create_opts);
3490f88e1a42SJes Sorensen 
3491f88e1a42SJes Sorensen     /* Create parameter list with default values */
349283d0521aSChunyan Liu     opts = qemu_opts_create(create_opts, NULL, 0, &error_abort);
349339101f25SMarkus Armbruster     qemu_opt_set_number(opts, BLOCK_OPT_SIZE, img_size, &error_abort);
3494f88e1a42SJes Sorensen 
3495f88e1a42SJes Sorensen     /* Parse -o options */
3496f88e1a42SJes Sorensen     if (options) {
3497dc523cd3SMarkus Armbruster         qemu_opts_do_parse(opts, options, NULL, &local_err);
3498dc523cd3SMarkus Armbruster         if (local_err) {
3499dc523cd3SMarkus Armbruster             error_report_err(local_err);
3500dc523cd3SMarkus Armbruster             local_err = NULL;
350183d0521aSChunyan Liu             error_setg(errp, "Invalid options for file format '%s'", fmt);
3502f88e1a42SJes Sorensen             goto out;
3503f88e1a42SJes Sorensen         }
3504f88e1a42SJes Sorensen     }
3505f88e1a42SJes Sorensen 
3506f88e1a42SJes Sorensen     if (base_filename) {
3507f43e47dbSMarkus Armbruster         qemu_opt_set(opts, BLOCK_OPT_BACKING_FILE, base_filename, &local_err);
35086be4194bSMarkus Armbruster         if (local_err) {
350971c79813SLuiz Capitulino             error_setg(errp, "Backing file not supported for file format '%s'",
351071c79813SLuiz Capitulino                        fmt);
3511f88e1a42SJes Sorensen             goto out;
3512f88e1a42SJes Sorensen         }
3513f88e1a42SJes Sorensen     }
3514f88e1a42SJes Sorensen 
3515f88e1a42SJes Sorensen     if (base_fmt) {
3516f43e47dbSMarkus Armbruster         qemu_opt_set(opts, BLOCK_OPT_BACKING_FMT, base_fmt, &local_err);
35176be4194bSMarkus Armbruster         if (local_err) {
351871c79813SLuiz Capitulino             error_setg(errp, "Backing file format not supported for file "
351971c79813SLuiz Capitulino                              "format '%s'", fmt);
3520f88e1a42SJes Sorensen             goto out;
3521f88e1a42SJes Sorensen         }
3522f88e1a42SJes Sorensen     }
3523f88e1a42SJes Sorensen 
352483d0521aSChunyan Liu     backing_file = qemu_opt_get(opts, BLOCK_OPT_BACKING_FILE);
352583d0521aSChunyan Liu     if (backing_file) {
352683d0521aSChunyan Liu         if (!strcmp(filename, backing_file)) {
352771c79813SLuiz Capitulino             error_setg(errp, "Error: Trying to create an image with the "
352871c79813SLuiz Capitulino                              "same filename as the backing file");
3529792da93aSJes Sorensen             goto out;
3530792da93aSJes Sorensen         }
3531792da93aSJes Sorensen     }
3532792da93aSJes Sorensen 
353383d0521aSChunyan Liu     backing_fmt = qemu_opt_get(opts, BLOCK_OPT_BACKING_FMT);
3534f88e1a42SJes Sorensen 
3535f88e1a42SJes Sorensen     // The size for the image must always be specified, with one exception:
3536f88e1a42SJes Sorensen     // If we are using a backing file, we can obtain the size from there
353783d0521aSChunyan Liu     size = qemu_opt_get_size(opts, BLOCK_OPT_SIZE, 0);
353883d0521aSChunyan Liu     if (size == -1) {
353983d0521aSChunyan Liu         if (backing_file) {
354066f6b814SMax Reitz             BlockDriverState *bs;
354129168018SMax Reitz             char *full_backing = g_new0(char, PATH_MAX);
354252bf1e72SMarkus Armbruster             int64_t size;
354363090dacSPaolo Bonzini             int back_flags;
3544e6641719SMax Reitz             QDict *backing_options = NULL;
354563090dacSPaolo Bonzini 
354629168018SMax Reitz             bdrv_get_full_backing_filename_from_filename(filename, backing_file,
354729168018SMax Reitz                                                          full_backing, PATH_MAX,
354829168018SMax Reitz                                                          &local_err);
354929168018SMax Reitz             if (local_err) {
355029168018SMax Reitz                 g_free(full_backing);
355129168018SMax Reitz                 goto out;
355229168018SMax Reitz             }
355329168018SMax Reitz 
355463090dacSPaolo Bonzini             /* backing files always opened read-only */
355561de4c68SKevin Wolf             back_flags = flags;
3556bfd18d1eSKevin Wolf             back_flags &= ~(BDRV_O_RDWR | BDRV_O_SNAPSHOT | BDRV_O_NO_BACKING);
3557f88e1a42SJes Sorensen 
3558e6641719SMax Reitz             if (backing_fmt) {
3559e6641719SMax Reitz                 backing_options = qdict_new();
3560e6641719SMax Reitz                 qdict_put(backing_options, "driver",
3561e6641719SMax Reitz                           qstring_from_str(backing_fmt));
3562e6641719SMax Reitz             }
3563e6641719SMax Reitz 
3564f67503e5SMax Reitz             bs = NULL;
3565e6641719SMax Reitz             ret = bdrv_open(&bs, full_backing, NULL, backing_options,
35666ebf9aa2SMax Reitz                             back_flags, &local_err);
356729168018SMax Reitz             g_free(full_backing);
3568f88e1a42SJes Sorensen             if (ret < 0) {
3569f88e1a42SJes Sorensen                 goto out;
3570f88e1a42SJes Sorensen             }
357152bf1e72SMarkus Armbruster             size = bdrv_getlength(bs);
357252bf1e72SMarkus Armbruster             if (size < 0) {
357352bf1e72SMarkus Armbruster                 error_setg_errno(errp, -size, "Could not get size of '%s'",
357452bf1e72SMarkus Armbruster                                  backing_file);
357552bf1e72SMarkus Armbruster                 bdrv_unref(bs);
357652bf1e72SMarkus Armbruster                 goto out;
357752bf1e72SMarkus Armbruster             }
3578f88e1a42SJes Sorensen 
357939101f25SMarkus Armbruster             qemu_opt_set_number(opts, BLOCK_OPT_SIZE, size, &error_abort);
358066f6b814SMax Reitz 
358166f6b814SMax Reitz             bdrv_unref(bs);
3582f88e1a42SJes Sorensen         } else {
358371c79813SLuiz Capitulino             error_setg(errp, "Image creation needs a size parameter");
3584f88e1a42SJes Sorensen             goto out;
3585f88e1a42SJes Sorensen         }
3586f88e1a42SJes Sorensen     }
3587f88e1a42SJes Sorensen 
3588f382d43aSMiroslav Rezanina     if (!quiet) {
3589f88e1a42SJes Sorensen         printf("Formatting '%s', fmt=%s ", filename, fmt);
359043c5d8f8SFam Zheng         qemu_opts_print(opts, " ");
3591f88e1a42SJes Sorensen         puts("");
3592f382d43aSMiroslav Rezanina     }
359383d0521aSChunyan Liu 
3594c282e1fdSChunyan Liu     ret = bdrv_create(drv, filename, opts, &local_err);
359583d0521aSChunyan Liu 
3596cc84d90fSMax Reitz     if (ret == -EFBIG) {
3597cc84d90fSMax Reitz         /* This is generally a better message than whatever the driver would
3598cc84d90fSMax Reitz          * deliver (especially because of the cluster_size_hint), since that
3599cc84d90fSMax Reitz          * is most probably not much different from "image too large". */
3600f3f4d2c0SKevin Wolf         const char *cluster_size_hint = "";
360183d0521aSChunyan Liu         if (qemu_opt_get_size(opts, BLOCK_OPT_CLUSTER_SIZE, 0)) {
3602f3f4d2c0SKevin Wolf             cluster_size_hint = " (try using a larger cluster size)";
3603f3f4d2c0SKevin Wolf         }
3604cc84d90fSMax Reitz         error_setg(errp, "The image size is too large for file format '%s'"
3605cc84d90fSMax Reitz                    "%s", fmt, cluster_size_hint);
3606cc84d90fSMax Reitz         error_free(local_err);
3607cc84d90fSMax Reitz         local_err = NULL;
3608f88e1a42SJes Sorensen     }
3609f88e1a42SJes Sorensen 
3610f88e1a42SJes Sorensen out:
361183d0521aSChunyan Liu     qemu_opts_del(opts);
361283d0521aSChunyan Liu     qemu_opts_free(create_opts);
361384d18f06SMarkus Armbruster     if (local_err) {
3614cc84d90fSMax Reitz         error_propagate(errp, local_err);
3615cc84d90fSMax Reitz     }
3616f88e1a42SJes Sorensen }
361785d126f3SStefan Hajnoczi 
361885d126f3SStefan Hajnoczi AioContext *bdrv_get_aio_context(BlockDriverState *bs)
361985d126f3SStefan Hajnoczi {
3620dcd04228SStefan Hajnoczi     return bs->aio_context;
3621dcd04228SStefan Hajnoczi }
3622dcd04228SStefan Hajnoczi 
3623dcd04228SStefan Hajnoczi void bdrv_detach_aio_context(BlockDriverState *bs)
3624dcd04228SStefan Hajnoczi {
362533384421SMax Reitz     BdrvAioNotifier *baf;
362633384421SMax Reitz 
3627dcd04228SStefan Hajnoczi     if (!bs->drv) {
3628dcd04228SStefan Hajnoczi         return;
3629dcd04228SStefan Hajnoczi     }
3630dcd04228SStefan Hajnoczi 
363133384421SMax Reitz     QLIST_FOREACH(baf, &bs->aio_notifiers, list) {
363233384421SMax Reitz         baf->detach_aio_context(baf->opaque);
363333384421SMax Reitz     }
363433384421SMax Reitz 
3635a0d64a61SAlberto Garcia     if (bs->throttle_state) {
36360e5b0a2dSBenoît Canet         throttle_timers_detach_aio_context(&bs->throttle_timers);
363713af91ebSStefan Hajnoczi     }
3638dcd04228SStefan Hajnoczi     if (bs->drv->bdrv_detach_aio_context) {
3639dcd04228SStefan Hajnoczi         bs->drv->bdrv_detach_aio_context(bs);
3640dcd04228SStefan Hajnoczi     }
3641dcd04228SStefan Hajnoczi     if (bs->file) {
36429a4f4c31SKevin Wolf         bdrv_detach_aio_context(bs->file->bs);
3643dcd04228SStefan Hajnoczi     }
3644760e0063SKevin Wolf     if (bs->backing) {
3645760e0063SKevin Wolf         bdrv_detach_aio_context(bs->backing->bs);
3646dcd04228SStefan Hajnoczi     }
3647dcd04228SStefan Hajnoczi 
3648dcd04228SStefan Hajnoczi     bs->aio_context = NULL;
3649dcd04228SStefan Hajnoczi }
3650dcd04228SStefan Hajnoczi 
3651dcd04228SStefan Hajnoczi void bdrv_attach_aio_context(BlockDriverState *bs,
3652dcd04228SStefan Hajnoczi                              AioContext *new_context)
3653dcd04228SStefan Hajnoczi {
365433384421SMax Reitz     BdrvAioNotifier *ban;
365533384421SMax Reitz 
3656dcd04228SStefan Hajnoczi     if (!bs->drv) {
3657dcd04228SStefan Hajnoczi         return;
3658dcd04228SStefan Hajnoczi     }
3659dcd04228SStefan Hajnoczi 
3660dcd04228SStefan Hajnoczi     bs->aio_context = new_context;
3661dcd04228SStefan Hajnoczi 
3662760e0063SKevin Wolf     if (bs->backing) {
3663760e0063SKevin Wolf         bdrv_attach_aio_context(bs->backing->bs, new_context);
3664dcd04228SStefan Hajnoczi     }
3665dcd04228SStefan Hajnoczi     if (bs->file) {
36669a4f4c31SKevin Wolf         bdrv_attach_aio_context(bs->file->bs, new_context);
3667dcd04228SStefan Hajnoczi     }
3668dcd04228SStefan Hajnoczi     if (bs->drv->bdrv_attach_aio_context) {
3669dcd04228SStefan Hajnoczi         bs->drv->bdrv_attach_aio_context(bs, new_context);
3670dcd04228SStefan Hajnoczi     }
3671a0d64a61SAlberto Garcia     if (bs->throttle_state) {
36720e5b0a2dSBenoît Canet         throttle_timers_attach_aio_context(&bs->throttle_timers, new_context);
367313af91ebSStefan Hajnoczi     }
367433384421SMax Reitz 
367533384421SMax Reitz     QLIST_FOREACH(ban, &bs->aio_notifiers, list) {
367633384421SMax Reitz         ban->attached_aio_context(new_context, ban->opaque);
367733384421SMax Reitz     }
3678dcd04228SStefan Hajnoczi }
3679dcd04228SStefan Hajnoczi 
3680dcd04228SStefan Hajnoczi void bdrv_set_aio_context(BlockDriverState *bs, AioContext *new_context)
3681dcd04228SStefan Hajnoczi {
368253ec73e2SFam Zheng     bdrv_drain(bs); /* ensure there are no in-flight requests */
3683dcd04228SStefan Hajnoczi 
3684dcd04228SStefan Hajnoczi     bdrv_detach_aio_context(bs);
3685dcd04228SStefan Hajnoczi 
3686dcd04228SStefan Hajnoczi     /* This function executes in the old AioContext so acquire the new one in
3687dcd04228SStefan Hajnoczi      * case it runs in a different thread.
3688dcd04228SStefan Hajnoczi      */
3689dcd04228SStefan Hajnoczi     aio_context_acquire(new_context);
3690dcd04228SStefan Hajnoczi     bdrv_attach_aio_context(bs, new_context);
3691dcd04228SStefan Hajnoczi     aio_context_release(new_context);
369285d126f3SStefan Hajnoczi }
3693d616b224SStefan Hajnoczi 
369433384421SMax Reitz void bdrv_add_aio_context_notifier(BlockDriverState *bs,
369533384421SMax Reitz         void (*attached_aio_context)(AioContext *new_context, void *opaque),
369633384421SMax Reitz         void (*detach_aio_context)(void *opaque), void *opaque)
369733384421SMax Reitz {
369833384421SMax Reitz     BdrvAioNotifier *ban = g_new(BdrvAioNotifier, 1);
369933384421SMax Reitz     *ban = (BdrvAioNotifier){
370033384421SMax Reitz         .attached_aio_context = attached_aio_context,
370133384421SMax Reitz         .detach_aio_context   = detach_aio_context,
370233384421SMax Reitz         .opaque               = opaque
370333384421SMax Reitz     };
370433384421SMax Reitz 
370533384421SMax Reitz     QLIST_INSERT_HEAD(&bs->aio_notifiers, ban, list);
370633384421SMax Reitz }
370733384421SMax Reitz 
370833384421SMax Reitz void bdrv_remove_aio_context_notifier(BlockDriverState *bs,
370933384421SMax Reitz                                       void (*attached_aio_context)(AioContext *,
371033384421SMax Reitz                                                                    void *),
371133384421SMax Reitz                                       void (*detach_aio_context)(void *),
371233384421SMax Reitz                                       void *opaque)
371333384421SMax Reitz {
371433384421SMax Reitz     BdrvAioNotifier *ban, *ban_next;
371533384421SMax Reitz 
371633384421SMax Reitz     QLIST_FOREACH_SAFE(ban, &bs->aio_notifiers, list, ban_next) {
371733384421SMax Reitz         if (ban->attached_aio_context == attached_aio_context &&
371833384421SMax Reitz             ban->detach_aio_context   == detach_aio_context   &&
371933384421SMax Reitz             ban->opaque               == opaque)
372033384421SMax Reitz         {
372133384421SMax Reitz             QLIST_REMOVE(ban, list);
372233384421SMax Reitz             g_free(ban);
372333384421SMax Reitz 
372433384421SMax Reitz             return;
372533384421SMax Reitz         }
372633384421SMax Reitz     }
372733384421SMax Reitz 
372833384421SMax Reitz     abort();
372933384421SMax Reitz }
373033384421SMax Reitz 
373177485434SMax Reitz int bdrv_amend_options(BlockDriverState *bs, QemuOpts *opts,
37328b13976dSMax Reitz                        BlockDriverAmendStatusCB *status_cb, void *cb_opaque)
37336f176b48SMax Reitz {
3734c282e1fdSChunyan Liu     if (!bs->drv->bdrv_amend_options) {
37356f176b48SMax Reitz         return -ENOTSUP;
37366f176b48SMax Reitz     }
37378b13976dSMax Reitz     return bs->drv->bdrv_amend_options(bs, opts, status_cb, cb_opaque);
37386f176b48SMax Reitz }
3739f6186f49SBenoît Canet 
3740b5042a36SBenoît Canet /* This function will be called by the bdrv_recurse_is_first_non_filter method
3741b5042a36SBenoît Canet  * of block filter and by bdrv_is_first_non_filter.
3742b5042a36SBenoît Canet  * It is used to test if the given bs is the candidate or recurse more in the
3743b5042a36SBenoît Canet  * node graph.
3744212a5a8fSBenoît Canet  */
3745212a5a8fSBenoît Canet bool bdrv_recurse_is_first_non_filter(BlockDriverState *bs,
3746212a5a8fSBenoît Canet                                       BlockDriverState *candidate)
3747f6186f49SBenoît Canet {
3748b5042a36SBenoît Canet     /* return false if basic checks fails */
3749b5042a36SBenoît Canet     if (!bs || !bs->drv) {
3750b5042a36SBenoît Canet         return false;
3751b5042a36SBenoît Canet     }
3752b5042a36SBenoît Canet 
3753b5042a36SBenoît Canet     /* the code reached a non block filter driver -> check if the bs is
3754b5042a36SBenoît Canet      * the same as the candidate. It's the recursion termination condition.
3755b5042a36SBenoît Canet      */
3756b5042a36SBenoît Canet     if (!bs->drv->is_filter) {
3757b5042a36SBenoît Canet         return bs == candidate;
3758b5042a36SBenoît Canet     }
3759b5042a36SBenoît Canet     /* Down this path the driver is a block filter driver */
3760b5042a36SBenoît Canet 
3761b5042a36SBenoît Canet     /* If the block filter recursion method is defined use it to recurse down
3762b5042a36SBenoît Canet      * the node graph.
3763b5042a36SBenoît Canet      */
3764b5042a36SBenoît Canet     if (bs->drv->bdrv_recurse_is_first_non_filter) {
3765212a5a8fSBenoît Canet         return bs->drv->bdrv_recurse_is_first_non_filter(bs, candidate);
3766212a5a8fSBenoît Canet     }
3767212a5a8fSBenoît Canet 
3768b5042a36SBenoît Canet     /* the driver is a block filter but don't allow to recurse -> return false
3769b5042a36SBenoît Canet      */
3770b5042a36SBenoît Canet     return false;
3771212a5a8fSBenoît Canet }
3772212a5a8fSBenoît Canet 
3773212a5a8fSBenoît Canet /* This function checks if the candidate is the first non filter bs down it's
3774212a5a8fSBenoît Canet  * bs chain. Since we don't have pointers to parents it explore all bs chains
3775212a5a8fSBenoît Canet  * from the top. Some filters can choose not to pass down the recursion.
3776212a5a8fSBenoît Canet  */
3777212a5a8fSBenoît Canet bool bdrv_is_first_non_filter(BlockDriverState *candidate)
3778212a5a8fSBenoît Canet {
377979720af6SMax Reitz     BlockDriverState *bs = NULL;
3780212a5a8fSBenoît Canet 
3781212a5a8fSBenoît Canet     /* walk down the bs forest recursively */
378279720af6SMax Reitz     while ((bs = bdrv_next(bs)) != NULL) {
3783212a5a8fSBenoît Canet         bool perm;
3784212a5a8fSBenoît Canet 
3785b5042a36SBenoît Canet         /* try to recurse in this top level bs */
3786e6dc8a1fSKevin Wolf         perm = bdrv_recurse_is_first_non_filter(bs, candidate);
3787212a5a8fSBenoît Canet 
3788212a5a8fSBenoît Canet         /* candidate is the first non filter */
3789212a5a8fSBenoît Canet         if (perm) {
3790212a5a8fSBenoît Canet             return true;
3791212a5a8fSBenoît Canet         }
3792212a5a8fSBenoît Canet     }
3793212a5a8fSBenoît Canet 
3794212a5a8fSBenoît Canet     return false;
3795f6186f49SBenoît Canet }
379609158f00SBenoît Canet 
3797e12f3784SWen Congyang BlockDriverState *check_to_replace_node(BlockDriverState *parent_bs,
3798e12f3784SWen Congyang                                         const char *node_name, Error **errp)
379909158f00SBenoît Canet {
380009158f00SBenoît Canet     BlockDriverState *to_replace_bs = bdrv_find_node(node_name);
38015a7e7a0bSStefan Hajnoczi     AioContext *aio_context;
38025a7e7a0bSStefan Hajnoczi 
380309158f00SBenoît Canet     if (!to_replace_bs) {
380409158f00SBenoît Canet         error_setg(errp, "Node name '%s' not found", node_name);
380509158f00SBenoît Canet         return NULL;
380609158f00SBenoît Canet     }
380709158f00SBenoît Canet 
38085a7e7a0bSStefan Hajnoczi     aio_context = bdrv_get_aio_context(to_replace_bs);
38095a7e7a0bSStefan Hajnoczi     aio_context_acquire(aio_context);
38105a7e7a0bSStefan Hajnoczi 
381109158f00SBenoît Canet     if (bdrv_op_is_blocked(to_replace_bs, BLOCK_OP_TYPE_REPLACE, errp)) {
38125a7e7a0bSStefan Hajnoczi         to_replace_bs = NULL;
38135a7e7a0bSStefan Hajnoczi         goto out;
381409158f00SBenoît Canet     }
381509158f00SBenoît Canet 
381609158f00SBenoît Canet     /* We don't want arbitrary node of the BDS chain to be replaced only the top
381709158f00SBenoît Canet      * most non filter in order to prevent data corruption.
381809158f00SBenoît Canet      * Another benefit is that this tests exclude backing files which are
381909158f00SBenoît Canet      * blocked by the backing blockers.
382009158f00SBenoît Canet      */
3821e12f3784SWen Congyang     if (!bdrv_recurse_is_first_non_filter(parent_bs, to_replace_bs)) {
382209158f00SBenoît Canet         error_setg(errp, "Only top most non filter can be replaced");
38235a7e7a0bSStefan Hajnoczi         to_replace_bs = NULL;
38245a7e7a0bSStefan Hajnoczi         goto out;
382509158f00SBenoît Canet     }
382609158f00SBenoît Canet 
38275a7e7a0bSStefan Hajnoczi out:
38285a7e7a0bSStefan Hajnoczi     aio_context_release(aio_context);
382909158f00SBenoît Canet     return to_replace_bs;
383009158f00SBenoît Canet }
3831448ad91dSMing Lei 
383291af7014SMax Reitz static bool append_open_options(QDict *d, BlockDriverState *bs)
383391af7014SMax Reitz {
383491af7014SMax Reitz     const QDictEntry *entry;
38359e700c1aSKevin Wolf     QemuOptDesc *desc;
3836260fecf1SKevin Wolf     BdrvChild *child;
383791af7014SMax Reitz     bool found_any = false;
3838260fecf1SKevin Wolf     const char *p;
383991af7014SMax Reitz 
384091af7014SMax Reitz     for (entry = qdict_first(bs->options); entry;
384191af7014SMax Reitz          entry = qdict_next(bs->options, entry))
384291af7014SMax Reitz     {
3843260fecf1SKevin Wolf         /* Exclude options for children */
3844260fecf1SKevin Wolf         QLIST_FOREACH(child, &bs->children, next) {
3845260fecf1SKevin Wolf             if (strstart(qdict_entry_key(entry), child->name, &p)
3846260fecf1SKevin Wolf                 && (!*p || *p == '.'))
3847260fecf1SKevin Wolf             {
3848260fecf1SKevin Wolf                 break;
3849260fecf1SKevin Wolf             }
3850260fecf1SKevin Wolf         }
3851260fecf1SKevin Wolf         if (child) {
38529e700c1aSKevin Wolf             continue;
38539e700c1aSKevin Wolf         }
38549e700c1aSKevin Wolf 
38559e700c1aSKevin Wolf         /* And exclude all non-driver-specific options */
38569e700c1aSKevin Wolf         for (desc = bdrv_runtime_opts.desc; desc->name; desc++) {
38579e700c1aSKevin Wolf             if (!strcmp(qdict_entry_key(entry), desc->name)) {
38589e700c1aSKevin Wolf                 break;
38599e700c1aSKevin Wolf             }
38609e700c1aSKevin Wolf         }
38619e700c1aSKevin Wolf         if (desc->name) {
38629e700c1aSKevin Wolf             continue;
38639e700c1aSKevin Wolf         }
38649e700c1aSKevin Wolf 
386591af7014SMax Reitz         qobject_incref(qdict_entry_value(entry));
386691af7014SMax Reitz         qdict_put_obj(d, qdict_entry_key(entry), qdict_entry_value(entry));
386791af7014SMax Reitz         found_any = true;
386891af7014SMax Reitz     }
386991af7014SMax Reitz 
387091af7014SMax Reitz     return found_any;
387191af7014SMax Reitz }
387291af7014SMax Reitz 
387391af7014SMax Reitz /* Updates the following BDS fields:
387491af7014SMax Reitz  *  - exact_filename: A filename which may be used for opening a block device
387591af7014SMax Reitz  *                    which (mostly) equals the given BDS (even without any
387691af7014SMax Reitz  *                    other options; so reading and writing must return the same
387791af7014SMax Reitz  *                    results, but caching etc. may be different)
387891af7014SMax Reitz  *  - full_open_options: Options which, when given when opening a block device
387991af7014SMax Reitz  *                       (without a filename), result in a BDS (mostly)
388091af7014SMax Reitz  *                       equalling the given one
388191af7014SMax Reitz  *  - filename: If exact_filename is set, it is copied here. Otherwise,
388291af7014SMax Reitz  *              full_open_options is converted to a JSON object, prefixed with
388391af7014SMax Reitz  *              "json:" (for use through the JSON pseudo protocol) and put here.
388491af7014SMax Reitz  */
388591af7014SMax Reitz void bdrv_refresh_filename(BlockDriverState *bs)
388691af7014SMax Reitz {
388791af7014SMax Reitz     BlockDriver *drv = bs->drv;
388891af7014SMax Reitz     QDict *opts;
388991af7014SMax Reitz 
389091af7014SMax Reitz     if (!drv) {
389191af7014SMax Reitz         return;
389291af7014SMax Reitz     }
389391af7014SMax Reitz 
389491af7014SMax Reitz     /* This BDS's file name will most probably depend on its file's name, so
389591af7014SMax Reitz      * refresh that first */
389691af7014SMax Reitz     if (bs->file) {
38979a4f4c31SKevin Wolf         bdrv_refresh_filename(bs->file->bs);
389891af7014SMax Reitz     }
389991af7014SMax Reitz 
390091af7014SMax Reitz     if (drv->bdrv_refresh_filename) {
390191af7014SMax Reitz         /* Obsolete information is of no use here, so drop the old file name
390291af7014SMax Reitz          * information before refreshing it */
390391af7014SMax Reitz         bs->exact_filename[0] = '\0';
390491af7014SMax Reitz         if (bs->full_open_options) {
390591af7014SMax Reitz             QDECREF(bs->full_open_options);
390691af7014SMax Reitz             bs->full_open_options = NULL;
390791af7014SMax Reitz         }
390891af7014SMax Reitz 
39094cdd01d3SKevin Wolf         opts = qdict_new();
39104cdd01d3SKevin Wolf         append_open_options(opts, bs);
39114cdd01d3SKevin Wolf         drv->bdrv_refresh_filename(bs, opts);
39124cdd01d3SKevin Wolf         QDECREF(opts);
391391af7014SMax Reitz     } else if (bs->file) {
391491af7014SMax Reitz         /* Try to reconstruct valid information from the underlying file */
391591af7014SMax Reitz         bool has_open_options;
391691af7014SMax Reitz 
391791af7014SMax Reitz         bs->exact_filename[0] = '\0';
391891af7014SMax Reitz         if (bs->full_open_options) {
391991af7014SMax Reitz             QDECREF(bs->full_open_options);
392091af7014SMax Reitz             bs->full_open_options = NULL;
392191af7014SMax Reitz         }
392291af7014SMax Reitz 
392391af7014SMax Reitz         opts = qdict_new();
392491af7014SMax Reitz         has_open_options = append_open_options(opts, bs);
392591af7014SMax Reitz 
392691af7014SMax Reitz         /* If no specific options have been given for this BDS, the filename of
392791af7014SMax Reitz          * the underlying file should suffice for this one as well */
39289a4f4c31SKevin Wolf         if (bs->file->bs->exact_filename[0] && !has_open_options) {
39299a4f4c31SKevin Wolf             strcpy(bs->exact_filename, bs->file->bs->exact_filename);
393091af7014SMax Reitz         }
393191af7014SMax Reitz         /* Reconstructing the full options QDict is simple for most format block
393291af7014SMax Reitz          * drivers, as long as the full options are known for the underlying
393391af7014SMax Reitz          * file BDS. The full options QDict of that file BDS should somehow
393491af7014SMax Reitz          * contain a representation of the filename, therefore the following
393591af7014SMax Reitz          * suffices without querying the (exact_)filename of this BDS. */
39369a4f4c31SKevin Wolf         if (bs->file->bs->full_open_options) {
393791af7014SMax Reitz             qdict_put_obj(opts, "driver",
393891af7014SMax Reitz                           QOBJECT(qstring_from_str(drv->format_name)));
39399a4f4c31SKevin Wolf             QINCREF(bs->file->bs->full_open_options);
39409a4f4c31SKevin Wolf             qdict_put_obj(opts, "file",
39419a4f4c31SKevin Wolf                           QOBJECT(bs->file->bs->full_open_options));
394291af7014SMax Reitz 
394391af7014SMax Reitz             bs->full_open_options = opts;
394491af7014SMax Reitz         } else {
394591af7014SMax Reitz             QDECREF(opts);
394691af7014SMax Reitz         }
394791af7014SMax Reitz     } else if (!bs->full_open_options && qdict_size(bs->options)) {
394891af7014SMax Reitz         /* There is no underlying file BDS (at least referenced by BDS.file),
394991af7014SMax Reitz          * so the full options QDict should be equal to the options given
395091af7014SMax Reitz          * specifically for this block device when it was opened (plus the
395191af7014SMax Reitz          * driver specification).
395291af7014SMax Reitz          * Because those options don't change, there is no need to update
395391af7014SMax Reitz          * full_open_options when it's already set. */
395491af7014SMax Reitz 
395591af7014SMax Reitz         opts = qdict_new();
395691af7014SMax Reitz         append_open_options(opts, bs);
395791af7014SMax Reitz         qdict_put_obj(opts, "driver",
395891af7014SMax Reitz                       QOBJECT(qstring_from_str(drv->format_name)));
395991af7014SMax Reitz 
396091af7014SMax Reitz         if (bs->exact_filename[0]) {
396191af7014SMax Reitz             /* This may not work for all block protocol drivers (some may
396291af7014SMax Reitz              * require this filename to be parsed), but we have to find some
396391af7014SMax Reitz              * default solution here, so just include it. If some block driver
396491af7014SMax Reitz              * does not support pure options without any filename at all or
396591af7014SMax Reitz              * needs some special format of the options QDict, it needs to
396691af7014SMax Reitz              * implement the driver-specific bdrv_refresh_filename() function.
396791af7014SMax Reitz              */
396891af7014SMax Reitz             qdict_put_obj(opts, "filename",
396991af7014SMax Reitz                           QOBJECT(qstring_from_str(bs->exact_filename)));
397091af7014SMax Reitz         }
397191af7014SMax Reitz 
397291af7014SMax Reitz         bs->full_open_options = opts;
397391af7014SMax Reitz     }
397491af7014SMax Reitz 
397591af7014SMax Reitz     if (bs->exact_filename[0]) {
397691af7014SMax Reitz         pstrcpy(bs->filename, sizeof(bs->filename), bs->exact_filename);
397791af7014SMax Reitz     } else if (bs->full_open_options) {
397891af7014SMax Reitz         QString *json = qobject_to_json(QOBJECT(bs->full_open_options));
397991af7014SMax Reitz         snprintf(bs->filename, sizeof(bs->filename), "json:%s",
398091af7014SMax Reitz                  qstring_get_str(json));
398191af7014SMax Reitz         QDECREF(json);
398291af7014SMax Reitz     }
398391af7014SMax Reitz }
3984