xref: /openbmc/qemu/block.c (revision d0e46a55776a59c8fdbb75620e7c5fcf0d6aa029)
1fc01f7e7Sbellard /*
2fc01f7e7Sbellard  * QEMU System Emulator block driver
3fc01f7e7Sbellard  *
4fc01f7e7Sbellard  * Copyright (c) 2003 Fabrice Bellard
5fc01f7e7Sbellard  *
6fc01f7e7Sbellard  * Permission is hereby granted, free of charge, to any person obtaining a copy
7fc01f7e7Sbellard  * of this software and associated documentation files (the "Software"), to deal
8fc01f7e7Sbellard  * in the Software without restriction, including without limitation the rights
9fc01f7e7Sbellard  * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10fc01f7e7Sbellard  * copies of the Software, and to permit persons to whom the Software is
11fc01f7e7Sbellard  * furnished to do so, subject to the following conditions:
12fc01f7e7Sbellard  *
13fc01f7e7Sbellard  * The above copyright notice and this permission notice shall be included in
14fc01f7e7Sbellard  * all copies or substantial portions of the Software.
15fc01f7e7Sbellard  *
16fc01f7e7Sbellard  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17fc01f7e7Sbellard  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18fc01f7e7Sbellard  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19fc01f7e7Sbellard  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20fc01f7e7Sbellard  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21fc01f7e7Sbellard  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22fc01f7e7Sbellard  * THE SOFTWARE.
23fc01f7e7Sbellard  */
24d38ea87aSPeter Maydell #include "qemu/osdep.h"
25faf07963Spbrook #include "qemu-common.h"
266d519a5fSStefan Hajnoczi #include "trace.h"
27737e150eSPaolo Bonzini #include "block/block_int.h"
28737e150eSPaolo Bonzini #include "block/blockjob.h"
29d49b6836SMarkus Armbruster #include "qemu/error-report.h"
301de7afc9SPaolo Bonzini #include "qemu/module.h"
31cc7a8ea7SMarkus Armbruster #include "qapi/qmp/qerror.h"
3291a097e7SKevin Wolf #include "qapi/qmp/qbool.h"
337b1b5d19SPaolo Bonzini #include "qapi/qmp/qjson.h"
34bfb197e0SMarkus Armbruster #include "sysemu/block-backend.h"
359c17d615SPaolo Bonzini #include "sysemu/sysemu.h"
361de7afc9SPaolo Bonzini #include "qemu/notify.h"
3710817bf0SDaniel P. Berrange #include "qemu/coroutine.h"
38c13163fbSBenoît Canet #include "block/qapi.h"
39b2023818SLuiz Capitulino #include "qmp-commands.h"
401de7afc9SPaolo Bonzini #include "qemu/timer.h"
41a5ee7bd4SWenchao Xia #include "qapi-event.h"
42db628338SAlberto Garcia #include "block/throttle-groups.h"
43fc01f7e7Sbellard 
4471e72a19SJuan Quintela #ifdef CONFIG_BSD
457674e7bfSbellard #include <sys/ioctl.h>
4672cf2d4fSBlue Swirl #include <sys/queue.h>
47c5e97233Sblueswir1 #ifndef __DragonFly__
487674e7bfSbellard #include <sys/disk.h>
497674e7bfSbellard #endif
50c5e97233Sblueswir1 #endif
517674e7bfSbellard 
5249dc768dSaliguori #ifdef _WIN32
5349dc768dSaliguori #include <windows.h>
5449dc768dSaliguori #endif
5549dc768dSaliguori 
561c9805a3SStefan Hajnoczi #define NOT_DONE 0x7fffffff /* used while emulated sync operation in progress */
571c9805a3SStefan Hajnoczi 
58c69a4dd8SMax Reitz struct BdrvStates bdrv_states = QTAILQ_HEAD_INITIALIZER(bdrv_states);
597ee930d0Sblueswir1 
60dc364f4cSBenoît Canet static QTAILQ_HEAD(, BlockDriverState) graph_bdrv_states =
61dc364f4cSBenoît Canet     QTAILQ_HEAD_INITIALIZER(graph_bdrv_states);
62dc364f4cSBenoît Canet 
632c1d04e0SMax Reitz static QTAILQ_HEAD(, BlockDriverState) all_bdrv_states =
642c1d04e0SMax Reitz     QTAILQ_HEAD_INITIALIZER(all_bdrv_states);
652c1d04e0SMax Reitz 
668a22f02aSStefan Hajnoczi static QLIST_HEAD(, BlockDriver) bdrv_drivers =
678a22f02aSStefan Hajnoczi     QLIST_HEAD_INITIALIZER(bdrv_drivers);
68ea2384d3Sbellard 
69f3930ed0SKevin Wolf static int bdrv_open_inherit(BlockDriverState **pbs, const char *filename,
70f3930ed0SKevin Wolf                              const char *reference, QDict *options, int flags,
71f3930ed0SKevin Wolf                              BlockDriverState *parent,
72ce343771SMax Reitz                              const BdrvChildRole *child_role, Error **errp);
73f3930ed0SKevin Wolf 
74eb852011SMarkus Armbruster /* If non-zero, use only whitelisted block drivers */
75eb852011SMarkus Armbruster static int use_bdrv_whitelist;
76eb852011SMarkus Armbruster 
7764dff520SMax Reitz static void bdrv_close(BlockDriverState *bs);
7864dff520SMax Reitz 
799e0b22f4SStefan Hajnoczi #ifdef _WIN32
809e0b22f4SStefan Hajnoczi static int is_windows_drive_prefix(const char *filename)
819e0b22f4SStefan Hajnoczi {
829e0b22f4SStefan Hajnoczi     return (((filename[0] >= 'a' && filename[0] <= 'z') ||
839e0b22f4SStefan Hajnoczi              (filename[0] >= 'A' && filename[0] <= 'Z')) &&
849e0b22f4SStefan Hajnoczi             filename[1] == ':');
859e0b22f4SStefan Hajnoczi }
869e0b22f4SStefan Hajnoczi 
879e0b22f4SStefan Hajnoczi int is_windows_drive(const char *filename)
889e0b22f4SStefan Hajnoczi {
899e0b22f4SStefan Hajnoczi     if (is_windows_drive_prefix(filename) &&
909e0b22f4SStefan Hajnoczi         filename[2] == '\0')
919e0b22f4SStefan Hajnoczi         return 1;
929e0b22f4SStefan Hajnoczi     if (strstart(filename, "\\\\.\\", NULL) ||
939e0b22f4SStefan Hajnoczi         strstart(filename, "//./", NULL))
949e0b22f4SStefan Hajnoczi         return 1;
959e0b22f4SStefan Hajnoczi     return 0;
969e0b22f4SStefan Hajnoczi }
979e0b22f4SStefan Hajnoczi #endif
989e0b22f4SStefan Hajnoczi 
99339064d5SKevin Wolf size_t bdrv_opt_mem_align(BlockDriverState *bs)
100339064d5SKevin Wolf {
101339064d5SKevin Wolf     if (!bs || !bs->drv) {
102459b4e66SDenis V. Lunev         /* page size or 4k (hdd sector size) should be on the safe side */
103459b4e66SDenis V. Lunev         return MAX(4096, getpagesize());
104339064d5SKevin Wolf     }
105339064d5SKevin Wolf 
106339064d5SKevin Wolf     return bs->bl.opt_mem_alignment;
107339064d5SKevin Wolf }
108339064d5SKevin Wolf 
1094196d2f0SDenis V. Lunev size_t bdrv_min_mem_align(BlockDriverState *bs)
1104196d2f0SDenis V. Lunev {
1114196d2f0SDenis V. Lunev     if (!bs || !bs->drv) {
112459b4e66SDenis V. Lunev         /* page size or 4k (hdd sector size) should be on the safe side */
113459b4e66SDenis V. Lunev         return MAX(4096, getpagesize());
1144196d2f0SDenis V. Lunev     }
1154196d2f0SDenis V. Lunev 
1164196d2f0SDenis V. Lunev     return bs->bl.min_mem_alignment;
1174196d2f0SDenis V. Lunev }
1184196d2f0SDenis V. Lunev 
1199e0b22f4SStefan Hajnoczi /* check if the path starts with "<protocol>:" */
1205c98415bSMax Reitz int path_has_protocol(const char *path)
1219e0b22f4SStefan Hajnoczi {
122947995c0SPaolo Bonzini     const char *p;
123947995c0SPaolo Bonzini 
1249e0b22f4SStefan Hajnoczi #ifdef _WIN32
1259e0b22f4SStefan Hajnoczi     if (is_windows_drive(path) ||
1269e0b22f4SStefan Hajnoczi         is_windows_drive_prefix(path)) {
1279e0b22f4SStefan Hajnoczi         return 0;
1289e0b22f4SStefan Hajnoczi     }
129947995c0SPaolo Bonzini     p = path + strcspn(path, ":/\\");
130947995c0SPaolo Bonzini #else
131947995c0SPaolo Bonzini     p = path + strcspn(path, ":/");
1329e0b22f4SStefan Hajnoczi #endif
1339e0b22f4SStefan Hajnoczi 
134947995c0SPaolo Bonzini     return *p == ':';
1359e0b22f4SStefan Hajnoczi }
1369e0b22f4SStefan Hajnoczi 
13783f64091Sbellard int path_is_absolute(const char *path)
13883f64091Sbellard {
13921664424Sbellard #ifdef _WIN32
14021664424Sbellard     /* specific case for names like: "\\.\d:" */
141f53f4da9SPaolo Bonzini     if (is_windows_drive(path) || is_windows_drive_prefix(path)) {
14221664424Sbellard         return 1;
143f53f4da9SPaolo Bonzini     }
144f53f4da9SPaolo Bonzini     return (*path == '/' || *path == '\\');
1453b9f94e1Sbellard #else
146f53f4da9SPaolo Bonzini     return (*path == '/');
1473b9f94e1Sbellard #endif
14883f64091Sbellard }
14983f64091Sbellard 
15083f64091Sbellard /* if filename is absolute, just copy it to dest. Otherwise, build a
15183f64091Sbellard    path to it by considering it is relative to base_path. URL are
15283f64091Sbellard    supported. */
15383f64091Sbellard void path_combine(char *dest, int dest_size,
15483f64091Sbellard                   const char *base_path,
15583f64091Sbellard                   const char *filename)
15683f64091Sbellard {
15783f64091Sbellard     const char *p, *p1;
15883f64091Sbellard     int len;
15983f64091Sbellard 
16083f64091Sbellard     if (dest_size <= 0)
16183f64091Sbellard         return;
16283f64091Sbellard     if (path_is_absolute(filename)) {
16383f64091Sbellard         pstrcpy(dest, dest_size, filename);
16483f64091Sbellard     } else {
16583f64091Sbellard         p = strchr(base_path, ':');
16683f64091Sbellard         if (p)
16783f64091Sbellard             p++;
16883f64091Sbellard         else
16983f64091Sbellard             p = base_path;
1703b9f94e1Sbellard         p1 = strrchr(base_path, '/');
1713b9f94e1Sbellard #ifdef _WIN32
1723b9f94e1Sbellard         {
1733b9f94e1Sbellard             const char *p2;
1743b9f94e1Sbellard             p2 = strrchr(base_path, '\\');
1753b9f94e1Sbellard             if (!p1 || p2 > p1)
1763b9f94e1Sbellard                 p1 = p2;
1773b9f94e1Sbellard         }
1783b9f94e1Sbellard #endif
17983f64091Sbellard         if (p1)
18083f64091Sbellard             p1++;
18183f64091Sbellard         else
18283f64091Sbellard             p1 = base_path;
18383f64091Sbellard         if (p1 > p)
18483f64091Sbellard             p = p1;
18583f64091Sbellard         len = p - base_path;
18683f64091Sbellard         if (len > dest_size - 1)
18783f64091Sbellard             len = dest_size - 1;
18883f64091Sbellard         memcpy(dest, base_path, len);
18983f64091Sbellard         dest[len] = '\0';
19083f64091Sbellard         pstrcat(dest, dest_size, filename);
19183f64091Sbellard     }
19283f64091Sbellard }
19383f64091Sbellard 
1940a82855aSMax Reitz void bdrv_get_full_backing_filename_from_filename(const char *backed,
1950a82855aSMax Reitz                                                   const char *backing,
1969f07429eSMax Reitz                                                   char *dest, size_t sz,
1979f07429eSMax Reitz                                                   Error **errp)
1980a82855aSMax Reitz {
1999f07429eSMax Reitz     if (backing[0] == '\0' || path_has_protocol(backing) ||
2009f07429eSMax Reitz         path_is_absolute(backing))
2019f07429eSMax Reitz     {
2020a82855aSMax Reitz         pstrcpy(dest, sz, backing);
2039f07429eSMax Reitz     } else if (backed[0] == '\0' || strstart(backed, "json:", NULL)) {
2049f07429eSMax Reitz         error_setg(errp, "Cannot use relative backing file names for '%s'",
2059f07429eSMax Reitz                    backed);
2060a82855aSMax Reitz     } else {
2070a82855aSMax Reitz         path_combine(dest, sz, backed, backing);
2080a82855aSMax Reitz     }
2090a82855aSMax Reitz }
2100a82855aSMax Reitz 
2119f07429eSMax Reitz void bdrv_get_full_backing_filename(BlockDriverState *bs, char *dest, size_t sz,
2129f07429eSMax Reitz                                     Error **errp)
213dc5a1371SPaolo Bonzini {
2149f07429eSMax Reitz     char *backed = bs->exact_filename[0] ? bs->exact_filename : bs->filename;
2159f07429eSMax Reitz 
2169f07429eSMax Reitz     bdrv_get_full_backing_filename_from_filename(backed, bs->backing_file,
2179f07429eSMax Reitz                                                  dest, sz, errp);
218dc5a1371SPaolo Bonzini }
219dc5a1371SPaolo Bonzini 
2200eb7217eSStefan Hajnoczi void bdrv_register(BlockDriver *bdrv)
2210eb7217eSStefan Hajnoczi {
2220eb7217eSStefan Hajnoczi     bdrv_setup_io_funcs(bdrv);
223b2e12bc6SChristoph Hellwig 
2248a22f02aSStefan Hajnoczi     QLIST_INSERT_HEAD(&bdrv_drivers, bdrv, list);
225ea2384d3Sbellard }
226b338082bSbellard 
2277f06d47eSMarkus Armbruster BlockDriverState *bdrv_new_root(void)
228fc01f7e7Sbellard {
2297f06d47eSMarkus Armbruster     BlockDriverState *bs = bdrv_new();
230e4e9986bSMarkus Armbruster 
231e4e9986bSMarkus Armbruster     QTAILQ_INSERT_TAIL(&bdrv_states, bs, device_list);
232e4e9986bSMarkus Armbruster     return bs;
233e4e9986bSMarkus Armbruster }
234e4e9986bSMarkus Armbruster 
235e4e9986bSMarkus Armbruster BlockDriverState *bdrv_new(void)
236e4e9986bSMarkus Armbruster {
237e4e9986bSMarkus Armbruster     BlockDriverState *bs;
238e4e9986bSMarkus Armbruster     int i;
239e4e9986bSMarkus Armbruster 
2405839e53bSMarkus Armbruster     bs = g_new0(BlockDriverState, 1);
241e4654d2dSFam Zheng     QLIST_INIT(&bs->dirty_bitmaps);
242fbe40ff7SFam Zheng     for (i = 0; i < BLOCK_OP_TYPE_MAX; i++) {
243fbe40ff7SFam Zheng         QLIST_INIT(&bs->op_blockers[i]);
244fbe40ff7SFam Zheng     }
245d616b224SStefan Hajnoczi     notifier_with_return_list_init(&bs->before_write_notifiers);
246cc0681c4SBenoît Canet     qemu_co_queue_init(&bs->throttled_reqs[0]);
247cc0681c4SBenoît Canet     qemu_co_queue_init(&bs->throttled_reqs[1]);
2489fcb0251SFam Zheng     bs->refcnt = 1;
249dcd04228SStefan Hajnoczi     bs->aio_context = qemu_get_aio_context();
250d7d512f6SPaolo Bonzini 
2512c1d04e0SMax Reitz     QTAILQ_INSERT_TAIL(&all_bdrv_states, bs, bs_list);
2522c1d04e0SMax Reitz 
253b338082bSbellard     return bs;
254b338082bSbellard }
255b338082bSbellard 
256ea2384d3Sbellard BlockDriver *bdrv_find_format(const char *format_name)
257ea2384d3Sbellard {
258ea2384d3Sbellard     BlockDriver *drv1;
2598a22f02aSStefan Hajnoczi     QLIST_FOREACH(drv1, &bdrv_drivers, list) {
2608a22f02aSStefan Hajnoczi         if (!strcmp(drv1->format_name, format_name)) {
261ea2384d3Sbellard             return drv1;
262ea2384d3Sbellard         }
2638a22f02aSStefan Hajnoczi     }
264ea2384d3Sbellard     return NULL;
265ea2384d3Sbellard }
266ea2384d3Sbellard 
267b64ec4e4SFam Zheng static int bdrv_is_whitelisted(BlockDriver *drv, bool read_only)
268eb852011SMarkus Armbruster {
269b64ec4e4SFam Zheng     static const char *whitelist_rw[] = {
270b64ec4e4SFam Zheng         CONFIG_BDRV_RW_WHITELIST
271b64ec4e4SFam Zheng     };
272b64ec4e4SFam Zheng     static const char *whitelist_ro[] = {
273b64ec4e4SFam Zheng         CONFIG_BDRV_RO_WHITELIST
274eb852011SMarkus Armbruster     };
275eb852011SMarkus Armbruster     const char **p;
276eb852011SMarkus Armbruster 
277b64ec4e4SFam Zheng     if (!whitelist_rw[0] && !whitelist_ro[0]) {
278eb852011SMarkus Armbruster         return 1;               /* no whitelist, anything goes */
279b64ec4e4SFam Zheng     }
280eb852011SMarkus Armbruster 
281b64ec4e4SFam Zheng     for (p = whitelist_rw; *p; p++) {
282eb852011SMarkus Armbruster         if (!strcmp(drv->format_name, *p)) {
283eb852011SMarkus Armbruster             return 1;
284eb852011SMarkus Armbruster         }
285eb852011SMarkus Armbruster     }
286b64ec4e4SFam Zheng     if (read_only) {
287b64ec4e4SFam Zheng         for (p = whitelist_ro; *p; p++) {
288b64ec4e4SFam Zheng             if (!strcmp(drv->format_name, *p)) {
289b64ec4e4SFam Zheng                 return 1;
290b64ec4e4SFam Zheng             }
291b64ec4e4SFam Zheng         }
292b64ec4e4SFam Zheng     }
293eb852011SMarkus Armbruster     return 0;
294eb852011SMarkus Armbruster }
295eb852011SMarkus Armbruster 
2965b7e1542SZhi Yong Wu typedef struct CreateCo {
2975b7e1542SZhi Yong Wu     BlockDriver *drv;
2985b7e1542SZhi Yong Wu     char *filename;
29983d0521aSChunyan Liu     QemuOpts *opts;
3005b7e1542SZhi Yong Wu     int ret;
301cc84d90fSMax Reitz     Error *err;
3025b7e1542SZhi Yong Wu } CreateCo;
3035b7e1542SZhi Yong Wu 
3045b7e1542SZhi Yong Wu static void coroutine_fn bdrv_create_co_entry(void *opaque)
3055b7e1542SZhi Yong Wu {
306cc84d90fSMax Reitz     Error *local_err = NULL;
307cc84d90fSMax Reitz     int ret;
308cc84d90fSMax Reitz 
3095b7e1542SZhi Yong Wu     CreateCo *cco = opaque;
3105b7e1542SZhi Yong Wu     assert(cco->drv);
3115b7e1542SZhi Yong Wu 
312c282e1fdSChunyan Liu     ret = cco->drv->bdrv_create(cco->filename, cco->opts, &local_err);
31384d18f06SMarkus Armbruster     if (local_err) {
314cc84d90fSMax Reitz         error_propagate(&cco->err, local_err);
315cc84d90fSMax Reitz     }
316cc84d90fSMax Reitz     cco->ret = ret;
3175b7e1542SZhi Yong Wu }
3185b7e1542SZhi Yong Wu 
3190e7e1989SKevin Wolf int bdrv_create(BlockDriver *drv, const char* filename,
32083d0521aSChunyan Liu                 QemuOpts *opts, Error **errp)
321ea2384d3Sbellard {
3225b7e1542SZhi Yong Wu     int ret;
3230e7e1989SKevin Wolf 
3245b7e1542SZhi Yong Wu     Coroutine *co;
3255b7e1542SZhi Yong Wu     CreateCo cco = {
3265b7e1542SZhi Yong Wu         .drv = drv,
3275b7e1542SZhi Yong Wu         .filename = g_strdup(filename),
32883d0521aSChunyan Liu         .opts = opts,
3295b7e1542SZhi Yong Wu         .ret = NOT_DONE,
330cc84d90fSMax Reitz         .err = NULL,
3315b7e1542SZhi Yong Wu     };
3325b7e1542SZhi Yong Wu 
333c282e1fdSChunyan Liu     if (!drv->bdrv_create) {
334cc84d90fSMax Reitz         error_setg(errp, "Driver '%s' does not support image creation", drv->format_name);
33580168bffSLuiz Capitulino         ret = -ENOTSUP;
33680168bffSLuiz Capitulino         goto out;
3375b7e1542SZhi Yong Wu     }
3385b7e1542SZhi Yong Wu 
3395b7e1542SZhi Yong Wu     if (qemu_in_coroutine()) {
3405b7e1542SZhi Yong Wu         /* Fast-path if already in coroutine context */
3415b7e1542SZhi Yong Wu         bdrv_create_co_entry(&cco);
3425b7e1542SZhi Yong Wu     } else {
3435b7e1542SZhi Yong Wu         co = qemu_coroutine_create(bdrv_create_co_entry);
3445b7e1542SZhi Yong Wu         qemu_coroutine_enter(co, &cco);
3455b7e1542SZhi Yong Wu         while (cco.ret == NOT_DONE) {
346b47ec2c4SPaolo Bonzini             aio_poll(qemu_get_aio_context(), true);
3475b7e1542SZhi Yong Wu         }
3485b7e1542SZhi Yong Wu     }
3495b7e1542SZhi Yong Wu 
3505b7e1542SZhi Yong Wu     ret = cco.ret;
351cc84d90fSMax Reitz     if (ret < 0) {
35284d18f06SMarkus Armbruster         if (cco.err) {
353cc84d90fSMax Reitz             error_propagate(errp, cco.err);
354cc84d90fSMax Reitz         } else {
355cc84d90fSMax Reitz             error_setg_errno(errp, -ret, "Could not create image");
356cc84d90fSMax Reitz         }
357cc84d90fSMax Reitz     }
3585b7e1542SZhi Yong Wu 
35980168bffSLuiz Capitulino out:
36080168bffSLuiz Capitulino     g_free(cco.filename);
3615b7e1542SZhi Yong Wu     return ret;
362ea2384d3Sbellard }
363ea2384d3Sbellard 
364c282e1fdSChunyan Liu int bdrv_create_file(const char *filename, QemuOpts *opts, Error **errp)
36584a12e66SChristoph Hellwig {
36684a12e66SChristoph Hellwig     BlockDriver *drv;
367cc84d90fSMax Reitz     Error *local_err = NULL;
368cc84d90fSMax Reitz     int ret;
36984a12e66SChristoph Hellwig 
370b65a5e12SMax Reitz     drv = bdrv_find_protocol(filename, true, errp);
37184a12e66SChristoph Hellwig     if (drv == NULL) {
37216905d71SStefan Hajnoczi         return -ENOENT;
37384a12e66SChristoph Hellwig     }
37484a12e66SChristoph Hellwig 
375c282e1fdSChunyan Liu     ret = bdrv_create(drv, filename, opts, &local_err);
37684d18f06SMarkus Armbruster     if (local_err) {
377cc84d90fSMax Reitz         error_propagate(errp, local_err);
378cc84d90fSMax Reitz     }
379cc84d90fSMax Reitz     return ret;
38084a12e66SChristoph Hellwig }
38184a12e66SChristoph Hellwig 
382892b7de8SEkaterina Tumanova /**
383892b7de8SEkaterina Tumanova  * Try to get @bs's logical and physical block size.
384892b7de8SEkaterina Tumanova  * On success, store them in @bsz struct and return 0.
385892b7de8SEkaterina Tumanova  * On failure return -errno.
386892b7de8SEkaterina Tumanova  * @bs must not be empty.
387892b7de8SEkaterina Tumanova  */
388892b7de8SEkaterina Tumanova int bdrv_probe_blocksizes(BlockDriverState *bs, BlockSizes *bsz)
389892b7de8SEkaterina Tumanova {
390892b7de8SEkaterina Tumanova     BlockDriver *drv = bs->drv;
391892b7de8SEkaterina Tumanova 
392892b7de8SEkaterina Tumanova     if (drv && drv->bdrv_probe_blocksizes) {
393892b7de8SEkaterina Tumanova         return drv->bdrv_probe_blocksizes(bs, bsz);
394892b7de8SEkaterina Tumanova     }
395892b7de8SEkaterina Tumanova 
396892b7de8SEkaterina Tumanova     return -ENOTSUP;
397892b7de8SEkaterina Tumanova }
398892b7de8SEkaterina Tumanova 
399892b7de8SEkaterina Tumanova /**
400892b7de8SEkaterina Tumanova  * Try to get @bs's geometry (cyls, heads, sectors).
401892b7de8SEkaterina Tumanova  * On success, store them in @geo struct and return 0.
402892b7de8SEkaterina Tumanova  * On failure return -errno.
403892b7de8SEkaterina Tumanova  * @bs must not be empty.
404892b7de8SEkaterina Tumanova  */
405892b7de8SEkaterina Tumanova int bdrv_probe_geometry(BlockDriverState *bs, HDGeometry *geo)
406892b7de8SEkaterina Tumanova {
407892b7de8SEkaterina Tumanova     BlockDriver *drv = bs->drv;
408892b7de8SEkaterina Tumanova 
409892b7de8SEkaterina Tumanova     if (drv && drv->bdrv_probe_geometry) {
410892b7de8SEkaterina Tumanova         return drv->bdrv_probe_geometry(bs, geo);
411892b7de8SEkaterina Tumanova     }
412892b7de8SEkaterina Tumanova 
413892b7de8SEkaterina Tumanova     return -ENOTSUP;
414892b7de8SEkaterina Tumanova }
415892b7de8SEkaterina Tumanova 
416eba25057SJim Meyering /*
417eba25057SJim Meyering  * Create a uniquely-named empty temporary file.
418eba25057SJim Meyering  * Return 0 upon success, otherwise a negative errno value.
419eba25057SJim Meyering  */
420eba25057SJim Meyering int get_tmp_filename(char *filename, int size)
421eba25057SJim Meyering {
422d5249393Sbellard #ifdef _WIN32
4233b9f94e1Sbellard     char temp_dir[MAX_PATH];
424eba25057SJim Meyering     /* GetTempFileName requires that its output buffer (4th param)
425eba25057SJim Meyering        have length MAX_PATH or greater.  */
426eba25057SJim Meyering     assert(size >= MAX_PATH);
427eba25057SJim Meyering     return (GetTempPath(MAX_PATH, temp_dir)
428eba25057SJim Meyering             && GetTempFileName(temp_dir, "qem", 0, filename)
429eba25057SJim Meyering             ? 0 : -GetLastError());
430d5249393Sbellard #else
431ea2384d3Sbellard     int fd;
4327ccfb2ebSblueswir1     const char *tmpdir;
4330badc1eeSaurel32     tmpdir = getenv("TMPDIR");
43469bef793SAmit Shah     if (!tmpdir) {
43569bef793SAmit Shah         tmpdir = "/var/tmp";
43669bef793SAmit Shah     }
437eba25057SJim Meyering     if (snprintf(filename, size, "%s/vl.XXXXXX", tmpdir) >= size) {
438eba25057SJim Meyering         return -EOVERFLOW;
439ea2384d3Sbellard     }
440eba25057SJim Meyering     fd = mkstemp(filename);
441fe235a06SDunrong Huang     if (fd < 0) {
442fe235a06SDunrong Huang         return -errno;
443fe235a06SDunrong Huang     }
444fe235a06SDunrong Huang     if (close(fd) != 0) {
445fe235a06SDunrong Huang         unlink(filename);
446eba25057SJim Meyering         return -errno;
447eba25057SJim Meyering     }
448eba25057SJim Meyering     return 0;
449d5249393Sbellard #endif
450eba25057SJim Meyering }
451ea2384d3Sbellard 
452f3a5d3f8SChristoph Hellwig /*
453f3a5d3f8SChristoph Hellwig  * Detect host devices. By convention, /dev/cdrom[N] is always
454f3a5d3f8SChristoph Hellwig  * recognized as a host CDROM.
455f3a5d3f8SChristoph Hellwig  */
456f3a5d3f8SChristoph Hellwig static BlockDriver *find_hdev_driver(const char *filename)
457f3a5d3f8SChristoph Hellwig {
458508c7cb3SChristoph Hellwig     int score_max = 0, score;
459508c7cb3SChristoph Hellwig     BlockDriver *drv = NULL, *d;
460f3a5d3f8SChristoph Hellwig 
4618a22f02aSStefan Hajnoczi     QLIST_FOREACH(d, &bdrv_drivers, list) {
462508c7cb3SChristoph Hellwig         if (d->bdrv_probe_device) {
463508c7cb3SChristoph Hellwig             score = d->bdrv_probe_device(filename);
464508c7cb3SChristoph Hellwig             if (score > score_max) {
465508c7cb3SChristoph Hellwig                 score_max = score;
466508c7cb3SChristoph Hellwig                 drv = d;
467f3a5d3f8SChristoph Hellwig             }
468508c7cb3SChristoph Hellwig         }
469f3a5d3f8SChristoph Hellwig     }
470f3a5d3f8SChristoph Hellwig 
471508c7cb3SChristoph Hellwig     return drv;
472f3a5d3f8SChristoph Hellwig }
473f3a5d3f8SChristoph Hellwig 
47498289620SKevin Wolf BlockDriver *bdrv_find_protocol(const char *filename,
475b65a5e12SMax Reitz                                 bool allow_protocol_prefix,
476b65a5e12SMax Reitz                                 Error **errp)
47784a12e66SChristoph Hellwig {
47884a12e66SChristoph Hellwig     BlockDriver *drv1;
47984a12e66SChristoph Hellwig     char protocol[128];
48084a12e66SChristoph Hellwig     int len;
48184a12e66SChristoph Hellwig     const char *p;
48284a12e66SChristoph Hellwig 
48366f82ceeSKevin Wolf     /* TODO Drivers without bdrv_file_open must be specified explicitly */
48466f82ceeSKevin Wolf 
48539508e7aSChristoph Hellwig     /*
48639508e7aSChristoph Hellwig      * XXX(hch): we really should not let host device detection
48739508e7aSChristoph Hellwig      * override an explicit protocol specification, but moving this
48839508e7aSChristoph Hellwig      * later breaks access to device names with colons in them.
48939508e7aSChristoph Hellwig      * Thanks to the brain-dead persistent naming schemes on udev-
49039508e7aSChristoph Hellwig      * based Linux systems those actually are quite common.
49139508e7aSChristoph Hellwig      */
49284a12e66SChristoph Hellwig     drv1 = find_hdev_driver(filename);
49339508e7aSChristoph Hellwig     if (drv1) {
49484a12e66SChristoph Hellwig         return drv1;
49584a12e66SChristoph Hellwig     }
49639508e7aSChristoph Hellwig 
49798289620SKevin Wolf     if (!path_has_protocol(filename) || !allow_protocol_prefix) {
498ef810437SMax Reitz         return &bdrv_file;
49939508e7aSChristoph Hellwig     }
50098289620SKevin Wolf 
5019e0b22f4SStefan Hajnoczi     p = strchr(filename, ':');
5029e0b22f4SStefan Hajnoczi     assert(p != NULL);
50384a12e66SChristoph Hellwig     len = p - filename;
50484a12e66SChristoph Hellwig     if (len > sizeof(protocol) - 1)
50584a12e66SChristoph Hellwig         len = sizeof(protocol) - 1;
50684a12e66SChristoph Hellwig     memcpy(protocol, filename, len);
50784a12e66SChristoph Hellwig     protocol[len] = '\0';
50884a12e66SChristoph Hellwig     QLIST_FOREACH(drv1, &bdrv_drivers, list) {
50984a12e66SChristoph Hellwig         if (drv1->protocol_name &&
51084a12e66SChristoph Hellwig             !strcmp(drv1->protocol_name, protocol)) {
51184a12e66SChristoph Hellwig             return drv1;
51284a12e66SChristoph Hellwig         }
51384a12e66SChristoph Hellwig     }
514b65a5e12SMax Reitz 
515b65a5e12SMax Reitz     error_setg(errp, "Unknown protocol '%s'", protocol);
51684a12e66SChristoph Hellwig     return NULL;
51784a12e66SChristoph Hellwig }
51884a12e66SChristoph Hellwig 
519c6684249SMarkus Armbruster /*
520c6684249SMarkus Armbruster  * Guess image format by probing its contents.
521c6684249SMarkus Armbruster  * This is not a good idea when your image is raw (CVE-2008-2004), but
522c6684249SMarkus Armbruster  * we do it anyway for backward compatibility.
523c6684249SMarkus Armbruster  *
524c6684249SMarkus Armbruster  * @buf         contains the image's first @buf_size bytes.
5257cddd372SKevin Wolf  * @buf_size    is the buffer size in bytes (generally BLOCK_PROBE_BUF_SIZE,
5267cddd372SKevin Wolf  *              but can be smaller if the image file is smaller)
527c6684249SMarkus Armbruster  * @filename    is its filename.
528c6684249SMarkus Armbruster  *
529c6684249SMarkus Armbruster  * For all block drivers, call the bdrv_probe() method to get its
530c6684249SMarkus Armbruster  * probing score.
531c6684249SMarkus Armbruster  * Return the first block driver with the highest probing score.
532c6684249SMarkus Armbruster  */
53338f3ef57SKevin Wolf BlockDriver *bdrv_probe_all(const uint8_t *buf, int buf_size,
534c6684249SMarkus Armbruster                             const char *filename)
535c6684249SMarkus Armbruster {
536c6684249SMarkus Armbruster     int score_max = 0, score;
537c6684249SMarkus Armbruster     BlockDriver *drv = NULL, *d;
538c6684249SMarkus Armbruster 
539c6684249SMarkus Armbruster     QLIST_FOREACH(d, &bdrv_drivers, list) {
540c6684249SMarkus Armbruster         if (d->bdrv_probe) {
541c6684249SMarkus Armbruster             score = d->bdrv_probe(buf, buf_size, filename);
542c6684249SMarkus Armbruster             if (score > score_max) {
543c6684249SMarkus Armbruster                 score_max = score;
544c6684249SMarkus Armbruster                 drv = d;
545c6684249SMarkus Armbruster             }
546c6684249SMarkus Armbruster         }
547c6684249SMarkus Armbruster     }
548c6684249SMarkus Armbruster 
549c6684249SMarkus Armbruster     return drv;
550c6684249SMarkus Armbruster }
551c6684249SMarkus Armbruster 
552f500a6d3SKevin Wolf static int find_image_format(BlockDriverState *bs, const char *filename,
55334b5d2c6SMax Reitz                              BlockDriver **pdrv, Error **errp)
554ea2384d3Sbellard {
555c6684249SMarkus Armbruster     BlockDriver *drv;
5567cddd372SKevin Wolf     uint8_t buf[BLOCK_PROBE_BUF_SIZE];
557f500a6d3SKevin Wolf     int ret = 0;
558f8ea0b00SNicholas Bellinger 
55908a00559SKevin Wolf     /* Return the raw BlockDriver * to scsi-generic devices or empty drives */
560b192af8aSDimitris Aragiorgis     if (bdrv_is_sg(bs) || !bdrv_is_inserted(bs) || bdrv_getlength(bs) == 0) {
561ef810437SMax Reitz         *pdrv = &bdrv_raw;
562c98ac35dSStefan Weil         return ret;
5631a396859SNicholas A. Bellinger     }
564f8ea0b00SNicholas Bellinger 
56583f64091Sbellard     ret = bdrv_pread(bs, 0, buf, sizeof(buf));
566ea2384d3Sbellard     if (ret < 0) {
56734b5d2c6SMax Reitz         error_setg_errno(errp, -ret, "Could not read image for determining its "
56834b5d2c6SMax Reitz                          "format");
569c98ac35dSStefan Weil         *pdrv = NULL;
570c98ac35dSStefan Weil         return ret;
571ea2384d3Sbellard     }
572ea2384d3Sbellard 
573c6684249SMarkus Armbruster     drv = bdrv_probe_all(buf, ret, filename);
574c98ac35dSStefan Weil     if (!drv) {
57534b5d2c6SMax Reitz         error_setg(errp, "Could not determine image format: No compatible "
57634b5d2c6SMax Reitz                    "driver found");
577c98ac35dSStefan Weil         ret = -ENOENT;
578c98ac35dSStefan Weil     }
579c98ac35dSStefan Weil     *pdrv = drv;
580c98ac35dSStefan Weil     return ret;
581ea2384d3Sbellard }
582ea2384d3Sbellard 
58351762288SStefan Hajnoczi /**
58451762288SStefan Hajnoczi  * Set the current 'total_sectors' value
58565a9bb25SMarkus Armbruster  * Return 0 on success, -errno on error.
58651762288SStefan Hajnoczi  */
58751762288SStefan Hajnoczi static int refresh_total_sectors(BlockDriverState *bs, int64_t hint)
58851762288SStefan Hajnoczi {
58951762288SStefan Hajnoczi     BlockDriver *drv = bs->drv;
59051762288SStefan Hajnoczi 
591396759adSNicholas Bellinger     /* Do not attempt drv->bdrv_getlength() on scsi-generic devices */
592b192af8aSDimitris Aragiorgis     if (bdrv_is_sg(bs))
593396759adSNicholas Bellinger         return 0;
594396759adSNicholas Bellinger 
59551762288SStefan Hajnoczi     /* query actual device if possible, otherwise just trust the hint */
59651762288SStefan Hajnoczi     if (drv->bdrv_getlength) {
59751762288SStefan Hajnoczi         int64_t length = drv->bdrv_getlength(bs);
59851762288SStefan Hajnoczi         if (length < 0) {
59951762288SStefan Hajnoczi             return length;
60051762288SStefan Hajnoczi         }
6017e382003SFam Zheng         hint = DIV_ROUND_UP(length, BDRV_SECTOR_SIZE);
60251762288SStefan Hajnoczi     }
60351762288SStefan Hajnoczi 
60451762288SStefan Hajnoczi     bs->total_sectors = hint;
60551762288SStefan Hajnoczi     return 0;
60651762288SStefan Hajnoczi }
60751762288SStefan Hajnoczi 
608c3993cdcSStefan Hajnoczi /**
609cddff5baSKevin Wolf  * Combines a QDict of new block driver @options with any missing options taken
610cddff5baSKevin Wolf  * from @old_options, so that leaving out an option defaults to its old value.
611cddff5baSKevin Wolf  */
612cddff5baSKevin Wolf static void bdrv_join_options(BlockDriverState *bs, QDict *options,
613cddff5baSKevin Wolf                               QDict *old_options)
614cddff5baSKevin Wolf {
615cddff5baSKevin Wolf     if (bs->drv && bs->drv->bdrv_join_options) {
616cddff5baSKevin Wolf         bs->drv->bdrv_join_options(options, old_options);
617cddff5baSKevin Wolf     } else {
618cddff5baSKevin Wolf         qdict_join(options, old_options, false);
619cddff5baSKevin Wolf     }
620cddff5baSKevin Wolf }
621cddff5baSKevin Wolf 
622cddff5baSKevin Wolf /**
6239e8f1835SPaolo Bonzini  * Set open flags for a given discard mode
6249e8f1835SPaolo Bonzini  *
6259e8f1835SPaolo Bonzini  * Return 0 on success, -1 if the discard mode was invalid.
6269e8f1835SPaolo Bonzini  */
6279e8f1835SPaolo Bonzini int bdrv_parse_discard_flags(const char *mode, int *flags)
6289e8f1835SPaolo Bonzini {
6299e8f1835SPaolo Bonzini     *flags &= ~BDRV_O_UNMAP;
6309e8f1835SPaolo Bonzini 
6319e8f1835SPaolo Bonzini     if (!strcmp(mode, "off") || !strcmp(mode, "ignore")) {
6329e8f1835SPaolo Bonzini         /* do nothing */
6339e8f1835SPaolo Bonzini     } else if (!strcmp(mode, "on") || !strcmp(mode, "unmap")) {
6349e8f1835SPaolo Bonzini         *flags |= BDRV_O_UNMAP;
6359e8f1835SPaolo Bonzini     } else {
6369e8f1835SPaolo Bonzini         return -1;
6379e8f1835SPaolo Bonzini     }
6389e8f1835SPaolo Bonzini 
6399e8f1835SPaolo Bonzini     return 0;
6409e8f1835SPaolo Bonzini }
6419e8f1835SPaolo Bonzini 
6429e8f1835SPaolo Bonzini /**
643c3993cdcSStefan Hajnoczi  * Set open flags for a given cache mode
644c3993cdcSStefan Hajnoczi  *
645c3993cdcSStefan Hajnoczi  * Return 0 on success, -1 if the cache mode was invalid.
646c3993cdcSStefan Hajnoczi  */
647c3993cdcSStefan Hajnoczi int bdrv_parse_cache_flags(const char *mode, int *flags)
648c3993cdcSStefan Hajnoczi {
649c3993cdcSStefan Hajnoczi     *flags &= ~BDRV_O_CACHE_MASK;
650c3993cdcSStefan Hajnoczi 
651c3993cdcSStefan Hajnoczi     if (!strcmp(mode, "off") || !strcmp(mode, "none")) {
652c3993cdcSStefan Hajnoczi         *flags |= BDRV_O_NOCACHE | BDRV_O_CACHE_WB;
65392196b2fSStefan Hajnoczi     } else if (!strcmp(mode, "directsync")) {
65492196b2fSStefan Hajnoczi         *flags |= BDRV_O_NOCACHE;
655c3993cdcSStefan Hajnoczi     } else if (!strcmp(mode, "writeback")) {
656c3993cdcSStefan Hajnoczi         *flags |= BDRV_O_CACHE_WB;
657c3993cdcSStefan Hajnoczi     } else if (!strcmp(mode, "unsafe")) {
658c3993cdcSStefan Hajnoczi         *flags |= BDRV_O_CACHE_WB;
659c3993cdcSStefan Hajnoczi         *flags |= BDRV_O_NO_FLUSH;
660c3993cdcSStefan Hajnoczi     } else if (!strcmp(mode, "writethrough")) {
661c3993cdcSStefan Hajnoczi         /* this is the default */
662c3993cdcSStefan Hajnoczi     } else {
663c3993cdcSStefan Hajnoczi         return -1;
664c3993cdcSStefan Hajnoczi     }
665c3993cdcSStefan Hajnoczi 
666c3993cdcSStefan Hajnoczi     return 0;
667c3993cdcSStefan Hajnoczi }
668c3993cdcSStefan Hajnoczi 
6690b50cc88SKevin Wolf /*
67073176beeSKevin Wolf  * Returns the options and flags that a temporary snapshot should get, based on
67173176beeSKevin Wolf  * the originally requested flags (the originally requested image will have
67273176beeSKevin Wolf  * flags like a backing file)
673b1e6fc08SKevin Wolf  */
67473176beeSKevin Wolf static void bdrv_temp_snapshot_options(int *child_flags, QDict *child_options,
67573176beeSKevin Wolf                                        int parent_flags, QDict *parent_options)
676b1e6fc08SKevin Wolf {
67773176beeSKevin Wolf     *child_flags = (parent_flags & ~BDRV_O_SNAPSHOT) | BDRV_O_TEMPORARY;
67873176beeSKevin Wolf 
67973176beeSKevin Wolf     /* For temporary files, unconditional cache=unsafe is fine */
68073176beeSKevin Wolf     qdict_set_default_str(child_options, BDRV_OPT_CACHE_WB, "on");
68173176beeSKevin Wolf     qdict_set_default_str(child_options, BDRV_OPT_CACHE_DIRECT, "off");
68273176beeSKevin Wolf     qdict_set_default_str(child_options, BDRV_OPT_CACHE_NO_FLUSH, "on");
683b1e6fc08SKevin Wolf }
684b1e6fc08SKevin Wolf 
685b1e6fc08SKevin Wolf /*
6868e2160e2SKevin Wolf  * Returns the options and flags that bs->file should get if a protocol driver
6878e2160e2SKevin Wolf  * is expected, based on the given options and flags for the parent BDS
6880b50cc88SKevin Wolf  */
6898e2160e2SKevin Wolf static void bdrv_inherited_options(int *child_flags, QDict *child_options,
6908e2160e2SKevin Wolf                                    int parent_flags, QDict *parent_options)
6910b50cc88SKevin Wolf {
6928e2160e2SKevin Wolf     int flags = parent_flags;
6938e2160e2SKevin Wolf 
6940b50cc88SKevin Wolf     /* Enable protocol handling, disable format probing for bs->file */
6950b50cc88SKevin Wolf     flags |= BDRV_O_PROTOCOL;
6960b50cc88SKevin Wolf 
69791a097e7SKevin Wolf     /* If the cache mode isn't explicitly set, inherit direct and no-flush from
69891a097e7SKevin Wolf      * the parent. */
69991a097e7SKevin Wolf     qdict_copy_default(child_options, parent_options, BDRV_OPT_CACHE_DIRECT);
70091a097e7SKevin Wolf     qdict_copy_default(child_options, parent_options, BDRV_OPT_CACHE_NO_FLUSH);
70191a097e7SKevin Wolf 
7020b50cc88SKevin Wolf     /* Our block drivers take care to send flushes and respect unmap policy,
70391a097e7SKevin Wolf      * so we can default to enable both on lower layers regardless of the
70491a097e7SKevin Wolf      * corresponding parent options. */
70591a097e7SKevin Wolf     qdict_set_default_str(child_options, BDRV_OPT_CACHE_WB, "on");
70691a097e7SKevin Wolf     flags |= BDRV_O_UNMAP;
7070b50cc88SKevin Wolf 
7080b50cc88SKevin Wolf     /* Clear flags that only apply to the top layer */
7095669b44dSKevin Wolf     flags &= ~(BDRV_O_SNAPSHOT | BDRV_O_NO_BACKING | BDRV_O_COPY_ON_READ);
7100b50cc88SKevin Wolf 
7118e2160e2SKevin Wolf     *child_flags = flags;
7120b50cc88SKevin Wolf }
7130b50cc88SKevin Wolf 
714f3930ed0SKevin Wolf const BdrvChildRole child_file = {
7158e2160e2SKevin Wolf     .inherit_options = bdrv_inherited_options,
716f3930ed0SKevin Wolf };
717f3930ed0SKevin Wolf 
718f3930ed0SKevin Wolf /*
7198e2160e2SKevin Wolf  * Returns the options and flags that bs->file should get if the use of formats
7208e2160e2SKevin Wolf  * (and not only protocols) is permitted for it, based on the given options and
7218e2160e2SKevin Wolf  * flags for the parent BDS
722f3930ed0SKevin Wolf  */
7238e2160e2SKevin Wolf static void bdrv_inherited_fmt_options(int *child_flags, QDict *child_options,
7248e2160e2SKevin Wolf                                        int parent_flags, QDict *parent_options)
725f3930ed0SKevin Wolf {
7268e2160e2SKevin Wolf     child_file.inherit_options(child_flags, child_options,
7278e2160e2SKevin Wolf                                parent_flags, parent_options);
7288e2160e2SKevin Wolf 
7298e2160e2SKevin Wolf     *child_flags &= ~BDRV_O_PROTOCOL;
730f3930ed0SKevin Wolf }
731f3930ed0SKevin Wolf 
732f3930ed0SKevin Wolf const BdrvChildRole child_format = {
7338e2160e2SKevin Wolf     .inherit_options = bdrv_inherited_fmt_options,
734f3930ed0SKevin Wolf };
735f3930ed0SKevin Wolf 
736317fc44eSKevin Wolf /*
7378e2160e2SKevin Wolf  * Returns the options and flags that bs->backing should get, based on the
7388e2160e2SKevin Wolf  * given options and flags for the parent BDS
739317fc44eSKevin Wolf  */
7408e2160e2SKevin Wolf static void bdrv_backing_options(int *child_flags, QDict *child_options,
7418e2160e2SKevin Wolf                                  int parent_flags, QDict *parent_options)
742317fc44eSKevin Wolf {
7438e2160e2SKevin Wolf     int flags = parent_flags;
7448e2160e2SKevin Wolf 
74591a097e7SKevin Wolf     /* The cache mode is inherited unmodified for backing files */
74691a097e7SKevin Wolf     qdict_copy_default(child_options, parent_options, BDRV_OPT_CACHE_WB);
74791a097e7SKevin Wolf     qdict_copy_default(child_options, parent_options, BDRV_OPT_CACHE_DIRECT);
74891a097e7SKevin Wolf     qdict_copy_default(child_options, parent_options, BDRV_OPT_CACHE_NO_FLUSH);
74991a097e7SKevin Wolf 
750317fc44eSKevin Wolf     /* backing files always opened read-only */
751317fc44eSKevin Wolf     flags &= ~(BDRV_O_RDWR | BDRV_O_COPY_ON_READ);
752317fc44eSKevin Wolf 
753317fc44eSKevin Wolf     /* snapshot=on is handled on the top layer */
7548bfea15dSKevin Wolf     flags &= ~(BDRV_O_SNAPSHOT | BDRV_O_TEMPORARY);
755317fc44eSKevin Wolf 
7568e2160e2SKevin Wolf     *child_flags = flags;
757317fc44eSKevin Wolf }
758317fc44eSKevin Wolf 
759f3930ed0SKevin Wolf static const BdrvChildRole child_backing = {
7608e2160e2SKevin Wolf     .inherit_options = bdrv_backing_options,
761f3930ed0SKevin Wolf };
762f3930ed0SKevin Wolf 
7637b272452SKevin Wolf static int bdrv_open_flags(BlockDriverState *bs, int flags)
7647b272452SKevin Wolf {
7657b272452SKevin Wolf     int open_flags = flags | BDRV_O_CACHE_WB;
7667b272452SKevin Wolf 
7677b272452SKevin Wolf     /*
7687b272452SKevin Wolf      * Clear flags that are internal to the block layer before opening the
7697b272452SKevin Wolf      * image.
7707b272452SKevin Wolf      */
77120cca275SKevin Wolf     open_flags &= ~(BDRV_O_SNAPSHOT | BDRV_O_NO_BACKING | BDRV_O_PROTOCOL);
7727b272452SKevin Wolf 
7737b272452SKevin Wolf     /*
7747b272452SKevin Wolf      * Snapshots should be writable.
7757b272452SKevin Wolf      */
7768bfea15dSKevin Wolf     if (flags & BDRV_O_TEMPORARY) {
7777b272452SKevin Wolf         open_flags |= BDRV_O_RDWR;
7787b272452SKevin Wolf     }
7797b272452SKevin Wolf 
7807b272452SKevin Wolf     return open_flags;
7817b272452SKevin Wolf }
7827b272452SKevin Wolf 
78391a097e7SKevin Wolf static void update_flags_from_options(int *flags, QemuOpts *opts)
78491a097e7SKevin Wolf {
78591a097e7SKevin Wolf     *flags &= ~BDRV_O_CACHE_MASK;
78691a097e7SKevin Wolf 
78791a097e7SKevin Wolf     assert(qemu_opt_find(opts, BDRV_OPT_CACHE_WB));
78891a097e7SKevin Wolf     if (qemu_opt_get_bool(opts, BDRV_OPT_CACHE_WB, false)) {
78991a097e7SKevin Wolf         *flags |= BDRV_O_CACHE_WB;
79091a097e7SKevin Wolf     }
79191a097e7SKevin Wolf 
79291a097e7SKevin Wolf     assert(qemu_opt_find(opts, BDRV_OPT_CACHE_NO_FLUSH));
79391a097e7SKevin Wolf     if (qemu_opt_get_bool(opts, BDRV_OPT_CACHE_NO_FLUSH, false)) {
79491a097e7SKevin Wolf         *flags |= BDRV_O_NO_FLUSH;
79591a097e7SKevin Wolf     }
79691a097e7SKevin Wolf 
79791a097e7SKevin Wolf     assert(qemu_opt_find(opts, BDRV_OPT_CACHE_DIRECT));
79891a097e7SKevin Wolf     if (qemu_opt_get_bool(opts, BDRV_OPT_CACHE_DIRECT, false)) {
79991a097e7SKevin Wolf         *flags |= BDRV_O_NOCACHE;
80091a097e7SKevin Wolf     }
80191a097e7SKevin Wolf }
80291a097e7SKevin Wolf 
80391a097e7SKevin Wolf static void update_options_from_flags(QDict *options, int flags)
80491a097e7SKevin Wolf {
80591a097e7SKevin Wolf     if (!qdict_haskey(options, BDRV_OPT_CACHE_WB)) {
80691a097e7SKevin Wolf         qdict_put(options, BDRV_OPT_CACHE_WB,
80791a097e7SKevin Wolf                   qbool_from_bool(flags & BDRV_O_CACHE_WB));
80891a097e7SKevin Wolf     }
80991a097e7SKevin Wolf     if (!qdict_haskey(options, BDRV_OPT_CACHE_DIRECT)) {
81091a097e7SKevin Wolf         qdict_put(options, BDRV_OPT_CACHE_DIRECT,
81191a097e7SKevin Wolf                   qbool_from_bool(flags & BDRV_O_NOCACHE));
81291a097e7SKevin Wolf     }
81391a097e7SKevin Wolf     if (!qdict_haskey(options, BDRV_OPT_CACHE_NO_FLUSH)) {
81491a097e7SKevin Wolf         qdict_put(options, BDRV_OPT_CACHE_NO_FLUSH,
81591a097e7SKevin Wolf                   qbool_from_bool(flags & BDRV_O_NO_FLUSH));
81691a097e7SKevin Wolf     }
81791a097e7SKevin Wolf }
81891a097e7SKevin Wolf 
819636ea370SKevin Wolf static void bdrv_assign_node_name(BlockDriverState *bs,
8206913c0c2SBenoît Canet                                   const char *node_name,
8216913c0c2SBenoît Canet                                   Error **errp)
8226913c0c2SBenoît Canet {
82315489c76SJeff Cody     char *gen_node_name = NULL;
8246913c0c2SBenoît Canet 
82515489c76SJeff Cody     if (!node_name) {
82615489c76SJeff Cody         node_name = gen_node_name = id_generate(ID_BLOCK);
82715489c76SJeff Cody     } else if (!id_wellformed(node_name)) {
82815489c76SJeff Cody         /*
82915489c76SJeff Cody          * Check for empty string or invalid characters, but not if it is
83015489c76SJeff Cody          * generated (generated names use characters not available to the user)
83115489c76SJeff Cody          */
8329aebf3b8SKevin Wolf         error_setg(errp, "Invalid node name");
833636ea370SKevin Wolf         return;
8346913c0c2SBenoît Canet     }
8356913c0c2SBenoît Canet 
8360c5e94eeSBenoît Canet     /* takes care of avoiding namespaces collisions */
8377f06d47eSMarkus Armbruster     if (blk_by_name(node_name)) {
8380c5e94eeSBenoît Canet         error_setg(errp, "node-name=%s is conflicting with a device id",
8390c5e94eeSBenoît Canet                    node_name);
84015489c76SJeff Cody         goto out;
8410c5e94eeSBenoît Canet     }
8420c5e94eeSBenoît Canet 
8436913c0c2SBenoît Canet     /* takes care of avoiding duplicates node names */
8446913c0c2SBenoît Canet     if (bdrv_find_node(node_name)) {
8456913c0c2SBenoît Canet         error_setg(errp, "Duplicate node name");
84615489c76SJeff Cody         goto out;
8476913c0c2SBenoît Canet     }
8486913c0c2SBenoît Canet 
8496913c0c2SBenoît Canet     /* copy node name into the bs and insert it into the graph list */
8506913c0c2SBenoît Canet     pstrcpy(bs->node_name, sizeof(bs->node_name), node_name);
8516913c0c2SBenoît Canet     QTAILQ_INSERT_TAIL(&graph_bdrv_states, bs, node_list);
85215489c76SJeff Cody out:
85315489c76SJeff Cody     g_free(gen_node_name);
8546913c0c2SBenoît Canet }
8556913c0c2SBenoît Canet 
85618edf289SKevin Wolf static QemuOptsList bdrv_runtime_opts = {
85718edf289SKevin Wolf     .name = "bdrv_common",
85818edf289SKevin Wolf     .head = QTAILQ_HEAD_INITIALIZER(bdrv_runtime_opts.head),
85918edf289SKevin Wolf     .desc = {
86018edf289SKevin Wolf         {
86118edf289SKevin Wolf             .name = "node-name",
86218edf289SKevin Wolf             .type = QEMU_OPT_STRING,
86318edf289SKevin Wolf             .help = "Node name of the block device node",
86418edf289SKevin Wolf         },
86562392ebbSKevin Wolf         {
86662392ebbSKevin Wolf             .name = "driver",
86762392ebbSKevin Wolf             .type = QEMU_OPT_STRING,
86862392ebbSKevin Wolf             .help = "Block driver to use for the node",
86962392ebbSKevin Wolf         },
87091a097e7SKevin Wolf         {
87191a097e7SKevin Wolf             .name = BDRV_OPT_CACHE_WB,
87291a097e7SKevin Wolf             .type = QEMU_OPT_BOOL,
87391a097e7SKevin Wolf             .help = "Enable writeback mode",
87491a097e7SKevin Wolf         },
87591a097e7SKevin Wolf         {
87691a097e7SKevin Wolf             .name = BDRV_OPT_CACHE_DIRECT,
87791a097e7SKevin Wolf             .type = QEMU_OPT_BOOL,
87891a097e7SKevin Wolf             .help = "Bypass software writeback cache on the host",
87991a097e7SKevin Wolf         },
88091a097e7SKevin Wolf         {
88191a097e7SKevin Wolf             .name = BDRV_OPT_CACHE_NO_FLUSH,
88291a097e7SKevin Wolf             .type = QEMU_OPT_BOOL,
88391a097e7SKevin Wolf             .help = "Ignore flush requests",
88491a097e7SKevin Wolf         },
88518edf289SKevin Wolf         { /* end of list */ }
88618edf289SKevin Wolf     },
88718edf289SKevin Wolf };
88818edf289SKevin Wolf 
889b6ce07aaSKevin Wolf /*
89057915332SKevin Wolf  * Common part for opening disk images and files
891b6ad491aSKevin Wolf  *
892b6ad491aSKevin Wolf  * Removes all processed options from *options.
89357915332SKevin Wolf  */
8949a4f4c31SKevin Wolf static int bdrv_open_common(BlockDriverState *bs, BdrvChild *file,
89582dc8b41SKevin Wolf                             QDict *options, Error **errp)
89657915332SKevin Wolf {
89757915332SKevin Wolf     int ret, open_flags;
898035fccdfSKevin Wolf     const char *filename;
89962392ebbSKevin Wolf     const char *driver_name = NULL;
9006913c0c2SBenoît Canet     const char *node_name = NULL;
90118edf289SKevin Wolf     QemuOpts *opts;
90262392ebbSKevin Wolf     BlockDriver *drv;
90334b5d2c6SMax Reitz     Error *local_err = NULL;
90457915332SKevin Wolf 
9056405875cSPaolo Bonzini     assert(bs->file == NULL);
906707ff828SKevin Wolf     assert(options != NULL && bs->options != options);
90757915332SKevin Wolf 
90862392ebbSKevin Wolf     opts = qemu_opts_create(&bdrv_runtime_opts, NULL, 0, &error_abort);
90962392ebbSKevin Wolf     qemu_opts_absorb_qdict(opts, options, &local_err);
91062392ebbSKevin Wolf     if (local_err) {
91162392ebbSKevin Wolf         error_propagate(errp, local_err);
91262392ebbSKevin Wolf         ret = -EINVAL;
91362392ebbSKevin Wolf         goto fail_opts;
91462392ebbSKevin Wolf     }
91562392ebbSKevin Wolf 
91662392ebbSKevin Wolf     driver_name = qemu_opt_get(opts, "driver");
91762392ebbSKevin Wolf     drv = bdrv_find_format(driver_name);
91862392ebbSKevin Wolf     assert(drv != NULL);
91962392ebbSKevin Wolf 
92045673671SKevin Wolf     if (file != NULL) {
9219a4f4c31SKevin Wolf         filename = file->bs->filename;
92245673671SKevin Wolf     } else {
92345673671SKevin Wolf         filename = qdict_get_try_str(options, "filename");
92445673671SKevin Wolf     }
92545673671SKevin Wolf 
926765003dbSKevin Wolf     if (drv->bdrv_needs_filename && !filename) {
927765003dbSKevin Wolf         error_setg(errp, "The '%s' block driver requires a file name",
928765003dbSKevin Wolf                    drv->format_name);
92918edf289SKevin Wolf         ret = -EINVAL;
93018edf289SKevin Wolf         goto fail_opts;
93118edf289SKevin Wolf     }
93218edf289SKevin Wolf 
93382dc8b41SKevin Wolf     trace_bdrv_open_common(bs, filename ?: "", bs->open_flags,
93482dc8b41SKevin Wolf                            drv->format_name);
93562392ebbSKevin Wolf 
93618edf289SKevin Wolf     node_name = qemu_opt_get(opts, "node-name");
937636ea370SKevin Wolf     bdrv_assign_node_name(bs, node_name, &local_err);
9380fb6395cSMarkus Armbruster     if (local_err) {
939636ea370SKevin Wolf         error_propagate(errp, local_err);
94018edf289SKevin Wolf         ret = -EINVAL;
94118edf289SKevin Wolf         goto fail_opts;
9425d186eb0SKevin Wolf     }
9435d186eb0SKevin Wolf 
944c25f53b0SPaolo Bonzini     bs->request_alignment = 512;
9450d51b4deSAsias He     bs->zero_beyond_eof = true;
94682dc8b41SKevin Wolf     bs->read_only = !(bs->open_flags & BDRV_O_RDWR);
947b64ec4e4SFam Zheng 
948b64ec4e4SFam Zheng     if (use_bdrv_whitelist && !bdrv_is_whitelisted(drv, bs->read_only)) {
9498f94a6e4SKevin Wolf         error_setg(errp,
9508f94a6e4SKevin Wolf                    !bs->read_only && bdrv_is_whitelisted(drv, true)
9518f94a6e4SKevin Wolf                         ? "Driver '%s' can only be used for read-only devices"
9528f94a6e4SKevin Wolf                         : "Driver '%s' is not whitelisted",
9538f94a6e4SKevin Wolf                    drv->format_name);
95418edf289SKevin Wolf         ret = -ENOTSUP;
95518edf289SKevin Wolf         goto fail_opts;
956b64ec4e4SFam Zheng     }
95757915332SKevin Wolf 
95853fec9d3SStefan Hajnoczi     assert(bs->copy_on_read == 0); /* bdrv_new() and bdrv_close() make it so */
95982dc8b41SKevin Wolf     if (bs->open_flags & BDRV_O_COPY_ON_READ) {
9600ebd24e0SKevin Wolf         if (!bs->read_only) {
96153fec9d3SStefan Hajnoczi             bdrv_enable_copy_on_read(bs);
9620ebd24e0SKevin Wolf         } else {
9630ebd24e0SKevin Wolf             error_setg(errp, "Can't use copy-on-read on read-only device");
96418edf289SKevin Wolf             ret = -EINVAL;
96518edf289SKevin Wolf             goto fail_opts;
9660ebd24e0SKevin Wolf         }
96753fec9d3SStefan Hajnoczi     }
96853fec9d3SStefan Hajnoczi 
969c2ad1b0cSKevin Wolf     if (filename != NULL) {
97057915332SKevin Wolf         pstrcpy(bs->filename, sizeof(bs->filename), filename);
971c2ad1b0cSKevin Wolf     } else {
972c2ad1b0cSKevin Wolf         bs->filename[0] = '\0';
973c2ad1b0cSKevin Wolf     }
97491af7014SMax Reitz     pstrcpy(bs->exact_filename, sizeof(bs->exact_filename), bs->filename);
97557915332SKevin Wolf 
97657915332SKevin Wolf     bs->drv = drv;
9777267c094SAnthony Liguori     bs->opaque = g_malloc0(drv->instance_size);
97857915332SKevin Wolf 
97991a097e7SKevin Wolf     /* Apply cache mode options */
98091a097e7SKevin Wolf     update_flags_from_options(&bs->open_flags, opts);
98191a097e7SKevin Wolf     bdrv_set_enable_write_cache(bs, bs->open_flags & BDRV_O_CACHE_WB);
982e7c63796SStefan Hajnoczi 
98366f82ceeSKevin Wolf     /* Open the image, either directly or using a protocol */
98482dc8b41SKevin Wolf     open_flags = bdrv_open_flags(bs, bs->open_flags);
98566f82ceeSKevin Wolf     if (drv->bdrv_file_open) {
9865d186eb0SKevin Wolf         assert(file == NULL);
987030be321SBenoît Canet         assert(!drv->bdrv_needs_filename || filename != NULL);
98834b5d2c6SMax Reitz         ret = drv->bdrv_file_open(bs, options, open_flags, &local_err);
989f500a6d3SKevin Wolf     } else {
9902af5ef70SKevin Wolf         if (file == NULL) {
99134b5d2c6SMax Reitz             error_setg(errp, "Can't use '%s' as a block driver for the "
99234b5d2c6SMax Reitz                        "protocol level", drv->format_name);
9932af5ef70SKevin Wolf             ret = -EINVAL;
9942af5ef70SKevin Wolf             goto free_and_fail;
9952af5ef70SKevin Wolf         }
996f500a6d3SKevin Wolf         bs->file = file;
99734b5d2c6SMax Reitz         ret = drv->bdrv_open(bs, options, open_flags, &local_err);
99866f82ceeSKevin Wolf     }
99966f82ceeSKevin Wolf 
100057915332SKevin Wolf     if (ret < 0) {
100184d18f06SMarkus Armbruster         if (local_err) {
100234b5d2c6SMax Reitz             error_propagate(errp, local_err);
10032fa9aa59SDunrong Huang         } else if (bs->filename[0]) {
10042fa9aa59SDunrong Huang             error_setg_errno(errp, -ret, "Could not open '%s'", bs->filename);
100534b5d2c6SMax Reitz         } else {
100634b5d2c6SMax Reitz             error_setg_errno(errp, -ret, "Could not open image");
100734b5d2c6SMax Reitz         }
100857915332SKevin Wolf         goto free_and_fail;
100957915332SKevin Wolf     }
101057915332SKevin Wolf 
1011a1f688f4SMarkus Armbruster     if (bs->encrypted) {
1012a1f688f4SMarkus Armbruster         error_report("Encrypted images are deprecated");
1013a1f688f4SMarkus Armbruster         error_printf("Support for them will be removed in a future release.\n"
1014a1f688f4SMarkus Armbruster                      "You can use 'qemu-img convert' to convert your image"
1015a1f688f4SMarkus Armbruster                      " to an unencrypted one.\n");
1016a1f688f4SMarkus Armbruster     }
1017a1f688f4SMarkus Armbruster 
101851762288SStefan Hajnoczi     ret = refresh_total_sectors(bs, bs->total_sectors);
101951762288SStefan Hajnoczi     if (ret < 0) {
102034b5d2c6SMax Reitz         error_setg_errno(errp, -ret, "Could not refresh total sector count");
102151762288SStefan Hajnoczi         goto free_and_fail;
102257915332SKevin Wolf     }
102351762288SStefan Hajnoczi 
10243baca891SKevin Wolf     bdrv_refresh_limits(bs, &local_err);
10253baca891SKevin Wolf     if (local_err) {
10263baca891SKevin Wolf         error_propagate(errp, local_err);
10273baca891SKevin Wolf         ret = -EINVAL;
10283baca891SKevin Wolf         goto free_and_fail;
10293baca891SKevin Wolf     }
10303baca891SKevin Wolf 
1031c25f53b0SPaolo Bonzini     assert(bdrv_opt_mem_align(bs) != 0);
10324196d2f0SDenis V. Lunev     assert(bdrv_min_mem_align(bs) != 0);
1033b192af8aSDimitris Aragiorgis     assert((bs->request_alignment != 0) || bdrv_is_sg(bs));
103418edf289SKevin Wolf 
103518edf289SKevin Wolf     qemu_opts_del(opts);
103657915332SKevin Wolf     return 0;
103757915332SKevin Wolf 
103857915332SKevin Wolf free_and_fail:
103966f82ceeSKevin Wolf     bs->file = NULL;
10407267c094SAnthony Liguori     g_free(bs->opaque);
104157915332SKevin Wolf     bs->opaque = NULL;
104257915332SKevin Wolf     bs->drv = NULL;
104318edf289SKevin Wolf fail_opts:
104418edf289SKevin Wolf     qemu_opts_del(opts);
104557915332SKevin Wolf     return ret;
104657915332SKevin Wolf }
104757915332SKevin Wolf 
10485e5c4f63SKevin Wolf static QDict *parse_json_filename(const char *filename, Error **errp)
10495e5c4f63SKevin Wolf {
10505e5c4f63SKevin Wolf     QObject *options_obj;
10515e5c4f63SKevin Wolf     QDict *options;
10525e5c4f63SKevin Wolf     int ret;
10535e5c4f63SKevin Wolf 
10545e5c4f63SKevin Wolf     ret = strstart(filename, "json:", &filename);
10555e5c4f63SKevin Wolf     assert(ret);
10565e5c4f63SKevin Wolf 
10575e5c4f63SKevin Wolf     options_obj = qobject_from_json(filename);
10585e5c4f63SKevin Wolf     if (!options_obj) {
10595e5c4f63SKevin Wolf         error_setg(errp, "Could not parse the JSON options");
10605e5c4f63SKevin Wolf         return NULL;
10615e5c4f63SKevin Wolf     }
10625e5c4f63SKevin Wolf 
10635e5c4f63SKevin Wolf     if (qobject_type(options_obj) != QTYPE_QDICT) {
10645e5c4f63SKevin Wolf         qobject_decref(options_obj);
10655e5c4f63SKevin Wolf         error_setg(errp, "Invalid JSON object given");
10665e5c4f63SKevin Wolf         return NULL;
10675e5c4f63SKevin Wolf     }
10685e5c4f63SKevin Wolf 
10695e5c4f63SKevin Wolf     options = qobject_to_qdict(options_obj);
10705e5c4f63SKevin Wolf     qdict_flatten(options);
10715e5c4f63SKevin Wolf 
10725e5c4f63SKevin Wolf     return options;
10735e5c4f63SKevin Wolf }
10745e5c4f63SKevin Wolf 
1075de3b53f0SKevin Wolf static void parse_json_protocol(QDict *options, const char **pfilename,
1076de3b53f0SKevin Wolf                                 Error **errp)
1077de3b53f0SKevin Wolf {
1078de3b53f0SKevin Wolf     QDict *json_options;
1079de3b53f0SKevin Wolf     Error *local_err = NULL;
1080de3b53f0SKevin Wolf 
1081de3b53f0SKevin Wolf     /* Parse json: pseudo-protocol */
1082de3b53f0SKevin Wolf     if (!*pfilename || !g_str_has_prefix(*pfilename, "json:")) {
1083de3b53f0SKevin Wolf         return;
1084de3b53f0SKevin Wolf     }
1085de3b53f0SKevin Wolf 
1086de3b53f0SKevin Wolf     json_options = parse_json_filename(*pfilename, &local_err);
1087de3b53f0SKevin Wolf     if (local_err) {
1088de3b53f0SKevin Wolf         error_propagate(errp, local_err);
1089de3b53f0SKevin Wolf         return;
1090de3b53f0SKevin Wolf     }
1091de3b53f0SKevin Wolf 
1092de3b53f0SKevin Wolf     /* Options given in the filename have lower priority than options
1093de3b53f0SKevin Wolf      * specified directly */
1094de3b53f0SKevin Wolf     qdict_join(options, json_options, false);
1095de3b53f0SKevin Wolf     QDECREF(json_options);
1096de3b53f0SKevin Wolf     *pfilename = NULL;
1097de3b53f0SKevin Wolf }
1098de3b53f0SKevin Wolf 
109957915332SKevin Wolf /*
1100f54120ffSKevin Wolf  * Fills in default options for opening images and converts the legacy
1101f54120ffSKevin Wolf  * filename/flags pair to option QDict entries.
110253a29513SMax Reitz  * The BDRV_O_PROTOCOL flag in *flags will be set or cleared accordingly if a
110353a29513SMax Reitz  * block driver has been specified explicitly.
1104f54120ffSKevin Wolf  */
1105de3b53f0SKevin Wolf static int bdrv_fill_options(QDict **options, const char *filename,
1106053e1578SMax Reitz                              int *flags, Error **errp)
1107f54120ffSKevin Wolf {
1108f54120ffSKevin Wolf     const char *drvname;
110953a29513SMax Reitz     bool protocol = *flags & BDRV_O_PROTOCOL;
1110f54120ffSKevin Wolf     bool parse_filename = false;
1111053e1578SMax Reitz     BlockDriver *drv = NULL;
1112f54120ffSKevin Wolf     Error *local_err = NULL;
1113f54120ffSKevin Wolf 
111453a29513SMax Reitz     drvname = qdict_get_try_str(*options, "driver");
1115053e1578SMax Reitz     if (drvname) {
1116053e1578SMax Reitz         drv = bdrv_find_format(drvname);
1117053e1578SMax Reitz         if (!drv) {
1118053e1578SMax Reitz             error_setg(errp, "Unknown driver '%s'", drvname);
1119053e1578SMax Reitz             return -ENOENT;
1120053e1578SMax Reitz         }
112153a29513SMax Reitz         /* If the user has explicitly specified the driver, this choice should
112253a29513SMax Reitz          * override the BDRV_O_PROTOCOL flag */
1123053e1578SMax Reitz         protocol = drv->bdrv_file_open;
112453a29513SMax Reitz     }
112553a29513SMax Reitz 
112653a29513SMax Reitz     if (protocol) {
112753a29513SMax Reitz         *flags |= BDRV_O_PROTOCOL;
112853a29513SMax Reitz     } else {
112953a29513SMax Reitz         *flags &= ~BDRV_O_PROTOCOL;
113053a29513SMax Reitz     }
113153a29513SMax Reitz 
113291a097e7SKevin Wolf     /* Translate cache options from flags into options */
113391a097e7SKevin Wolf     update_options_from_flags(*options, *flags);
113491a097e7SKevin Wolf 
1135f54120ffSKevin Wolf     /* Fetch the file name from the options QDict if necessary */
113617b005f1SKevin Wolf     if (protocol && filename) {
1137f54120ffSKevin Wolf         if (!qdict_haskey(*options, "filename")) {
1138f54120ffSKevin Wolf             qdict_put(*options, "filename", qstring_from_str(filename));
1139f54120ffSKevin Wolf             parse_filename = true;
1140f54120ffSKevin Wolf         } else {
1141f54120ffSKevin Wolf             error_setg(errp, "Can't specify 'file' and 'filename' options at "
1142f54120ffSKevin Wolf                              "the same time");
1143f54120ffSKevin Wolf             return -EINVAL;
1144f54120ffSKevin Wolf         }
1145f54120ffSKevin Wolf     }
1146f54120ffSKevin Wolf 
1147f54120ffSKevin Wolf     /* Find the right block driver */
1148f54120ffSKevin Wolf     filename = qdict_get_try_str(*options, "filename");
1149f54120ffSKevin Wolf 
115017b005f1SKevin Wolf     if (!drvname && protocol) {
1151f54120ffSKevin Wolf         if (filename) {
1152b65a5e12SMax Reitz             drv = bdrv_find_protocol(filename, parse_filename, errp);
1153f54120ffSKevin Wolf             if (!drv) {
1154f54120ffSKevin Wolf                 return -EINVAL;
1155f54120ffSKevin Wolf             }
1156f54120ffSKevin Wolf 
1157f54120ffSKevin Wolf             drvname = drv->format_name;
1158f54120ffSKevin Wolf             qdict_put(*options, "driver", qstring_from_str(drvname));
1159f54120ffSKevin Wolf         } else {
1160f54120ffSKevin Wolf             error_setg(errp, "Must specify either driver or file");
1161f54120ffSKevin Wolf             return -EINVAL;
1162f54120ffSKevin Wolf         }
116317b005f1SKevin Wolf     }
116417b005f1SKevin Wolf 
116517b005f1SKevin Wolf     assert(drv || !protocol);
1166f54120ffSKevin Wolf 
1167f54120ffSKevin Wolf     /* Driver-specific filename parsing */
116817b005f1SKevin Wolf     if (drv && drv->bdrv_parse_filename && parse_filename) {
1169f54120ffSKevin Wolf         drv->bdrv_parse_filename(filename, *options, &local_err);
1170f54120ffSKevin Wolf         if (local_err) {
1171f54120ffSKevin Wolf             error_propagate(errp, local_err);
1172f54120ffSKevin Wolf             return -EINVAL;
1173f54120ffSKevin Wolf         }
1174f54120ffSKevin Wolf 
1175f54120ffSKevin Wolf         if (!drv->bdrv_needs_filename) {
1176f54120ffSKevin Wolf             qdict_del(*options, "filename");
1177f54120ffSKevin Wolf         }
1178f54120ffSKevin Wolf     }
1179f54120ffSKevin Wolf 
1180f54120ffSKevin Wolf     return 0;
1181f54120ffSKevin Wolf }
1182f54120ffSKevin Wolf 
1183b4b059f6SKevin Wolf static BdrvChild *bdrv_attach_child(BlockDriverState *parent_bs,
1184df581792SKevin Wolf                                     BlockDriverState *child_bs,
1185260fecf1SKevin Wolf                                     const char *child_name,
1186df581792SKevin Wolf                                     const BdrvChildRole *child_role)
1187df581792SKevin Wolf {
1188df581792SKevin Wolf     BdrvChild *child = g_new(BdrvChild, 1);
1189df581792SKevin Wolf     *child = (BdrvChild) {
1190df581792SKevin Wolf         .bs     = child_bs,
1191260fecf1SKevin Wolf         .name   = g_strdup(child_name),
1192df581792SKevin Wolf         .role   = child_role,
1193df581792SKevin Wolf     };
1194df581792SKevin Wolf 
1195df581792SKevin Wolf     QLIST_INSERT_HEAD(&parent_bs->children, child, next);
1196d42a8a93SKevin Wolf     QLIST_INSERT_HEAD(&child_bs->parents, child, next_parent);
1197b4b059f6SKevin Wolf 
1198b4b059f6SKevin Wolf     return child;
1199df581792SKevin Wolf }
1200df581792SKevin Wolf 
12013f09bfbcSKevin Wolf static void bdrv_detach_child(BdrvChild *child)
120233a60407SKevin Wolf {
120333a60407SKevin Wolf     QLIST_REMOVE(child, next);
1204d42a8a93SKevin Wolf     QLIST_REMOVE(child, next_parent);
1205260fecf1SKevin Wolf     g_free(child->name);
120633a60407SKevin Wolf     g_free(child);
120733a60407SKevin Wolf }
120833a60407SKevin Wolf 
120933a60407SKevin Wolf void bdrv_unref_child(BlockDriverState *parent, BdrvChild *child)
121033a60407SKevin Wolf {
1211779020cbSKevin Wolf     BlockDriverState *child_bs;
1212779020cbSKevin Wolf 
1213779020cbSKevin Wolf     if (child == NULL) {
1214779020cbSKevin Wolf         return;
1215779020cbSKevin Wolf     }
121633a60407SKevin Wolf 
121733a60407SKevin Wolf     if (child->bs->inherits_from == parent) {
121833a60407SKevin Wolf         child->bs->inherits_from = NULL;
121933a60407SKevin Wolf     }
122033a60407SKevin Wolf 
1221779020cbSKevin Wolf     child_bs = child->bs;
122233a60407SKevin Wolf     bdrv_detach_child(child);
122333a60407SKevin Wolf     bdrv_unref(child_bs);
122433a60407SKevin Wolf }
122533a60407SKevin Wolf 
12265db15a57SKevin Wolf /*
12275db15a57SKevin Wolf  * Sets the backing file link of a BDS. A new reference is created; callers
12285db15a57SKevin Wolf  * which don't need their own reference any more must call bdrv_unref().
12295db15a57SKevin Wolf  */
12308d24cce1SFam Zheng void bdrv_set_backing_hd(BlockDriverState *bs, BlockDriverState *backing_hd)
12318d24cce1SFam Zheng {
12325db15a57SKevin Wolf     if (backing_hd) {
12335db15a57SKevin Wolf         bdrv_ref(backing_hd);
12345db15a57SKevin Wolf     }
12358d24cce1SFam Zheng 
1236760e0063SKevin Wolf     if (bs->backing) {
1237826b6ca0SFam Zheng         assert(bs->backing_blocker);
1238760e0063SKevin Wolf         bdrv_op_unblock_all(bs->backing->bs, bs->backing_blocker);
12395db15a57SKevin Wolf         bdrv_unref_child(bs, bs->backing);
1240826b6ca0SFam Zheng     } else if (backing_hd) {
1241826b6ca0SFam Zheng         error_setg(&bs->backing_blocker,
124281e5f78aSAlberto Garcia                    "node is used as backing hd of '%s'",
124381e5f78aSAlberto Garcia                    bdrv_get_device_or_node_name(bs));
1244826b6ca0SFam Zheng     }
1245826b6ca0SFam Zheng 
12468d24cce1SFam Zheng     if (!backing_hd) {
1247826b6ca0SFam Zheng         error_free(bs->backing_blocker);
1248826b6ca0SFam Zheng         bs->backing_blocker = NULL;
1249760e0063SKevin Wolf         bs->backing = NULL;
12508d24cce1SFam Zheng         goto out;
12518d24cce1SFam Zheng     }
1252260fecf1SKevin Wolf     bs->backing = bdrv_attach_child(bs, backing_hd, "backing", &child_backing);
12538d24cce1SFam Zheng     bs->open_flags &= ~BDRV_O_NO_BACKING;
12548d24cce1SFam Zheng     pstrcpy(bs->backing_file, sizeof(bs->backing_file), backing_hd->filename);
12558d24cce1SFam Zheng     pstrcpy(bs->backing_format, sizeof(bs->backing_format),
12568d24cce1SFam Zheng             backing_hd->drv ? backing_hd->drv->format_name : "");
1257826b6ca0SFam Zheng 
1258760e0063SKevin Wolf     bdrv_op_block_all(backing_hd, bs->backing_blocker);
1259826b6ca0SFam Zheng     /* Otherwise we won't be able to commit due to check in bdrv_commit */
1260760e0063SKevin Wolf     bdrv_op_unblock(backing_hd, BLOCK_OP_TYPE_COMMIT_TARGET,
1261826b6ca0SFam Zheng                     bs->backing_blocker);
12628d24cce1SFam Zheng out:
12633baca891SKevin Wolf     bdrv_refresh_limits(bs, NULL);
12648d24cce1SFam Zheng }
12658d24cce1SFam Zheng 
126631ca6d07SKevin Wolf /*
126731ca6d07SKevin Wolf  * Opens the backing file for a BlockDriverState if not yet open
126831ca6d07SKevin Wolf  *
1269d9b7b057SKevin Wolf  * bdref_key specifies the key for the image's BlockdevRef in the options QDict.
1270d9b7b057SKevin Wolf  * That QDict has to be flattened; therefore, if the BlockdevRef is a QDict
1271d9b7b057SKevin Wolf  * itself, all options starting with "${bdref_key}." are considered part of the
1272d9b7b057SKevin Wolf  * BlockdevRef.
1273d9b7b057SKevin Wolf  *
1274d9b7b057SKevin Wolf  * TODO Can this be unified with bdrv_open_image()?
127531ca6d07SKevin Wolf  */
1276d9b7b057SKevin Wolf int bdrv_open_backing_file(BlockDriverState *bs, QDict *parent_options,
1277d9b7b057SKevin Wolf                            const char *bdref_key, Error **errp)
12789156df12SPaolo Bonzini {
12791ba4b6a5SBenoît Canet     char *backing_filename = g_malloc0(PATH_MAX);
1280d9b7b057SKevin Wolf     char *bdref_key_dot;
1281d9b7b057SKevin Wolf     const char *reference = NULL;
1282317fc44eSKevin Wolf     int ret = 0;
12838d24cce1SFam Zheng     BlockDriverState *backing_hd;
1284d9b7b057SKevin Wolf     QDict *options;
1285d9b7b057SKevin Wolf     QDict *tmp_parent_options = NULL;
128634b5d2c6SMax Reitz     Error *local_err = NULL;
12879156df12SPaolo Bonzini 
1288760e0063SKevin Wolf     if (bs->backing != NULL) {
12891ba4b6a5SBenoît Canet         goto free_exit;
12909156df12SPaolo Bonzini     }
12919156df12SPaolo Bonzini 
129231ca6d07SKevin Wolf     /* NULL means an empty set of options */
1293d9b7b057SKevin Wolf     if (parent_options == NULL) {
1294d9b7b057SKevin Wolf         tmp_parent_options = qdict_new();
1295d9b7b057SKevin Wolf         parent_options = tmp_parent_options;
129631ca6d07SKevin Wolf     }
129731ca6d07SKevin Wolf 
12989156df12SPaolo Bonzini     bs->open_flags &= ~BDRV_O_NO_BACKING;
1299d9b7b057SKevin Wolf 
1300d9b7b057SKevin Wolf     bdref_key_dot = g_strdup_printf("%s.", bdref_key);
1301d9b7b057SKevin Wolf     qdict_extract_subqdict(parent_options, &options, bdref_key_dot);
1302d9b7b057SKevin Wolf     g_free(bdref_key_dot);
1303d9b7b057SKevin Wolf 
1304d9b7b057SKevin Wolf     reference = qdict_get_try_str(parent_options, bdref_key);
1305d9b7b057SKevin Wolf     if (reference || qdict_haskey(options, "file.filename")) {
13061cb6f506SKevin Wolf         backing_filename[0] = '\0';
13071cb6f506SKevin Wolf     } else if (bs->backing_file[0] == '\0' && qdict_size(options) == 0) {
130831ca6d07SKevin Wolf         QDECREF(options);
13091ba4b6a5SBenoît Canet         goto free_exit;
1310dbecebddSFam Zheng     } else {
13119f07429eSMax Reitz         bdrv_get_full_backing_filename(bs, backing_filename, PATH_MAX,
13129f07429eSMax Reitz                                        &local_err);
13139f07429eSMax Reitz         if (local_err) {
13149f07429eSMax Reitz             ret = -EINVAL;
13159f07429eSMax Reitz             error_propagate(errp, local_err);
13169f07429eSMax Reitz             QDECREF(options);
13179f07429eSMax Reitz             goto free_exit;
13189f07429eSMax Reitz         }
13199156df12SPaolo Bonzini     }
13209156df12SPaolo Bonzini 
13218ee79e70SKevin Wolf     if (!bs->drv || !bs->drv->supports_backing) {
13228ee79e70SKevin Wolf         ret = -EINVAL;
13238ee79e70SKevin Wolf         error_setg(errp, "Driver doesn't support backing files");
13248ee79e70SKevin Wolf         QDECREF(options);
13258ee79e70SKevin Wolf         goto free_exit;
13268ee79e70SKevin Wolf     }
13278ee79e70SKevin Wolf 
1328c5f6e493SKevin Wolf     if (bs->backing_format[0] != '\0' && !qdict_haskey(options, "driver")) {
1329c5f6e493SKevin Wolf         qdict_put(options, "driver", qstring_from_str(bs->backing_format));
13309156df12SPaolo Bonzini     }
13319156df12SPaolo Bonzini 
1332d9b7b057SKevin Wolf     backing_hd = NULL;
1333f3930ed0SKevin Wolf     ret = bdrv_open_inherit(&backing_hd,
1334f3930ed0SKevin Wolf                             *backing_filename ? backing_filename : NULL,
1335d9b7b057SKevin Wolf                             reference, options, 0, bs, &child_backing,
1336e43bfd9cSMarkus Armbruster                             errp);
13379156df12SPaolo Bonzini     if (ret < 0) {
13389156df12SPaolo Bonzini         bs->open_flags |= BDRV_O_NO_BACKING;
1339e43bfd9cSMarkus Armbruster         error_prepend(errp, "Could not open backing file: ");
13401ba4b6a5SBenoît Canet         goto free_exit;
13419156df12SPaolo Bonzini     }
1342df581792SKevin Wolf 
13435db15a57SKevin Wolf     /* Hook up the backing file link; drop our reference, bs owns the
13445db15a57SKevin Wolf      * backing_hd reference now */
13458d24cce1SFam Zheng     bdrv_set_backing_hd(bs, backing_hd);
13465db15a57SKevin Wolf     bdrv_unref(backing_hd);
1347d80ac658SPeter Feiner 
1348d9b7b057SKevin Wolf     qdict_del(parent_options, bdref_key);
1349d9b7b057SKevin Wolf 
13501ba4b6a5SBenoît Canet free_exit:
13511ba4b6a5SBenoît Canet     g_free(backing_filename);
1352d9b7b057SKevin Wolf     QDECREF(tmp_parent_options);
13531ba4b6a5SBenoît Canet     return ret;
13549156df12SPaolo Bonzini }
13559156df12SPaolo Bonzini 
1356b6ce07aaSKevin Wolf /*
1357da557aacSMax Reitz  * Opens a disk image whose options are given as BlockdevRef in another block
1358da557aacSMax Reitz  * device's options.
1359da557aacSMax Reitz  *
1360da557aacSMax Reitz  * If allow_none is true, no image will be opened if filename is false and no
1361b4b059f6SKevin Wolf  * BlockdevRef is given. NULL will be returned, but errp remains unset.
1362da557aacSMax Reitz  *
1363da557aacSMax Reitz  * bdrev_key specifies the key for the image's BlockdevRef in the options QDict.
1364da557aacSMax Reitz  * That QDict has to be flattened; therefore, if the BlockdevRef is a QDict
1365da557aacSMax Reitz  * itself, all options starting with "${bdref_key}." are considered part of the
1366da557aacSMax Reitz  * BlockdevRef.
1367da557aacSMax Reitz  *
1368da557aacSMax Reitz  * The BlockdevRef will be removed from the options QDict.
1369da557aacSMax Reitz  */
1370b4b059f6SKevin Wolf BdrvChild *bdrv_open_child(const char *filename,
1371f3930ed0SKevin Wolf                            QDict *options, const char *bdref_key,
1372b4b059f6SKevin Wolf                            BlockDriverState* parent,
1373b4b059f6SKevin Wolf                            const BdrvChildRole *child_role,
1374f7d9fd8cSMax Reitz                            bool allow_none, Error **errp)
1375da557aacSMax Reitz {
1376b4b059f6SKevin Wolf     BdrvChild *c = NULL;
1377b4b059f6SKevin Wolf     BlockDriverState *bs;
1378da557aacSMax Reitz     QDict *image_options;
1379da557aacSMax Reitz     int ret;
1380da557aacSMax Reitz     char *bdref_key_dot;
1381da557aacSMax Reitz     const char *reference;
1382da557aacSMax Reitz 
1383df581792SKevin Wolf     assert(child_role != NULL);
1384f67503e5SMax Reitz 
1385da557aacSMax Reitz     bdref_key_dot = g_strdup_printf("%s.", bdref_key);
1386da557aacSMax Reitz     qdict_extract_subqdict(options, &image_options, bdref_key_dot);
1387da557aacSMax Reitz     g_free(bdref_key_dot);
1388da557aacSMax Reitz 
1389da557aacSMax Reitz     reference = qdict_get_try_str(options, bdref_key);
1390da557aacSMax Reitz     if (!filename && !reference && !qdict_size(image_options)) {
1391b4b059f6SKevin Wolf         if (!allow_none) {
1392da557aacSMax Reitz             error_setg(errp, "A block device must be specified for \"%s\"",
1393da557aacSMax Reitz                        bdref_key);
1394da557aacSMax Reitz         }
1395b20e61e0SMarkus Armbruster         QDECREF(image_options);
1396da557aacSMax Reitz         goto done;
1397da557aacSMax Reitz     }
1398da557aacSMax Reitz 
1399b4b059f6SKevin Wolf     bs = NULL;
1400b4b059f6SKevin Wolf     ret = bdrv_open_inherit(&bs, filename, reference, image_options, 0,
1401ce343771SMax Reitz                             parent, child_role, errp);
1402df581792SKevin Wolf     if (ret < 0) {
1403df581792SKevin Wolf         goto done;
1404df581792SKevin Wolf     }
1405df581792SKevin Wolf 
1406260fecf1SKevin Wolf     c = bdrv_attach_child(parent, bs, bdref_key, child_role);
1407da557aacSMax Reitz 
1408da557aacSMax Reitz done:
1409da557aacSMax Reitz     qdict_del(options, bdref_key);
1410b4b059f6SKevin Wolf     return c;
1411b4b059f6SKevin Wolf }
1412b4b059f6SKevin Wolf 
141373176beeSKevin Wolf static int bdrv_append_temp_snapshot(BlockDriverState *bs, int flags,
141473176beeSKevin Wolf                                      QDict *snapshot_options, Error **errp)
1415b998875dSKevin Wolf {
1416b998875dSKevin Wolf     /* TODO: extra byte is a hack to ensure MAX_PATH space on Windows. */
14171ba4b6a5SBenoît Canet     char *tmp_filename = g_malloc0(PATH_MAX + 1);
1418b998875dSKevin Wolf     int64_t total_size;
141983d0521aSChunyan Liu     QemuOpts *opts = NULL;
1420b998875dSKevin Wolf     BlockDriverState *bs_snapshot;
1421c2e0dbbfSFam Zheng     Error *local_err = NULL;
1422b998875dSKevin Wolf     int ret;
1423b998875dSKevin Wolf 
1424b998875dSKevin Wolf     /* if snapshot, we create a temporary backing file and open it
1425b998875dSKevin Wolf        instead of opening 'filename' directly */
1426b998875dSKevin Wolf 
1427b998875dSKevin Wolf     /* Get the required size from the image */
1428f187743aSKevin Wolf     total_size = bdrv_getlength(bs);
1429f187743aSKevin Wolf     if (total_size < 0) {
14306b8aeca5SChen Gang         ret = total_size;
1431f187743aSKevin Wolf         error_setg_errno(errp, -total_size, "Could not get image size");
14321ba4b6a5SBenoît Canet         goto out;
1433f187743aSKevin Wolf     }
1434b998875dSKevin Wolf 
1435b998875dSKevin Wolf     /* Create the temporary image */
14361ba4b6a5SBenoît Canet     ret = get_tmp_filename(tmp_filename, PATH_MAX + 1);
1437b998875dSKevin Wolf     if (ret < 0) {
1438b998875dSKevin Wolf         error_setg_errno(errp, -ret, "Could not get temporary filename");
14391ba4b6a5SBenoît Canet         goto out;
1440b998875dSKevin Wolf     }
1441b998875dSKevin Wolf 
1442ef810437SMax Reitz     opts = qemu_opts_create(bdrv_qcow2.create_opts, NULL, 0,
1443c282e1fdSChunyan Liu                             &error_abort);
144439101f25SMarkus Armbruster     qemu_opt_set_number(opts, BLOCK_OPT_SIZE, total_size, &error_abort);
1445e43bfd9cSMarkus Armbruster     ret = bdrv_create(&bdrv_qcow2, tmp_filename, opts, errp);
144683d0521aSChunyan Liu     qemu_opts_del(opts);
1447b998875dSKevin Wolf     if (ret < 0) {
1448e43bfd9cSMarkus Armbruster         error_prepend(errp, "Could not create temporary overlay '%s': ",
1449e43bfd9cSMarkus Armbruster                       tmp_filename);
14501ba4b6a5SBenoît Canet         goto out;
1451b998875dSKevin Wolf     }
1452b998875dSKevin Wolf 
145373176beeSKevin Wolf     /* Prepare options QDict for the temporary file */
1454b998875dSKevin Wolf     qdict_put(snapshot_options, "file.driver",
1455b998875dSKevin Wolf               qstring_from_str("file"));
1456b998875dSKevin Wolf     qdict_put(snapshot_options, "file.filename",
1457b998875dSKevin Wolf               qstring_from_str(tmp_filename));
1458e6641719SMax Reitz     qdict_put(snapshot_options, "driver",
1459e6641719SMax Reitz               qstring_from_str("qcow2"));
1460b998875dSKevin Wolf 
1461e4e9986bSMarkus Armbruster     bs_snapshot = bdrv_new();
1462b998875dSKevin Wolf 
1463b998875dSKevin Wolf     ret = bdrv_open(&bs_snapshot, NULL, NULL, snapshot_options,
14646ebf9aa2SMax Reitz                     flags, &local_err);
146573176beeSKevin Wolf     snapshot_options = NULL;
1466b998875dSKevin Wolf     if (ret < 0) {
1467b998875dSKevin Wolf         error_propagate(errp, local_err);
14681ba4b6a5SBenoît Canet         goto out;
1469b998875dSKevin Wolf     }
1470b998875dSKevin Wolf 
1471b998875dSKevin Wolf     bdrv_append(bs_snapshot, bs);
14721ba4b6a5SBenoît Canet 
14731ba4b6a5SBenoît Canet out:
147473176beeSKevin Wolf     QDECREF(snapshot_options);
14751ba4b6a5SBenoît Canet     g_free(tmp_filename);
14766b8aeca5SChen Gang     return ret;
1477b998875dSKevin Wolf }
1478b998875dSKevin Wolf 
1479da557aacSMax Reitz /*
1480b6ce07aaSKevin Wolf  * Opens a disk image (raw, qcow2, vmdk, ...)
1481de9c0cecSKevin Wolf  *
1482de9c0cecSKevin Wolf  * options is a QDict of options to pass to the block drivers, or NULL for an
1483de9c0cecSKevin Wolf  * empty set of options. The reference to the QDict belongs to the block layer
1484de9c0cecSKevin Wolf  * after the call (even on failure), so if the caller intends to reuse the
1485de9c0cecSKevin Wolf  * dictionary, it needs to use QINCREF() before calling bdrv_open.
1486f67503e5SMax Reitz  *
1487f67503e5SMax Reitz  * If *pbs is NULL, a new BDS will be created with a pointer to it stored there.
1488f67503e5SMax Reitz  * If it is not NULL, the referenced BDS will be reused.
1489ddf5636dSMax Reitz  *
1490ddf5636dSMax Reitz  * The reference parameter may be used to specify an existing block device which
1491ddf5636dSMax Reitz  * should be opened. If specified, neither options nor a filename may be given,
1492ddf5636dSMax Reitz  * nor can an existing BDS be reused (that is, *pbs has to be NULL).
1493b6ce07aaSKevin Wolf  */
1494f3930ed0SKevin Wolf static int bdrv_open_inherit(BlockDriverState **pbs, const char *filename,
1495ddf5636dSMax Reitz                              const char *reference, QDict *options, int flags,
1496f3930ed0SKevin Wolf                              BlockDriverState *parent,
1497ce343771SMax Reitz                              const BdrvChildRole *child_role, Error **errp)
1498ea2384d3Sbellard {
1499b6ce07aaSKevin Wolf     int ret;
15009a4f4c31SKevin Wolf     BdrvChild *file = NULL;
15019a4f4c31SKevin Wolf     BlockDriverState *bs;
1502ce343771SMax Reitz     BlockDriver *drv = NULL;
150374fe54f2SKevin Wolf     const char *drvname;
15043e8c2e57SAlberto Garcia     const char *backing;
150534b5d2c6SMax Reitz     Error *local_err = NULL;
150673176beeSKevin Wolf     QDict *snapshot_options = NULL;
1507b1e6fc08SKevin Wolf     int snapshot_flags = 0;
150833e3963eSbellard 
1509f67503e5SMax Reitz     assert(pbs);
1510f3930ed0SKevin Wolf     assert(!child_role || !flags);
1511f3930ed0SKevin Wolf     assert(!child_role == !parent);
1512f67503e5SMax Reitz 
1513ddf5636dSMax Reitz     if (reference) {
1514ddf5636dSMax Reitz         bool options_non_empty = options ? qdict_size(options) : false;
1515ddf5636dSMax Reitz         QDECREF(options);
1516ddf5636dSMax Reitz 
1517ddf5636dSMax Reitz         if (*pbs) {
1518ddf5636dSMax Reitz             error_setg(errp, "Cannot reuse an existing BDS when referencing "
1519ddf5636dSMax Reitz                        "another block device");
1520ddf5636dSMax Reitz             return -EINVAL;
1521ddf5636dSMax Reitz         }
1522ddf5636dSMax Reitz 
1523ddf5636dSMax Reitz         if (filename || options_non_empty) {
1524ddf5636dSMax Reitz             error_setg(errp, "Cannot reference an existing block device with "
1525ddf5636dSMax Reitz                        "additional options or a new filename");
1526ddf5636dSMax Reitz             return -EINVAL;
1527ddf5636dSMax Reitz         }
1528ddf5636dSMax Reitz 
1529ddf5636dSMax Reitz         bs = bdrv_lookup_bs(reference, reference, errp);
1530ddf5636dSMax Reitz         if (!bs) {
1531ddf5636dSMax Reitz             return -ENODEV;
1532ddf5636dSMax Reitz         }
1533ddf5636dSMax Reitz         bdrv_ref(bs);
1534ddf5636dSMax Reitz         *pbs = bs;
1535ddf5636dSMax Reitz         return 0;
1536ddf5636dSMax Reitz     }
1537ddf5636dSMax Reitz 
1538f67503e5SMax Reitz     if (*pbs) {
1539f67503e5SMax Reitz         bs = *pbs;
1540f67503e5SMax Reitz     } else {
1541e4e9986bSMarkus Armbruster         bs = bdrv_new();
1542f67503e5SMax Reitz     }
1543f67503e5SMax Reitz 
1544de9c0cecSKevin Wolf     /* NULL means an empty set of options */
1545de9c0cecSKevin Wolf     if (options == NULL) {
1546de9c0cecSKevin Wolf         options = qdict_new();
1547de9c0cecSKevin Wolf     }
1548de9c0cecSKevin Wolf 
1549145f598eSKevin Wolf     /* json: syntax counts as explicit options, as if in the QDict */
1550de3b53f0SKevin Wolf     parse_json_protocol(options, &filename, &local_err);
1551de3b53f0SKevin Wolf     if (local_err) {
1552de3b53f0SKevin Wolf         ret = -EINVAL;
1553de3b53f0SKevin Wolf         goto fail;
1554de3b53f0SKevin Wolf     }
1555de3b53f0SKevin Wolf 
1556145f598eSKevin Wolf     bs->explicit_options = qdict_clone_shallow(options);
1557145f598eSKevin Wolf 
1558f3930ed0SKevin Wolf     if (child_role) {
1559bddcec37SKevin Wolf         bs->inherits_from = parent;
15608e2160e2SKevin Wolf         child_role->inherit_options(&flags, options,
15618e2160e2SKevin Wolf                                     parent->open_flags, parent->options);
1562f3930ed0SKevin Wolf     }
1563f3930ed0SKevin Wolf 
1564de3b53f0SKevin Wolf     ret = bdrv_fill_options(&options, filename, &flags, &local_err);
1565462f5bcfSKevin Wolf     if (local_err) {
1566462f5bcfSKevin Wolf         goto fail;
1567462f5bcfSKevin Wolf     }
1568462f5bcfSKevin Wolf 
156962392ebbSKevin Wolf     bs->open_flags = flags;
157062392ebbSKevin Wolf     bs->options = options;
157162392ebbSKevin Wolf     options = qdict_clone_shallow(options);
157262392ebbSKevin Wolf 
157376c591b0SKevin Wolf     /* Find the right image format driver */
157476c591b0SKevin Wolf     drvname = qdict_get_try_str(options, "driver");
157576c591b0SKevin Wolf     if (drvname) {
157676c591b0SKevin Wolf         drv = bdrv_find_format(drvname);
157776c591b0SKevin Wolf         if (!drv) {
157876c591b0SKevin Wolf             error_setg(errp, "Unknown driver: '%s'", drvname);
157976c591b0SKevin Wolf             ret = -EINVAL;
158076c591b0SKevin Wolf             goto fail;
158176c591b0SKevin Wolf         }
158276c591b0SKevin Wolf     }
158376c591b0SKevin Wolf 
158476c591b0SKevin Wolf     assert(drvname || !(flags & BDRV_O_PROTOCOL));
158576c591b0SKevin Wolf 
15863e8c2e57SAlberto Garcia     backing = qdict_get_try_str(options, "backing");
15873e8c2e57SAlberto Garcia     if (backing && *backing == '\0') {
15883e8c2e57SAlberto Garcia         flags |= BDRV_O_NO_BACKING;
15893e8c2e57SAlberto Garcia         qdict_del(options, "backing");
15903e8c2e57SAlberto Garcia     }
15913e8c2e57SAlberto Garcia 
1592f500a6d3SKevin Wolf     /* Open image file without format layer */
1593f4788adcSKevin Wolf     if ((flags & BDRV_O_PROTOCOL) == 0) {
1594be028adcSJeff Cody         if (flags & BDRV_O_RDWR) {
1595be028adcSJeff Cody             flags |= BDRV_O_ALLOW_RDWR;
1596be028adcSJeff Cody         }
1597b1e6fc08SKevin Wolf         if (flags & BDRV_O_SNAPSHOT) {
159873176beeSKevin Wolf             snapshot_options = qdict_new();
159973176beeSKevin Wolf             bdrv_temp_snapshot_options(&snapshot_flags, snapshot_options,
160073176beeSKevin Wolf                                        flags, options);
16018e2160e2SKevin Wolf             bdrv_backing_options(&flags, options, flags, options);
1602b1e6fc08SKevin Wolf         }
1603be028adcSJeff Cody 
1604f3930ed0SKevin Wolf         bs->open_flags = flags;
16051fdd6933SKevin Wolf 
16069a4f4c31SKevin Wolf         file = bdrv_open_child(filename, options, "file", bs,
16071fdd6933SKevin Wolf                                &child_file, true, &local_err);
16081fdd6933SKevin Wolf         if (local_err) {
16091fdd6933SKevin Wolf             ret = -EINVAL;
16108bfea15dSKevin Wolf             goto fail;
1611f500a6d3SKevin Wolf         }
1612f4788adcSKevin Wolf     }
1613f500a6d3SKevin Wolf 
161476c591b0SKevin Wolf     /* Image format probing */
161538f3ef57SKevin Wolf     bs->probed = !drv;
161676c591b0SKevin Wolf     if (!drv && file) {
16179a4f4c31SKevin Wolf         ret = find_image_format(file->bs, filename, &drv, &local_err);
161817b005f1SKevin Wolf         if (ret < 0) {
161917b005f1SKevin Wolf             goto fail;
162017b005f1SKevin Wolf         }
162162392ebbSKevin Wolf         /*
162262392ebbSKevin Wolf          * This option update would logically belong in bdrv_fill_options(),
162362392ebbSKevin Wolf          * but we first need to open bs->file for the probing to work, while
162462392ebbSKevin Wolf          * opening bs->file already requires the (mostly) final set of options
162562392ebbSKevin Wolf          * so that cache mode etc. can be inherited.
162662392ebbSKevin Wolf          *
162762392ebbSKevin Wolf          * Adding the driver later is somewhat ugly, but it's not an option
162862392ebbSKevin Wolf          * that would ever be inherited, so it's correct. We just need to make
162962392ebbSKevin Wolf          * sure to update both bs->options (which has the full effective
163062392ebbSKevin Wolf          * options for bs) and options (which has file.* already removed).
163162392ebbSKevin Wolf          */
163262392ebbSKevin Wolf         qdict_put(bs->options, "driver", qstring_from_str(drv->format_name));
163362392ebbSKevin Wolf         qdict_put(options, "driver", qstring_from_str(drv->format_name));
163476c591b0SKevin Wolf     } else if (!drv) {
16352a05cbe4SMax Reitz         error_setg(errp, "Must specify either driver or file");
16362a05cbe4SMax Reitz         ret = -EINVAL;
16378bfea15dSKevin Wolf         goto fail;
16382a05cbe4SMax Reitz     }
1639f500a6d3SKevin Wolf 
164053a29513SMax Reitz     /* BDRV_O_PROTOCOL must be set iff a protocol BDS is about to be created */
164153a29513SMax Reitz     assert(!!(flags & BDRV_O_PROTOCOL) == !!drv->bdrv_file_open);
164253a29513SMax Reitz     /* file must be NULL if a protocol BDS is about to be created
164353a29513SMax Reitz      * (the inverse results in an error message from bdrv_open_common()) */
164453a29513SMax Reitz     assert(!(flags & BDRV_O_PROTOCOL) || !file);
164553a29513SMax Reitz 
1646b6ce07aaSKevin Wolf     /* Open the image */
164782dc8b41SKevin Wolf     ret = bdrv_open_common(bs, file, options, &local_err);
1648b6ce07aaSKevin Wolf     if (ret < 0) {
16498bfea15dSKevin Wolf         goto fail;
16506987307cSChristoph Hellwig     }
16516987307cSChristoph Hellwig 
16522a05cbe4SMax Reitz     if (file && (bs->file != file)) {
16539a4f4c31SKevin Wolf         bdrv_unref_child(bs, file);
1654f500a6d3SKevin Wolf         file = NULL;
1655f500a6d3SKevin Wolf     }
1656f500a6d3SKevin Wolf 
1657b6ce07aaSKevin Wolf     /* If there is a backing file, use it */
16589156df12SPaolo Bonzini     if ((flags & BDRV_O_NO_BACKING) == 0) {
1659d9b7b057SKevin Wolf         ret = bdrv_open_backing_file(bs, options, "backing", &local_err);
1660b6ce07aaSKevin Wolf         if (ret < 0) {
1661b6ad491aSKevin Wolf             goto close_and_fail;
1662b6ce07aaSKevin Wolf         }
1663b6ce07aaSKevin Wolf     }
1664b6ce07aaSKevin Wolf 
166591af7014SMax Reitz     bdrv_refresh_filename(bs);
166691af7014SMax Reitz 
1667b6ad491aSKevin Wolf     /* Check if any unknown options were used */
16685acd9d81SMax Reitz     if (options && (qdict_size(options) != 0)) {
1669b6ad491aSKevin Wolf         const QDictEntry *entry = qdict_first(options);
16705acd9d81SMax Reitz         if (flags & BDRV_O_PROTOCOL) {
16715acd9d81SMax Reitz             error_setg(errp, "Block protocol '%s' doesn't support the option "
16725acd9d81SMax Reitz                        "'%s'", drv->format_name, entry->key);
16735acd9d81SMax Reitz         } else {
1674*d0e46a55SMax Reitz             error_setg(errp,
1675*d0e46a55SMax Reitz                        "Block format '%s' does not support the option '%s'",
1676*d0e46a55SMax Reitz                        drv->format_name, entry->key);
16775acd9d81SMax Reitz         }
1678b6ad491aSKevin Wolf 
1679b6ad491aSKevin Wolf         ret = -EINVAL;
1680b6ad491aSKevin Wolf         goto close_and_fail;
1681b6ad491aSKevin Wolf     }
1682b6ad491aSKevin Wolf 
1683b6ce07aaSKevin Wolf     if (!bdrv_key_required(bs)) {
1684a7f53e26SMarkus Armbruster         if (bs->blk) {
1685a7f53e26SMarkus Armbruster             blk_dev_change_media_cb(bs->blk, true);
1686a7f53e26SMarkus Armbruster         }
1687c3adb58fSMarkus Armbruster     } else if (!runstate_check(RUN_STATE_PRELAUNCH)
1688c3adb58fSMarkus Armbruster                && !runstate_check(RUN_STATE_INMIGRATE)
1689c3adb58fSMarkus Armbruster                && !runstate_check(RUN_STATE_PAUSED)) { /* HACK */
1690c3adb58fSMarkus Armbruster         error_setg(errp,
1691c3adb58fSMarkus Armbruster                    "Guest must be stopped for opening of encrypted image");
1692c3adb58fSMarkus Armbruster         ret = -EBUSY;
1693c3adb58fSMarkus Armbruster         goto close_and_fail;
1694b6ce07aaSKevin Wolf     }
1695b6ce07aaSKevin Wolf 
1696c3adb58fSMarkus Armbruster     QDECREF(options);
1697f67503e5SMax Reitz     *pbs = bs;
1698dd62f1caSKevin Wolf 
1699dd62f1caSKevin Wolf     /* For snapshot=on, create a temporary qcow2 overlay. bs points to the
1700dd62f1caSKevin Wolf      * temporary snapshot afterwards. */
1701dd62f1caSKevin Wolf     if (snapshot_flags) {
170273176beeSKevin Wolf         ret = bdrv_append_temp_snapshot(bs, snapshot_flags, snapshot_options,
170373176beeSKevin Wolf                                         &local_err);
170473176beeSKevin Wolf         snapshot_options = NULL;
1705dd62f1caSKevin Wolf         if (local_err) {
1706dd62f1caSKevin Wolf             goto close_and_fail;
1707dd62f1caSKevin Wolf         }
1708dd62f1caSKevin Wolf     }
1709dd62f1caSKevin Wolf 
1710b6ce07aaSKevin Wolf     return 0;
1711b6ce07aaSKevin Wolf 
17128bfea15dSKevin Wolf fail:
1713f500a6d3SKevin Wolf     if (file != NULL) {
17149a4f4c31SKevin Wolf         bdrv_unref_child(bs, file);
1715f500a6d3SKevin Wolf     }
171673176beeSKevin Wolf     QDECREF(snapshot_options);
1717145f598eSKevin Wolf     QDECREF(bs->explicit_options);
1718de9c0cecSKevin Wolf     QDECREF(bs->options);
1719b6ad491aSKevin Wolf     QDECREF(options);
1720de9c0cecSKevin Wolf     bs->options = NULL;
1721f67503e5SMax Reitz     if (!*pbs) {
1722f67503e5SMax Reitz         /* If *pbs is NULL, a new BDS has been created in this function and
1723f67503e5SMax Reitz            needs to be freed now. Otherwise, it does not need to be closed,
1724f67503e5SMax Reitz            since it has not really been opened yet. */
1725f67503e5SMax Reitz         bdrv_unref(bs);
1726f67503e5SMax Reitz     }
172784d18f06SMarkus Armbruster     if (local_err) {
172834b5d2c6SMax Reitz         error_propagate(errp, local_err);
172934b5d2c6SMax Reitz     }
1730b6ad491aSKevin Wolf     return ret;
1731de9c0cecSKevin Wolf 
1732b6ad491aSKevin Wolf close_and_fail:
1733f67503e5SMax Reitz     /* See fail path, but now the BDS has to be always closed */
1734f67503e5SMax Reitz     if (*pbs) {
1735b6ad491aSKevin Wolf         bdrv_close(bs);
1736f67503e5SMax Reitz     } else {
1737f67503e5SMax Reitz         bdrv_unref(bs);
1738f67503e5SMax Reitz     }
173973176beeSKevin Wolf     QDECREF(snapshot_options);
1740b6ad491aSKevin Wolf     QDECREF(options);
174184d18f06SMarkus Armbruster     if (local_err) {
174234b5d2c6SMax Reitz         error_propagate(errp, local_err);
174334b5d2c6SMax Reitz     }
1744b6ce07aaSKevin Wolf     return ret;
1745b6ce07aaSKevin Wolf }
1746b6ce07aaSKevin Wolf 
1747f3930ed0SKevin Wolf int bdrv_open(BlockDriverState **pbs, const char *filename,
17486ebf9aa2SMax Reitz               const char *reference, QDict *options, int flags, Error **errp)
1749f3930ed0SKevin Wolf {
1750f3930ed0SKevin Wolf     return bdrv_open_inherit(pbs, filename, reference, options, flags, NULL,
1751ce343771SMax Reitz                              NULL, errp);
1752f3930ed0SKevin Wolf }
1753f3930ed0SKevin Wolf 
1754e971aa12SJeff Cody typedef struct BlockReopenQueueEntry {
1755e971aa12SJeff Cody      bool prepared;
1756e971aa12SJeff Cody      BDRVReopenState state;
1757e971aa12SJeff Cody      QSIMPLEQ_ENTRY(BlockReopenQueueEntry) entry;
1758e971aa12SJeff Cody } BlockReopenQueueEntry;
1759e971aa12SJeff Cody 
1760e971aa12SJeff Cody /*
1761e971aa12SJeff Cody  * Adds a BlockDriverState to a simple queue for an atomic, transactional
1762e971aa12SJeff Cody  * reopen of multiple devices.
1763e971aa12SJeff Cody  *
1764e971aa12SJeff Cody  * bs_queue can either be an existing BlockReopenQueue that has had QSIMPLE_INIT
1765e971aa12SJeff Cody  * already performed, or alternatively may be NULL a new BlockReopenQueue will
1766e971aa12SJeff Cody  * be created and initialized. This newly created BlockReopenQueue should be
1767e971aa12SJeff Cody  * passed back in for subsequent calls that are intended to be of the same
1768e971aa12SJeff Cody  * atomic 'set'.
1769e971aa12SJeff Cody  *
1770e971aa12SJeff Cody  * bs is the BlockDriverState to add to the reopen queue.
1771e971aa12SJeff Cody  *
17724d2cb092SKevin Wolf  * options contains the changed options for the associated bs
17734d2cb092SKevin Wolf  * (the BlockReopenQueue takes ownership)
17744d2cb092SKevin Wolf  *
1775e971aa12SJeff Cody  * flags contains the open flags for the associated bs
1776e971aa12SJeff Cody  *
1777e971aa12SJeff Cody  * returns a pointer to bs_queue, which is either the newly allocated
1778e971aa12SJeff Cody  * bs_queue, or the existing bs_queue being used.
1779e971aa12SJeff Cody  *
1780e971aa12SJeff Cody  */
178128518102SKevin Wolf static BlockReopenQueue *bdrv_reopen_queue_child(BlockReopenQueue *bs_queue,
17824d2cb092SKevin Wolf                                                  BlockDriverState *bs,
178328518102SKevin Wolf                                                  QDict *options,
178428518102SKevin Wolf                                                  int flags,
178528518102SKevin Wolf                                                  const BdrvChildRole *role,
178628518102SKevin Wolf                                                  QDict *parent_options,
178728518102SKevin Wolf                                                  int parent_flags)
1788e971aa12SJeff Cody {
1789e971aa12SJeff Cody     assert(bs != NULL);
1790e971aa12SJeff Cody 
1791e971aa12SJeff Cody     BlockReopenQueueEntry *bs_entry;
179267251a31SKevin Wolf     BdrvChild *child;
1793145f598eSKevin Wolf     QDict *old_options, *explicit_options;
179467251a31SKevin Wolf 
1795e971aa12SJeff Cody     if (bs_queue == NULL) {
1796e971aa12SJeff Cody         bs_queue = g_new0(BlockReopenQueue, 1);
1797e971aa12SJeff Cody         QSIMPLEQ_INIT(bs_queue);
1798e971aa12SJeff Cody     }
1799e971aa12SJeff Cody 
18004d2cb092SKevin Wolf     if (!options) {
18014d2cb092SKevin Wolf         options = qdict_new();
18024d2cb092SKevin Wolf     }
18034d2cb092SKevin Wolf 
180428518102SKevin Wolf     /*
180528518102SKevin Wolf      * Precedence of options:
180628518102SKevin Wolf      * 1. Explicitly passed in options (highest)
180791a097e7SKevin Wolf      * 2. Set in flags (only for top level)
1808145f598eSKevin Wolf      * 3. Retained from explicitly set options of bs
18098e2160e2SKevin Wolf      * 4. Inherited from parent node
181028518102SKevin Wolf      * 5. Retained from effective options of bs
181128518102SKevin Wolf      */
181228518102SKevin Wolf 
181391a097e7SKevin Wolf     if (!parent_options) {
181491a097e7SKevin Wolf         /*
181591a097e7SKevin Wolf          * Any setting represented by flags is always updated. If the
181691a097e7SKevin Wolf          * corresponding QDict option is set, it takes precedence. Otherwise
181791a097e7SKevin Wolf          * the flag is translated into a QDict option. The old setting of bs is
181891a097e7SKevin Wolf          * not considered.
181991a097e7SKevin Wolf          */
182091a097e7SKevin Wolf         update_options_from_flags(options, flags);
182191a097e7SKevin Wolf     }
182291a097e7SKevin Wolf 
1823145f598eSKevin Wolf     /* Old explicitly set values (don't overwrite by inherited value) */
1824145f598eSKevin Wolf     old_options = qdict_clone_shallow(bs->explicit_options);
1825145f598eSKevin Wolf     bdrv_join_options(bs, options, old_options);
1826145f598eSKevin Wolf     QDECREF(old_options);
1827145f598eSKevin Wolf 
1828145f598eSKevin Wolf     explicit_options = qdict_clone_shallow(options);
1829145f598eSKevin Wolf 
183028518102SKevin Wolf     /* Inherit from parent node */
183128518102SKevin Wolf     if (parent_options) {
183228518102SKevin Wolf         assert(!flags);
18338e2160e2SKevin Wolf         role->inherit_options(&flags, options, parent_flags, parent_options);
183428518102SKevin Wolf     }
183528518102SKevin Wolf 
183628518102SKevin Wolf     /* Old values are used for options that aren't set yet */
18374d2cb092SKevin Wolf     old_options = qdict_clone_shallow(bs->options);
1838cddff5baSKevin Wolf     bdrv_join_options(bs, options, old_options);
18394d2cb092SKevin Wolf     QDECREF(old_options);
18404d2cb092SKevin Wolf 
1841f1f25a2eSKevin Wolf     /* bdrv_open() masks this flag out */
1842f1f25a2eSKevin Wolf     flags &= ~BDRV_O_PROTOCOL;
1843f1f25a2eSKevin Wolf 
184467251a31SKevin Wolf     QLIST_FOREACH(child, &bs->children, next) {
18454c9dfe5dSKevin Wolf         QDict *new_child_options;
18464c9dfe5dSKevin Wolf         char *child_key_dot;
184767251a31SKevin Wolf 
18484c9dfe5dSKevin Wolf         /* reopen can only change the options of block devices that were
18494c9dfe5dSKevin Wolf          * implicitly created and inherited options. For other (referenced)
18504c9dfe5dSKevin Wolf          * block devices, a syntax like "backing.foo" results in an error. */
185167251a31SKevin Wolf         if (child->bs->inherits_from != bs) {
185267251a31SKevin Wolf             continue;
185367251a31SKevin Wolf         }
185467251a31SKevin Wolf 
18554c9dfe5dSKevin Wolf         child_key_dot = g_strdup_printf("%s.", child->name);
18564c9dfe5dSKevin Wolf         qdict_extract_subqdict(options, &new_child_options, child_key_dot);
18574c9dfe5dSKevin Wolf         g_free(child_key_dot);
18584c9dfe5dSKevin Wolf 
185928518102SKevin Wolf         bdrv_reopen_queue_child(bs_queue, child->bs, new_child_options, 0,
186028518102SKevin Wolf                                 child->role, options, flags);
1861e971aa12SJeff Cody     }
1862e971aa12SJeff Cody 
1863e971aa12SJeff Cody     bs_entry = g_new0(BlockReopenQueueEntry, 1);
1864e971aa12SJeff Cody     QSIMPLEQ_INSERT_TAIL(bs_queue, bs_entry, entry);
1865e971aa12SJeff Cody 
1866e971aa12SJeff Cody     bs_entry->state.bs = bs;
18674d2cb092SKevin Wolf     bs_entry->state.options = options;
1868145f598eSKevin Wolf     bs_entry->state.explicit_options = explicit_options;
1869e971aa12SJeff Cody     bs_entry->state.flags = flags;
1870e971aa12SJeff Cody 
1871e971aa12SJeff Cody     return bs_queue;
1872e971aa12SJeff Cody }
1873e971aa12SJeff Cody 
187428518102SKevin Wolf BlockReopenQueue *bdrv_reopen_queue(BlockReopenQueue *bs_queue,
187528518102SKevin Wolf                                     BlockDriverState *bs,
187628518102SKevin Wolf                                     QDict *options, int flags)
187728518102SKevin Wolf {
187828518102SKevin Wolf     return bdrv_reopen_queue_child(bs_queue, bs, options, flags,
187928518102SKevin Wolf                                    NULL, NULL, 0);
188028518102SKevin Wolf }
188128518102SKevin Wolf 
1882e971aa12SJeff Cody /*
1883e971aa12SJeff Cody  * Reopen multiple BlockDriverStates atomically & transactionally.
1884e971aa12SJeff Cody  *
1885e971aa12SJeff Cody  * The queue passed in (bs_queue) must have been built up previous
1886e971aa12SJeff Cody  * via bdrv_reopen_queue().
1887e971aa12SJeff Cody  *
1888e971aa12SJeff Cody  * Reopens all BDS specified in the queue, with the appropriate
1889e971aa12SJeff Cody  * flags.  All devices are prepared for reopen, and failure of any
1890e971aa12SJeff Cody  * device will cause all device changes to be abandonded, and intermediate
1891e971aa12SJeff Cody  * data cleaned up.
1892e971aa12SJeff Cody  *
1893e971aa12SJeff Cody  * If all devices prepare successfully, then the changes are committed
1894e971aa12SJeff Cody  * to all devices.
1895e971aa12SJeff Cody  *
1896e971aa12SJeff Cody  */
1897e971aa12SJeff Cody int bdrv_reopen_multiple(BlockReopenQueue *bs_queue, Error **errp)
1898e971aa12SJeff Cody {
1899e971aa12SJeff Cody     int ret = -1;
1900e971aa12SJeff Cody     BlockReopenQueueEntry *bs_entry, *next;
1901e971aa12SJeff Cody     Error *local_err = NULL;
1902e971aa12SJeff Cody 
1903e971aa12SJeff Cody     assert(bs_queue != NULL);
1904e971aa12SJeff Cody 
1905e971aa12SJeff Cody     bdrv_drain_all();
1906e971aa12SJeff Cody 
1907e971aa12SJeff Cody     QSIMPLEQ_FOREACH(bs_entry, bs_queue, entry) {
1908e971aa12SJeff Cody         if (bdrv_reopen_prepare(&bs_entry->state, bs_queue, &local_err)) {
1909e971aa12SJeff Cody             error_propagate(errp, local_err);
1910e971aa12SJeff Cody             goto cleanup;
1911e971aa12SJeff Cody         }
1912e971aa12SJeff Cody         bs_entry->prepared = true;
1913e971aa12SJeff Cody     }
1914e971aa12SJeff Cody 
1915e971aa12SJeff Cody     /* If we reach this point, we have success and just need to apply the
1916e971aa12SJeff Cody      * changes
1917e971aa12SJeff Cody      */
1918e971aa12SJeff Cody     QSIMPLEQ_FOREACH(bs_entry, bs_queue, entry) {
1919e971aa12SJeff Cody         bdrv_reopen_commit(&bs_entry->state);
1920e971aa12SJeff Cody     }
1921e971aa12SJeff Cody 
1922e971aa12SJeff Cody     ret = 0;
1923e971aa12SJeff Cody 
1924e971aa12SJeff Cody cleanup:
1925e971aa12SJeff Cody     QSIMPLEQ_FOREACH_SAFE(bs_entry, bs_queue, entry, next) {
1926e971aa12SJeff Cody         if (ret && bs_entry->prepared) {
1927e971aa12SJeff Cody             bdrv_reopen_abort(&bs_entry->state);
1928145f598eSKevin Wolf         } else if (ret) {
1929145f598eSKevin Wolf             QDECREF(bs_entry->state.explicit_options);
1930e971aa12SJeff Cody         }
19314d2cb092SKevin Wolf         QDECREF(bs_entry->state.options);
1932e971aa12SJeff Cody         g_free(bs_entry);
1933e971aa12SJeff Cody     }
1934e971aa12SJeff Cody     g_free(bs_queue);
1935e971aa12SJeff Cody     return ret;
1936e971aa12SJeff Cody }
1937e971aa12SJeff Cody 
1938e971aa12SJeff Cody 
1939e971aa12SJeff Cody /* Reopen a single BlockDriverState with the specified flags. */
1940e971aa12SJeff Cody int bdrv_reopen(BlockDriverState *bs, int bdrv_flags, Error **errp)
1941e971aa12SJeff Cody {
1942e971aa12SJeff Cody     int ret = -1;
1943e971aa12SJeff Cody     Error *local_err = NULL;
19444d2cb092SKevin Wolf     BlockReopenQueue *queue = bdrv_reopen_queue(NULL, bs, NULL, bdrv_flags);
1945e971aa12SJeff Cody 
1946e971aa12SJeff Cody     ret = bdrv_reopen_multiple(queue, &local_err);
1947e971aa12SJeff Cody     if (local_err != NULL) {
1948e971aa12SJeff Cody         error_propagate(errp, local_err);
1949e971aa12SJeff Cody     }
1950e971aa12SJeff Cody     return ret;
1951e971aa12SJeff Cody }
1952e971aa12SJeff Cody 
1953e971aa12SJeff Cody 
1954e971aa12SJeff Cody /*
1955e971aa12SJeff Cody  * Prepares a BlockDriverState for reopen. All changes are staged in the
1956e971aa12SJeff Cody  * 'opaque' field of the BDRVReopenState, which is used and allocated by
1957e971aa12SJeff Cody  * the block driver layer .bdrv_reopen_prepare()
1958e971aa12SJeff Cody  *
1959e971aa12SJeff Cody  * bs is the BlockDriverState to reopen
1960e971aa12SJeff Cody  * flags are the new open flags
1961e971aa12SJeff Cody  * queue is the reopen queue
1962e971aa12SJeff Cody  *
1963e971aa12SJeff Cody  * Returns 0 on success, non-zero on error.  On error errp will be set
1964e971aa12SJeff Cody  * as well.
1965e971aa12SJeff Cody  *
1966e971aa12SJeff Cody  * On failure, bdrv_reopen_abort() will be called to clean up any data.
1967e971aa12SJeff Cody  * It is the responsibility of the caller to then call the abort() or
1968e971aa12SJeff Cody  * commit() for any other BDS that have been left in a prepare() state
1969e971aa12SJeff Cody  *
1970e971aa12SJeff Cody  */
1971e971aa12SJeff Cody int bdrv_reopen_prepare(BDRVReopenState *reopen_state, BlockReopenQueue *queue,
1972e971aa12SJeff Cody                         Error **errp)
1973e971aa12SJeff Cody {
1974e971aa12SJeff Cody     int ret = -1;
1975e971aa12SJeff Cody     Error *local_err = NULL;
1976e971aa12SJeff Cody     BlockDriver *drv;
1977ccf9dc07SKevin Wolf     QemuOpts *opts;
1978ccf9dc07SKevin Wolf     const char *value;
1979e971aa12SJeff Cody 
1980e971aa12SJeff Cody     assert(reopen_state != NULL);
1981e971aa12SJeff Cody     assert(reopen_state->bs->drv != NULL);
1982e971aa12SJeff Cody     drv = reopen_state->bs->drv;
1983e971aa12SJeff Cody 
1984ccf9dc07SKevin Wolf     /* Process generic block layer options */
1985ccf9dc07SKevin Wolf     opts = qemu_opts_create(&bdrv_runtime_opts, NULL, 0, &error_abort);
1986ccf9dc07SKevin Wolf     qemu_opts_absorb_qdict(opts, reopen_state->options, &local_err);
1987ccf9dc07SKevin Wolf     if (local_err) {
1988ccf9dc07SKevin Wolf         error_propagate(errp, local_err);
1989ccf9dc07SKevin Wolf         ret = -EINVAL;
1990ccf9dc07SKevin Wolf         goto error;
1991ccf9dc07SKevin Wolf     }
1992ccf9dc07SKevin Wolf 
199391a097e7SKevin Wolf     update_flags_from_options(&reopen_state->flags, opts);
199491a097e7SKevin Wolf 
199591a097e7SKevin Wolf     /* If a guest device is attached, it owns WCE */
199691a097e7SKevin Wolf     if (reopen_state->bs->blk && blk_get_attached_dev(reopen_state->bs->blk)) {
199791a097e7SKevin Wolf         bool old_wce = bdrv_enable_write_cache(reopen_state->bs);
199891a097e7SKevin Wolf         bool new_wce = (reopen_state->flags & BDRV_O_CACHE_WB);
199991a097e7SKevin Wolf         if (old_wce != new_wce) {
200091a097e7SKevin Wolf             error_setg(errp, "Cannot change cache.writeback: Device attached");
200191a097e7SKevin Wolf             ret = -EINVAL;
200291a097e7SKevin Wolf             goto error;
200391a097e7SKevin Wolf         }
200491a097e7SKevin Wolf     }
200591a097e7SKevin Wolf 
2006ccf9dc07SKevin Wolf     /* node-name and driver must be unchanged. Put them back into the QDict, so
2007ccf9dc07SKevin Wolf      * that they are checked at the end of this function. */
2008ccf9dc07SKevin Wolf     value = qemu_opt_get(opts, "node-name");
2009ccf9dc07SKevin Wolf     if (value) {
2010ccf9dc07SKevin Wolf         qdict_put(reopen_state->options, "node-name", qstring_from_str(value));
2011ccf9dc07SKevin Wolf     }
2012ccf9dc07SKevin Wolf 
2013ccf9dc07SKevin Wolf     value = qemu_opt_get(opts, "driver");
2014ccf9dc07SKevin Wolf     if (value) {
2015ccf9dc07SKevin Wolf         qdict_put(reopen_state->options, "driver", qstring_from_str(value));
2016ccf9dc07SKevin Wolf     }
2017ccf9dc07SKevin Wolf 
2018e971aa12SJeff Cody     /* if we are to stay read-only, do not allow permission change
2019e971aa12SJeff Cody      * to r/w */
2020e971aa12SJeff Cody     if (!(reopen_state->bs->open_flags & BDRV_O_ALLOW_RDWR) &&
2021e971aa12SJeff Cody         reopen_state->flags & BDRV_O_RDWR) {
202281e5f78aSAlberto Garcia         error_setg(errp, "Node '%s' is read only",
202381e5f78aSAlberto Garcia                    bdrv_get_device_or_node_name(reopen_state->bs));
2024e971aa12SJeff Cody         goto error;
2025e971aa12SJeff Cody     }
2026e971aa12SJeff Cody 
2027e971aa12SJeff Cody 
2028e971aa12SJeff Cody     ret = bdrv_flush(reopen_state->bs);
2029e971aa12SJeff Cody     if (ret) {
2030455b0fdeSEric Blake         error_setg_errno(errp, -ret, "Error flushing drive");
2031e971aa12SJeff Cody         goto error;
2032e971aa12SJeff Cody     }
2033e971aa12SJeff Cody 
2034e971aa12SJeff Cody     if (drv->bdrv_reopen_prepare) {
2035e971aa12SJeff Cody         ret = drv->bdrv_reopen_prepare(reopen_state, queue, &local_err);
2036e971aa12SJeff Cody         if (ret) {
2037e971aa12SJeff Cody             if (local_err != NULL) {
2038e971aa12SJeff Cody                 error_propagate(errp, local_err);
2039e971aa12SJeff Cody             } else {
2040d8b6895fSLuiz Capitulino                 error_setg(errp, "failed while preparing to reopen image '%s'",
2041e971aa12SJeff Cody                            reopen_state->bs->filename);
2042e971aa12SJeff Cody             }
2043e971aa12SJeff Cody             goto error;
2044e971aa12SJeff Cody         }
2045e971aa12SJeff Cody     } else {
2046e971aa12SJeff Cody         /* It is currently mandatory to have a bdrv_reopen_prepare()
2047e971aa12SJeff Cody          * handler for each supported drv. */
204881e5f78aSAlberto Garcia         error_setg(errp, "Block format '%s' used by node '%s' "
204981e5f78aSAlberto Garcia                    "does not support reopening files", drv->format_name,
205081e5f78aSAlberto Garcia                    bdrv_get_device_or_node_name(reopen_state->bs));
2051e971aa12SJeff Cody         ret = -1;
2052e971aa12SJeff Cody         goto error;
2053e971aa12SJeff Cody     }
2054e971aa12SJeff Cody 
20554d2cb092SKevin Wolf     /* Options that are not handled are only okay if they are unchanged
20564d2cb092SKevin Wolf      * compared to the old state. It is expected that some options are only
20574d2cb092SKevin Wolf      * used for the initial open, but not reopen (e.g. filename) */
20584d2cb092SKevin Wolf     if (qdict_size(reopen_state->options)) {
20594d2cb092SKevin Wolf         const QDictEntry *entry = qdict_first(reopen_state->options);
20604d2cb092SKevin Wolf 
20614d2cb092SKevin Wolf         do {
20624d2cb092SKevin Wolf             QString *new_obj = qobject_to_qstring(entry->value);
20634d2cb092SKevin Wolf             const char *new = qstring_get_str(new_obj);
20644d2cb092SKevin Wolf             const char *old = qdict_get_try_str(reopen_state->bs->options,
20654d2cb092SKevin Wolf                                                 entry->key);
20664d2cb092SKevin Wolf 
20674d2cb092SKevin Wolf             if (!old || strcmp(new, old)) {
20684d2cb092SKevin Wolf                 error_setg(errp, "Cannot change the option '%s'", entry->key);
20694d2cb092SKevin Wolf                 ret = -EINVAL;
20704d2cb092SKevin Wolf                 goto error;
20714d2cb092SKevin Wolf             }
20724d2cb092SKevin Wolf         } while ((entry = qdict_next(reopen_state->options, entry)));
20734d2cb092SKevin Wolf     }
20744d2cb092SKevin Wolf 
2075e971aa12SJeff Cody     ret = 0;
2076e971aa12SJeff Cody 
2077e971aa12SJeff Cody error:
2078ccf9dc07SKevin Wolf     qemu_opts_del(opts);
2079e971aa12SJeff Cody     return ret;
2080e971aa12SJeff Cody }
2081e971aa12SJeff Cody 
2082e971aa12SJeff Cody /*
2083e971aa12SJeff Cody  * Takes the staged changes for the reopen from bdrv_reopen_prepare(), and
2084e971aa12SJeff Cody  * makes them final by swapping the staging BlockDriverState contents into
2085e971aa12SJeff Cody  * the active BlockDriverState contents.
2086e971aa12SJeff Cody  */
2087e971aa12SJeff Cody void bdrv_reopen_commit(BDRVReopenState *reopen_state)
2088e971aa12SJeff Cody {
2089e971aa12SJeff Cody     BlockDriver *drv;
2090e971aa12SJeff Cody 
2091e971aa12SJeff Cody     assert(reopen_state != NULL);
2092e971aa12SJeff Cody     drv = reopen_state->bs->drv;
2093e971aa12SJeff Cody     assert(drv != NULL);
2094e971aa12SJeff Cody 
2095e971aa12SJeff Cody     /* If there are any driver level actions to take */
2096e971aa12SJeff Cody     if (drv->bdrv_reopen_commit) {
2097e971aa12SJeff Cody         drv->bdrv_reopen_commit(reopen_state);
2098e971aa12SJeff Cody     }
2099e971aa12SJeff Cody 
2100e971aa12SJeff Cody     /* set BDS specific flags now */
2101145f598eSKevin Wolf     QDECREF(reopen_state->bs->explicit_options);
2102145f598eSKevin Wolf 
2103145f598eSKevin Wolf     reopen_state->bs->explicit_options   = reopen_state->explicit_options;
2104e971aa12SJeff Cody     reopen_state->bs->open_flags         = reopen_state->flags;
2105e971aa12SJeff Cody     reopen_state->bs->enable_write_cache = !!(reopen_state->flags &
2106e971aa12SJeff Cody                                               BDRV_O_CACHE_WB);
2107e971aa12SJeff Cody     reopen_state->bs->read_only = !(reopen_state->flags & BDRV_O_RDWR);
2108355ef4acSKevin Wolf 
21093baca891SKevin Wolf     bdrv_refresh_limits(reopen_state->bs, NULL);
2110e971aa12SJeff Cody }
2111e971aa12SJeff Cody 
2112e971aa12SJeff Cody /*
2113e971aa12SJeff Cody  * Abort the reopen, and delete and free the staged changes in
2114e971aa12SJeff Cody  * reopen_state
2115e971aa12SJeff Cody  */
2116e971aa12SJeff Cody void bdrv_reopen_abort(BDRVReopenState *reopen_state)
2117e971aa12SJeff Cody {
2118e971aa12SJeff Cody     BlockDriver *drv;
2119e971aa12SJeff Cody 
2120e971aa12SJeff Cody     assert(reopen_state != NULL);
2121e971aa12SJeff Cody     drv = reopen_state->bs->drv;
2122e971aa12SJeff Cody     assert(drv != NULL);
2123e971aa12SJeff Cody 
2124e971aa12SJeff Cody     if (drv->bdrv_reopen_abort) {
2125e971aa12SJeff Cody         drv->bdrv_reopen_abort(reopen_state);
2126e971aa12SJeff Cody     }
2127145f598eSKevin Wolf 
2128145f598eSKevin Wolf     QDECREF(reopen_state->explicit_options);
2129e971aa12SJeff Cody }
2130e971aa12SJeff Cody 
2131e971aa12SJeff Cody 
213264dff520SMax Reitz static void bdrv_close(BlockDriverState *bs)
2133fc01f7e7Sbellard {
213433384421SMax Reitz     BdrvAioNotifier *ban, *ban_next;
213533384421SMax Reitz 
2136ca9bd24cSMax Reitz     assert(!bs->job);
213799b7e775SAlberto Garcia 
213899b7e775SAlberto Garcia     /* Disable I/O limits and drain all pending throttled requests */
2139a0d64a61SAlberto Garcia     if (bs->throttle_state) {
214099b7e775SAlberto Garcia         bdrv_io_limits_disable(bs);
214199b7e775SAlberto Garcia     }
214299b7e775SAlberto Garcia 
2143fc27291dSPaolo Bonzini     bdrv_drained_begin(bs); /* complete I/O */
214458fda173SStefan Hajnoczi     bdrv_flush(bs);
214553ec73e2SFam Zheng     bdrv_drain(bs); /* in case flush left pending I/O */
2146fc27291dSPaolo Bonzini 
2147c5acdc9aSMax Reitz     bdrv_release_named_dirty_bitmaps(bs);
2148c5acdc9aSMax Reitz     assert(QLIST_EMPTY(&bs->dirty_bitmaps));
2149c5acdc9aSMax Reitz 
2150b4d02820SMax Reitz     if (bs->blk) {
2151b4d02820SMax Reitz         blk_dev_change_media_cb(bs->blk, false);
2152b4d02820SMax Reitz     }
2153b4d02820SMax Reitz 
21543cbc002cSPaolo Bonzini     if (bs->drv) {
21556e93e7c4SKevin Wolf         BdrvChild *child, *next;
21566e93e7c4SKevin Wolf 
21579a7dedbcSKevin Wolf         bs->drv->bdrv_close(bs);
21589a4f4c31SKevin Wolf         bs->drv = NULL;
21599a7dedbcSKevin Wolf 
21609a7dedbcSKevin Wolf         bdrv_set_backing_hd(bs, NULL);
21619a7dedbcSKevin Wolf 
21629a4f4c31SKevin Wolf         if (bs->file != NULL) {
21639a4f4c31SKevin Wolf             bdrv_unref_child(bs, bs->file);
21649a4f4c31SKevin Wolf             bs->file = NULL;
21659a4f4c31SKevin Wolf         }
21669a4f4c31SKevin Wolf 
21676e93e7c4SKevin Wolf         QLIST_FOREACH_SAFE(child, &bs->children, next, next) {
216833a60407SKevin Wolf             /* TODO Remove bdrv_unref() from drivers' close function and use
216933a60407SKevin Wolf              * bdrv_unref_child() here */
2170bddcec37SKevin Wolf             if (child->bs->inherits_from == bs) {
2171bddcec37SKevin Wolf                 child->bs->inherits_from = NULL;
2172bddcec37SKevin Wolf             }
217333a60407SKevin Wolf             bdrv_detach_child(child);
21746e93e7c4SKevin Wolf         }
21756e93e7c4SKevin Wolf 
21767267c094SAnthony Liguori         g_free(bs->opaque);
2177ea2384d3Sbellard         bs->opaque = NULL;
217853fec9d3SStefan Hajnoczi         bs->copy_on_read = 0;
2179a275fa42SPaolo Bonzini         bs->backing_file[0] = '\0';
2180a275fa42SPaolo Bonzini         bs->backing_format[0] = '\0';
21816405875cSPaolo Bonzini         bs->total_sectors = 0;
21826405875cSPaolo Bonzini         bs->encrypted = 0;
21836405875cSPaolo Bonzini         bs->valid_key = 0;
21846405875cSPaolo Bonzini         bs->sg = 0;
21850d51b4deSAsias He         bs->zero_beyond_eof = false;
2186de9c0cecSKevin Wolf         QDECREF(bs->options);
2187145f598eSKevin Wolf         QDECREF(bs->explicit_options);
2188de9c0cecSKevin Wolf         bs->options = NULL;
218991af7014SMax Reitz         QDECREF(bs->full_open_options);
219091af7014SMax Reitz         bs->full_open_options = NULL;
21919ca11154SPavel Hrdina     }
219266f82ceeSKevin Wolf 
219333384421SMax Reitz     QLIST_FOREACH_SAFE(ban, &bs->aio_notifiers, list, ban_next) {
219433384421SMax Reitz         g_free(ban);
219533384421SMax Reitz     }
219633384421SMax Reitz     QLIST_INIT(&bs->aio_notifiers);
2197fc27291dSPaolo Bonzini     bdrv_drained_end(bs);
2198b338082bSbellard }
2199b338082bSbellard 
22002bc93fedSMORITA Kazutaka void bdrv_close_all(void)
22012bc93fedSMORITA Kazutaka {
22022bc93fedSMORITA Kazutaka     BlockDriverState *bs;
2203ca9bd24cSMax Reitz     AioContext *aio_context;
22042bc93fedSMORITA Kazutaka 
2205ca9bd24cSMax Reitz     /* Drop references from requests still in flight, such as canceled block
2206ca9bd24cSMax Reitz      * jobs whose AIO context has not been polled yet */
2207ca9bd24cSMax Reitz     bdrv_drain_all();
2208ca9bd24cSMax Reitz 
2209ca9bd24cSMax Reitz     blk_remove_all_bs();
2210ca9bd24cSMax Reitz     blockdev_close_all_bdrv_states();
2211ca9bd24cSMax Reitz 
2212ca9bd24cSMax Reitz     /* Cancel all block jobs */
2213ca9bd24cSMax Reitz     while (!QTAILQ_EMPTY(&all_bdrv_states)) {
2214ca9bd24cSMax Reitz         QTAILQ_FOREACH(bs, &all_bdrv_states, bs_list) {
2215ca9bd24cSMax Reitz             aio_context = bdrv_get_aio_context(bs);
2216ed78cda3SStefan Hajnoczi 
2217ed78cda3SStefan Hajnoczi             aio_context_acquire(aio_context);
2218ca9bd24cSMax Reitz             if (bs->job) {
2219ca9bd24cSMax Reitz                 block_job_cancel_sync(bs->job);
2220ed78cda3SStefan Hajnoczi                 aio_context_release(aio_context);
2221ca9bd24cSMax Reitz                 break;
2222ca9bd24cSMax Reitz             }
2223ca9bd24cSMax Reitz             aio_context_release(aio_context);
2224ca9bd24cSMax Reitz         }
2225ca9bd24cSMax Reitz 
2226ca9bd24cSMax Reitz         /* All the remaining BlockDriverStates are referenced directly or
2227ca9bd24cSMax Reitz          * indirectly from block jobs, so there needs to be at least one BDS
2228ca9bd24cSMax Reitz          * directly used by a block job */
2229ca9bd24cSMax Reitz         assert(bs);
22302bc93fedSMORITA Kazutaka     }
22312bc93fedSMORITA Kazutaka }
22322bc93fedSMORITA Kazutaka 
2233f8aa905aSJeff Cody /* Note that bs->device_list.tqe_prev is initially null,
2234f8aa905aSJeff Cody  * and gets set to non-null by QTAILQ_INSERT_TAIL().  Establish
2235f8aa905aSJeff Cody  * the useful invariant "bs in bdrv_states iff bs->tqe_prev" by
2236f8aa905aSJeff Cody  * resetting it to null on remove.  */
2237f8aa905aSJeff Cody void bdrv_device_remove(BlockDriverState *bs)
2238f8aa905aSJeff Cody {
2239f8aa905aSJeff Cody     QTAILQ_REMOVE(&bdrv_states, bs, device_list);
2240f8aa905aSJeff Cody     bs->device_list.tqe_prev = NULL;
2241f8aa905aSJeff Cody }
2242f8aa905aSJeff Cody 
2243dc364f4cSBenoît Canet /* make a BlockDriverState anonymous by removing from bdrv_state and
2244dc364f4cSBenoît Canet  * graph_bdrv_state list.
2245d22b2f41SRyan Harper    Also, NULL terminate the device_name to prevent double remove */
2246d22b2f41SRyan Harper void bdrv_make_anon(BlockDriverState *bs)
2247d22b2f41SRyan Harper {
2248f8aa905aSJeff Cody     /* Take care to remove bs from bdrv_states only when it's actually
2249f8aa905aSJeff Cody      * in it. */
2250bfb197e0SMarkus Armbruster     if (bs->device_list.tqe_prev) {
2251f8aa905aSJeff Cody         bdrv_device_remove(bs);
2252d22b2f41SRyan Harper     }
2253dc364f4cSBenoît Canet     if (bs->node_name[0] != '\0') {
2254dc364f4cSBenoît Canet         QTAILQ_REMOVE(&graph_bdrv_states, bs, node_list);
2255dc364f4cSBenoît Canet     }
2256dc364f4cSBenoît Canet     bs->node_name[0] = '\0';
2257d22b2f41SRyan Harper }
2258d22b2f41SRyan Harper 
22598e419aefSKevin Wolf /* Fields that need to stay with the top-level BDS */
22604ddc07caSPaolo Bonzini static void bdrv_move_feature_fields(BlockDriverState *bs_dest,
22614ddc07caSPaolo Bonzini                                      BlockDriverState *bs_src)
22624ddc07caSPaolo Bonzini {
22634ddc07caSPaolo Bonzini     /* move some fields that need to stay attached to the device */
22644ddc07caSPaolo Bonzini 
22654ddc07caSPaolo Bonzini     /* dev info */
22664ddc07caSPaolo Bonzini     bs_dest->copy_on_read       = bs_src->copy_on_read;
22674ddc07caSPaolo Bonzini 
22684ddc07caSPaolo Bonzini     bs_dest->enable_write_cache = bs_src->enable_write_cache;
22694ddc07caSPaolo Bonzini 
2270dd62f1caSKevin Wolf     /* dirty bitmap */
2271dd62f1caSKevin Wolf     bs_dest->dirty_bitmaps      = bs_src->dirty_bitmaps;
2272dd62f1caSKevin Wolf }
2273dd62f1caSKevin Wolf 
2274dd62f1caSKevin Wolf static void change_parent_backing_link(BlockDriverState *from,
2275dd62f1caSKevin Wolf                                        BlockDriverState *to)
2276dd62f1caSKevin Wolf {
2277dd62f1caSKevin Wolf     BdrvChild *c, *next;
2278dd62f1caSKevin Wolf 
2279dd62f1caSKevin Wolf     QLIST_FOREACH_SAFE(c, &from->parents, next_parent, next) {
2280dd62f1caSKevin Wolf         assert(c->role != &child_backing);
2281dd62f1caSKevin Wolf         c->bs = to;
2282dd62f1caSKevin Wolf         QLIST_REMOVE(c, next_parent);
2283dd62f1caSKevin Wolf         QLIST_INSERT_HEAD(&to->parents, c, next_parent);
2284dd62f1caSKevin Wolf         bdrv_ref(to);
2285dd62f1caSKevin Wolf         bdrv_unref(from);
2286dd62f1caSKevin Wolf     }
2287dd62f1caSKevin Wolf     if (from->blk) {
2288dd62f1caSKevin Wolf         blk_set_bs(from->blk, to);
2289dd62f1caSKevin Wolf         if (!to->device_list.tqe_prev) {
2290dd62f1caSKevin Wolf             QTAILQ_INSERT_BEFORE(from, to, device_list);
2291dd62f1caSKevin Wolf         }
2292f8aa905aSJeff Cody         bdrv_device_remove(from);
2293dd62f1caSKevin Wolf     }
2294dd62f1caSKevin Wolf }
2295dd62f1caSKevin Wolf 
2296dd62f1caSKevin Wolf static void swap_feature_fields(BlockDriverState *bs_top,
2297dd62f1caSKevin Wolf                                 BlockDriverState *bs_new)
2298dd62f1caSKevin Wolf {
2299dd62f1caSKevin Wolf     BlockDriverState tmp;
2300dd62f1caSKevin Wolf 
2301dd62f1caSKevin Wolf     bdrv_move_feature_fields(&tmp, bs_top);
2302dd62f1caSKevin Wolf     bdrv_move_feature_fields(bs_top, bs_new);
2303dd62f1caSKevin Wolf     bdrv_move_feature_fields(bs_new, &tmp);
2304dd62f1caSKevin Wolf 
2305dd62f1caSKevin Wolf     assert(!bs_new->throttle_state);
2306dd62f1caSKevin Wolf     if (bs_top->throttle_state) {
2307dd62f1caSKevin Wolf         assert(bs_top->io_limits_enabled);
2308dd62f1caSKevin Wolf         bdrv_io_limits_enable(bs_new, throttle_group_get_name(bs_top));
2309dd62f1caSKevin Wolf         bdrv_io_limits_disable(bs_top);
2310dd62f1caSKevin Wolf     }
2311dd62f1caSKevin Wolf }
2312dd62f1caSKevin Wolf 
23138802d1fdSJeff Cody /*
23148802d1fdSJeff Cody  * Add new bs contents at the top of an image chain while the chain is
23158802d1fdSJeff Cody  * live, while keeping required fields on the top layer.
23168802d1fdSJeff Cody  *
23178802d1fdSJeff Cody  * This will modify the BlockDriverState fields, and swap contents
23188802d1fdSJeff Cody  * between bs_new and bs_top. Both bs_new and bs_top are modified.
23198802d1fdSJeff Cody  *
2320bfb197e0SMarkus Armbruster  * bs_new must not be attached to a BlockBackend.
2321f6801b83SJeff Cody  *
23228802d1fdSJeff Cody  * This function does not create any image files.
2323dd62f1caSKevin Wolf  *
2324dd62f1caSKevin Wolf  * bdrv_append() takes ownership of a bs_new reference and unrefs it because
2325dd62f1caSKevin Wolf  * that's what the callers commonly need. bs_new will be referenced by the old
2326dd62f1caSKevin Wolf  * parents of bs_top after bdrv_append() returns. If the caller needs to keep a
2327dd62f1caSKevin Wolf  * reference of its own, it must call bdrv_ref().
23288802d1fdSJeff Cody  */
23298802d1fdSJeff Cody void bdrv_append(BlockDriverState *bs_new, BlockDriverState *bs_top)
23308802d1fdSJeff Cody {
2331dd62f1caSKevin Wolf     assert(!bdrv_requests_pending(bs_top));
2332dd62f1caSKevin Wolf     assert(!bdrv_requests_pending(bs_new));
23338802d1fdSJeff Cody 
2334dd62f1caSKevin Wolf     bdrv_ref(bs_top);
2335dd62f1caSKevin Wolf     change_parent_backing_link(bs_top, bs_new);
2336dd62f1caSKevin Wolf 
2337dd62f1caSKevin Wolf     /* Some fields always stay on top of the backing file chain */
2338dd62f1caSKevin Wolf     swap_feature_fields(bs_top, bs_new);
2339dd62f1caSKevin Wolf 
2340dd62f1caSKevin Wolf     bdrv_set_backing_hd(bs_new, bs_top);
2341dd62f1caSKevin Wolf     bdrv_unref(bs_top);
2342dd62f1caSKevin Wolf 
2343dd62f1caSKevin Wolf     /* bs_new is now referenced by its new parents, we don't need the
2344dd62f1caSKevin Wolf      * additional reference any more. */
2345dd62f1caSKevin Wolf     bdrv_unref(bs_new);
23468802d1fdSJeff Cody }
23478802d1fdSJeff Cody 
23483f09bfbcSKevin Wolf void bdrv_replace_in_backing_chain(BlockDriverState *old, BlockDriverState *new)
23493f09bfbcSKevin Wolf {
23503f09bfbcSKevin Wolf     assert(!bdrv_requests_pending(old));
23513f09bfbcSKevin Wolf     assert(!bdrv_requests_pending(new));
23523f09bfbcSKevin Wolf 
23533f09bfbcSKevin Wolf     bdrv_ref(old);
23543f09bfbcSKevin Wolf 
23553f09bfbcSKevin Wolf     if (old->blk) {
23563f09bfbcSKevin Wolf         /* As long as these fields aren't in BlockBackend, but in the top-level
23573f09bfbcSKevin Wolf          * BlockDriverState, it's not possible for a BDS to have two BBs.
23583f09bfbcSKevin Wolf          *
23593f09bfbcSKevin Wolf          * We really want to copy the fields from old to new, but we go for a
23603f09bfbcSKevin Wolf          * swap instead so that pointers aren't duplicated and cause trouble.
23613f09bfbcSKevin Wolf          * (Also, bdrv_swap() used to do the same.) */
23623f09bfbcSKevin Wolf         assert(!new->blk);
23633f09bfbcSKevin Wolf         swap_feature_fields(old, new);
23643f09bfbcSKevin Wolf     }
23653f09bfbcSKevin Wolf     change_parent_backing_link(old, new);
23663f09bfbcSKevin Wolf 
23673f09bfbcSKevin Wolf     /* Change backing files if a previously independent node is added to the
23683f09bfbcSKevin Wolf      * chain. For active commit, we replace top by its own (indirect) backing
23693f09bfbcSKevin Wolf      * file and don't do anything here so we don't build a loop. */
23703f09bfbcSKevin Wolf     if (new->backing == NULL && !bdrv_chain_contains(backing_bs(old), new)) {
23713f09bfbcSKevin Wolf         bdrv_set_backing_hd(new, backing_bs(old));
23723f09bfbcSKevin Wolf         bdrv_set_backing_hd(old, NULL);
23733f09bfbcSKevin Wolf     }
23743f09bfbcSKevin Wolf 
23753f09bfbcSKevin Wolf     bdrv_unref(old);
23763f09bfbcSKevin Wolf }
23773f09bfbcSKevin Wolf 
23784f6fd349SFam Zheng static void bdrv_delete(BlockDriverState *bs)
2379b338082bSbellard {
23803e914655SPaolo Bonzini     assert(!bs->job);
23813718d8abSFam Zheng     assert(bdrv_op_blocker_is_empty(bs));
23824f6fd349SFam Zheng     assert(!bs->refcnt);
238318846deeSMarkus Armbruster 
2384e1b5c52eSStefan Hajnoczi     bdrv_close(bs);
2385e1b5c52eSStefan Hajnoczi 
23861b7bdbc1SStefan Hajnoczi     /* remove from list, if necessary */
2387d22b2f41SRyan Harper     bdrv_make_anon(bs);
238834c6f050Saurel32 
23892c1d04e0SMax Reitz     QTAILQ_REMOVE(&all_bdrv_states, bs, bs_list);
23902c1d04e0SMax Reitz 
23917267c094SAnthony Liguori     g_free(bs);
2392fc01f7e7Sbellard }
2393fc01f7e7Sbellard 
2394e97fc193Saliguori /*
2395e97fc193Saliguori  * Run consistency checks on an image
2396e97fc193Saliguori  *
2397e076f338SKevin Wolf  * Returns 0 if the check could be completed (it doesn't mean that the image is
2398a1c7273bSStefan Weil  * free of errors) or -errno when an internal error occurred. The results of the
2399e076f338SKevin Wolf  * check are stored in res.
2400e97fc193Saliguori  */
24014534ff54SKevin Wolf int bdrv_check(BlockDriverState *bs, BdrvCheckResult *res, BdrvCheckMode fix)
2402e97fc193Saliguori {
2403908bcd54SMax Reitz     if (bs->drv == NULL) {
2404908bcd54SMax Reitz         return -ENOMEDIUM;
2405908bcd54SMax Reitz     }
2406e97fc193Saliguori     if (bs->drv->bdrv_check == NULL) {
2407e97fc193Saliguori         return -ENOTSUP;
2408e97fc193Saliguori     }
2409e97fc193Saliguori 
2410e076f338SKevin Wolf     memset(res, 0, sizeof(*res));
24114534ff54SKevin Wolf     return bs->drv->bdrv_check(bs, res, fix);
2412e97fc193Saliguori }
2413e97fc193Saliguori 
24148a426614SKevin Wolf #define COMMIT_BUF_SECTORS 2048
24158a426614SKevin Wolf 
241633e3963eSbellard /* commit COW file into the raw image */
241733e3963eSbellard int bdrv_commit(BlockDriverState *bs)
241833e3963eSbellard {
241919cb3738Sbellard     BlockDriver *drv = bs->drv;
242072706ea4SJeff Cody     int64_t sector, total_sectors, length, backing_length;
24218a426614SKevin Wolf     int n, ro, open_flags;
24220bce597dSJeff Cody     int ret = 0;
242372706ea4SJeff Cody     uint8_t *buf = NULL;
242433e3963eSbellard 
242519cb3738Sbellard     if (!drv)
242619cb3738Sbellard         return -ENOMEDIUM;
242733e3963eSbellard 
2428760e0063SKevin Wolf     if (!bs->backing) {
24294dca4b63SNaphtali Sprei         return -ENOTSUP;
24304dca4b63SNaphtali Sprei     }
24314dca4b63SNaphtali Sprei 
2432bb00021dSFam Zheng     if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_COMMIT_SOURCE, NULL) ||
2433760e0063SKevin Wolf         bdrv_op_is_blocked(bs->backing->bs, BLOCK_OP_TYPE_COMMIT_TARGET, NULL)) {
24342d3735d3SStefan Hajnoczi         return -EBUSY;
24352d3735d3SStefan Hajnoczi     }
24362d3735d3SStefan Hajnoczi 
2437760e0063SKevin Wolf     ro = bs->backing->bs->read_only;
2438760e0063SKevin Wolf     open_flags =  bs->backing->bs->open_flags;
24394dca4b63SNaphtali Sprei 
24404dca4b63SNaphtali Sprei     if (ro) {
2441760e0063SKevin Wolf         if (bdrv_reopen(bs->backing->bs, open_flags | BDRV_O_RDWR, NULL)) {
24420bce597dSJeff Cody             return -EACCES;
24434dca4b63SNaphtali Sprei         }
2444ea2384d3Sbellard     }
2445ea2384d3Sbellard 
244672706ea4SJeff Cody     length = bdrv_getlength(bs);
244772706ea4SJeff Cody     if (length < 0) {
244872706ea4SJeff Cody         ret = length;
244972706ea4SJeff Cody         goto ro_cleanup;
245072706ea4SJeff Cody     }
245172706ea4SJeff Cody 
2452760e0063SKevin Wolf     backing_length = bdrv_getlength(bs->backing->bs);
245372706ea4SJeff Cody     if (backing_length < 0) {
245472706ea4SJeff Cody         ret = backing_length;
245572706ea4SJeff Cody         goto ro_cleanup;
245672706ea4SJeff Cody     }
245772706ea4SJeff Cody 
245872706ea4SJeff Cody     /* If our top snapshot is larger than the backing file image,
245972706ea4SJeff Cody      * grow the backing file image if possible.  If not possible,
246072706ea4SJeff Cody      * we must return an error */
246172706ea4SJeff Cody     if (length > backing_length) {
2462760e0063SKevin Wolf         ret = bdrv_truncate(bs->backing->bs, length);
246372706ea4SJeff Cody         if (ret < 0) {
246472706ea4SJeff Cody             goto ro_cleanup;
246572706ea4SJeff Cody         }
246672706ea4SJeff Cody     }
246772706ea4SJeff Cody 
246872706ea4SJeff Cody     total_sectors = length >> BDRV_SECTOR_BITS;
2469857d4f46SKevin Wolf 
2470857d4f46SKevin Wolf     /* qemu_try_blockalign() for bs will choose an alignment that works for
2471760e0063SKevin Wolf      * bs->backing->bs as well, so no need to compare the alignment manually. */
2472857d4f46SKevin Wolf     buf = qemu_try_blockalign(bs, COMMIT_BUF_SECTORS * BDRV_SECTOR_SIZE);
2473857d4f46SKevin Wolf     if (buf == NULL) {
2474857d4f46SKevin Wolf         ret = -ENOMEM;
2475857d4f46SKevin Wolf         goto ro_cleanup;
2476857d4f46SKevin Wolf     }
24778a426614SKevin Wolf 
24788a426614SKevin Wolf     for (sector = 0; sector < total_sectors; sector += n) {
2479d663640cSPaolo Bonzini         ret = bdrv_is_allocated(bs, sector, COMMIT_BUF_SECTORS, &n);
2480d663640cSPaolo Bonzini         if (ret < 0) {
2481d663640cSPaolo Bonzini             goto ro_cleanup;
2482d663640cSPaolo Bonzini         }
2483d663640cSPaolo Bonzini         if (ret) {
2484dabfa6ccSKevin Wolf             ret = bdrv_read(bs, sector, buf, n);
2485dabfa6ccSKevin Wolf             if (ret < 0) {
24864dca4b63SNaphtali Sprei                 goto ro_cleanup;
248733e3963eSbellard             }
248833e3963eSbellard 
2489760e0063SKevin Wolf             ret = bdrv_write(bs->backing->bs, sector, buf, n);
2490dabfa6ccSKevin Wolf             if (ret < 0) {
24914dca4b63SNaphtali Sprei                 goto ro_cleanup;
249233e3963eSbellard             }
249333e3963eSbellard         }
249433e3963eSbellard     }
249595389c86Sbellard 
24961d44952fSChristoph Hellwig     if (drv->bdrv_make_empty) {
24971d44952fSChristoph Hellwig         ret = drv->bdrv_make_empty(bs);
2498dabfa6ccSKevin Wolf         if (ret < 0) {
2499dabfa6ccSKevin Wolf             goto ro_cleanup;
2500dabfa6ccSKevin Wolf         }
25011d44952fSChristoph Hellwig         bdrv_flush(bs);
25021d44952fSChristoph Hellwig     }
250395389c86Sbellard 
25043f5075aeSChristoph Hellwig     /*
25053f5075aeSChristoph Hellwig      * Make sure all data we wrote to the backing device is actually
25063f5075aeSChristoph Hellwig      * stable on disk.
25073f5075aeSChristoph Hellwig      */
2508760e0063SKevin Wolf     if (bs->backing) {
2509760e0063SKevin Wolf         bdrv_flush(bs->backing->bs);
2510dabfa6ccSKevin Wolf     }
25114dca4b63SNaphtali Sprei 
2512dabfa6ccSKevin Wolf     ret = 0;
25134dca4b63SNaphtali Sprei ro_cleanup:
2514857d4f46SKevin Wolf     qemu_vfree(buf);
25154dca4b63SNaphtali Sprei 
25164dca4b63SNaphtali Sprei     if (ro) {
25170bce597dSJeff Cody         /* ignoring error return here */
2518760e0063SKevin Wolf         bdrv_reopen(bs->backing->bs, open_flags & ~BDRV_O_RDWR, NULL);
25194dca4b63SNaphtali Sprei     }
25204dca4b63SNaphtali Sprei 
25211d44952fSChristoph Hellwig     return ret;
252233e3963eSbellard }
252333e3963eSbellard 
2524e8877497SStefan Hajnoczi int bdrv_commit_all(void)
25256ab4b5abSMarkus Armbruster {
25266ab4b5abSMarkus Armbruster     BlockDriverState *bs;
25276ab4b5abSMarkus Armbruster 
2528dc364f4cSBenoît Canet     QTAILQ_FOREACH(bs, &bdrv_states, device_list) {
2529ed78cda3SStefan Hajnoczi         AioContext *aio_context = bdrv_get_aio_context(bs);
2530ed78cda3SStefan Hajnoczi 
2531ed78cda3SStefan Hajnoczi         aio_context_acquire(aio_context);
2532760e0063SKevin Wolf         if (bs->drv && bs->backing) {
2533e8877497SStefan Hajnoczi             int ret = bdrv_commit(bs);
2534e8877497SStefan Hajnoczi             if (ret < 0) {
2535ed78cda3SStefan Hajnoczi                 aio_context_release(aio_context);
2536e8877497SStefan Hajnoczi                 return ret;
25376ab4b5abSMarkus Armbruster             }
25386ab4b5abSMarkus Armbruster         }
2539ed78cda3SStefan Hajnoczi         aio_context_release(aio_context);
2540272d2d8eSJeff Cody     }
2541e8877497SStefan Hajnoczi     return 0;
2542e8877497SStefan Hajnoczi }
25436ab4b5abSMarkus Armbruster 
2544756e6736SKevin Wolf /*
2545756e6736SKevin Wolf  * Return values:
2546756e6736SKevin Wolf  * 0        - success
2547756e6736SKevin Wolf  * -EINVAL  - backing format specified, but no file
2548756e6736SKevin Wolf  * -ENOSPC  - can't update the backing file because no space is left in the
2549756e6736SKevin Wolf  *            image file header
2550756e6736SKevin Wolf  * -ENOTSUP - format driver doesn't support changing the backing file
2551756e6736SKevin Wolf  */
2552756e6736SKevin Wolf int bdrv_change_backing_file(BlockDriverState *bs,
2553756e6736SKevin Wolf     const char *backing_file, const char *backing_fmt)
2554756e6736SKevin Wolf {
2555756e6736SKevin Wolf     BlockDriver *drv = bs->drv;
2556469ef350SPaolo Bonzini     int ret;
2557756e6736SKevin Wolf 
25585f377794SPaolo Bonzini     /* Backing file format doesn't make sense without a backing file */
25595f377794SPaolo Bonzini     if (backing_fmt && !backing_file) {
25605f377794SPaolo Bonzini         return -EINVAL;
25615f377794SPaolo Bonzini     }
25625f377794SPaolo Bonzini 
2563756e6736SKevin Wolf     if (drv->bdrv_change_backing_file != NULL) {
2564469ef350SPaolo Bonzini         ret = drv->bdrv_change_backing_file(bs, backing_file, backing_fmt);
2565756e6736SKevin Wolf     } else {
2566469ef350SPaolo Bonzini         ret = -ENOTSUP;
2567756e6736SKevin Wolf     }
2568469ef350SPaolo Bonzini 
2569469ef350SPaolo Bonzini     if (ret == 0) {
2570469ef350SPaolo Bonzini         pstrcpy(bs->backing_file, sizeof(bs->backing_file), backing_file ?: "");
2571469ef350SPaolo Bonzini         pstrcpy(bs->backing_format, sizeof(bs->backing_format), backing_fmt ?: "");
2572469ef350SPaolo Bonzini     }
2573469ef350SPaolo Bonzini     return ret;
2574756e6736SKevin Wolf }
2575756e6736SKevin Wolf 
25766ebdcee2SJeff Cody /*
25776ebdcee2SJeff Cody  * Finds the image layer in the chain that has 'bs' as its backing file.
25786ebdcee2SJeff Cody  *
25796ebdcee2SJeff Cody  * active is the current topmost image.
25806ebdcee2SJeff Cody  *
25816ebdcee2SJeff Cody  * Returns NULL if bs is not found in active's image chain,
25826ebdcee2SJeff Cody  * or if active == bs.
25834caf0fcdSJeff Cody  *
25844caf0fcdSJeff Cody  * Returns the bottommost base image if bs == NULL.
25856ebdcee2SJeff Cody  */
25866ebdcee2SJeff Cody BlockDriverState *bdrv_find_overlay(BlockDriverState *active,
25876ebdcee2SJeff Cody                                     BlockDriverState *bs)
25886ebdcee2SJeff Cody {
2589760e0063SKevin Wolf     while (active && bs != backing_bs(active)) {
2590760e0063SKevin Wolf         active = backing_bs(active);
25916ebdcee2SJeff Cody     }
25926ebdcee2SJeff Cody 
25934caf0fcdSJeff Cody     return active;
25946ebdcee2SJeff Cody }
25956ebdcee2SJeff Cody 
25964caf0fcdSJeff Cody /* Given a BDS, searches for the base layer. */
25974caf0fcdSJeff Cody BlockDriverState *bdrv_find_base(BlockDriverState *bs)
25984caf0fcdSJeff Cody {
25994caf0fcdSJeff Cody     return bdrv_find_overlay(bs, NULL);
26006ebdcee2SJeff Cody }
26016ebdcee2SJeff Cody 
26026ebdcee2SJeff Cody /*
26036ebdcee2SJeff Cody  * Drops images above 'base' up to and including 'top', and sets the image
26046ebdcee2SJeff Cody  * above 'top' to have base as its backing file.
26056ebdcee2SJeff Cody  *
26066ebdcee2SJeff Cody  * Requires that the overlay to 'top' is opened r/w, so that the backing file
26076ebdcee2SJeff Cody  * information in 'bs' can be properly updated.
26086ebdcee2SJeff Cody  *
26096ebdcee2SJeff Cody  * E.g., this will convert the following chain:
26106ebdcee2SJeff Cody  * bottom <- base <- intermediate <- top <- active
26116ebdcee2SJeff Cody  *
26126ebdcee2SJeff Cody  * to
26136ebdcee2SJeff Cody  *
26146ebdcee2SJeff Cody  * bottom <- base <- active
26156ebdcee2SJeff Cody  *
26166ebdcee2SJeff Cody  * It is allowed for bottom==base, in which case it converts:
26176ebdcee2SJeff Cody  *
26186ebdcee2SJeff Cody  * base <- intermediate <- top <- active
26196ebdcee2SJeff Cody  *
26206ebdcee2SJeff Cody  * to
26216ebdcee2SJeff Cody  *
26226ebdcee2SJeff Cody  * base <- active
26236ebdcee2SJeff Cody  *
262454e26900SJeff Cody  * If backing_file_str is non-NULL, it will be used when modifying top's
262554e26900SJeff Cody  * overlay image metadata.
262654e26900SJeff Cody  *
26276ebdcee2SJeff Cody  * Error conditions:
26286ebdcee2SJeff Cody  *  if active == top, that is considered an error
26296ebdcee2SJeff Cody  *
26306ebdcee2SJeff Cody  */
26316ebdcee2SJeff Cody int bdrv_drop_intermediate(BlockDriverState *active, BlockDriverState *top,
263254e26900SJeff Cody                            BlockDriverState *base, const char *backing_file_str)
26336ebdcee2SJeff Cody {
26346ebdcee2SJeff Cody     BlockDriverState *new_top_bs = NULL;
26356ebdcee2SJeff Cody     int ret = -EIO;
26366ebdcee2SJeff Cody 
26376ebdcee2SJeff Cody     if (!top->drv || !base->drv) {
26386ebdcee2SJeff Cody         goto exit;
26396ebdcee2SJeff Cody     }
26406ebdcee2SJeff Cody 
26416ebdcee2SJeff Cody     new_top_bs = bdrv_find_overlay(active, top);
26426ebdcee2SJeff Cody 
26436ebdcee2SJeff Cody     if (new_top_bs == NULL) {
26446ebdcee2SJeff Cody         /* we could not find the image above 'top', this is an error */
26456ebdcee2SJeff Cody         goto exit;
26466ebdcee2SJeff Cody     }
26476ebdcee2SJeff Cody 
2648760e0063SKevin Wolf     /* special case of new_top_bs->backing->bs already pointing to base - nothing
26496ebdcee2SJeff Cody      * to do, no intermediate images */
2650760e0063SKevin Wolf     if (backing_bs(new_top_bs) == base) {
26516ebdcee2SJeff Cody         ret = 0;
26526ebdcee2SJeff Cody         goto exit;
26536ebdcee2SJeff Cody     }
26546ebdcee2SJeff Cody 
26555db15a57SKevin Wolf     /* Make sure that base is in the backing chain of top */
26565db15a57SKevin Wolf     if (!bdrv_chain_contains(top, base)) {
26576ebdcee2SJeff Cody         goto exit;
26586ebdcee2SJeff Cody     }
26596ebdcee2SJeff Cody 
26606ebdcee2SJeff Cody     /* success - we can delete the intermediate states, and link top->base */
26615db15a57SKevin Wolf     backing_file_str = backing_file_str ? backing_file_str : base->filename;
266254e26900SJeff Cody     ret = bdrv_change_backing_file(new_top_bs, backing_file_str,
26635db15a57SKevin Wolf                                    base->drv ? base->drv->format_name : "");
26646ebdcee2SJeff Cody     if (ret) {
26656ebdcee2SJeff Cody         goto exit;
26666ebdcee2SJeff Cody     }
26675db15a57SKevin Wolf     bdrv_set_backing_hd(new_top_bs, base);
26686ebdcee2SJeff Cody 
26696ebdcee2SJeff Cody     ret = 0;
26706ebdcee2SJeff Cody exit:
26716ebdcee2SJeff Cody     return ret;
26726ebdcee2SJeff Cody }
26736ebdcee2SJeff Cody 
267483f64091Sbellard /**
267583f64091Sbellard  * Truncate file to 'offset' bytes (needed only for file protocols)
267683f64091Sbellard  */
267783f64091Sbellard int bdrv_truncate(BlockDriverState *bs, int64_t offset)
267883f64091Sbellard {
267983f64091Sbellard     BlockDriver *drv = bs->drv;
268051762288SStefan Hajnoczi     int ret;
268183f64091Sbellard     if (!drv)
268219cb3738Sbellard         return -ENOMEDIUM;
268383f64091Sbellard     if (!drv->bdrv_truncate)
268483f64091Sbellard         return -ENOTSUP;
268559f2689dSNaphtali Sprei     if (bs->read_only)
268659f2689dSNaphtali Sprei         return -EACCES;
26879c75e168SJeff Cody 
268851762288SStefan Hajnoczi     ret = drv->bdrv_truncate(bs, offset);
268951762288SStefan Hajnoczi     if (ret == 0) {
269051762288SStefan Hajnoczi         ret = refresh_total_sectors(bs, offset >> BDRV_SECTOR_BITS);
2691ce1ffea8SJohn Snow         bdrv_dirty_bitmap_truncate(bs);
2692a7f53e26SMarkus Armbruster         if (bs->blk) {
2693a7f53e26SMarkus Armbruster             blk_dev_resize_cb(bs->blk);
2694a7f53e26SMarkus Armbruster         }
269551762288SStefan Hajnoczi     }
269651762288SStefan Hajnoczi     return ret;
269783f64091Sbellard }
269883f64091Sbellard 
269983f64091Sbellard /**
27004a1d5e1fSFam Zheng  * Length of a allocated file in bytes. Sparse files are counted by actual
27014a1d5e1fSFam Zheng  * allocated space. Return < 0 if error or unknown.
27024a1d5e1fSFam Zheng  */
27034a1d5e1fSFam Zheng int64_t bdrv_get_allocated_file_size(BlockDriverState *bs)
27044a1d5e1fSFam Zheng {
27054a1d5e1fSFam Zheng     BlockDriver *drv = bs->drv;
27064a1d5e1fSFam Zheng     if (!drv) {
27074a1d5e1fSFam Zheng         return -ENOMEDIUM;
27084a1d5e1fSFam Zheng     }
27094a1d5e1fSFam Zheng     if (drv->bdrv_get_allocated_file_size) {
27104a1d5e1fSFam Zheng         return drv->bdrv_get_allocated_file_size(bs);
27114a1d5e1fSFam Zheng     }
27124a1d5e1fSFam Zheng     if (bs->file) {
27139a4f4c31SKevin Wolf         return bdrv_get_allocated_file_size(bs->file->bs);
27144a1d5e1fSFam Zheng     }
27154a1d5e1fSFam Zheng     return -ENOTSUP;
27164a1d5e1fSFam Zheng }
27174a1d5e1fSFam Zheng 
27184a1d5e1fSFam Zheng /**
271965a9bb25SMarkus Armbruster  * Return number of sectors on success, -errno on error.
272083f64091Sbellard  */
272165a9bb25SMarkus Armbruster int64_t bdrv_nb_sectors(BlockDriverState *bs)
272283f64091Sbellard {
272383f64091Sbellard     BlockDriver *drv = bs->drv;
272465a9bb25SMarkus Armbruster 
272583f64091Sbellard     if (!drv)
272619cb3738Sbellard         return -ENOMEDIUM;
272751762288SStefan Hajnoczi 
2728b94a2610SKevin Wolf     if (drv->has_variable_length) {
2729b94a2610SKevin Wolf         int ret = refresh_total_sectors(bs, bs->total_sectors);
2730b94a2610SKevin Wolf         if (ret < 0) {
2731b94a2610SKevin Wolf             return ret;
2732fc01f7e7Sbellard         }
273346a4e4e6SStefan Hajnoczi     }
273465a9bb25SMarkus Armbruster     return bs->total_sectors;
273565a9bb25SMarkus Armbruster }
273665a9bb25SMarkus Armbruster 
273765a9bb25SMarkus Armbruster /**
273865a9bb25SMarkus Armbruster  * Return length in bytes on success, -errno on error.
273965a9bb25SMarkus Armbruster  * The length is always a multiple of BDRV_SECTOR_SIZE.
274065a9bb25SMarkus Armbruster  */
274165a9bb25SMarkus Armbruster int64_t bdrv_getlength(BlockDriverState *bs)
274265a9bb25SMarkus Armbruster {
274365a9bb25SMarkus Armbruster     int64_t ret = bdrv_nb_sectors(bs);
274465a9bb25SMarkus Armbruster 
27454a9c9ea0SFam Zheng     ret = ret > INT64_MAX / BDRV_SECTOR_SIZE ? -EFBIG : ret;
274665a9bb25SMarkus Armbruster     return ret < 0 ? ret : ret * BDRV_SECTOR_SIZE;
274746a4e4e6SStefan Hajnoczi }
2748fc01f7e7Sbellard 
274919cb3738Sbellard /* return 0 as number of sectors if no device present or error */
275096b8f136Sths void bdrv_get_geometry(BlockDriverState *bs, uint64_t *nb_sectors_ptr)
2751fc01f7e7Sbellard {
275265a9bb25SMarkus Armbruster     int64_t nb_sectors = bdrv_nb_sectors(bs);
275365a9bb25SMarkus Armbruster 
275465a9bb25SMarkus Armbruster     *nb_sectors_ptr = nb_sectors < 0 ? 0 : nb_sectors;
2755fc01f7e7Sbellard }
2756cf98951bSbellard 
2757b338082bSbellard int bdrv_is_read_only(BlockDriverState *bs)
2758b338082bSbellard {
2759b338082bSbellard     return bs->read_only;
2760b338082bSbellard }
2761b338082bSbellard 
2762985a03b0Sths int bdrv_is_sg(BlockDriverState *bs)
2763985a03b0Sths {
2764985a03b0Sths     return bs->sg;
2765985a03b0Sths }
2766985a03b0Sths 
2767e900a7b7SChristoph Hellwig int bdrv_enable_write_cache(BlockDriverState *bs)
2768e900a7b7SChristoph Hellwig {
2769e900a7b7SChristoph Hellwig     return bs->enable_write_cache;
2770e900a7b7SChristoph Hellwig }
2771e900a7b7SChristoph Hellwig 
2772425b0148SPaolo Bonzini void bdrv_set_enable_write_cache(BlockDriverState *bs, bool wce)
2773425b0148SPaolo Bonzini {
2774425b0148SPaolo Bonzini     bs->enable_write_cache = wce;
277555b110f2SJeff Cody 
277655b110f2SJeff Cody     /* so a reopen() will preserve wce */
277755b110f2SJeff Cody     if (wce) {
277855b110f2SJeff Cody         bs->open_flags |= BDRV_O_CACHE_WB;
277955b110f2SJeff Cody     } else {
278055b110f2SJeff Cody         bs->open_flags &= ~BDRV_O_CACHE_WB;
278155b110f2SJeff Cody     }
2782425b0148SPaolo Bonzini }
2783425b0148SPaolo Bonzini 
2784ea2384d3Sbellard int bdrv_is_encrypted(BlockDriverState *bs)
2785ea2384d3Sbellard {
2786760e0063SKevin Wolf     if (bs->backing && bs->backing->bs->encrypted) {
2787ea2384d3Sbellard         return 1;
2788760e0063SKevin Wolf     }
2789ea2384d3Sbellard     return bs->encrypted;
2790ea2384d3Sbellard }
2791ea2384d3Sbellard 
2792c0f4ce77Saliguori int bdrv_key_required(BlockDriverState *bs)
2793c0f4ce77Saliguori {
2794760e0063SKevin Wolf     BdrvChild *backing = bs->backing;
2795c0f4ce77Saliguori 
2796760e0063SKevin Wolf     if (backing && backing->bs->encrypted && !backing->bs->valid_key) {
2797c0f4ce77Saliguori         return 1;
2798760e0063SKevin Wolf     }
2799c0f4ce77Saliguori     return (bs->encrypted && !bs->valid_key);
2800c0f4ce77Saliguori }
2801c0f4ce77Saliguori 
2802ea2384d3Sbellard int bdrv_set_key(BlockDriverState *bs, const char *key)
2803ea2384d3Sbellard {
2804ea2384d3Sbellard     int ret;
2805760e0063SKevin Wolf     if (bs->backing && bs->backing->bs->encrypted) {
2806760e0063SKevin Wolf         ret = bdrv_set_key(bs->backing->bs, key);
2807ea2384d3Sbellard         if (ret < 0)
2808ea2384d3Sbellard             return ret;
2809ea2384d3Sbellard         if (!bs->encrypted)
2810ea2384d3Sbellard             return 0;
2811ea2384d3Sbellard     }
2812fd04a2aeSShahar Havivi     if (!bs->encrypted) {
2813fd04a2aeSShahar Havivi         return -EINVAL;
2814fd04a2aeSShahar Havivi     } else if (!bs->drv || !bs->drv->bdrv_set_key) {
2815fd04a2aeSShahar Havivi         return -ENOMEDIUM;
2816fd04a2aeSShahar Havivi     }
2817c0f4ce77Saliguori     ret = bs->drv->bdrv_set_key(bs, key);
2818bb5fc20fSaliguori     if (ret < 0) {
2819bb5fc20fSaliguori         bs->valid_key = 0;
2820bb5fc20fSaliguori     } else if (!bs->valid_key) {
2821bb5fc20fSaliguori         bs->valid_key = 1;
2822a7f53e26SMarkus Armbruster         if (bs->blk) {
2823bb5fc20fSaliguori             /* call the change callback now, we skipped it on open */
2824a7f53e26SMarkus Armbruster             blk_dev_change_media_cb(bs->blk, true);
2825a7f53e26SMarkus Armbruster         }
2826bb5fc20fSaliguori     }
2827c0f4ce77Saliguori     return ret;
2828ea2384d3Sbellard }
2829ea2384d3Sbellard 
28304d2855a3SMarkus Armbruster /*
28314d2855a3SMarkus Armbruster  * Provide an encryption key for @bs.
28324d2855a3SMarkus Armbruster  * If @key is non-null:
28334d2855a3SMarkus Armbruster  *     If @bs is not encrypted, fail.
28344d2855a3SMarkus Armbruster  *     Else if the key is invalid, fail.
28354d2855a3SMarkus Armbruster  *     Else set @bs's key to @key, replacing the existing key, if any.
28364d2855a3SMarkus Armbruster  * If @key is null:
28374d2855a3SMarkus Armbruster  *     If @bs is encrypted and still lacks a key, fail.
28384d2855a3SMarkus Armbruster  *     Else do nothing.
28394d2855a3SMarkus Armbruster  * On failure, store an error object through @errp if non-null.
28404d2855a3SMarkus Armbruster  */
28414d2855a3SMarkus Armbruster void bdrv_add_key(BlockDriverState *bs, const char *key, Error **errp)
28424d2855a3SMarkus Armbruster {
28434d2855a3SMarkus Armbruster     if (key) {
28444d2855a3SMarkus Armbruster         if (!bdrv_is_encrypted(bs)) {
284581e5f78aSAlberto Garcia             error_setg(errp, "Node '%s' is not encrypted",
284681e5f78aSAlberto Garcia                       bdrv_get_device_or_node_name(bs));
28474d2855a3SMarkus Armbruster         } else if (bdrv_set_key(bs, key) < 0) {
2848c6bd8c70SMarkus Armbruster             error_setg(errp, QERR_INVALID_PASSWORD);
28494d2855a3SMarkus Armbruster         }
28504d2855a3SMarkus Armbruster     } else {
28514d2855a3SMarkus Armbruster         if (bdrv_key_required(bs)) {
2852b1ca6391SMarkus Armbruster             error_set(errp, ERROR_CLASS_DEVICE_ENCRYPTED,
2853b1ca6391SMarkus Armbruster                       "'%s' (%s) is encrypted",
285481e5f78aSAlberto Garcia                       bdrv_get_device_or_node_name(bs),
28554d2855a3SMarkus Armbruster                       bdrv_get_encrypted_filename(bs));
28564d2855a3SMarkus Armbruster         }
28574d2855a3SMarkus Armbruster     }
28584d2855a3SMarkus Armbruster }
28594d2855a3SMarkus Armbruster 
2860f8d6bba1SMarkus Armbruster const char *bdrv_get_format_name(BlockDriverState *bs)
2861ea2384d3Sbellard {
2862f8d6bba1SMarkus Armbruster     return bs->drv ? bs->drv->format_name : NULL;
2863ea2384d3Sbellard }
2864ea2384d3Sbellard 
2865ada42401SStefan Hajnoczi static int qsort_strcmp(const void *a, const void *b)
2866ada42401SStefan Hajnoczi {
2867ada42401SStefan Hajnoczi     return strcmp(a, b);
2868ada42401SStefan Hajnoczi }
2869ada42401SStefan Hajnoczi 
2870ea2384d3Sbellard void bdrv_iterate_format(void (*it)(void *opaque, const char *name),
2871ea2384d3Sbellard                          void *opaque)
2872ea2384d3Sbellard {
2873ea2384d3Sbellard     BlockDriver *drv;
2874e855e4fbSJeff Cody     int count = 0;
2875ada42401SStefan Hajnoczi     int i;
2876e855e4fbSJeff Cody     const char **formats = NULL;
2877ea2384d3Sbellard 
28788a22f02aSStefan Hajnoczi     QLIST_FOREACH(drv, &bdrv_drivers, list) {
2879e855e4fbSJeff Cody         if (drv->format_name) {
2880e855e4fbSJeff Cody             bool found = false;
2881e855e4fbSJeff Cody             int i = count;
2882e855e4fbSJeff Cody             while (formats && i && !found) {
2883e855e4fbSJeff Cody                 found = !strcmp(formats[--i], drv->format_name);
2884e855e4fbSJeff Cody             }
2885e855e4fbSJeff Cody 
2886e855e4fbSJeff Cody             if (!found) {
28875839e53bSMarkus Armbruster                 formats = g_renew(const char *, formats, count + 1);
2888e855e4fbSJeff Cody                 formats[count++] = drv->format_name;
2889ea2384d3Sbellard             }
2890ea2384d3Sbellard         }
2891e855e4fbSJeff Cody     }
2892ada42401SStefan Hajnoczi 
2893ada42401SStefan Hajnoczi     qsort(formats, count, sizeof(formats[0]), qsort_strcmp);
2894ada42401SStefan Hajnoczi 
2895ada42401SStefan Hajnoczi     for (i = 0; i < count; i++) {
2896ada42401SStefan Hajnoczi         it(opaque, formats[i]);
2897ada42401SStefan Hajnoczi     }
2898ada42401SStefan Hajnoczi 
2899e855e4fbSJeff Cody     g_free(formats);
2900e855e4fbSJeff Cody }
2901ea2384d3Sbellard 
2902dc364f4cSBenoît Canet /* This function is to find a node in the bs graph */
2903dc364f4cSBenoît Canet BlockDriverState *bdrv_find_node(const char *node_name)
2904dc364f4cSBenoît Canet {
2905dc364f4cSBenoît Canet     BlockDriverState *bs;
2906dc364f4cSBenoît Canet 
2907dc364f4cSBenoît Canet     assert(node_name);
2908dc364f4cSBenoît Canet 
2909dc364f4cSBenoît Canet     QTAILQ_FOREACH(bs, &graph_bdrv_states, node_list) {
2910dc364f4cSBenoît Canet         if (!strcmp(node_name, bs->node_name)) {
2911dc364f4cSBenoît Canet             return bs;
2912dc364f4cSBenoît Canet         }
2913dc364f4cSBenoît Canet     }
2914dc364f4cSBenoît Canet     return NULL;
2915dc364f4cSBenoît Canet }
2916dc364f4cSBenoît Canet 
2917c13163fbSBenoît Canet /* Put this QMP function here so it can access the static graph_bdrv_states. */
2918d5a8ee60SAlberto Garcia BlockDeviceInfoList *bdrv_named_nodes_list(Error **errp)
2919c13163fbSBenoît Canet {
2920c13163fbSBenoît Canet     BlockDeviceInfoList *list, *entry;
2921c13163fbSBenoît Canet     BlockDriverState *bs;
2922c13163fbSBenoît Canet 
2923c13163fbSBenoît Canet     list = NULL;
2924c13163fbSBenoît Canet     QTAILQ_FOREACH(bs, &graph_bdrv_states, node_list) {
2925d5a8ee60SAlberto Garcia         BlockDeviceInfo *info = bdrv_block_device_info(bs, errp);
2926d5a8ee60SAlberto Garcia         if (!info) {
2927d5a8ee60SAlberto Garcia             qapi_free_BlockDeviceInfoList(list);
2928d5a8ee60SAlberto Garcia             return NULL;
2929d5a8ee60SAlberto Garcia         }
2930c13163fbSBenoît Canet         entry = g_malloc0(sizeof(*entry));
2931d5a8ee60SAlberto Garcia         entry->value = info;
2932c13163fbSBenoît Canet         entry->next = list;
2933c13163fbSBenoît Canet         list = entry;
2934c13163fbSBenoît Canet     }
2935c13163fbSBenoît Canet 
2936c13163fbSBenoît Canet     return list;
2937c13163fbSBenoît Canet }
2938c13163fbSBenoît Canet 
293912d3ba82SBenoît Canet BlockDriverState *bdrv_lookup_bs(const char *device,
294012d3ba82SBenoît Canet                                  const char *node_name,
294112d3ba82SBenoît Canet                                  Error **errp)
294212d3ba82SBenoît Canet {
29437f06d47eSMarkus Armbruster     BlockBackend *blk;
29447f06d47eSMarkus Armbruster     BlockDriverState *bs;
294512d3ba82SBenoît Canet 
294612d3ba82SBenoît Canet     if (device) {
29477f06d47eSMarkus Armbruster         blk = blk_by_name(device);
294812d3ba82SBenoît Canet 
29497f06d47eSMarkus Armbruster         if (blk) {
29509f4ed6fbSAlberto Garcia             bs = blk_bs(blk);
29519f4ed6fbSAlberto Garcia             if (!bs) {
29525433c24fSMax Reitz                 error_setg(errp, "Device '%s' has no medium", device);
29535433c24fSMax Reitz             }
29545433c24fSMax Reitz 
29559f4ed6fbSAlberto Garcia             return bs;
295612d3ba82SBenoît Canet         }
2957dd67fa50SBenoît Canet     }
295812d3ba82SBenoît Canet 
2959dd67fa50SBenoît Canet     if (node_name) {
296012d3ba82SBenoît Canet         bs = bdrv_find_node(node_name);
296112d3ba82SBenoît Canet 
2962dd67fa50SBenoît Canet         if (bs) {
2963dd67fa50SBenoît Canet             return bs;
2964dd67fa50SBenoît Canet         }
296512d3ba82SBenoît Canet     }
296612d3ba82SBenoît Canet 
2967dd67fa50SBenoît Canet     error_setg(errp, "Cannot find device=%s nor node_name=%s",
2968dd67fa50SBenoît Canet                      device ? device : "",
2969dd67fa50SBenoît Canet                      node_name ? node_name : "");
2970dd67fa50SBenoît Canet     return NULL;
297112d3ba82SBenoît Canet }
297212d3ba82SBenoît Canet 
29735a6684d2SJeff Cody /* If 'base' is in the same chain as 'top', return true. Otherwise,
29745a6684d2SJeff Cody  * return false.  If either argument is NULL, return false. */
29755a6684d2SJeff Cody bool bdrv_chain_contains(BlockDriverState *top, BlockDriverState *base)
29765a6684d2SJeff Cody {
29775a6684d2SJeff Cody     while (top && top != base) {
2978760e0063SKevin Wolf         top = backing_bs(top);
29795a6684d2SJeff Cody     }
29805a6684d2SJeff Cody 
29815a6684d2SJeff Cody     return top != NULL;
29825a6684d2SJeff Cody }
29835a6684d2SJeff Cody 
298404df765aSFam Zheng BlockDriverState *bdrv_next_node(BlockDriverState *bs)
298504df765aSFam Zheng {
298604df765aSFam Zheng     if (!bs) {
298704df765aSFam Zheng         return QTAILQ_FIRST(&graph_bdrv_states);
298804df765aSFam Zheng     }
298904df765aSFam Zheng     return QTAILQ_NEXT(bs, node_list);
299004df765aSFam Zheng }
299104df765aSFam Zheng 
29922f399b0aSMarkus Armbruster BlockDriverState *bdrv_next(BlockDriverState *bs)
29932f399b0aSMarkus Armbruster {
29942f399b0aSMarkus Armbruster     if (!bs) {
29952f399b0aSMarkus Armbruster         return QTAILQ_FIRST(&bdrv_states);
29962f399b0aSMarkus Armbruster     }
2997dc364f4cSBenoît Canet     return QTAILQ_NEXT(bs, device_list);
29982f399b0aSMarkus Armbruster }
29992f399b0aSMarkus Armbruster 
300020a9e77dSFam Zheng const char *bdrv_get_node_name(const BlockDriverState *bs)
300120a9e77dSFam Zheng {
300220a9e77dSFam Zheng     return bs->node_name;
300320a9e77dSFam Zheng }
300420a9e77dSFam Zheng 
30057f06d47eSMarkus Armbruster /* TODO check what callers really want: bs->node_name or blk_name() */
3006bfb197e0SMarkus Armbruster const char *bdrv_get_device_name(const BlockDriverState *bs)
3007ea2384d3Sbellard {
3008bfb197e0SMarkus Armbruster     return bs->blk ? blk_name(bs->blk) : "";
3009ea2384d3Sbellard }
3010ea2384d3Sbellard 
30119b2aa84fSAlberto Garcia /* This can be used to identify nodes that might not have a device
30129b2aa84fSAlberto Garcia  * name associated. Since node and device names live in the same
30139b2aa84fSAlberto Garcia  * namespace, the result is unambiguous. The exception is if both are
30149b2aa84fSAlberto Garcia  * absent, then this returns an empty (non-null) string. */
30159b2aa84fSAlberto Garcia const char *bdrv_get_device_or_node_name(const BlockDriverState *bs)
30169b2aa84fSAlberto Garcia {
30179b2aa84fSAlberto Garcia     return bs->blk ? blk_name(bs->blk) : bs->node_name;
30189b2aa84fSAlberto Garcia }
30199b2aa84fSAlberto Garcia 
3020c8433287SMarkus Armbruster int bdrv_get_flags(BlockDriverState *bs)
3021c8433287SMarkus Armbruster {
3022c8433287SMarkus Armbruster     return bs->open_flags;
3023c8433287SMarkus Armbruster }
3024c8433287SMarkus Armbruster 
30253ac21627SPeter Lieven int bdrv_has_zero_init_1(BlockDriverState *bs)
30263ac21627SPeter Lieven {
30273ac21627SPeter Lieven     return 1;
30283ac21627SPeter Lieven }
30293ac21627SPeter Lieven 
3030f2feebbdSKevin Wolf int bdrv_has_zero_init(BlockDriverState *bs)
3031f2feebbdSKevin Wolf {
3032f2feebbdSKevin Wolf     assert(bs->drv);
3033f2feebbdSKevin Wolf 
303411212d8fSPaolo Bonzini     /* If BS is a copy on write image, it is initialized to
303511212d8fSPaolo Bonzini        the contents of the base image, which may not be zeroes.  */
3036760e0063SKevin Wolf     if (bs->backing) {
303711212d8fSPaolo Bonzini         return 0;
303811212d8fSPaolo Bonzini     }
3039336c1c12SKevin Wolf     if (bs->drv->bdrv_has_zero_init) {
3040336c1c12SKevin Wolf         return bs->drv->bdrv_has_zero_init(bs);
3041f2feebbdSKevin Wolf     }
3042f2feebbdSKevin Wolf 
30433ac21627SPeter Lieven     /* safe default */
30443ac21627SPeter Lieven     return 0;
3045f2feebbdSKevin Wolf }
3046f2feebbdSKevin Wolf 
30474ce78691SPeter Lieven bool bdrv_unallocated_blocks_are_zero(BlockDriverState *bs)
30484ce78691SPeter Lieven {
30494ce78691SPeter Lieven     BlockDriverInfo bdi;
30504ce78691SPeter Lieven 
3051760e0063SKevin Wolf     if (bs->backing) {
30524ce78691SPeter Lieven         return false;
30534ce78691SPeter Lieven     }
30544ce78691SPeter Lieven 
30554ce78691SPeter Lieven     if (bdrv_get_info(bs, &bdi) == 0) {
30564ce78691SPeter Lieven         return bdi.unallocated_blocks_are_zero;
30574ce78691SPeter Lieven     }
30584ce78691SPeter Lieven 
30594ce78691SPeter Lieven     return false;
30604ce78691SPeter Lieven }
30614ce78691SPeter Lieven 
30624ce78691SPeter Lieven bool bdrv_can_write_zeroes_with_unmap(BlockDriverState *bs)
30634ce78691SPeter Lieven {
30644ce78691SPeter Lieven     BlockDriverInfo bdi;
30654ce78691SPeter Lieven 
3066760e0063SKevin Wolf     if (bs->backing || !(bs->open_flags & BDRV_O_UNMAP)) {
30674ce78691SPeter Lieven         return false;
30684ce78691SPeter Lieven     }
30694ce78691SPeter Lieven 
30704ce78691SPeter Lieven     if (bdrv_get_info(bs, &bdi) == 0) {
30714ce78691SPeter Lieven         return bdi.can_write_zeroes_with_unmap;
30724ce78691SPeter Lieven     }
30734ce78691SPeter Lieven 
30744ce78691SPeter Lieven     return false;
30754ce78691SPeter Lieven }
30764ce78691SPeter Lieven 
3077045df330Saliguori const char *bdrv_get_encrypted_filename(BlockDriverState *bs)
3078045df330Saliguori {
3079760e0063SKevin Wolf     if (bs->backing && bs->backing->bs->encrypted)
3080045df330Saliguori         return bs->backing_file;
3081045df330Saliguori     else if (bs->encrypted)
3082045df330Saliguori         return bs->filename;
3083045df330Saliguori     else
3084045df330Saliguori         return NULL;
3085045df330Saliguori }
3086045df330Saliguori 
308783f64091Sbellard void bdrv_get_backing_filename(BlockDriverState *bs,
308883f64091Sbellard                                char *filename, int filename_size)
308983f64091Sbellard {
309083f64091Sbellard     pstrcpy(filename, filename_size, bs->backing_file);
309183f64091Sbellard }
309283f64091Sbellard 
3093faea38e7Sbellard int bdrv_get_info(BlockDriverState *bs, BlockDriverInfo *bdi)
3094faea38e7Sbellard {
3095faea38e7Sbellard     BlockDriver *drv = bs->drv;
3096faea38e7Sbellard     if (!drv)
309719cb3738Sbellard         return -ENOMEDIUM;
3098faea38e7Sbellard     if (!drv->bdrv_get_info)
3099faea38e7Sbellard         return -ENOTSUP;
3100faea38e7Sbellard     memset(bdi, 0, sizeof(*bdi));
3101faea38e7Sbellard     return drv->bdrv_get_info(bs, bdi);
3102faea38e7Sbellard }
3103faea38e7Sbellard 
3104eae041feSMax Reitz ImageInfoSpecific *bdrv_get_specific_info(BlockDriverState *bs)
3105eae041feSMax Reitz {
3106eae041feSMax Reitz     BlockDriver *drv = bs->drv;
3107eae041feSMax Reitz     if (drv && drv->bdrv_get_specific_info) {
3108eae041feSMax Reitz         return drv->bdrv_get_specific_info(bs);
3109eae041feSMax Reitz     }
3110eae041feSMax Reitz     return NULL;
3111eae041feSMax Reitz }
3112eae041feSMax Reitz 
3113a31939e6SEric Blake void bdrv_debug_event(BlockDriverState *bs, BlkdebugEvent event)
31148b9b0cc2SKevin Wolf {
3115bf736fe3SKevin Wolf     if (!bs || !bs->drv || !bs->drv->bdrv_debug_event) {
31168b9b0cc2SKevin Wolf         return;
31178b9b0cc2SKevin Wolf     }
31188b9b0cc2SKevin Wolf 
3119bf736fe3SKevin Wolf     bs->drv->bdrv_debug_event(bs, event);
312041c695c7SKevin Wolf }
31218b9b0cc2SKevin Wolf 
312241c695c7SKevin Wolf int bdrv_debug_breakpoint(BlockDriverState *bs, const char *event,
312341c695c7SKevin Wolf                           const char *tag)
312441c695c7SKevin Wolf {
312541c695c7SKevin Wolf     while (bs && bs->drv && !bs->drv->bdrv_debug_breakpoint) {
31269a4f4c31SKevin Wolf         bs = bs->file ? bs->file->bs : NULL;
312741c695c7SKevin Wolf     }
312841c695c7SKevin Wolf 
312941c695c7SKevin Wolf     if (bs && bs->drv && bs->drv->bdrv_debug_breakpoint) {
313041c695c7SKevin Wolf         return bs->drv->bdrv_debug_breakpoint(bs, event, tag);
313141c695c7SKevin Wolf     }
313241c695c7SKevin Wolf 
313341c695c7SKevin Wolf     return -ENOTSUP;
313441c695c7SKevin Wolf }
313541c695c7SKevin Wolf 
31364cc70e93SFam Zheng int bdrv_debug_remove_breakpoint(BlockDriverState *bs, const char *tag)
31374cc70e93SFam Zheng {
31384cc70e93SFam Zheng     while (bs && bs->drv && !bs->drv->bdrv_debug_remove_breakpoint) {
31399a4f4c31SKevin Wolf         bs = bs->file ? bs->file->bs : NULL;
31404cc70e93SFam Zheng     }
31414cc70e93SFam Zheng 
31424cc70e93SFam Zheng     if (bs && bs->drv && bs->drv->bdrv_debug_remove_breakpoint) {
31434cc70e93SFam Zheng         return bs->drv->bdrv_debug_remove_breakpoint(bs, tag);
31444cc70e93SFam Zheng     }
31454cc70e93SFam Zheng 
31464cc70e93SFam Zheng     return -ENOTSUP;
31474cc70e93SFam Zheng }
31484cc70e93SFam Zheng 
314941c695c7SKevin Wolf int bdrv_debug_resume(BlockDriverState *bs, const char *tag)
315041c695c7SKevin Wolf {
3151938789eaSMax Reitz     while (bs && (!bs->drv || !bs->drv->bdrv_debug_resume)) {
31529a4f4c31SKevin Wolf         bs = bs->file ? bs->file->bs : NULL;
315341c695c7SKevin Wolf     }
315441c695c7SKevin Wolf 
315541c695c7SKevin Wolf     if (bs && bs->drv && bs->drv->bdrv_debug_resume) {
315641c695c7SKevin Wolf         return bs->drv->bdrv_debug_resume(bs, tag);
315741c695c7SKevin Wolf     }
315841c695c7SKevin Wolf 
315941c695c7SKevin Wolf     return -ENOTSUP;
316041c695c7SKevin Wolf }
316141c695c7SKevin Wolf 
316241c695c7SKevin Wolf bool bdrv_debug_is_suspended(BlockDriverState *bs, const char *tag)
316341c695c7SKevin Wolf {
316441c695c7SKevin Wolf     while (bs && bs->drv && !bs->drv->bdrv_debug_is_suspended) {
31659a4f4c31SKevin Wolf         bs = bs->file ? bs->file->bs : NULL;
316641c695c7SKevin Wolf     }
316741c695c7SKevin Wolf 
316841c695c7SKevin Wolf     if (bs && bs->drv && bs->drv->bdrv_debug_is_suspended) {
316941c695c7SKevin Wolf         return bs->drv->bdrv_debug_is_suspended(bs, tag);
317041c695c7SKevin Wolf     }
317141c695c7SKevin Wolf 
317241c695c7SKevin Wolf     return false;
31738b9b0cc2SKevin Wolf }
31748b9b0cc2SKevin Wolf 
3175199630b6SBlue Swirl int bdrv_is_snapshot(BlockDriverState *bs)
3176199630b6SBlue Swirl {
3177199630b6SBlue Swirl     return !!(bs->open_flags & BDRV_O_SNAPSHOT);
3178199630b6SBlue Swirl }
3179199630b6SBlue Swirl 
3180b1b1d783SJeff Cody /* backing_file can either be relative, or absolute, or a protocol.  If it is
3181b1b1d783SJeff Cody  * relative, it must be relative to the chain.  So, passing in bs->filename
3182b1b1d783SJeff Cody  * from a BDS as backing_file should not be done, as that may be relative to
3183b1b1d783SJeff Cody  * the CWD rather than the chain. */
3184e8a6bb9cSMarcelo Tosatti BlockDriverState *bdrv_find_backing_image(BlockDriverState *bs,
3185e8a6bb9cSMarcelo Tosatti         const char *backing_file)
3186e8a6bb9cSMarcelo Tosatti {
3187b1b1d783SJeff Cody     char *filename_full = NULL;
3188b1b1d783SJeff Cody     char *backing_file_full = NULL;
3189b1b1d783SJeff Cody     char *filename_tmp = NULL;
3190b1b1d783SJeff Cody     int is_protocol = 0;
3191b1b1d783SJeff Cody     BlockDriverState *curr_bs = NULL;
3192b1b1d783SJeff Cody     BlockDriverState *retval = NULL;
3193b1b1d783SJeff Cody 
3194b1b1d783SJeff Cody     if (!bs || !bs->drv || !backing_file) {
3195e8a6bb9cSMarcelo Tosatti         return NULL;
3196e8a6bb9cSMarcelo Tosatti     }
3197e8a6bb9cSMarcelo Tosatti 
3198b1b1d783SJeff Cody     filename_full     = g_malloc(PATH_MAX);
3199b1b1d783SJeff Cody     backing_file_full = g_malloc(PATH_MAX);
3200b1b1d783SJeff Cody     filename_tmp      = g_malloc(PATH_MAX);
3201b1b1d783SJeff Cody 
3202b1b1d783SJeff Cody     is_protocol = path_has_protocol(backing_file);
3203b1b1d783SJeff Cody 
3204760e0063SKevin Wolf     for (curr_bs = bs; curr_bs->backing; curr_bs = curr_bs->backing->bs) {
3205b1b1d783SJeff Cody 
3206b1b1d783SJeff Cody         /* If either of the filename paths is actually a protocol, then
3207b1b1d783SJeff Cody          * compare unmodified paths; otherwise make paths relative */
3208b1b1d783SJeff Cody         if (is_protocol || path_has_protocol(curr_bs->backing_file)) {
3209b1b1d783SJeff Cody             if (strcmp(backing_file, curr_bs->backing_file) == 0) {
3210760e0063SKevin Wolf                 retval = curr_bs->backing->bs;
3211b1b1d783SJeff Cody                 break;
3212b1b1d783SJeff Cody             }
3213e8a6bb9cSMarcelo Tosatti         } else {
3214b1b1d783SJeff Cody             /* If not an absolute filename path, make it relative to the current
3215b1b1d783SJeff Cody              * image's filename path */
3216b1b1d783SJeff Cody             path_combine(filename_tmp, PATH_MAX, curr_bs->filename,
3217b1b1d783SJeff Cody                          backing_file);
3218b1b1d783SJeff Cody 
3219b1b1d783SJeff Cody             /* We are going to compare absolute pathnames */
3220b1b1d783SJeff Cody             if (!realpath(filename_tmp, filename_full)) {
3221b1b1d783SJeff Cody                 continue;
3222b1b1d783SJeff Cody             }
3223b1b1d783SJeff Cody 
3224b1b1d783SJeff Cody             /* We need to make sure the backing filename we are comparing against
3225b1b1d783SJeff Cody              * is relative to the current image filename (or absolute) */
3226b1b1d783SJeff Cody             path_combine(filename_tmp, PATH_MAX, curr_bs->filename,
3227b1b1d783SJeff Cody                          curr_bs->backing_file);
3228b1b1d783SJeff Cody 
3229b1b1d783SJeff Cody             if (!realpath(filename_tmp, backing_file_full)) {
3230b1b1d783SJeff Cody                 continue;
3231b1b1d783SJeff Cody             }
3232b1b1d783SJeff Cody 
3233b1b1d783SJeff Cody             if (strcmp(backing_file_full, filename_full) == 0) {
3234760e0063SKevin Wolf                 retval = curr_bs->backing->bs;
3235b1b1d783SJeff Cody                 break;
3236b1b1d783SJeff Cody             }
3237e8a6bb9cSMarcelo Tosatti         }
3238e8a6bb9cSMarcelo Tosatti     }
3239e8a6bb9cSMarcelo Tosatti 
3240b1b1d783SJeff Cody     g_free(filename_full);
3241b1b1d783SJeff Cody     g_free(backing_file_full);
3242b1b1d783SJeff Cody     g_free(filename_tmp);
3243b1b1d783SJeff Cody     return retval;
3244e8a6bb9cSMarcelo Tosatti }
3245e8a6bb9cSMarcelo Tosatti 
3246f198fd1cSBenoît Canet int bdrv_get_backing_file_depth(BlockDriverState *bs)
3247f198fd1cSBenoît Canet {
3248f198fd1cSBenoît Canet     if (!bs->drv) {
3249f198fd1cSBenoît Canet         return 0;
3250f198fd1cSBenoît Canet     }
3251f198fd1cSBenoît Canet 
3252760e0063SKevin Wolf     if (!bs->backing) {
3253f198fd1cSBenoît Canet         return 0;
3254f198fd1cSBenoît Canet     }
3255f198fd1cSBenoît Canet 
3256760e0063SKevin Wolf     return 1 + bdrv_get_backing_file_depth(bs->backing->bs);
3257f198fd1cSBenoît Canet }
3258f198fd1cSBenoît Canet 
3259ea2384d3Sbellard void bdrv_init(void)
3260ea2384d3Sbellard {
32615efa9d5aSAnthony Liguori     module_call_init(MODULE_INIT_BLOCK);
3262ea2384d3Sbellard }
3263ce1a14dcSpbrook 
3264eb852011SMarkus Armbruster void bdrv_init_with_whitelist(void)
3265eb852011SMarkus Armbruster {
3266eb852011SMarkus Armbruster     use_bdrv_whitelist = 1;
3267eb852011SMarkus Armbruster     bdrv_init();
3268eb852011SMarkus Armbruster }
3269eb852011SMarkus Armbruster 
32705a8a30dbSKevin Wolf void bdrv_invalidate_cache(BlockDriverState *bs, Error **errp)
32710f15423cSAnthony Liguori {
32725a8a30dbSKevin Wolf     Error *local_err = NULL;
32735a8a30dbSKevin Wolf     int ret;
32745a8a30dbSKevin Wolf 
32753456a8d1SKevin Wolf     if (!bs->drv)  {
32763456a8d1SKevin Wolf         return;
32770f15423cSAnthony Liguori     }
32783456a8d1SKevin Wolf 
327904c01a5cSKevin Wolf     if (!(bs->open_flags & BDRV_O_INACTIVE)) {
32807ea2d269SAlexey Kardashevskiy         return;
32817ea2d269SAlexey Kardashevskiy     }
328204c01a5cSKevin Wolf     bs->open_flags &= ~BDRV_O_INACTIVE;
32837ea2d269SAlexey Kardashevskiy 
32843456a8d1SKevin Wolf     if (bs->drv->bdrv_invalidate_cache) {
32855a8a30dbSKevin Wolf         bs->drv->bdrv_invalidate_cache(bs, &local_err);
32863456a8d1SKevin Wolf     } else if (bs->file) {
32879a4f4c31SKevin Wolf         bdrv_invalidate_cache(bs->file->bs, &local_err);
32885a8a30dbSKevin Wolf     }
32895a8a30dbSKevin Wolf     if (local_err) {
329004c01a5cSKevin Wolf         bs->open_flags |= BDRV_O_INACTIVE;
32915a8a30dbSKevin Wolf         error_propagate(errp, local_err);
32925a8a30dbSKevin Wolf         return;
32933456a8d1SKevin Wolf     }
32943456a8d1SKevin Wolf 
32955a8a30dbSKevin Wolf     ret = refresh_total_sectors(bs, bs->total_sectors);
32965a8a30dbSKevin Wolf     if (ret < 0) {
329704c01a5cSKevin Wolf         bs->open_flags |= BDRV_O_INACTIVE;
32985a8a30dbSKevin Wolf         error_setg_errno(errp, -ret, "Could not refresh total sector count");
32995a8a30dbSKevin Wolf         return;
33005a8a30dbSKevin Wolf     }
33010f15423cSAnthony Liguori }
33020f15423cSAnthony Liguori 
33035a8a30dbSKevin Wolf void bdrv_invalidate_cache_all(Error **errp)
33040f15423cSAnthony Liguori {
33050f15423cSAnthony Liguori     BlockDriverState *bs;
33065a8a30dbSKevin Wolf     Error *local_err = NULL;
33070f15423cSAnthony Liguori 
3308dc364f4cSBenoît Canet     QTAILQ_FOREACH(bs, &bdrv_states, device_list) {
3309ed78cda3SStefan Hajnoczi         AioContext *aio_context = bdrv_get_aio_context(bs);
3310ed78cda3SStefan Hajnoczi 
3311ed78cda3SStefan Hajnoczi         aio_context_acquire(aio_context);
33125a8a30dbSKevin Wolf         bdrv_invalidate_cache(bs, &local_err);
3313ed78cda3SStefan Hajnoczi         aio_context_release(aio_context);
33145a8a30dbSKevin Wolf         if (local_err) {
33155a8a30dbSKevin Wolf             error_propagate(errp, local_err);
33165a8a30dbSKevin Wolf             return;
33175a8a30dbSKevin Wolf         }
33180f15423cSAnthony Liguori     }
33190f15423cSAnthony Liguori }
33200f15423cSAnthony Liguori 
332176b1c7feSKevin Wolf static int bdrv_inactivate(BlockDriverState *bs)
332276b1c7feSKevin Wolf {
332376b1c7feSKevin Wolf     int ret;
332476b1c7feSKevin Wolf 
332576b1c7feSKevin Wolf     if (bs->drv->bdrv_inactivate) {
332676b1c7feSKevin Wolf         ret = bs->drv->bdrv_inactivate(bs);
332776b1c7feSKevin Wolf         if (ret < 0) {
332876b1c7feSKevin Wolf             return ret;
332976b1c7feSKevin Wolf         }
333076b1c7feSKevin Wolf     }
333176b1c7feSKevin Wolf 
333276b1c7feSKevin Wolf     bs->open_flags |= BDRV_O_INACTIVE;
333376b1c7feSKevin Wolf     return 0;
333476b1c7feSKevin Wolf }
333576b1c7feSKevin Wolf 
333676b1c7feSKevin Wolf int bdrv_inactivate_all(void)
333776b1c7feSKevin Wolf {
333876b1c7feSKevin Wolf     BlockDriverState *bs;
333976b1c7feSKevin Wolf     int ret;
334076b1c7feSKevin Wolf 
334176b1c7feSKevin Wolf     QTAILQ_FOREACH(bs, &bdrv_states, device_list) {
334276b1c7feSKevin Wolf         AioContext *aio_context = bdrv_get_aio_context(bs);
334376b1c7feSKevin Wolf 
334476b1c7feSKevin Wolf         aio_context_acquire(aio_context);
334576b1c7feSKevin Wolf         ret = bdrv_inactivate(bs);
334676b1c7feSKevin Wolf         aio_context_release(aio_context);
334776b1c7feSKevin Wolf         if (ret < 0) {
334876b1c7feSKevin Wolf             return ret;
334976b1c7feSKevin Wolf         }
335076b1c7feSKevin Wolf     }
335176b1c7feSKevin Wolf 
335276b1c7feSKevin Wolf     return 0;
335376b1c7feSKevin Wolf }
335476b1c7feSKevin Wolf 
3355f9f05dc5SKevin Wolf /**************************************************************/
335619cb3738Sbellard /* removable device support */
335719cb3738Sbellard 
335819cb3738Sbellard /**
335919cb3738Sbellard  * Return TRUE if the media is present
336019cb3738Sbellard  */
3361e031f750SMax Reitz bool bdrv_is_inserted(BlockDriverState *bs)
336219cb3738Sbellard {
336319cb3738Sbellard     BlockDriver *drv = bs->drv;
336428d7a789SMax Reitz     BdrvChild *child;
3365a1aff5bfSMarkus Armbruster 
3366e031f750SMax Reitz     if (!drv) {
3367e031f750SMax Reitz         return false;
3368e031f750SMax Reitz     }
336928d7a789SMax Reitz     if (drv->bdrv_is_inserted) {
3370a1aff5bfSMarkus Armbruster         return drv->bdrv_is_inserted(bs);
337119cb3738Sbellard     }
337228d7a789SMax Reitz     QLIST_FOREACH(child, &bs->children, next) {
337328d7a789SMax Reitz         if (!bdrv_is_inserted(child->bs)) {
337428d7a789SMax Reitz             return false;
337528d7a789SMax Reitz         }
337628d7a789SMax Reitz     }
337728d7a789SMax Reitz     return true;
337828d7a789SMax Reitz }
337919cb3738Sbellard 
338019cb3738Sbellard /**
33818e49ca46SMarkus Armbruster  * Return whether the media changed since the last call to this
33828e49ca46SMarkus Armbruster  * function, or -ENOTSUP if we don't know.  Most drivers don't know.
338319cb3738Sbellard  */
338419cb3738Sbellard int bdrv_media_changed(BlockDriverState *bs)
338519cb3738Sbellard {
338619cb3738Sbellard     BlockDriver *drv = bs->drv;
338719cb3738Sbellard 
33888e49ca46SMarkus Armbruster     if (drv && drv->bdrv_media_changed) {
33898e49ca46SMarkus Armbruster         return drv->bdrv_media_changed(bs);
33908e49ca46SMarkus Armbruster     }
33918e49ca46SMarkus Armbruster     return -ENOTSUP;
339219cb3738Sbellard }
339319cb3738Sbellard 
339419cb3738Sbellard /**
339519cb3738Sbellard  * If eject_flag is TRUE, eject the media. Otherwise, close the tray
339619cb3738Sbellard  */
3397f36f3949SLuiz Capitulino void bdrv_eject(BlockDriverState *bs, bool eject_flag)
339819cb3738Sbellard {
339919cb3738Sbellard     BlockDriver *drv = bs->drv;
3400bfb197e0SMarkus Armbruster     const char *device_name;
340119cb3738Sbellard 
3402822e1cd1SMarkus Armbruster     if (drv && drv->bdrv_eject) {
3403822e1cd1SMarkus Armbruster         drv->bdrv_eject(bs, eject_flag);
340419cb3738Sbellard     }
34056f382ed2SLuiz Capitulino 
3406bfb197e0SMarkus Armbruster     device_name = bdrv_get_device_name(bs);
3407bfb197e0SMarkus Armbruster     if (device_name[0] != '\0') {
3408bfb197e0SMarkus Armbruster         qapi_event_send_device_tray_moved(device_name,
3409a5ee7bd4SWenchao Xia                                           eject_flag, &error_abort);
34106f382ed2SLuiz Capitulino     }
341119cb3738Sbellard }
341219cb3738Sbellard 
341319cb3738Sbellard /**
341419cb3738Sbellard  * Lock or unlock the media (if it is locked, the user won't be able
341519cb3738Sbellard  * to eject it manually).
341619cb3738Sbellard  */
3417025e849aSMarkus Armbruster void bdrv_lock_medium(BlockDriverState *bs, bool locked)
341819cb3738Sbellard {
341919cb3738Sbellard     BlockDriver *drv = bs->drv;
342019cb3738Sbellard 
3421025e849aSMarkus Armbruster     trace_bdrv_lock_medium(bs, locked);
3422b8c6d095SStefan Hajnoczi 
3423025e849aSMarkus Armbruster     if (drv && drv->bdrv_lock_medium) {
3424025e849aSMarkus Armbruster         drv->bdrv_lock_medium(bs, locked);
342519cb3738Sbellard     }
342619cb3738Sbellard }
3427985a03b0Sths 
34289fcb0251SFam Zheng /* Get a reference to bs */
34299fcb0251SFam Zheng void bdrv_ref(BlockDriverState *bs)
34309fcb0251SFam Zheng {
34319fcb0251SFam Zheng     bs->refcnt++;
34329fcb0251SFam Zheng }
34339fcb0251SFam Zheng 
34349fcb0251SFam Zheng /* Release a previously grabbed reference to bs.
34359fcb0251SFam Zheng  * If after releasing, reference count is zero, the BlockDriverState is
34369fcb0251SFam Zheng  * deleted. */
34379fcb0251SFam Zheng void bdrv_unref(BlockDriverState *bs)
34389fcb0251SFam Zheng {
34399a4d5ca6SJeff Cody     if (!bs) {
34409a4d5ca6SJeff Cody         return;
34419a4d5ca6SJeff Cody     }
34429fcb0251SFam Zheng     assert(bs->refcnt > 0);
34439fcb0251SFam Zheng     if (--bs->refcnt == 0) {
34449fcb0251SFam Zheng         bdrv_delete(bs);
34459fcb0251SFam Zheng     }
34469fcb0251SFam Zheng }
34479fcb0251SFam Zheng 
3448fbe40ff7SFam Zheng struct BdrvOpBlocker {
3449fbe40ff7SFam Zheng     Error *reason;
3450fbe40ff7SFam Zheng     QLIST_ENTRY(BdrvOpBlocker) list;
3451fbe40ff7SFam Zheng };
3452fbe40ff7SFam Zheng 
3453fbe40ff7SFam Zheng bool bdrv_op_is_blocked(BlockDriverState *bs, BlockOpType op, Error **errp)
3454fbe40ff7SFam Zheng {
3455fbe40ff7SFam Zheng     BdrvOpBlocker *blocker;
3456fbe40ff7SFam Zheng     assert((int) op >= 0 && op < BLOCK_OP_TYPE_MAX);
3457fbe40ff7SFam Zheng     if (!QLIST_EMPTY(&bs->op_blockers[op])) {
3458fbe40ff7SFam Zheng         blocker = QLIST_FIRST(&bs->op_blockers[op]);
3459fbe40ff7SFam Zheng         if (errp) {
3460e43bfd9cSMarkus Armbruster             *errp = error_copy(blocker->reason);
3461e43bfd9cSMarkus Armbruster             error_prepend(errp, "Node '%s' is busy: ",
3462e43bfd9cSMarkus Armbruster                           bdrv_get_device_or_node_name(bs));
3463fbe40ff7SFam Zheng         }
3464fbe40ff7SFam Zheng         return true;
3465fbe40ff7SFam Zheng     }
3466fbe40ff7SFam Zheng     return false;
3467fbe40ff7SFam Zheng }
3468fbe40ff7SFam Zheng 
3469fbe40ff7SFam Zheng void bdrv_op_block(BlockDriverState *bs, BlockOpType op, Error *reason)
3470fbe40ff7SFam Zheng {
3471fbe40ff7SFam Zheng     BdrvOpBlocker *blocker;
3472fbe40ff7SFam Zheng     assert((int) op >= 0 && op < BLOCK_OP_TYPE_MAX);
3473fbe40ff7SFam Zheng 
34745839e53bSMarkus Armbruster     blocker = g_new0(BdrvOpBlocker, 1);
3475fbe40ff7SFam Zheng     blocker->reason = reason;
3476fbe40ff7SFam Zheng     QLIST_INSERT_HEAD(&bs->op_blockers[op], blocker, list);
3477fbe40ff7SFam Zheng }
3478fbe40ff7SFam Zheng 
3479fbe40ff7SFam Zheng void bdrv_op_unblock(BlockDriverState *bs, BlockOpType op, Error *reason)
3480fbe40ff7SFam Zheng {
3481fbe40ff7SFam Zheng     BdrvOpBlocker *blocker, *next;
3482fbe40ff7SFam Zheng     assert((int) op >= 0 && op < BLOCK_OP_TYPE_MAX);
3483fbe40ff7SFam Zheng     QLIST_FOREACH_SAFE(blocker, &bs->op_blockers[op], list, next) {
3484fbe40ff7SFam Zheng         if (blocker->reason == reason) {
3485fbe40ff7SFam Zheng             QLIST_REMOVE(blocker, list);
3486fbe40ff7SFam Zheng             g_free(blocker);
3487fbe40ff7SFam Zheng         }
3488fbe40ff7SFam Zheng     }
3489fbe40ff7SFam Zheng }
3490fbe40ff7SFam Zheng 
3491fbe40ff7SFam Zheng void bdrv_op_block_all(BlockDriverState *bs, Error *reason)
3492fbe40ff7SFam Zheng {
3493fbe40ff7SFam Zheng     int i;
3494fbe40ff7SFam Zheng     for (i = 0; i < BLOCK_OP_TYPE_MAX; i++) {
3495fbe40ff7SFam Zheng         bdrv_op_block(bs, i, reason);
3496fbe40ff7SFam Zheng     }
3497fbe40ff7SFam Zheng }
3498fbe40ff7SFam Zheng 
3499fbe40ff7SFam Zheng void bdrv_op_unblock_all(BlockDriverState *bs, Error *reason)
3500fbe40ff7SFam Zheng {
3501fbe40ff7SFam Zheng     int i;
3502fbe40ff7SFam Zheng     for (i = 0; i < BLOCK_OP_TYPE_MAX; i++) {
3503fbe40ff7SFam Zheng         bdrv_op_unblock(bs, i, reason);
3504fbe40ff7SFam Zheng     }
3505fbe40ff7SFam Zheng }
3506fbe40ff7SFam Zheng 
3507fbe40ff7SFam Zheng bool bdrv_op_blocker_is_empty(BlockDriverState *bs)
3508fbe40ff7SFam Zheng {
3509fbe40ff7SFam Zheng     int i;
3510fbe40ff7SFam Zheng 
3511fbe40ff7SFam Zheng     for (i = 0; i < BLOCK_OP_TYPE_MAX; i++) {
3512fbe40ff7SFam Zheng         if (!QLIST_EMPTY(&bs->op_blockers[i])) {
3513fbe40ff7SFam Zheng             return false;
3514fbe40ff7SFam Zheng         }
3515fbe40ff7SFam Zheng     }
3516fbe40ff7SFam Zheng     return true;
3517fbe40ff7SFam Zheng }
3518fbe40ff7SFam Zheng 
3519d92ada22SLuiz Capitulino void bdrv_img_create(const char *filename, const char *fmt,
3520f88e1a42SJes Sorensen                      const char *base_filename, const char *base_fmt,
3521f382d43aSMiroslav Rezanina                      char *options, uint64_t img_size, int flags,
3522f382d43aSMiroslav Rezanina                      Error **errp, bool quiet)
3523f88e1a42SJes Sorensen {
352483d0521aSChunyan Liu     QemuOptsList *create_opts = NULL;
352583d0521aSChunyan Liu     QemuOpts *opts = NULL;
352683d0521aSChunyan Liu     const char *backing_fmt, *backing_file;
352783d0521aSChunyan Liu     int64_t size;
3528f88e1a42SJes Sorensen     BlockDriver *drv, *proto_drv;
3529cc84d90fSMax Reitz     Error *local_err = NULL;
3530f88e1a42SJes Sorensen     int ret = 0;
3531f88e1a42SJes Sorensen 
3532f88e1a42SJes Sorensen     /* Find driver and parse its options */
3533f88e1a42SJes Sorensen     drv = bdrv_find_format(fmt);
3534f88e1a42SJes Sorensen     if (!drv) {
353571c79813SLuiz Capitulino         error_setg(errp, "Unknown file format '%s'", fmt);
3536d92ada22SLuiz Capitulino         return;
3537f88e1a42SJes Sorensen     }
3538f88e1a42SJes Sorensen 
3539b65a5e12SMax Reitz     proto_drv = bdrv_find_protocol(filename, true, errp);
3540f88e1a42SJes Sorensen     if (!proto_drv) {
3541d92ada22SLuiz Capitulino         return;
3542f88e1a42SJes Sorensen     }
3543f88e1a42SJes Sorensen 
3544c6149724SMax Reitz     if (!drv->create_opts) {
3545c6149724SMax Reitz         error_setg(errp, "Format driver '%s' does not support image creation",
3546c6149724SMax Reitz                    drv->format_name);
3547c6149724SMax Reitz         return;
3548c6149724SMax Reitz     }
3549c6149724SMax Reitz 
3550c6149724SMax Reitz     if (!proto_drv->create_opts) {
3551c6149724SMax Reitz         error_setg(errp, "Protocol driver '%s' does not support image creation",
3552c6149724SMax Reitz                    proto_drv->format_name);
3553c6149724SMax Reitz         return;
3554c6149724SMax Reitz     }
3555c6149724SMax Reitz 
3556c282e1fdSChunyan Liu     create_opts = qemu_opts_append(create_opts, drv->create_opts);
3557c282e1fdSChunyan Liu     create_opts = qemu_opts_append(create_opts, proto_drv->create_opts);
3558f88e1a42SJes Sorensen 
3559f88e1a42SJes Sorensen     /* Create parameter list with default values */
356083d0521aSChunyan Liu     opts = qemu_opts_create(create_opts, NULL, 0, &error_abort);
356139101f25SMarkus Armbruster     qemu_opt_set_number(opts, BLOCK_OPT_SIZE, img_size, &error_abort);
3562f88e1a42SJes Sorensen 
3563f88e1a42SJes Sorensen     /* Parse -o options */
3564f88e1a42SJes Sorensen     if (options) {
3565dc523cd3SMarkus Armbruster         qemu_opts_do_parse(opts, options, NULL, &local_err);
3566dc523cd3SMarkus Armbruster         if (local_err) {
3567dc523cd3SMarkus Armbruster             error_report_err(local_err);
3568dc523cd3SMarkus Armbruster             local_err = NULL;
356983d0521aSChunyan Liu             error_setg(errp, "Invalid options for file format '%s'", fmt);
3570f88e1a42SJes Sorensen             goto out;
3571f88e1a42SJes Sorensen         }
3572f88e1a42SJes Sorensen     }
3573f88e1a42SJes Sorensen 
3574f88e1a42SJes Sorensen     if (base_filename) {
3575f43e47dbSMarkus Armbruster         qemu_opt_set(opts, BLOCK_OPT_BACKING_FILE, base_filename, &local_err);
35766be4194bSMarkus Armbruster         if (local_err) {
357771c79813SLuiz Capitulino             error_setg(errp, "Backing file not supported for file format '%s'",
357871c79813SLuiz Capitulino                        fmt);
3579f88e1a42SJes Sorensen             goto out;
3580f88e1a42SJes Sorensen         }
3581f88e1a42SJes Sorensen     }
3582f88e1a42SJes Sorensen 
3583f88e1a42SJes Sorensen     if (base_fmt) {
3584f43e47dbSMarkus Armbruster         qemu_opt_set(opts, BLOCK_OPT_BACKING_FMT, base_fmt, &local_err);
35856be4194bSMarkus Armbruster         if (local_err) {
358671c79813SLuiz Capitulino             error_setg(errp, "Backing file format not supported for file "
358771c79813SLuiz Capitulino                              "format '%s'", fmt);
3588f88e1a42SJes Sorensen             goto out;
3589f88e1a42SJes Sorensen         }
3590f88e1a42SJes Sorensen     }
3591f88e1a42SJes Sorensen 
359283d0521aSChunyan Liu     backing_file = qemu_opt_get(opts, BLOCK_OPT_BACKING_FILE);
359383d0521aSChunyan Liu     if (backing_file) {
359483d0521aSChunyan Liu         if (!strcmp(filename, backing_file)) {
359571c79813SLuiz Capitulino             error_setg(errp, "Error: Trying to create an image with the "
359671c79813SLuiz Capitulino                              "same filename as the backing file");
3597792da93aSJes Sorensen             goto out;
3598792da93aSJes Sorensen         }
3599792da93aSJes Sorensen     }
3600792da93aSJes Sorensen 
360183d0521aSChunyan Liu     backing_fmt = qemu_opt_get(opts, BLOCK_OPT_BACKING_FMT);
3602f88e1a42SJes Sorensen 
3603f88e1a42SJes Sorensen     // The size for the image must always be specified, with one exception:
3604f88e1a42SJes Sorensen     // If we are using a backing file, we can obtain the size from there
360583d0521aSChunyan Liu     size = qemu_opt_get_size(opts, BLOCK_OPT_SIZE, 0);
360683d0521aSChunyan Liu     if (size == -1) {
360783d0521aSChunyan Liu         if (backing_file) {
360866f6b814SMax Reitz             BlockDriverState *bs;
360929168018SMax Reitz             char *full_backing = g_new0(char, PATH_MAX);
361052bf1e72SMarkus Armbruster             int64_t size;
361163090dacSPaolo Bonzini             int back_flags;
3612e6641719SMax Reitz             QDict *backing_options = NULL;
361363090dacSPaolo Bonzini 
361429168018SMax Reitz             bdrv_get_full_backing_filename_from_filename(filename, backing_file,
361529168018SMax Reitz                                                          full_backing, PATH_MAX,
361629168018SMax Reitz                                                          &local_err);
361729168018SMax Reitz             if (local_err) {
361829168018SMax Reitz                 g_free(full_backing);
361929168018SMax Reitz                 goto out;
362029168018SMax Reitz             }
362129168018SMax Reitz 
362263090dacSPaolo Bonzini             /* backing files always opened read-only */
362363090dacSPaolo Bonzini             back_flags =
362463090dacSPaolo Bonzini                 flags & ~(BDRV_O_RDWR | BDRV_O_SNAPSHOT | BDRV_O_NO_BACKING);
3625f88e1a42SJes Sorensen 
3626e6641719SMax Reitz             if (backing_fmt) {
3627e6641719SMax Reitz                 backing_options = qdict_new();
3628e6641719SMax Reitz                 qdict_put(backing_options, "driver",
3629e6641719SMax Reitz                           qstring_from_str(backing_fmt));
3630e6641719SMax Reitz             }
3631e6641719SMax Reitz 
3632f67503e5SMax Reitz             bs = NULL;
3633e6641719SMax Reitz             ret = bdrv_open(&bs, full_backing, NULL, backing_options,
36346ebf9aa2SMax Reitz                             back_flags, &local_err);
363529168018SMax Reitz             g_free(full_backing);
3636f88e1a42SJes Sorensen             if (ret < 0) {
3637f88e1a42SJes Sorensen                 goto out;
3638f88e1a42SJes Sorensen             }
363952bf1e72SMarkus Armbruster             size = bdrv_getlength(bs);
364052bf1e72SMarkus Armbruster             if (size < 0) {
364152bf1e72SMarkus Armbruster                 error_setg_errno(errp, -size, "Could not get size of '%s'",
364252bf1e72SMarkus Armbruster                                  backing_file);
364352bf1e72SMarkus Armbruster                 bdrv_unref(bs);
364452bf1e72SMarkus Armbruster                 goto out;
364552bf1e72SMarkus Armbruster             }
3646f88e1a42SJes Sorensen 
364739101f25SMarkus Armbruster             qemu_opt_set_number(opts, BLOCK_OPT_SIZE, size, &error_abort);
364866f6b814SMax Reitz 
364966f6b814SMax Reitz             bdrv_unref(bs);
3650f88e1a42SJes Sorensen         } else {
365171c79813SLuiz Capitulino             error_setg(errp, "Image creation needs a size parameter");
3652f88e1a42SJes Sorensen             goto out;
3653f88e1a42SJes Sorensen         }
3654f88e1a42SJes Sorensen     }
3655f88e1a42SJes Sorensen 
3656f382d43aSMiroslav Rezanina     if (!quiet) {
3657f88e1a42SJes Sorensen         printf("Formatting '%s', fmt=%s ", filename, fmt);
365843c5d8f8SFam Zheng         qemu_opts_print(opts, " ");
3659f88e1a42SJes Sorensen         puts("");
3660f382d43aSMiroslav Rezanina     }
366183d0521aSChunyan Liu 
3662c282e1fdSChunyan Liu     ret = bdrv_create(drv, filename, opts, &local_err);
366383d0521aSChunyan Liu 
3664cc84d90fSMax Reitz     if (ret == -EFBIG) {
3665cc84d90fSMax Reitz         /* This is generally a better message than whatever the driver would
3666cc84d90fSMax Reitz          * deliver (especially because of the cluster_size_hint), since that
3667cc84d90fSMax Reitz          * is most probably not much different from "image too large". */
3668f3f4d2c0SKevin Wolf         const char *cluster_size_hint = "";
366983d0521aSChunyan Liu         if (qemu_opt_get_size(opts, BLOCK_OPT_CLUSTER_SIZE, 0)) {
3670f3f4d2c0SKevin Wolf             cluster_size_hint = " (try using a larger cluster size)";
3671f3f4d2c0SKevin Wolf         }
3672cc84d90fSMax Reitz         error_setg(errp, "The image size is too large for file format '%s'"
3673cc84d90fSMax Reitz                    "%s", fmt, cluster_size_hint);
3674cc84d90fSMax Reitz         error_free(local_err);
3675cc84d90fSMax Reitz         local_err = NULL;
3676f88e1a42SJes Sorensen     }
3677f88e1a42SJes Sorensen 
3678f88e1a42SJes Sorensen out:
367983d0521aSChunyan Liu     qemu_opts_del(opts);
368083d0521aSChunyan Liu     qemu_opts_free(create_opts);
368184d18f06SMarkus Armbruster     if (local_err) {
3682cc84d90fSMax Reitz         error_propagate(errp, local_err);
3683cc84d90fSMax Reitz     }
3684f88e1a42SJes Sorensen }
368585d126f3SStefan Hajnoczi 
368685d126f3SStefan Hajnoczi AioContext *bdrv_get_aio_context(BlockDriverState *bs)
368785d126f3SStefan Hajnoczi {
3688dcd04228SStefan Hajnoczi     return bs->aio_context;
3689dcd04228SStefan Hajnoczi }
3690dcd04228SStefan Hajnoczi 
3691dcd04228SStefan Hajnoczi void bdrv_detach_aio_context(BlockDriverState *bs)
3692dcd04228SStefan Hajnoczi {
369333384421SMax Reitz     BdrvAioNotifier *baf;
369433384421SMax Reitz 
3695dcd04228SStefan Hajnoczi     if (!bs->drv) {
3696dcd04228SStefan Hajnoczi         return;
3697dcd04228SStefan Hajnoczi     }
3698dcd04228SStefan Hajnoczi 
369933384421SMax Reitz     QLIST_FOREACH(baf, &bs->aio_notifiers, list) {
370033384421SMax Reitz         baf->detach_aio_context(baf->opaque);
370133384421SMax Reitz     }
370233384421SMax Reitz 
3703a0d64a61SAlberto Garcia     if (bs->throttle_state) {
37040e5b0a2dSBenoît Canet         throttle_timers_detach_aio_context(&bs->throttle_timers);
370513af91ebSStefan Hajnoczi     }
3706dcd04228SStefan Hajnoczi     if (bs->drv->bdrv_detach_aio_context) {
3707dcd04228SStefan Hajnoczi         bs->drv->bdrv_detach_aio_context(bs);
3708dcd04228SStefan Hajnoczi     }
3709dcd04228SStefan Hajnoczi     if (bs->file) {
37109a4f4c31SKevin Wolf         bdrv_detach_aio_context(bs->file->bs);
3711dcd04228SStefan Hajnoczi     }
3712760e0063SKevin Wolf     if (bs->backing) {
3713760e0063SKevin Wolf         bdrv_detach_aio_context(bs->backing->bs);
3714dcd04228SStefan Hajnoczi     }
3715dcd04228SStefan Hajnoczi 
3716dcd04228SStefan Hajnoczi     bs->aio_context = NULL;
3717dcd04228SStefan Hajnoczi }
3718dcd04228SStefan Hajnoczi 
3719dcd04228SStefan Hajnoczi void bdrv_attach_aio_context(BlockDriverState *bs,
3720dcd04228SStefan Hajnoczi                              AioContext *new_context)
3721dcd04228SStefan Hajnoczi {
372233384421SMax Reitz     BdrvAioNotifier *ban;
372333384421SMax Reitz 
3724dcd04228SStefan Hajnoczi     if (!bs->drv) {
3725dcd04228SStefan Hajnoczi         return;
3726dcd04228SStefan Hajnoczi     }
3727dcd04228SStefan Hajnoczi 
3728dcd04228SStefan Hajnoczi     bs->aio_context = new_context;
3729dcd04228SStefan Hajnoczi 
3730760e0063SKevin Wolf     if (bs->backing) {
3731760e0063SKevin Wolf         bdrv_attach_aio_context(bs->backing->bs, new_context);
3732dcd04228SStefan Hajnoczi     }
3733dcd04228SStefan Hajnoczi     if (bs->file) {
37349a4f4c31SKevin Wolf         bdrv_attach_aio_context(bs->file->bs, new_context);
3735dcd04228SStefan Hajnoczi     }
3736dcd04228SStefan Hajnoczi     if (bs->drv->bdrv_attach_aio_context) {
3737dcd04228SStefan Hajnoczi         bs->drv->bdrv_attach_aio_context(bs, new_context);
3738dcd04228SStefan Hajnoczi     }
3739a0d64a61SAlberto Garcia     if (bs->throttle_state) {
37400e5b0a2dSBenoît Canet         throttle_timers_attach_aio_context(&bs->throttle_timers, new_context);
374113af91ebSStefan Hajnoczi     }
374233384421SMax Reitz 
374333384421SMax Reitz     QLIST_FOREACH(ban, &bs->aio_notifiers, list) {
374433384421SMax Reitz         ban->attached_aio_context(new_context, ban->opaque);
374533384421SMax Reitz     }
3746dcd04228SStefan Hajnoczi }
3747dcd04228SStefan Hajnoczi 
3748dcd04228SStefan Hajnoczi void bdrv_set_aio_context(BlockDriverState *bs, AioContext *new_context)
3749dcd04228SStefan Hajnoczi {
375053ec73e2SFam Zheng     bdrv_drain(bs); /* ensure there are no in-flight requests */
3751dcd04228SStefan Hajnoczi 
3752dcd04228SStefan Hajnoczi     bdrv_detach_aio_context(bs);
3753dcd04228SStefan Hajnoczi 
3754dcd04228SStefan Hajnoczi     /* This function executes in the old AioContext so acquire the new one in
3755dcd04228SStefan Hajnoczi      * case it runs in a different thread.
3756dcd04228SStefan Hajnoczi      */
3757dcd04228SStefan Hajnoczi     aio_context_acquire(new_context);
3758dcd04228SStefan Hajnoczi     bdrv_attach_aio_context(bs, new_context);
3759dcd04228SStefan Hajnoczi     aio_context_release(new_context);
376085d126f3SStefan Hajnoczi }
3761d616b224SStefan Hajnoczi 
376233384421SMax Reitz void bdrv_add_aio_context_notifier(BlockDriverState *bs,
376333384421SMax Reitz         void (*attached_aio_context)(AioContext *new_context, void *opaque),
376433384421SMax Reitz         void (*detach_aio_context)(void *opaque), void *opaque)
376533384421SMax Reitz {
376633384421SMax Reitz     BdrvAioNotifier *ban = g_new(BdrvAioNotifier, 1);
376733384421SMax Reitz     *ban = (BdrvAioNotifier){
376833384421SMax Reitz         .attached_aio_context = attached_aio_context,
376933384421SMax Reitz         .detach_aio_context   = detach_aio_context,
377033384421SMax Reitz         .opaque               = opaque
377133384421SMax Reitz     };
377233384421SMax Reitz 
377333384421SMax Reitz     QLIST_INSERT_HEAD(&bs->aio_notifiers, ban, list);
377433384421SMax Reitz }
377533384421SMax Reitz 
377633384421SMax Reitz void bdrv_remove_aio_context_notifier(BlockDriverState *bs,
377733384421SMax Reitz                                       void (*attached_aio_context)(AioContext *,
377833384421SMax Reitz                                                                    void *),
377933384421SMax Reitz                                       void (*detach_aio_context)(void *),
378033384421SMax Reitz                                       void *opaque)
378133384421SMax Reitz {
378233384421SMax Reitz     BdrvAioNotifier *ban, *ban_next;
378333384421SMax Reitz 
378433384421SMax Reitz     QLIST_FOREACH_SAFE(ban, &bs->aio_notifiers, list, ban_next) {
378533384421SMax Reitz         if (ban->attached_aio_context == attached_aio_context &&
378633384421SMax Reitz             ban->detach_aio_context   == detach_aio_context   &&
378733384421SMax Reitz             ban->opaque               == opaque)
378833384421SMax Reitz         {
378933384421SMax Reitz             QLIST_REMOVE(ban, list);
379033384421SMax Reitz             g_free(ban);
379133384421SMax Reitz 
379233384421SMax Reitz             return;
379333384421SMax Reitz         }
379433384421SMax Reitz     }
379533384421SMax Reitz 
379633384421SMax Reitz     abort();
379733384421SMax Reitz }
379833384421SMax Reitz 
379977485434SMax Reitz int bdrv_amend_options(BlockDriverState *bs, QemuOpts *opts,
38008b13976dSMax Reitz                        BlockDriverAmendStatusCB *status_cb, void *cb_opaque)
38016f176b48SMax Reitz {
3802c282e1fdSChunyan Liu     if (!bs->drv->bdrv_amend_options) {
38036f176b48SMax Reitz         return -ENOTSUP;
38046f176b48SMax Reitz     }
38058b13976dSMax Reitz     return bs->drv->bdrv_amend_options(bs, opts, status_cb, cb_opaque);
38066f176b48SMax Reitz }
3807f6186f49SBenoît Canet 
3808b5042a36SBenoît Canet /* This function will be called by the bdrv_recurse_is_first_non_filter method
3809b5042a36SBenoît Canet  * of block filter and by bdrv_is_first_non_filter.
3810b5042a36SBenoît Canet  * It is used to test if the given bs is the candidate or recurse more in the
3811b5042a36SBenoît Canet  * node graph.
3812212a5a8fSBenoît Canet  */
3813212a5a8fSBenoît Canet bool bdrv_recurse_is_first_non_filter(BlockDriverState *bs,
3814212a5a8fSBenoît Canet                                       BlockDriverState *candidate)
3815f6186f49SBenoît Canet {
3816b5042a36SBenoît Canet     /* return false if basic checks fails */
3817b5042a36SBenoît Canet     if (!bs || !bs->drv) {
3818b5042a36SBenoît Canet         return false;
3819b5042a36SBenoît Canet     }
3820b5042a36SBenoît Canet 
3821b5042a36SBenoît Canet     /* the code reached a non block filter driver -> check if the bs is
3822b5042a36SBenoît Canet      * the same as the candidate. It's the recursion termination condition.
3823b5042a36SBenoît Canet      */
3824b5042a36SBenoît Canet     if (!bs->drv->is_filter) {
3825b5042a36SBenoît Canet         return bs == candidate;
3826b5042a36SBenoît Canet     }
3827b5042a36SBenoît Canet     /* Down this path the driver is a block filter driver */
3828b5042a36SBenoît Canet 
3829b5042a36SBenoît Canet     /* If the block filter recursion method is defined use it to recurse down
3830b5042a36SBenoît Canet      * the node graph.
3831b5042a36SBenoît Canet      */
3832b5042a36SBenoît Canet     if (bs->drv->bdrv_recurse_is_first_non_filter) {
3833212a5a8fSBenoît Canet         return bs->drv->bdrv_recurse_is_first_non_filter(bs, candidate);
3834212a5a8fSBenoît Canet     }
3835212a5a8fSBenoît Canet 
3836b5042a36SBenoît Canet     /* the driver is a block filter but don't allow to recurse -> return false
3837b5042a36SBenoît Canet      */
3838b5042a36SBenoît Canet     return false;
3839212a5a8fSBenoît Canet }
3840212a5a8fSBenoît Canet 
3841212a5a8fSBenoît Canet /* This function checks if the candidate is the first non filter bs down it's
3842212a5a8fSBenoît Canet  * bs chain. Since we don't have pointers to parents it explore all bs chains
3843212a5a8fSBenoît Canet  * from the top. Some filters can choose not to pass down the recursion.
3844212a5a8fSBenoît Canet  */
3845212a5a8fSBenoît Canet bool bdrv_is_first_non_filter(BlockDriverState *candidate)
3846212a5a8fSBenoît Canet {
3847212a5a8fSBenoît Canet     BlockDriverState *bs;
3848212a5a8fSBenoît Canet 
3849212a5a8fSBenoît Canet     /* walk down the bs forest recursively */
3850212a5a8fSBenoît Canet     QTAILQ_FOREACH(bs, &bdrv_states, device_list) {
3851212a5a8fSBenoît Canet         bool perm;
3852212a5a8fSBenoît Canet 
3853b5042a36SBenoît Canet         /* try to recurse in this top level bs */
3854e6dc8a1fSKevin Wolf         perm = bdrv_recurse_is_first_non_filter(bs, candidate);
3855212a5a8fSBenoît Canet 
3856212a5a8fSBenoît Canet         /* candidate is the first non filter */
3857212a5a8fSBenoît Canet         if (perm) {
3858212a5a8fSBenoît Canet             return true;
3859212a5a8fSBenoît Canet         }
3860212a5a8fSBenoît Canet     }
3861212a5a8fSBenoît Canet 
3862212a5a8fSBenoît Canet     return false;
3863f6186f49SBenoît Canet }
386409158f00SBenoît Canet 
3865e12f3784SWen Congyang BlockDriverState *check_to_replace_node(BlockDriverState *parent_bs,
3866e12f3784SWen Congyang                                         const char *node_name, Error **errp)
386709158f00SBenoît Canet {
386809158f00SBenoît Canet     BlockDriverState *to_replace_bs = bdrv_find_node(node_name);
38695a7e7a0bSStefan Hajnoczi     AioContext *aio_context;
38705a7e7a0bSStefan Hajnoczi 
387109158f00SBenoît Canet     if (!to_replace_bs) {
387209158f00SBenoît Canet         error_setg(errp, "Node name '%s' not found", node_name);
387309158f00SBenoît Canet         return NULL;
387409158f00SBenoît Canet     }
387509158f00SBenoît Canet 
38765a7e7a0bSStefan Hajnoczi     aio_context = bdrv_get_aio_context(to_replace_bs);
38775a7e7a0bSStefan Hajnoczi     aio_context_acquire(aio_context);
38785a7e7a0bSStefan Hajnoczi 
387909158f00SBenoît Canet     if (bdrv_op_is_blocked(to_replace_bs, BLOCK_OP_TYPE_REPLACE, errp)) {
38805a7e7a0bSStefan Hajnoczi         to_replace_bs = NULL;
38815a7e7a0bSStefan Hajnoczi         goto out;
388209158f00SBenoît Canet     }
388309158f00SBenoît Canet 
388409158f00SBenoît Canet     /* We don't want arbitrary node of the BDS chain to be replaced only the top
388509158f00SBenoît Canet      * most non filter in order to prevent data corruption.
388609158f00SBenoît Canet      * Another benefit is that this tests exclude backing files which are
388709158f00SBenoît Canet      * blocked by the backing blockers.
388809158f00SBenoît Canet      */
3889e12f3784SWen Congyang     if (!bdrv_recurse_is_first_non_filter(parent_bs, to_replace_bs)) {
389009158f00SBenoît Canet         error_setg(errp, "Only top most non filter can be replaced");
38915a7e7a0bSStefan Hajnoczi         to_replace_bs = NULL;
38925a7e7a0bSStefan Hajnoczi         goto out;
389309158f00SBenoît Canet     }
389409158f00SBenoît Canet 
38955a7e7a0bSStefan Hajnoczi out:
38965a7e7a0bSStefan Hajnoczi     aio_context_release(aio_context);
389709158f00SBenoît Canet     return to_replace_bs;
389809158f00SBenoît Canet }
3899448ad91dSMing Lei 
390091af7014SMax Reitz static bool append_open_options(QDict *d, BlockDriverState *bs)
390191af7014SMax Reitz {
390291af7014SMax Reitz     const QDictEntry *entry;
39039e700c1aSKevin Wolf     QemuOptDesc *desc;
3904260fecf1SKevin Wolf     BdrvChild *child;
390591af7014SMax Reitz     bool found_any = false;
3906260fecf1SKevin Wolf     const char *p;
390791af7014SMax Reitz 
390891af7014SMax Reitz     for (entry = qdict_first(bs->options); entry;
390991af7014SMax Reitz          entry = qdict_next(bs->options, entry))
391091af7014SMax Reitz     {
3911260fecf1SKevin Wolf         /* Exclude options for children */
3912260fecf1SKevin Wolf         QLIST_FOREACH(child, &bs->children, next) {
3913260fecf1SKevin Wolf             if (strstart(qdict_entry_key(entry), child->name, &p)
3914260fecf1SKevin Wolf                 && (!*p || *p == '.'))
3915260fecf1SKevin Wolf             {
3916260fecf1SKevin Wolf                 break;
3917260fecf1SKevin Wolf             }
3918260fecf1SKevin Wolf         }
3919260fecf1SKevin Wolf         if (child) {
39209e700c1aSKevin Wolf             continue;
39219e700c1aSKevin Wolf         }
39229e700c1aSKevin Wolf 
39239e700c1aSKevin Wolf         /* And exclude all non-driver-specific options */
39249e700c1aSKevin Wolf         for (desc = bdrv_runtime_opts.desc; desc->name; desc++) {
39259e700c1aSKevin Wolf             if (!strcmp(qdict_entry_key(entry), desc->name)) {
39269e700c1aSKevin Wolf                 break;
39279e700c1aSKevin Wolf             }
39289e700c1aSKevin Wolf         }
39299e700c1aSKevin Wolf         if (desc->name) {
39309e700c1aSKevin Wolf             continue;
39319e700c1aSKevin Wolf         }
39329e700c1aSKevin Wolf 
393391af7014SMax Reitz         qobject_incref(qdict_entry_value(entry));
393491af7014SMax Reitz         qdict_put_obj(d, qdict_entry_key(entry), qdict_entry_value(entry));
393591af7014SMax Reitz         found_any = true;
393691af7014SMax Reitz     }
393791af7014SMax Reitz 
393891af7014SMax Reitz     return found_any;
393991af7014SMax Reitz }
394091af7014SMax Reitz 
394191af7014SMax Reitz /* Updates the following BDS fields:
394291af7014SMax Reitz  *  - exact_filename: A filename which may be used for opening a block device
394391af7014SMax Reitz  *                    which (mostly) equals the given BDS (even without any
394491af7014SMax Reitz  *                    other options; so reading and writing must return the same
394591af7014SMax Reitz  *                    results, but caching etc. may be different)
394691af7014SMax Reitz  *  - full_open_options: Options which, when given when opening a block device
394791af7014SMax Reitz  *                       (without a filename), result in a BDS (mostly)
394891af7014SMax Reitz  *                       equalling the given one
394991af7014SMax Reitz  *  - filename: If exact_filename is set, it is copied here. Otherwise,
395091af7014SMax Reitz  *              full_open_options is converted to a JSON object, prefixed with
395191af7014SMax Reitz  *              "json:" (for use through the JSON pseudo protocol) and put here.
395291af7014SMax Reitz  */
395391af7014SMax Reitz void bdrv_refresh_filename(BlockDriverState *bs)
395491af7014SMax Reitz {
395591af7014SMax Reitz     BlockDriver *drv = bs->drv;
395691af7014SMax Reitz     QDict *opts;
395791af7014SMax Reitz 
395891af7014SMax Reitz     if (!drv) {
395991af7014SMax Reitz         return;
396091af7014SMax Reitz     }
396191af7014SMax Reitz 
396291af7014SMax Reitz     /* This BDS's file name will most probably depend on its file's name, so
396391af7014SMax Reitz      * refresh that first */
396491af7014SMax Reitz     if (bs->file) {
39659a4f4c31SKevin Wolf         bdrv_refresh_filename(bs->file->bs);
396691af7014SMax Reitz     }
396791af7014SMax Reitz 
396891af7014SMax Reitz     if (drv->bdrv_refresh_filename) {
396991af7014SMax Reitz         /* Obsolete information is of no use here, so drop the old file name
397091af7014SMax Reitz          * information before refreshing it */
397191af7014SMax Reitz         bs->exact_filename[0] = '\0';
397291af7014SMax Reitz         if (bs->full_open_options) {
397391af7014SMax Reitz             QDECREF(bs->full_open_options);
397491af7014SMax Reitz             bs->full_open_options = NULL;
397591af7014SMax Reitz         }
397691af7014SMax Reitz 
39774cdd01d3SKevin Wolf         opts = qdict_new();
39784cdd01d3SKevin Wolf         append_open_options(opts, bs);
39794cdd01d3SKevin Wolf         drv->bdrv_refresh_filename(bs, opts);
39804cdd01d3SKevin Wolf         QDECREF(opts);
398191af7014SMax Reitz     } else if (bs->file) {
398291af7014SMax Reitz         /* Try to reconstruct valid information from the underlying file */
398391af7014SMax Reitz         bool has_open_options;
398491af7014SMax Reitz 
398591af7014SMax Reitz         bs->exact_filename[0] = '\0';
398691af7014SMax Reitz         if (bs->full_open_options) {
398791af7014SMax Reitz             QDECREF(bs->full_open_options);
398891af7014SMax Reitz             bs->full_open_options = NULL;
398991af7014SMax Reitz         }
399091af7014SMax Reitz 
399191af7014SMax Reitz         opts = qdict_new();
399291af7014SMax Reitz         has_open_options = append_open_options(opts, bs);
399391af7014SMax Reitz 
399491af7014SMax Reitz         /* If no specific options have been given for this BDS, the filename of
399591af7014SMax Reitz          * the underlying file should suffice for this one as well */
39969a4f4c31SKevin Wolf         if (bs->file->bs->exact_filename[0] && !has_open_options) {
39979a4f4c31SKevin Wolf             strcpy(bs->exact_filename, bs->file->bs->exact_filename);
399891af7014SMax Reitz         }
399991af7014SMax Reitz         /* Reconstructing the full options QDict is simple for most format block
400091af7014SMax Reitz          * drivers, as long as the full options are known for the underlying
400191af7014SMax Reitz          * file BDS. The full options QDict of that file BDS should somehow
400291af7014SMax Reitz          * contain a representation of the filename, therefore the following
400391af7014SMax Reitz          * suffices without querying the (exact_)filename of this BDS. */
40049a4f4c31SKevin Wolf         if (bs->file->bs->full_open_options) {
400591af7014SMax Reitz             qdict_put_obj(opts, "driver",
400691af7014SMax Reitz                           QOBJECT(qstring_from_str(drv->format_name)));
40079a4f4c31SKevin Wolf             QINCREF(bs->file->bs->full_open_options);
40089a4f4c31SKevin Wolf             qdict_put_obj(opts, "file",
40099a4f4c31SKevin Wolf                           QOBJECT(bs->file->bs->full_open_options));
401091af7014SMax Reitz 
401191af7014SMax Reitz             bs->full_open_options = opts;
401291af7014SMax Reitz         } else {
401391af7014SMax Reitz             QDECREF(opts);
401491af7014SMax Reitz         }
401591af7014SMax Reitz     } else if (!bs->full_open_options && qdict_size(bs->options)) {
401691af7014SMax Reitz         /* There is no underlying file BDS (at least referenced by BDS.file),
401791af7014SMax Reitz          * so the full options QDict should be equal to the options given
401891af7014SMax Reitz          * specifically for this block device when it was opened (plus the
401991af7014SMax Reitz          * driver specification).
402091af7014SMax Reitz          * Because those options don't change, there is no need to update
402191af7014SMax Reitz          * full_open_options when it's already set. */
402291af7014SMax Reitz 
402391af7014SMax Reitz         opts = qdict_new();
402491af7014SMax Reitz         append_open_options(opts, bs);
402591af7014SMax Reitz         qdict_put_obj(opts, "driver",
402691af7014SMax Reitz                       QOBJECT(qstring_from_str(drv->format_name)));
402791af7014SMax Reitz 
402891af7014SMax Reitz         if (bs->exact_filename[0]) {
402991af7014SMax Reitz             /* This may not work for all block protocol drivers (some may
403091af7014SMax Reitz              * require this filename to be parsed), but we have to find some
403191af7014SMax Reitz              * default solution here, so just include it. If some block driver
403291af7014SMax Reitz              * does not support pure options without any filename at all or
403391af7014SMax Reitz              * needs some special format of the options QDict, it needs to
403491af7014SMax Reitz              * implement the driver-specific bdrv_refresh_filename() function.
403591af7014SMax Reitz              */
403691af7014SMax Reitz             qdict_put_obj(opts, "filename",
403791af7014SMax Reitz                           QOBJECT(qstring_from_str(bs->exact_filename)));
403891af7014SMax Reitz         }
403991af7014SMax Reitz 
404091af7014SMax Reitz         bs->full_open_options = opts;
404191af7014SMax Reitz     }
404291af7014SMax Reitz 
404391af7014SMax Reitz     if (bs->exact_filename[0]) {
404491af7014SMax Reitz         pstrcpy(bs->filename, sizeof(bs->filename), bs->exact_filename);
404591af7014SMax Reitz     } else if (bs->full_open_options) {
404691af7014SMax Reitz         QString *json = qobject_to_json(QOBJECT(bs->full_open_options));
404791af7014SMax Reitz         snprintf(bs->filename, sizeof(bs->filename), "json:%s",
404891af7014SMax Reitz                  qstring_get_str(json));
404991af7014SMax Reitz         QDECREF(json);
405091af7014SMax Reitz     }
405191af7014SMax Reitz }
4052