xref: /openbmc/qemu/block.c (revision b4b059f628173dd1d722ee8a9c592a80aec1fc2f)
1fc01f7e7Sbellard /*
2fc01f7e7Sbellard  * QEMU System Emulator block driver
3fc01f7e7Sbellard  *
4fc01f7e7Sbellard  * Copyright (c) 2003 Fabrice Bellard
5fc01f7e7Sbellard  *
6fc01f7e7Sbellard  * Permission is hereby granted, free of charge, to any person obtaining a copy
7fc01f7e7Sbellard  * of this software and associated documentation files (the "Software"), to deal
8fc01f7e7Sbellard  * in the Software without restriction, including without limitation the rights
9fc01f7e7Sbellard  * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10fc01f7e7Sbellard  * copies of the Software, and to permit persons to whom the Software is
11fc01f7e7Sbellard  * furnished to do so, subject to the following conditions:
12fc01f7e7Sbellard  *
13fc01f7e7Sbellard  * The above copyright notice and this permission notice shall be included in
14fc01f7e7Sbellard  * all copies or substantial portions of the Software.
15fc01f7e7Sbellard  *
16fc01f7e7Sbellard  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17fc01f7e7Sbellard  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18fc01f7e7Sbellard  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19fc01f7e7Sbellard  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20fc01f7e7Sbellard  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21fc01f7e7Sbellard  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22fc01f7e7Sbellard  * THE SOFTWARE.
23fc01f7e7Sbellard  */
243990d09aSblueswir1 #include "config-host.h"
25faf07963Spbrook #include "qemu-common.h"
266d519a5fSStefan Hajnoczi #include "trace.h"
27737e150eSPaolo Bonzini #include "block/block_int.h"
28737e150eSPaolo Bonzini #include "block/blockjob.h"
29d49b6836SMarkus Armbruster #include "qemu/error-report.h"
301de7afc9SPaolo Bonzini #include "qemu/module.h"
31cc7a8ea7SMarkus Armbruster #include "qapi/qmp/qerror.h"
327b1b5d19SPaolo Bonzini #include "qapi/qmp/qjson.h"
33bfb197e0SMarkus Armbruster #include "sysemu/block-backend.h"
349c17d615SPaolo Bonzini #include "sysemu/sysemu.h"
351de7afc9SPaolo Bonzini #include "qemu/notify.h"
36737e150eSPaolo Bonzini #include "block/coroutine.h"
37c13163fbSBenoît Canet #include "block/qapi.h"
38b2023818SLuiz Capitulino #include "qmp-commands.h"
391de7afc9SPaolo Bonzini #include "qemu/timer.h"
40a5ee7bd4SWenchao Xia #include "qapi-event.h"
41db628338SAlberto Garcia #include "block/throttle-groups.h"
42fc01f7e7Sbellard 
4371e72a19SJuan Quintela #ifdef CONFIG_BSD
447674e7bfSbellard #include <sys/types.h>
457674e7bfSbellard #include <sys/stat.h>
467674e7bfSbellard #include <sys/ioctl.h>
4772cf2d4fSBlue Swirl #include <sys/queue.h>
48c5e97233Sblueswir1 #ifndef __DragonFly__
497674e7bfSbellard #include <sys/disk.h>
507674e7bfSbellard #endif
51c5e97233Sblueswir1 #endif
527674e7bfSbellard 
5349dc768dSaliguori #ifdef _WIN32
5449dc768dSaliguori #include <windows.h>
5549dc768dSaliguori #endif
5649dc768dSaliguori 
579bd2b08fSJohn Snow /**
589bd2b08fSJohn Snow  * A BdrvDirtyBitmap can be in three possible states:
599bd2b08fSJohn Snow  * (1) successor is NULL and disabled is false: full r/w mode
609bd2b08fSJohn Snow  * (2) successor is NULL and disabled is true: read only mode ("disabled")
619bd2b08fSJohn Snow  * (3) successor is set: frozen mode.
629bd2b08fSJohn Snow  *     A frozen bitmap cannot be renamed, deleted, anonymized, cleared, set,
639bd2b08fSJohn Snow  *     or enabled. A frozen bitmap can only abdicate() or reclaim().
649bd2b08fSJohn Snow  */
65e4654d2dSFam Zheng struct BdrvDirtyBitmap {
66aa0c7ca5SJohn Snow     HBitmap *bitmap;            /* Dirty sector bitmap implementation */
67aa0c7ca5SJohn Snow     BdrvDirtyBitmap *successor; /* Anonymous child; implies frozen status */
68aa0c7ca5SJohn Snow     char *name;                 /* Optional non-empty unique ID */
69aa0c7ca5SJohn Snow     int64_t size;               /* Size of the bitmap (Number of sectors) */
70aa0c7ca5SJohn Snow     bool disabled;              /* Bitmap is read-only */
71e4654d2dSFam Zheng     QLIST_ENTRY(BdrvDirtyBitmap) list;
72e4654d2dSFam Zheng };
73e4654d2dSFam Zheng 
741c9805a3SStefan Hajnoczi #define NOT_DONE 0x7fffffff /* used while emulated sync operation in progress */
751c9805a3SStefan Hajnoczi 
761b7bdbc1SStefan Hajnoczi static QTAILQ_HEAD(, BlockDriverState) bdrv_states =
771b7bdbc1SStefan Hajnoczi     QTAILQ_HEAD_INITIALIZER(bdrv_states);
787ee930d0Sblueswir1 
79dc364f4cSBenoît Canet static QTAILQ_HEAD(, BlockDriverState) graph_bdrv_states =
80dc364f4cSBenoît Canet     QTAILQ_HEAD_INITIALIZER(graph_bdrv_states);
81dc364f4cSBenoît Canet 
828a22f02aSStefan Hajnoczi static QLIST_HEAD(, BlockDriver) bdrv_drivers =
838a22f02aSStefan Hajnoczi     QLIST_HEAD_INITIALIZER(bdrv_drivers);
84ea2384d3Sbellard 
85f3930ed0SKevin Wolf static int bdrv_open_inherit(BlockDriverState **pbs, const char *filename,
86f3930ed0SKevin Wolf                              const char *reference, QDict *options, int flags,
87f3930ed0SKevin Wolf                              BlockDriverState *parent,
88f3930ed0SKevin Wolf                              const BdrvChildRole *child_role,
89f3930ed0SKevin Wolf                              BlockDriver *drv, Error **errp);
90f3930ed0SKevin Wolf 
91ce1ffea8SJohn Snow static void bdrv_dirty_bitmap_truncate(BlockDriverState *bs);
92eb852011SMarkus Armbruster /* If non-zero, use only whitelisted block drivers */
93eb852011SMarkus Armbruster static int use_bdrv_whitelist;
94eb852011SMarkus Armbruster 
959e0b22f4SStefan Hajnoczi #ifdef _WIN32
969e0b22f4SStefan Hajnoczi static int is_windows_drive_prefix(const char *filename)
979e0b22f4SStefan Hajnoczi {
989e0b22f4SStefan Hajnoczi     return (((filename[0] >= 'a' && filename[0] <= 'z') ||
999e0b22f4SStefan Hajnoczi              (filename[0] >= 'A' && filename[0] <= 'Z')) &&
1009e0b22f4SStefan Hajnoczi             filename[1] == ':');
1019e0b22f4SStefan Hajnoczi }
1029e0b22f4SStefan Hajnoczi 
1039e0b22f4SStefan Hajnoczi int is_windows_drive(const char *filename)
1049e0b22f4SStefan Hajnoczi {
1059e0b22f4SStefan Hajnoczi     if (is_windows_drive_prefix(filename) &&
1069e0b22f4SStefan Hajnoczi         filename[2] == '\0')
1079e0b22f4SStefan Hajnoczi         return 1;
1089e0b22f4SStefan Hajnoczi     if (strstart(filename, "\\\\.\\", NULL) ||
1099e0b22f4SStefan Hajnoczi         strstart(filename, "//./", NULL))
1109e0b22f4SStefan Hajnoczi         return 1;
1119e0b22f4SStefan Hajnoczi     return 0;
1129e0b22f4SStefan Hajnoczi }
1139e0b22f4SStefan Hajnoczi #endif
1149e0b22f4SStefan Hajnoczi 
115339064d5SKevin Wolf size_t bdrv_opt_mem_align(BlockDriverState *bs)
116339064d5SKevin Wolf {
117339064d5SKevin Wolf     if (!bs || !bs->drv) {
118459b4e66SDenis V. Lunev         /* page size or 4k (hdd sector size) should be on the safe side */
119459b4e66SDenis V. Lunev         return MAX(4096, getpagesize());
120339064d5SKevin Wolf     }
121339064d5SKevin Wolf 
122339064d5SKevin Wolf     return bs->bl.opt_mem_alignment;
123339064d5SKevin Wolf }
124339064d5SKevin Wolf 
1254196d2f0SDenis V. Lunev size_t bdrv_min_mem_align(BlockDriverState *bs)
1264196d2f0SDenis V. Lunev {
1274196d2f0SDenis V. Lunev     if (!bs || !bs->drv) {
128459b4e66SDenis V. Lunev         /* page size or 4k (hdd sector size) should be on the safe side */
129459b4e66SDenis V. Lunev         return MAX(4096, getpagesize());
1304196d2f0SDenis V. Lunev     }
1314196d2f0SDenis V. Lunev 
1324196d2f0SDenis V. Lunev     return bs->bl.min_mem_alignment;
1334196d2f0SDenis V. Lunev }
1344196d2f0SDenis V. Lunev 
1359e0b22f4SStefan Hajnoczi /* check if the path starts with "<protocol>:" */
1365c98415bSMax Reitz int path_has_protocol(const char *path)
1379e0b22f4SStefan Hajnoczi {
138947995c0SPaolo Bonzini     const char *p;
139947995c0SPaolo Bonzini 
1409e0b22f4SStefan Hajnoczi #ifdef _WIN32
1419e0b22f4SStefan Hajnoczi     if (is_windows_drive(path) ||
1429e0b22f4SStefan Hajnoczi         is_windows_drive_prefix(path)) {
1439e0b22f4SStefan Hajnoczi         return 0;
1449e0b22f4SStefan Hajnoczi     }
145947995c0SPaolo Bonzini     p = path + strcspn(path, ":/\\");
146947995c0SPaolo Bonzini #else
147947995c0SPaolo Bonzini     p = path + strcspn(path, ":/");
1489e0b22f4SStefan Hajnoczi #endif
1499e0b22f4SStefan Hajnoczi 
150947995c0SPaolo Bonzini     return *p == ':';
1519e0b22f4SStefan Hajnoczi }
1529e0b22f4SStefan Hajnoczi 
15383f64091Sbellard int path_is_absolute(const char *path)
15483f64091Sbellard {
15521664424Sbellard #ifdef _WIN32
15621664424Sbellard     /* specific case for names like: "\\.\d:" */
157f53f4da9SPaolo Bonzini     if (is_windows_drive(path) || is_windows_drive_prefix(path)) {
15821664424Sbellard         return 1;
159f53f4da9SPaolo Bonzini     }
160f53f4da9SPaolo Bonzini     return (*path == '/' || *path == '\\');
1613b9f94e1Sbellard #else
162f53f4da9SPaolo Bonzini     return (*path == '/');
1633b9f94e1Sbellard #endif
16483f64091Sbellard }
16583f64091Sbellard 
16683f64091Sbellard /* if filename is absolute, just copy it to dest. Otherwise, build a
16783f64091Sbellard    path to it by considering it is relative to base_path. URL are
16883f64091Sbellard    supported. */
16983f64091Sbellard void path_combine(char *dest, int dest_size,
17083f64091Sbellard                   const char *base_path,
17183f64091Sbellard                   const char *filename)
17283f64091Sbellard {
17383f64091Sbellard     const char *p, *p1;
17483f64091Sbellard     int len;
17583f64091Sbellard 
17683f64091Sbellard     if (dest_size <= 0)
17783f64091Sbellard         return;
17883f64091Sbellard     if (path_is_absolute(filename)) {
17983f64091Sbellard         pstrcpy(dest, dest_size, filename);
18083f64091Sbellard     } else {
18183f64091Sbellard         p = strchr(base_path, ':');
18283f64091Sbellard         if (p)
18383f64091Sbellard             p++;
18483f64091Sbellard         else
18583f64091Sbellard             p = base_path;
1863b9f94e1Sbellard         p1 = strrchr(base_path, '/');
1873b9f94e1Sbellard #ifdef _WIN32
1883b9f94e1Sbellard         {
1893b9f94e1Sbellard             const char *p2;
1903b9f94e1Sbellard             p2 = strrchr(base_path, '\\');
1913b9f94e1Sbellard             if (!p1 || p2 > p1)
1923b9f94e1Sbellard                 p1 = p2;
1933b9f94e1Sbellard         }
1943b9f94e1Sbellard #endif
19583f64091Sbellard         if (p1)
19683f64091Sbellard             p1++;
19783f64091Sbellard         else
19883f64091Sbellard             p1 = base_path;
19983f64091Sbellard         if (p1 > p)
20083f64091Sbellard             p = p1;
20183f64091Sbellard         len = p - base_path;
20283f64091Sbellard         if (len > dest_size - 1)
20383f64091Sbellard             len = dest_size - 1;
20483f64091Sbellard         memcpy(dest, base_path, len);
20583f64091Sbellard         dest[len] = '\0';
20683f64091Sbellard         pstrcat(dest, dest_size, filename);
20783f64091Sbellard     }
20883f64091Sbellard }
20983f64091Sbellard 
2100a82855aSMax Reitz void bdrv_get_full_backing_filename_from_filename(const char *backed,
2110a82855aSMax Reitz                                                   const char *backing,
2129f07429eSMax Reitz                                                   char *dest, size_t sz,
2139f07429eSMax Reitz                                                   Error **errp)
2140a82855aSMax Reitz {
2159f07429eSMax Reitz     if (backing[0] == '\0' || path_has_protocol(backing) ||
2169f07429eSMax Reitz         path_is_absolute(backing))
2179f07429eSMax Reitz     {
2180a82855aSMax Reitz         pstrcpy(dest, sz, backing);
2199f07429eSMax Reitz     } else if (backed[0] == '\0' || strstart(backed, "json:", NULL)) {
2209f07429eSMax Reitz         error_setg(errp, "Cannot use relative backing file names for '%s'",
2219f07429eSMax Reitz                    backed);
2220a82855aSMax Reitz     } else {
2230a82855aSMax Reitz         path_combine(dest, sz, backed, backing);
2240a82855aSMax Reitz     }
2250a82855aSMax Reitz }
2260a82855aSMax Reitz 
2279f07429eSMax Reitz void bdrv_get_full_backing_filename(BlockDriverState *bs, char *dest, size_t sz,
2289f07429eSMax Reitz                                     Error **errp)
229dc5a1371SPaolo Bonzini {
2309f07429eSMax Reitz     char *backed = bs->exact_filename[0] ? bs->exact_filename : bs->filename;
2319f07429eSMax Reitz 
2329f07429eSMax Reitz     bdrv_get_full_backing_filename_from_filename(backed, bs->backing_file,
2339f07429eSMax Reitz                                                  dest, sz, errp);
234dc5a1371SPaolo Bonzini }
235dc5a1371SPaolo Bonzini 
2360eb7217eSStefan Hajnoczi void bdrv_register(BlockDriver *bdrv)
2370eb7217eSStefan Hajnoczi {
2380eb7217eSStefan Hajnoczi     bdrv_setup_io_funcs(bdrv);
239b2e12bc6SChristoph Hellwig 
2408a22f02aSStefan Hajnoczi     QLIST_INSERT_HEAD(&bdrv_drivers, bdrv, list);
241ea2384d3Sbellard }
242b338082bSbellard 
2437f06d47eSMarkus Armbruster BlockDriverState *bdrv_new_root(void)
244fc01f7e7Sbellard {
2457f06d47eSMarkus Armbruster     BlockDriverState *bs = bdrv_new();
246e4e9986bSMarkus Armbruster 
247e4e9986bSMarkus Armbruster     QTAILQ_INSERT_TAIL(&bdrv_states, bs, device_list);
248e4e9986bSMarkus Armbruster     return bs;
249e4e9986bSMarkus Armbruster }
250e4e9986bSMarkus Armbruster 
251e4e9986bSMarkus Armbruster BlockDriverState *bdrv_new(void)
252e4e9986bSMarkus Armbruster {
253e4e9986bSMarkus Armbruster     BlockDriverState *bs;
254e4e9986bSMarkus Armbruster     int i;
255e4e9986bSMarkus Armbruster 
2565839e53bSMarkus Armbruster     bs = g_new0(BlockDriverState, 1);
257e4654d2dSFam Zheng     QLIST_INIT(&bs->dirty_bitmaps);
258fbe40ff7SFam Zheng     for (i = 0; i < BLOCK_OP_TYPE_MAX; i++) {
259fbe40ff7SFam Zheng         QLIST_INIT(&bs->op_blockers[i]);
260fbe40ff7SFam Zheng     }
26128a7282aSLuiz Capitulino     bdrv_iostatus_disable(bs);
262d7d512f6SPaolo Bonzini     notifier_list_init(&bs->close_notifiers);
263d616b224SStefan Hajnoczi     notifier_with_return_list_init(&bs->before_write_notifiers);
264cc0681c4SBenoît Canet     qemu_co_queue_init(&bs->throttled_reqs[0]);
265cc0681c4SBenoît Canet     qemu_co_queue_init(&bs->throttled_reqs[1]);
2669fcb0251SFam Zheng     bs->refcnt = 1;
267dcd04228SStefan Hajnoczi     bs->aio_context = qemu_get_aio_context();
268d7d512f6SPaolo Bonzini 
269b338082bSbellard     return bs;
270b338082bSbellard }
271b338082bSbellard 
272d7d512f6SPaolo Bonzini void bdrv_add_close_notifier(BlockDriverState *bs, Notifier *notify)
273d7d512f6SPaolo Bonzini {
274d7d512f6SPaolo Bonzini     notifier_list_add(&bs->close_notifiers, notify);
275d7d512f6SPaolo Bonzini }
276d7d512f6SPaolo Bonzini 
277ea2384d3Sbellard BlockDriver *bdrv_find_format(const char *format_name)
278ea2384d3Sbellard {
279ea2384d3Sbellard     BlockDriver *drv1;
2808a22f02aSStefan Hajnoczi     QLIST_FOREACH(drv1, &bdrv_drivers, list) {
2818a22f02aSStefan Hajnoczi         if (!strcmp(drv1->format_name, format_name)) {
282ea2384d3Sbellard             return drv1;
283ea2384d3Sbellard         }
2848a22f02aSStefan Hajnoczi     }
285ea2384d3Sbellard     return NULL;
286ea2384d3Sbellard }
287ea2384d3Sbellard 
288b64ec4e4SFam Zheng static int bdrv_is_whitelisted(BlockDriver *drv, bool read_only)
289eb852011SMarkus Armbruster {
290b64ec4e4SFam Zheng     static const char *whitelist_rw[] = {
291b64ec4e4SFam Zheng         CONFIG_BDRV_RW_WHITELIST
292b64ec4e4SFam Zheng     };
293b64ec4e4SFam Zheng     static const char *whitelist_ro[] = {
294b64ec4e4SFam Zheng         CONFIG_BDRV_RO_WHITELIST
295eb852011SMarkus Armbruster     };
296eb852011SMarkus Armbruster     const char **p;
297eb852011SMarkus Armbruster 
298b64ec4e4SFam Zheng     if (!whitelist_rw[0] && !whitelist_ro[0]) {
299eb852011SMarkus Armbruster         return 1;               /* no whitelist, anything goes */
300b64ec4e4SFam Zheng     }
301eb852011SMarkus Armbruster 
302b64ec4e4SFam Zheng     for (p = whitelist_rw; *p; p++) {
303eb852011SMarkus Armbruster         if (!strcmp(drv->format_name, *p)) {
304eb852011SMarkus Armbruster             return 1;
305eb852011SMarkus Armbruster         }
306eb852011SMarkus Armbruster     }
307b64ec4e4SFam Zheng     if (read_only) {
308b64ec4e4SFam Zheng         for (p = whitelist_ro; *p; p++) {
309b64ec4e4SFam Zheng             if (!strcmp(drv->format_name, *p)) {
310b64ec4e4SFam Zheng                 return 1;
311b64ec4e4SFam Zheng             }
312b64ec4e4SFam Zheng         }
313b64ec4e4SFam Zheng     }
314eb852011SMarkus Armbruster     return 0;
315eb852011SMarkus Armbruster }
316eb852011SMarkus Armbruster 
317b64ec4e4SFam Zheng BlockDriver *bdrv_find_whitelisted_format(const char *format_name,
318b64ec4e4SFam Zheng                                           bool read_only)
319eb852011SMarkus Armbruster {
320eb852011SMarkus Armbruster     BlockDriver *drv = bdrv_find_format(format_name);
321b64ec4e4SFam Zheng     return drv && bdrv_is_whitelisted(drv, read_only) ? drv : NULL;
322eb852011SMarkus Armbruster }
323eb852011SMarkus Armbruster 
3245b7e1542SZhi Yong Wu typedef struct CreateCo {
3255b7e1542SZhi Yong Wu     BlockDriver *drv;
3265b7e1542SZhi Yong Wu     char *filename;
32783d0521aSChunyan Liu     QemuOpts *opts;
3285b7e1542SZhi Yong Wu     int ret;
329cc84d90fSMax Reitz     Error *err;
3305b7e1542SZhi Yong Wu } CreateCo;
3315b7e1542SZhi Yong Wu 
3325b7e1542SZhi Yong Wu static void coroutine_fn bdrv_create_co_entry(void *opaque)
3335b7e1542SZhi Yong Wu {
334cc84d90fSMax Reitz     Error *local_err = NULL;
335cc84d90fSMax Reitz     int ret;
336cc84d90fSMax Reitz 
3375b7e1542SZhi Yong Wu     CreateCo *cco = opaque;
3385b7e1542SZhi Yong Wu     assert(cco->drv);
3395b7e1542SZhi Yong Wu 
340c282e1fdSChunyan Liu     ret = cco->drv->bdrv_create(cco->filename, cco->opts, &local_err);
34184d18f06SMarkus Armbruster     if (local_err) {
342cc84d90fSMax Reitz         error_propagate(&cco->err, local_err);
343cc84d90fSMax Reitz     }
344cc84d90fSMax Reitz     cco->ret = ret;
3455b7e1542SZhi Yong Wu }
3465b7e1542SZhi Yong Wu 
3470e7e1989SKevin Wolf int bdrv_create(BlockDriver *drv, const char* filename,
34883d0521aSChunyan Liu                 QemuOpts *opts, Error **errp)
349ea2384d3Sbellard {
3505b7e1542SZhi Yong Wu     int ret;
3510e7e1989SKevin Wolf 
3525b7e1542SZhi Yong Wu     Coroutine *co;
3535b7e1542SZhi Yong Wu     CreateCo cco = {
3545b7e1542SZhi Yong Wu         .drv = drv,
3555b7e1542SZhi Yong Wu         .filename = g_strdup(filename),
35683d0521aSChunyan Liu         .opts = opts,
3575b7e1542SZhi Yong Wu         .ret = NOT_DONE,
358cc84d90fSMax Reitz         .err = NULL,
3595b7e1542SZhi Yong Wu     };
3605b7e1542SZhi Yong Wu 
361c282e1fdSChunyan Liu     if (!drv->bdrv_create) {
362cc84d90fSMax Reitz         error_setg(errp, "Driver '%s' does not support image creation", drv->format_name);
36380168bffSLuiz Capitulino         ret = -ENOTSUP;
36480168bffSLuiz Capitulino         goto out;
3655b7e1542SZhi Yong Wu     }
3665b7e1542SZhi Yong Wu 
3675b7e1542SZhi Yong Wu     if (qemu_in_coroutine()) {
3685b7e1542SZhi Yong Wu         /* Fast-path if already in coroutine context */
3695b7e1542SZhi Yong Wu         bdrv_create_co_entry(&cco);
3705b7e1542SZhi Yong Wu     } else {
3715b7e1542SZhi Yong Wu         co = qemu_coroutine_create(bdrv_create_co_entry);
3725b7e1542SZhi Yong Wu         qemu_coroutine_enter(co, &cco);
3735b7e1542SZhi Yong Wu         while (cco.ret == NOT_DONE) {
374b47ec2c4SPaolo Bonzini             aio_poll(qemu_get_aio_context(), true);
3755b7e1542SZhi Yong Wu         }
3765b7e1542SZhi Yong Wu     }
3775b7e1542SZhi Yong Wu 
3785b7e1542SZhi Yong Wu     ret = cco.ret;
379cc84d90fSMax Reitz     if (ret < 0) {
38084d18f06SMarkus Armbruster         if (cco.err) {
381cc84d90fSMax Reitz             error_propagate(errp, cco.err);
382cc84d90fSMax Reitz         } else {
383cc84d90fSMax Reitz             error_setg_errno(errp, -ret, "Could not create image");
384cc84d90fSMax Reitz         }
385cc84d90fSMax Reitz     }
3865b7e1542SZhi Yong Wu 
38780168bffSLuiz Capitulino out:
38880168bffSLuiz Capitulino     g_free(cco.filename);
3895b7e1542SZhi Yong Wu     return ret;
390ea2384d3Sbellard }
391ea2384d3Sbellard 
392c282e1fdSChunyan Liu int bdrv_create_file(const char *filename, QemuOpts *opts, Error **errp)
39384a12e66SChristoph Hellwig {
39484a12e66SChristoph Hellwig     BlockDriver *drv;
395cc84d90fSMax Reitz     Error *local_err = NULL;
396cc84d90fSMax Reitz     int ret;
39784a12e66SChristoph Hellwig 
398b65a5e12SMax Reitz     drv = bdrv_find_protocol(filename, true, errp);
39984a12e66SChristoph Hellwig     if (drv == NULL) {
40016905d71SStefan Hajnoczi         return -ENOENT;
40184a12e66SChristoph Hellwig     }
40284a12e66SChristoph Hellwig 
403c282e1fdSChunyan Liu     ret = bdrv_create(drv, filename, opts, &local_err);
40484d18f06SMarkus Armbruster     if (local_err) {
405cc84d90fSMax Reitz         error_propagate(errp, local_err);
406cc84d90fSMax Reitz     }
407cc84d90fSMax Reitz     return ret;
40884a12e66SChristoph Hellwig }
40984a12e66SChristoph Hellwig 
410892b7de8SEkaterina Tumanova /**
411892b7de8SEkaterina Tumanova  * Try to get @bs's logical and physical block size.
412892b7de8SEkaterina Tumanova  * On success, store them in @bsz struct and return 0.
413892b7de8SEkaterina Tumanova  * On failure return -errno.
414892b7de8SEkaterina Tumanova  * @bs must not be empty.
415892b7de8SEkaterina Tumanova  */
416892b7de8SEkaterina Tumanova int bdrv_probe_blocksizes(BlockDriverState *bs, BlockSizes *bsz)
417892b7de8SEkaterina Tumanova {
418892b7de8SEkaterina Tumanova     BlockDriver *drv = bs->drv;
419892b7de8SEkaterina Tumanova 
420892b7de8SEkaterina Tumanova     if (drv && drv->bdrv_probe_blocksizes) {
421892b7de8SEkaterina Tumanova         return drv->bdrv_probe_blocksizes(bs, bsz);
422892b7de8SEkaterina Tumanova     }
423892b7de8SEkaterina Tumanova 
424892b7de8SEkaterina Tumanova     return -ENOTSUP;
425892b7de8SEkaterina Tumanova }
426892b7de8SEkaterina Tumanova 
427892b7de8SEkaterina Tumanova /**
428892b7de8SEkaterina Tumanova  * Try to get @bs's geometry (cyls, heads, sectors).
429892b7de8SEkaterina Tumanova  * On success, store them in @geo struct and return 0.
430892b7de8SEkaterina Tumanova  * On failure return -errno.
431892b7de8SEkaterina Tumanova  * @bs must not be empty.
432892b7de8SEkaterina Tumanova  */
433892b7de8SEkaterina Tumanova int bdrv_probe_geometry(BlockDriverState *bs, HDGeometry *geo)
434892b7de8SEkaterina Tumanova {
435892b7de8SEkaterina Tumanova     BlockDriver *drv = bs->drv;
436892b7de8SEkaterina Tumanova 
437892b7de8SEkaterina Tumanova     if (drv && drv->bdrv_probe_geometry) {
438892b7de8SEkaterina Tumanova         return drv->bdrv_probe_geometry(bs, geo);
439892b7de8SEkaterina Tumanova     }
440892b7de8SEkaterina Tumanova 
441892b7de8SEkaterina Tumanova     return -ENOTSUP;
442892b7de8SEkaterina Tumanova }
443892b7de8SEkaterina Tumanova 
444eba25057SJim Meyering /*
445eba25057SJim Meyering  * Create a uniquely-named empty temporary file.
446eba25057SJim Meyering  * Return 0 upon success, otherwise a negative errno value.
447eba25057SJim Meyering  */
448eba25057SJim Meyering int get_tmp_filename(char *filename, int size)
449eba25057SJim Meyering {
450d5249393Sbellard #ifdef _WIN32
4513b9f94e1Sbellard     char temp_dir[MAX_PATH];
452eba25057SJim Meyering     /* GetTempFileName requires that its output buffer (4th param)
453eba25057SJim Meyering        have length MAX_PATH or greater.  */
454eba25057SJim Meyering     assert(size >= MAX_PATH);
455eba25057SJim Meyering     return (GetTempPath(MAX_PATH, temp_dir)
456eba25057SJim Meyering             && GetTempFileName(temp_dir, "qem", 0, filename)
457eba25057SJim Meyering             ? 0 : -GetLastError());
458d5249393Sbellard #else
459ea2384d3Sbellard     int fd;
4607ccfb2ebSblueswir1     const char *tmpdir;
4610badc1eeSaurel32     tmpdir = getenv("TMPDIR");
46269bef793SAmit Shah     if (!tmpdir) {
46369bef793SAmit Shah         tmpdir = "/var/tmp";
46469bef793SAmit Shah     }
465eba25057SJim Meyering     if (snprintf(filename, size, "%s/vl.XXXXXX", tmpdir) >= size) {
466eba25057SJim Meyering         return -EOVERFLOW;
467ea2384d3Sbellard     }
468eba25057SJim Meyering     fd = mkstemp(filename);
469fe235a06SDunrong Huang     if (fd < 0) {
470fe235a06SDunrong Huang         return -errno;
471fe235a06SDunrong Huang     }
472fe235a06SDunrong Huang     if (close(fd) != 0) {
473fe235a06SDunrong Huang         unlink(filename);
474eba25057SJim Meyering         return -errno;
475eba25057SJim Meyering     }
476eba25057SJim Meyering     return 0;
477d5249393Sbellard #endif
478eba25057SJim Meyering }
479ea2384d3Sbellard 
480f3a5d3f8SChristoph Hellwig /*
481f3a5d3f8SChristoph Hellwig  * Detect host devices. By convention, /dev/cdrom[N] is always
482f3a5d3f8SChristoph Hellwig  * recognized as a host CDROM.
483f3a5d3f8SChristoph Hellwig  */
484f3a5d3f8SChristoph Hellwig static BlockDriver *find_hdev_driver(const char *filename)
485f3a5d3f8SChristoph Hellwig {
486508c7cb3SChristoph Hellwig     int score_max = 0, score;
487508c7cb3SChristoph Hellwig     BlockDriver *drv = NULL, *d;
488f3a5d3f8SChristoph Hellwig 
4898a22f02aSStefan Hajnoczi     QLIST_FOREACH(d, &bdrv_drivers, list) {
490508c7cb3SChristoph Hellwig         if (d->bdrv_probe_device) {
491508c7cb3SChristoph Hellwig             score = d->bdrv_probe_device(filename);
492508c7cb3SChristoph Hellwig             if (score > score_max) {
493508c7cb3SChristoph Hellwig                 score_max = score;
494508c7cb3SChristoph Hellwig                 drv = d;
495f3a5d3f8SChristoph Hellwig             }
496508c7cb3SChristoph Hellwig         }
497f3a5d3f8SChristoph Hellwig     }
498f3a5d3f8SChristoph Hellwig 
499508c7cb3SChristoph Hellwig     return drv;
500f3a5d3f8SChristoph Hellwig }
501f3a5d3f8SChristoph Hellwig 
50298289620SKevin Wolf BlockDriver *bdrv_find_protocol(const char *filename,
503b65a5e12SMax Reitz                                 bool allow_protocol_prefix,
504b65a5e12SMax Reitz                                 Error **errp)
50584a12e66SChristoph Hellwig {
50684a12e66SChristoph Hellwig     BlockDriver *drv1;
50784a12e66SChristoph Hellwig     char protocol[128];
50884a12e66SChristoph Hellwig     int len;
50984a12e66SChristoph Hellwig     const char *p;
51084a12e66SChristoph Hellwig 
51166f82ceeSKevin Wolf     /* TODO Drivers without bdrv_file_open must be specified explicitly */
51266f82ceeSKevin Wolf 
51339508e7aSChristoph Hellwig     /*
51439508e7aSChristoph Hellwig      * XXX(hch): we really should not let host device detection
51539508e7aSChristoph Hellwig      * override an explicit protocol specification, but moving this
51639508e7aSChristoph Hellwig      * later breaks access to device names with colons in them.
51739508e7aSChristoph Hellwig      * Thanks to the brain-dead persistent naming schemes on udev-
51839508e7aSChristoph Hellwig      * based Linux systems those actually are quite common.
51939508e7aSChristoph Hellwig      */
52084a12e66SChristoph Hellwig     drv1 = find_hdev_driver(filename);
52139508e7aSChristoph Hellwig     if (drv1) {
52284a12e66SChristoph Hellwig         return drv1;
52384a12e66SChristoph Hellwig     }
52439508e7aSChristoph Hellwig 
52598289620SKevin Wolf     if (!path_has_protocol(filename) || !allow_protocol_prefix) {
526ef810437SMax Reitz         return &bdrv_file;
52739508e7aSChristoph Hellwig     }
52898289620SKevin Wolf 
5299e0b22f4SStefan Hajnoczi     p = strchr(filename, ':');
5309e0b22f4SStefan Hajnoczi     assert(p != NULL);
53184a12e66SChristoph Hellwig     len = p - filename;
53284a12e66SChristoph Hellwig     if (len > sizeof(protocol) - 1)
53384a12e66SChristoph Hellwig         len = sizeof(protocol) - 1;
53484a12e66SChristoph Hellwig     memcpy(protocol, filename, len);
53584a12e66SChristoph Hellwig     protocol[len] = '\0';
53684a12e66SChristoph Hellwig     QLIST_FOREACH(drv1, &bdrv_drivers, list) {
53784a12e66SChristoph Hellwig         if (drv1->protocol_name &&
53884a12e66SChristoph Hellwig             !strcmp(drv1->protocol_name, protocol)) {
53984a12e66SChristoph Hellwig             return drv1;
54084a12e66SChristoph Hellwig         }
54184a12e66SChristoph Hellwig     }
542b65a5e12SMax Reitz 
543b65a5e12SMax Reitz     error_setg(errp, "Unknown protocol '%s'", protocol);
54484a12e66SChristoph Hellwig     return NULL;
54584a12e66SChristoph Hellwig }
54684a12e66SChristoph Hellwig 
547c6684249SMarkus Armbruster /*
548c6684249SMarkus Armbruster  * Guess image format by probing its contents.
549c6684249SMarkus Armbruster  * This is not a good idea when your image is raw (CVE-2008-2004), but
550c6684249SMarkus Armbruster  * we do it anyway for backward compatibility.
551c6684249SMarkus Armbruster  *
552c6684249SMarkus Armbruster  * @buf         contains the image's first @buf_size bytes.
5537cddd372SKevin Wolf  * @buf_size    is the buffer size in bytes (generally BLOCK_PROBE_BUF_SIZE,
5547cddd372SKevin Wolf  *              but can be smaller if the image file is smaller)
555c6684249SMarkus Armbruster  * @filename    is its filename.
556c6684249SMarkus Armbruster  *
557c6684249SMarkus Armbruster  * For all block drivers, call the bdrv_probe() method to get its
558c6684249SMarkus Armbruster  * probing score.
559c6684249SMarkus Armbruster  * Return the first block driver with the highest probing score.
560c6684249SMarkus Armbruster  */
56138f3ef57SKevin Wolf BlockDriver *bdrv_probe_all(const uint8_t *buf, int buf_size,
562c6684249SMarkus Armbruster                             const char *filename)
563c6684249SMarkus Armbruster {
564c6684249SMarkus Armbruster     int score_max = 0, score;
565c6684249SMarkus Armbruster     BlockDriver *drv = NULL, *d;
566c6684249SMarkus Armbruster 
567c6684249SMarkus Armbruster     QLIST_FOREACH(d, &bdrv_drivers, list) {
568c6684249SMarkus Armbruster         if (d->bdrv_probe) {
569c6684249SMarkus Armbruster             score = d->bdrv_probe(buf, buf_size, filename);
570c6684249SMarkus Armbruster             if (score > score_max) {
571c6684249SMarkus Armbruster                 score_max = score;
572c6684249SMarkus Armbruster                 drv = d;
573c6684249SMarkus Armbruster             }
574c6684249SMarkus Armbruster         }
575c6684249SMarkus Armbruster     }
576c6684249SMarkus Armbruster 
577c6684249SMarkus Armbruster     return drv;
578c6684249SMarkus Armbruster }
579c6684249SMarkus Armbruster 
580f500a6d3SKevin Wolf static int find_image_format(BlockDriverState *bs, const char *filename,
58134b5d2c6SMax Reitz                              BlockDriver **pdrv, Error **errp)
582ea2384d3Sbellard {
583c6684249SMarkus Armbruster     BlockDriver *drv;
5847cddd372SKevin Wolf     uint8_t buf[BLOCK_PROBE_BUF_SIZE];
585f500a6d3SKevin Wolf     int ret = 0;
586f8ea0b00SNicholas Bellinger 
58708a00559SKevin Wolf     /* Return the raw BlockDriver * to scsi-generic devices or empty drives */
588b192af8aSDimitris Aragiorgis     if (bdrv_is_sg(bs) || !bdrv_is_inserted(bs) || bdrv_getlength(bs) == 0) {
589ef810437SMax Reitz         *pdrv = &bdrv_raw;
590c98ac35dSStefan Weil         return ret;
5911a396859SNicholas A. Bellinger     }
592f8ea0b00SNicholas Bellinger 
59383f64091Sbellard     ret = bdrv_pread(bs, 0, buf, sizeof(buf));
594ea2384d3Sbellard     if (ret < 0) {
59534b5d2c6SMax Reitz         error_setg_errno(errp, -ret, "Could not read image for determining its "
59634b5d2c6SMax Reitz                          "format");
597c98ac35dSStefan Weil         *pdrv = NULL;
598c98ac35dSStefan Weil         return ret;
599ea2384d3Sbellard     }
600ea2384d3Sbellard 
601c6684249SMarkus Armbruster     drv = bdrv_probe_all(buf, ret, filename);
602c98ac35dSStefan Weil     if (!drv) {
60334b5d2c6SMax Reitz         error_setg(errp, "Could not determine image format: No compatible "
60434b5d2c6SMax Reitz                    "driver found");
605c98ac35dSStefan Weil         ret = -ENOENT;
606c98ac35dSStefan Weil     }
607c98ac35dSStefan Weil     *pdrv = drv;
608c98ac35dSStefan Weil     return ret;
609ea2384d3Sbellard }
610ea2384d3Sbellard 
61151762288SStefan Hajnoczi /**
61251762288SStefan Hajnoczi  * Set the current 'total_sectors' value
61365a9bb25SMarkus Armbruster  * Return 0 on success, -errno on error.
61451762288SStefan Hajnoczi  */
61551762288SStefan Hajnoczi static int refresh_total_sectors(BlockDriverState *bs, int64_t hint)
61651762288SStefan Hajnoczi {
61751762288SStefan Hajnoczi     BlockDriver *drv = bs->drv;
61851762288SStefan Hajnoczi 
619396759adSNicholas Bellinger     /* Do not attempt drv->bdrv_getlength() on scsi-generic devices */
620b192af8aSDimitris Aragiorgis     if (bdrv_is_sg(bs))
621396759adSNicholas Bellinger         return 0;
622396759adSNicholas Bellinger 
62351762288SStefan Hajnoczi     /* query actual device if possible, otherwise just trust the hint */
62451762288SStefan Hajnoczi     if (drv->bdrv_getlength) {
62551762288SStefan Hajnoczi         int64_t length = drv->bdrv_getlength(bs);
62651762288SStefan Hajnoczi         if (length < 0) {
62751762288SStefan Hajnoczi             return length;
62851762288SStefan Hajnoczi         }
6297e382003SFam Zheng         hint = DIV_ROUND_UP(length, BDRV_SECTOR_SIZE);
63051762288SStefan Hajnoczi     }
63151762288SStefan Hajnoczi 
63251762288SStefan Hajnoczi     bs->total_sectors = hint;
63351762288SStefan Hajnoczi     return 0;
63451762288SStefan Hajnoczi }
63551762288SStefan Hajnoczi 
636c3993cdcSStefan Hajnoczi /**
6379e8f1835SPaolo Bonzini  * Set open flags for a given discard mode
6389e8f1835SPaolo Bonzini  *
6399e8f1835SPaolo Bonzini  * Return 0 on success, -1 if the discard mode was invalid.
6409e8f1835SPaolo Bonzini  */
6419e8f1835SPaolo Bonzini int bdrv_parse_discard_flags(const char *mode, int *flags)
6429e8f1835SPaolo Bonzini {
6439e8f1835SPaolo Bonzini     *flags &= ~BDRV_O_UNMAP;
6449e8f1835SPaolo Bonzini 
6459e8f1835SPaolo Bonzini     if (!strcmp(mode, "off") || !strcmp(mode, "ignore")) {
6469e8f1835SPaolo Bonzini         /* do nothing */
6479e8f1835SPaolo Bonzini     } else if (!strcmp(mode, "on") || !strcmp(mode, "unmap")) {
6489e8f1835SPaolo Bonzini         *flags |= BDRV_O_UNMAP;
6499e8f1835SPaolo Bonzini     } else {
6509e8f1835SPaolo Bonzini         return -1;
6519e8f1835SPaolo Bonzini     }
6529e8f1835SPaolo Bonzini 
6539e8f1835SPaolo Bonzini     return 0;
6549e8f1835SPaolo Bonzini }
6559e8f1835SPaolo Bonzini 
6569e8f1835SPaolo Bonzini /**
657c3993cdcSStefan Hajnoczi  * Set open flags for a given cache mode
658c3993cdcSStefan Hajnoczi  *
659c3993cdcSStefan Hajnoczi  * Return 0 on success, -1 if the cache mode was invalid.
660c3993cdcSStefan Hajnoczi  */
661c3993cdcSStefan Hajnoczi int bdrv_parse_cache_flags(const char *mode, int *flags)
662c3993cdcSStefan Hajnoczi {
663c3993cdcSStefan Hajnoczi     *flags &= ~BDRV_O_CACHE_MASK;
664c3993cdcSStefan Hajnoczi 
665c3993cdcSStefan Hajnoczi     if (!strcmp(mode, "off") || !strcmp(mode, "none")) {
666c3993cdcSStefan Hajnoczi         *flags |= BDRV_O_NOCACHE | BDRV_O_CACHE_WB;
66792196b2fSStefan Hajnoczi     } else if (!strcmp(mode, "directsync")) {
66892196b2fSStefan Hajnoczi         *flags |= BDRV_O_NOCACHE;
669c3993cdcSStefan Hajnoczi     } else if (!strcmp(mode, "writeback")) {
670c3993cdcSStefan Hajnoczi         *flags |= BDRV_O_CACHE_WB;
671c3993cdcSStefan Hajnoczi     } else if (!strcmp(mode, "unsafe")) {
672c3993cdcSStefan Hajnoczi         *flags |= BDRV_O_CACHE_WB;
673c3993cdcSStefan Hajnoczi         *flags |= BDRV_O_NO_FLUSH;
674c3993cdcSStefan Hajnoczi     } else if (!strcmp(mode, "writethrough")) {
675c3993cdcSStefan Hajnoczi         /* this is the default */
676c3993cdcSStefan Hajnoczi     } else {
677c3993cdcSStefan Hajnoczi         return -1;
678c3993cdcSStefan Hajnoczi     }
679c3993cdcSStefan Hajnoczi 
680c3993cdcSStefan Hajnoczi     return 0;
681c3993cdcSStefan Hajnoczi }
682c3993cdcSStefan Hajnoczi 
6830b50cc88SKevin Wolf /*
684b1e6fc08SKevin Wolf  * Returns the flags that a temporary snapshot should get, based on the
685b1e6fc08SKevin Wolf  * originally requested flags (the originally requested image will have flags
686b1e6fc08SKevin Wolf  * like a backing file)
687b1e6fc08SKevin Wolf  */
688b1e6fc08SKevin Wolf static int bdrv_temp_snapshot_flags(int flags)
689b1e6fc08SKevin Wolf {
690b1e6fc08SKevin Wolf     return (flags & ~BDRV_O_SNAPSHOT) | BDRV_O_TEMPORARY;
691b1e6fc08SKevin Wolf }
692b1e6fc08SKevin Wolf 
693b1e6fc08SKevin Wolf /*
694f3930ed0SKevin Wolf  * Returns the flags that bs->file should get if a protocol driver is expected,
695f3930ed0SKevin Wolf  * based on the given flags for the parent BDS
6960b50cc88SKevin Wolf  */
6970b50cc88SKevin Wolf static int bdrv_inherited_flags(int flags)
6980b50cc88SKevin Wolf {
6990b50cc88SKevin Wolf     /* Enable protocol handling, disable format probing for bs->file */
7000b50cc88SKevin Wolf     flags |= BDRV_O_PROTOCOL;
7010b50cc88SKevin Wolf 
7020b50cc88SKevin Wolf     /* Our block drivers take care to send flushes and respect unmap policy,
7030b50cc88SKevin Wolf      * so we can enable both unconditionally on lower layers. */
7040b50cc88SKevin Wolf     flags |= BDRV_O_CACHE_WB | BDRV_O_UNMAP;
7050b50cc88SKevin Wolf 
7060b50cc88SKevin Wolf     /* Clear flags that only apply to the top layer */
7075669b44dSKevin Wolf     flags &= ~(BDRV_O_SNAPSHOT | BDRV_O_NO_BACKING | BDRV_O_COPY_ON_READ);
7080b50cc88SKevin Wolf 
7090b50cc88SKevin Wolf     return flags;
7100b50cc88SKevin Wolf }
7110b50cc88SKevin Wolf 
712f3930ed0SKevin Wolf const BdrvChildRole child_file = {
713f3930ed0SKevin Wolf     .inherit_flags = bdrv_inherited_flags,
714f3930ed0SKevin Wolf };
715f3930ed0SKevin Wolf 
716f3930ed0SKevin Wolf /*
717f3930ed0SKevin Wolf  * Returns the flags that bs->file should get if the use of formats (and not
718f3930ed0SKevin Wolf  * only protocols) is permitted for it, based on the given flags for the parent
719f3930ed0SKevin Wolf  * BDS
720f3930ed0SKevin Wolf  */
721f3930ed0SKevin Wolf static int bdrv_inherited_fmt_flags(int parent_flags)
722f3930ed0SKevin Wolf {
723f3930ed0SKevin Wolf     int flags = child_file.inherit_flags(parent_flags);
724f3930ed0SKevin Wolf     return flags & ~BDRV_O_PROTOCOL;
725f3930ed0SKevin Wolf }
726f3930ed0SKevin Wolf 
727f3930ed0SKevin Wolf const BdrvChildRole child_format = {
728f3930ed0SKevin Wolf     .inherit_flags = bdrv_inherited_fmt_flags,
729f3930ed0SKevin Wolf };
730f3930ed0SKevin Wolf 
731317fc44eSKevin Wolf /*
732317fc44eSKevin Wolf  * Returns the flags that bs->backing_hd should get, based on the given flags
733317fc44eSKevin Wolf  * for the parent BDS
734317fc44eSKevin Wolf  */
735317fc44eSKevin Wolf static int bdrv_backing_flags(int flags)
736317fc44eSKevin Wolf {
737317fc44eSKevin Wolf     /* backing files always opened read-only */
738317fc44eSKevin Wolf     flags &= ~(BDRV_O_RDWR | BDRV_O_COPY_ON_READ);
739317fc44eSKevin Wolf 
740317fc44eSKevin Wolf     /* snapshot=on is handled on the top layer */
7418bfea15dSKevin Wolf     flags &= ~(BDRV_O_SNAPSHOT | BDRV_O_TEMPORARY);
742317fc44eSKevin Wolf 
743317fc44eSKevin Wolf     return flags;
744317fc44eSKevin Wolf }
745317fc44eSKevin Wolf 
746f3930ed0SKevin Wolf static const BdrvChildRole child_backing = {
747f3930ed0SKevin Wolf     .inherit_flags = bdrv_backing_flags,
748f3930ed0SKevin Wolf };
749f3930ed0SKevin Wolf 
7507b272452SKevin Wolf static int bdrv_open_flags(BlockDriverState *bs, int flags)
7517b272452SKevin Wolf {
7527b272452SKevin Wolf     int open_flags = flags | BDRV_O_CACHE_WB;
7537b272452SKevin Wolf 
7547b272452SKevin Wolf     /*
7557b272452SKevin Wolf      * Clear flags that are internal to the block layer before opening the
7567b272452SKevin Wolf      * image.
7577b272452SKevin Wolf      */
75820cca275SKevin Wolf     open_flags &= ~(BDRV_O_SNAPSHOT | BDRV_O_NO_BACKING | BDRV_O_PROTOCOL);
7597b272452SKevin Wolf 
7607b272452SKevin Wolf     /*
7617b272452SKevin Wolf      * Snapshots should be writable.
7627b272452SKevin Wolf      */
7638bfea15dSKevin Wolf     if (flags & BDRV_O_TEMPORARY) {
7647b272452SKevin Wolf         open_flags |= BDRV_O_RDWR;
7657b272452SKevin Wolf     }
7667b272452SKevin Wolf 
7677b272452SKevin Wolf     return open_flags;
7687b272452SKevin Wolf }
7697b272452SKevin Wolf 
770636ea370SKevin Wolf static void bdrv_assign_node_name(BlockDriverState *bs,
7716913c0c2SBenoît Canet                                   const char *node_name,
7726913c0c2SBenoît Canet                                   Error **errp)
7736913c0c2SBenoît Canet {
7746913c0c2SBenoît Canet     if (!node_name) {
775636ea370SKevin Wolf         return;
7766913c0c2SBenoît Canet     }
7776913c0c2SBenoît Canet 
7789aebf3b8SKevin Wolf     /* Check for empty string or invalid characters */
779f5bebbbbSMarkus Armbruster     if (!id_wellformed(node_name)) {
7809aebf3b8SKevin Wolf         error_setg(errp, "Invalid node name");
781636ea370SKevin Wolf         return;
7826913c0c2SBenoît Canet     }
7836913c0c2SBenoît Canet 
7840c5e94eeSBenoît Canet     /* takes care of avoiding namespaces collisions */
7857f06d47eSMarkus Armbruster     if (blk_by_name(node_name)) {
7860c5e94eeSBenoît Canet         error_setg(errp, "node-name=%s is conflicting with a device id",
7870c5e94eeSBenoît Canet                    node_name);
788636ea370SKevin Wolf         return;
7890c5e94eeSBenoît Canet     }
7900c5e94eeSBenoît Canet 
7916913c0c2SBenoît Canet     /* takes care of avoiding duplicates node names */
7926913c0c2SBenoît Canet     if (bdrv_find_node(node_name)) {
7936913c0c2SBenoît Canet         error_setg(errp, "Duplicate node name");
794636ea370SKevin Wolf         return;
7956913c0c2SBenoît Canet     }
7966913c0c2SBenoît Canet 
7976913c0c2SBenoît Canet     /* copy node name into the bs and insert it into the graph list */
7986913c0c2SBenoît Canet     pstrcpy(bs->node_name, sizeof(bs->node_name), node_name);
7996913c0c2SBenoît Canet     QTAILQ_INSERT_TAIL(&graph_bdrv_states, bs, node_list);
8006913c0c2SBenoît Canet }
8016913c0c2SBenoît Canet 
80218edf289SKevin Wolf static QemuOptsList bdrv_runtime_opts = {
80318edf289SKevin Wolf     .name = "bdrv_common",
80418edf289SKevin Wolf     .head = QTAILQ_HEAD_INITIALIZER(bdrv_runtime_opts.head),
80518edf289SKevin Wolf     .desc = {
80618edf289SKevin Wolf         {
80718edf289SKevin Wolf             .name = "node-name",
80818edf289SKevin Wolf             .type = QEMU_OPT_STRING,
80918edf289SKevin Wolf             .help = "Node name of the block device node",
81018edf289SKevin Wolf         },
81118edf289SKevin Wolf         { /* end of list */ }
81218edf289SKevin Wolf     },
81318edf289SKevin Wolf };
81418edf289SKevin Wolf 
815b6ce07aaSKevin Wolf /*
81657915332SKevin Wolf  * Common part for opening disk images and files
817b6ad491aSKevin Wolf  *
818b6ad491aSKevin Wolf  * Removes all processed options from *options.
81957915332SKevin Wolf  */
820f500a6d3SKevin Wolf static int bdrv_open_common(BlockDriverState *bs, BlockDriverState *file,
82134b5d2c6SMax Reitz     QDict *options, int flags, BlockDriver *drv, Error **errp)
82257915332SKevin Wolf {
82357915332SKevin Wolf     int ret, open_flags;
824035fccdfSKevin Wolf     const char *filename;
8256913c0c2SBenoît Canet     const char *node_name = NULL;
82618edf289SKevin Wolf     QemuOpts *opts;
82734b5d2c6SMax Reitz     Error *local_err = NULL;
82857915332SKevin Wolf 
82957915332SKevin Wolf     assert(drv != NULL);
8306405875cSPaolo Bonzini     assert(bs->file == NULL);
831707ff828SKevin Wolf     assert(options != NULL && bs->options != options);
83257915332SKevin Wolf 
83345673671SKevin Wolf     if (file != NULL) {
83445673671SKevin Wolf         filename = file->filename;
83545673671SKevin Wolf     } else {
83645673671SKevin Wolf         filename = qdict_get_try_str(options, "filename");
83745673671SKevin Wolf     }
83845673671SKevin Wolf 
839765003dbSKevin Wolf     if (drv->bdrv_needs_filename && !filename) {
840765003dbSKevin Wolf         error_setg(errp, "The '%s' block driver requires a file name",
841765003dbSKevin Wolf                    drv->format_name);
842765003dbSKevin Wolf         return -EINVAL;
843765003dbSKevin Wolf     }
844765003dbSKevin Wolf 
84545673671SKevin Wolf     trace_bdrv_open_common(bs, filename ?: "", flags, drv->format_name);
84628dcee10SStefan Hajnoczi 
84718edf289SKevin Wolf     opts = qemu_opts_create(&bdrv_runtime_opts, NULL, 0, &error_abort);
84818edf289SKevin Wolf     qemu_opts_absorb_qdict(opts, options, &local_err);
84918edf289SKevin Wolf     if (local_err) {
85018edf289SKevin Wolf         error_propagate(errp, local_err);
85118edf289SKevin Wolf         ret = -EINVAL;
85218edf289SKevin Wolf         goto fail_opts;
85318edf289SKevin Wolf     }
85418edf289SKevin Wolf 
85518edf289SKevin Wolf     node_name = qemu_opt_get(opts, "node-name");
856636ea370SKevin Wolf     bdrv_assign_node_name(bs, node_name, &local_err);
8570fb6395cSMarkus Armbruster     if (local_err) {
858636ea370SKevin Wolf         error_propagate(errp, local_err);
85918edf289SKevin Wolf         ret = -EINVAL;
86018edf289SKevin Wolf         goto fail_opts;
8615d186eb0SKevin Wolf     }
8625d186eb0SKevin Wolf 
8631b7fd729SPaolo Bonzini     bs->guest_block_size = 512;
864c25f53b0SPaolo Bonzini     bs->request_alignment = 512;
8650d51b4deSAsias He     bs->zero_beyond_eof = true;
866b64ec4e4SFam Zheng     open_flags = bdrv_open_flags(bs, flags);
867b64ec4e4SFam Zheng     bs->read_only = !(open_flags & BDRV_O_RDWR);
868b64ec4e4SFam Zheng 
869b64ec4e4SFam Zheng     if (use_bdrv_whitelist && !bdrv_is_whitelisted(drv, bs->read_only)) {
8708f94a6e4SKevin Wolf         error_setg(errp,
8718f94a6e4SKevin Wolf                    !bs->read_only && bdrv_is_whitelisted(drv, true)
8728f94a6e4SKevin Wolf                         ? "Driver '%s' can only be used for read-only devices"
8738f94a6e4SKevin Wolf                         : "Driver '%s' is not whitelisted",
8748f94a6e4SKevin Wolf                    drv->format_name);
87518edf289SKevin Wolf         ret = -ENOTSUP;
87618edf289SKevin Wolf         goto fail_opts;
877b64ec4e4SFam Zheng     }
87857915332SKevin Wolf 
87953fec9d3SStefan Hajnoczi     assert(bs->copy_on_read == 0); /* bdrv_new() and bdrv_close() make it so */
8800ebd24e0SKevin Wolf     if (flags & BDRV_O_COPY_ON_READ) {
8810ebd24e0SKevin Wolf         if (!bs->read_only) {
88253fec9d3SStefan Hajnoczi             bdrv_enable_copy_on_read(bs);
8830ebd24e0SKevin Wolf         } else {
8840ebd24e0SKevin Wolf             error_setg(errp, "Can't use copy-on-read on read-only device");
88518edf289SKevin Wolf             ret = -EINVAL;
88618edf289SKevin Wolf             goto fail_opts;
8870ebd24e0SKevin Wolf         }
88853fec9d3SStefan Hajnoczi     }
88953fec9d3SStefan Hajnoczi 
890c2ad1b0cSKevin Wolf     if (filename != NULL) {
89157915332SKevin Wolf         pstrcpy(bs->filename, sizeof(bs->filename), filename);
892c2ad1b0cSKevin Wolf     } else {
893c2ad1b0cSKevin Wolf         bs->filename[0] = '\0';
894c2ad1b0cSKevin Wolf     }
89591af7014SMax Reitz     pstrcpy(bs->exact_filename, sizeof(bs->exact_filename), bs->filename);
89657915332SKevin Wolf 
89757915332SKevin Wolf     bs->drv = drv;
8987267c094SAnthony Liguori     bs->opaque = g_malloc0(drv->instance_size);
89957915332SKevin Wolf 
90003f541bdSStefan Hajnoczi     bs->enable_write_cache = !!(flags & BDRV_O_CACHE_WB);
901e7c63796SStefan Hajnoczi 
90266f82ceeSKevin Wolf     /* Open the image, either directly or using a protocol */
90366f82ceeSKevin Wolf     if (drv->bdrv_file_open) {
9045d186eb0SKevin Wolf         assert(file == NULL);
905030be321SBenoît Canet         assert(!drv->bdrv_needs_filename || filename != NULL);
90634b5d2c6SMax Reitz         ret = drv->bdrv_file_open(bs, options, open_flags, &local_err);
907f500a6d3SKevin Wolf     } else {
9082af5ef70SKevin Wolf         if (file == NULL) {
90934b5d2c6SMax Reitz             error_setg(errp, "Can't use '%s' as a block driver for the "
91034b5d2c6SMax Reitz                        "protocol level", drv->format_name);
9112af5ef70SKevin Wolf             ret = -EINVAL;
9122af5ef70SKevin Wolf             goto free_and_fail;
9132af5ef70SKevin Wolf         }
914f500a6d3SKevin Wolf         bs->file = file;
91534b5d2c6SMax Reitz         ret = drv->bdrv_open(bs, options, open_flags, &local_err);
91666f82ceeSKevin Wolf     }
91766f82ceeSKevin Wolf 
91857915332SKevin Wolf     if (ret < 0) {
91984d18f06SMarkus Armbruster         if (local_err) {
92034b5d2c6SMax Reitz             error_propagate(errp, local_err);
9212fa9aa59SDunrong Huang         } else if (bs->filename[0]) {
9222fa9aa59SDunrong Huang             error_setg_errno(errp, -ret, "Could not open '%s'", bs->filename);
92334b5d2c6SMax Reitz         } else {
92434b5d2c6SMax Reitz             error_setg_errno(errp, -ret, "Could not open image");
92534b5d2c6SMax Reitz         }
92657915332SKevin Wolf         goto free_and_fail;
92757915332SKevin Wolf     }
92857915332SKevin Wolf 
929a1f688f4SMarkus Armbruster     if (bs->encrypted) {
930a1f688f4SMarkus Armbruster         error_report("Encrypted images are deprecated");
931a1f688f4SMarkus Armbruster         error_printf("Support for them will be removed in a future release.\n"
932a1f688f4SMarkus Armbruster                      "You can use 'qemu-img convert' to convert your image"
933a1f688f4SMarkus Armbruster                      " to an unencrypted one.\n");
934a1f688f4SMarkus Armbruster     }
935a1f688f4SMarkus Armbruster 
93651762288SStefan Hajnoczi     ret = refresh_total_sectors(bs, bs->total_sectors);
93751762288SStefan Hajnoczi     if (ret < 0) {
93834b5d2c6SMax Reitz         error_setg_errno(errp, -ret, "Could not refresh total sector count");
93951762288SStefan Hajnoczi         goto free_and_fail;
94057915332SKevin Wolf     }
94151762288SStefan Hajnoczi 
9423baca891SKevin Wolf     bdrv_refresh_limits(bs, &local_err);
9433baca891SKevin Wolf     if (local_err) {
9443baca891SKevin Wolf         error_propagate(errp, local_err);
9453baca891SKevin Wolf         ret = -EINVAL;
9463baca891SKevin Wolf         goto free_and_fail;
9473baca891SKevin Wolf     }
9483baca891SKevin Wolf 
949c25f53b0SPaolo Bonzini     assert(bdrv_opt_mem_align(bs) != 0);
9504196d2f0SDenis V. Lunev     assert(bdrv_min_mem_align(bs) != 0);
951b192af8aSDimitris Aragiorgis     assert((bs->request_alignment != 0) || bdrv_is_sg(bs));
95218edf289SKevin Wolf 
95318edf289SKevin Wolf     qemu_opts_del(opts);
95457915332SKevin Wolf     return 0;
95557915332SKevin Wolf 
95657915332SKevin Wolf free_and_fail:
95766f82ceeSKevin Wolf     bs->file = NULL;
9587267c094SAnthony Liguori     g_free(bs->opaque);
95957915332SKevin Wolf     bs->opaque = NULL;
96057915332SKevin Wolf     bs->drv = NULL;
96118edf289SKevin Wolf fail_opts:
96218edf289SKevin Wolf     qemu_opts_del(opts);
96357915332SKevin Wolf     return ret;
96457915332SKevin Wolf }
96557915332SKevin Wolf 
9665e5c4f63SKevin Wolf static QDict *parse_json_filename(const char *filename, Error **errp)
9675e5c4f63SKevin Wolf {
9685e5c4f63SKevin Wolf     QObject *options_obj;
9695e5c4f63SKevin Wolf     QDict *options;
9705e5c4f63SKevin Wolf     int ret;
9715e5c4f63SKevin Wolf 
9725e5c4f63SKevin Wolf     ret = strstart(filename, "json:", &filename);
9735e5c4f63SKevin Wolf     assert(ret);
9745e5c4f63SKevin Wolf 
9755e5c4f63SKevin Wolf     options_obj = qobject_from_json(filename);
9765e5c4f63SKevin Wolf     if (!options_obj) {
9775e5c4f63SKevin Wolf         error_setg(errp, "Could not parse the JSON options");
9785e5c4f63SKevin Wolf         return NULL;
9795e5c4f63SKevin Wolf     }
9805e5c4f63SKevin Wolf 
9815e5c4f63SKevin Wolf     if (qobject_type(options_obj) != QTYPE_QDICT) {
9825e5c4f63SKevin Wolf         qobject_decref(options_obj);
9835e5c4f63SKevin Wolf         error_setg(errp, "Invalid JSON object given");
9845e5c4f63SKevin Wolf         return NULL;
9855e5c4f63SKevin Wolf     }
9865e5c4f63SKevin Wolf 
9875e5c4f63SKevin Wolf     options = qobject_to_qdict(options_obj);
9885e5c4f63SKevin Wolf     qdict_flatten(options);
9895e5c4f63SKevin Wolf 
9905e5c4f63SKevin Wolf     return options;
9915e5c4f63SKevin Wolf }
9925e5c4f63SKevin Wolf 
99357915332SKevin Wolf /*
994f54120ffSKevin Wolf  * Fills in default options for opening images and converts the legacy
995f54120ffSKevin Wolf  * filename/flags pair to option QDict entries.
99653a29513SMax Reitz  * The BDRV_O_PROTOCOL flag in *flags will be set or cleared accordingly if a
99753a29513SMax Reitz  * block driver has been specified explicitly.
998f54120ffSKevin Wolf  */
99953a29513SMax Reitz static int bdrv_fill_options(QDict **options, const char **pfilename,
100053a29513SMax Reitz                              int *flags, BlockDriver *drv, Error **errp)
1001f54120ffSKevin Wolf {
10025e5c4f63SKevin Wolf     const char *filename = *pfilename;
1003f54120ffSKevin Wolf     const char *drvname;
100453a29513SMax Reitz     bool protocol = *flags & BDRV_O_PROTOCOL;
1005f54120ffSKevin Wolf     bool parse_filename = false;
100653a29513SMax Reitz     BlockDriver *tmp_drv;
1007f54120ffSKevin Wolf     Error *local_err = NULL;
1008f54120ffSKevin Wolf 
10095e5c4f63SKevin Wolf     /* Parse json: pseudo-protocol */
10105e5c4f63SKevin Wolf     if (filename && g_str_has_prefix(filename, "json:")) {
10115e5c4f63SKevin Wolf         QDict *json_options = parse_json_filename(filename, &local_err);
10125e5c4f63SKevin Wolf         if (local_err) {
10135e5c4f63SKevin Wolf             error_propagate(errp, local_err);
10145e5c4f63SKevin Wolf             return -EINVAL;
10155e5c4f63SKevin Wolf         }
10165e5c4f63SKevin Wolf 
10175e5c4f63SKevin Wolf         /* Options given in the filename have lower priority than options
10185e5c4f63SKevin Wolf          * specified directly */
10195e5c4f63SKevin Wolf         qdict_join(*options, json_options, false);
10205e5c4f63SKevin Wolf         QDECREF(json_options);
10215e5c4f63SKevin Wolf         *pfilename = filename = NULL;
10225e5c4f63SKevin Wolf     }
10235e5c4f63SKevin Wolf 
102453a29513SMax Reitz     drvname = qdict_get_try_str(*options, "driver");
102553a29513SMax Reitz 
102653a29513SMax Reitz     /* If the user has explicitly specified the driver, this choice should
102753a29513SMax Reitz      * override the BDRV_O_PROTOCOL flag */
102853a29513SMax Reitz     tmp_drv = drv;
102953a29513SMax Reitz     if (!tmp_drv && drvname) {
103053a29513SMax Reitz         tmp_drv = bdrv_find_format(drvname);
103153a29513SMax Reitz     }
103253a29513SMax Reitz     if (tmp_drv) {
103353a29513SMax Reitz         protocol = tmp_drv->bdrv_file_open;
103453a29513SMax Reitz     }
103553a29513SMax Reitz 
103653a29513SMax Reitz     if (protocol) {
103753a29513SMax Reitz         *flags |= BDRV_O_PROTOCOL;
103853a29513SMax Reitz     } else {
103953a29513SMax Reitz         *flags &= ~BDRV_O_PROTOCOL;
104053a29513SMax Reitz     }
104153a29513SMax Reitz 
1042f54120ffSKevin Wolf     /* Fetch the file name from the options QDict if necessary */
104317b005f1SKevin Wolf     if (protocol && filename) {
1044f54120ffSKevin Wolf         if (!qdict_haskey(*options, "filename")) {
1045f54120ffSKevin Wolf             qdict_put(*options, "filename", qstring_from_str(filename));
1046f54120ffSKevin Wolf             parse_filename = true;
1047f54120ffSKevin Wolf         } else {
1048f54120ffSKevin Wolf             error_setg(errp, "Can't specify 'file' and 'filename' options at "
1049f54120ffSKevin Wolf                              "the same time");
1050f54120ffSKevin Wolf             return -EINVAL;
1051f54120ffSKevin Wolf         }
1052f54120ffSKevin Wolf     }
1053f54120ffSKevin Wolf 
1054f54120ffSKevin Wolf     /* Find the right block driver */
1055f54120ffSKevin Wolf     filename = qdict_get_try_str(*options, "filename");
1056f54120ffSKevin Wolf 
105717b005f1SKevin Wolf     if (drv) {
105817b005f1SKevin Wolf         if (drvname) {
105917b005f1SKevin Wolf             error_setg(errp, "Driver specified twice");
106017b005f1SKevin Wolf             return -EINVAL;
106117b005f1SKevin Wolf         }
106217b005f1SKevin Wolf         drvname = drv->format_name;
106317b005f1SKevin Wolf         qdict_put(*options, "driver", qstring_from_str(drvname));
106417b005f1SKevin Wolf     } else {
106517b005f1SKevin Wolf         if (!drvname && protocol) {
1066f54120ffSKevin Wolf             if (filename) {
1067b65a5e12SMax Reitz                 drv = bdrv_find_protocol(filename, parse_filename, errp);
1068f54120ffSKevin Wolf                 if (!drv) {
1069f54120ffSKevin Wolf                     return -EINVAL;
1070f54120ffSKevin Wolf                 }
1071f54120ffSKevin Wolf 
1072f54120ffSKevin Wolf                 drvname = drv->format_name;
1073f54120ffSKevin Wolf                 qdict_put(*options, "driver", qstring_from_str(drvname));
1074f54120ffSKevin Wolf             } else {
1075f54120ffSKevin Wolf                 error_setg(errp, "Must specify either driver or file");
1076f54120ffSKevin Wolf                 return -EINVAL;
1077f54120ffSKevin Wolf             }
107817b005f1SKevin Wolf         } else if (drvname) {
1079f54120ffSKevin Wolf             drv = bdrv_find_format(drvname);
1080f54120ffSKevin Wolf             if (!drv) {
1081f54120ffSKevin Wolf                 error_setg(errp, "Unknown driver '%s'", drvname);
1082f54120ffSKevin Wolf                 return -ENOENT;
1083f54120ffSKevin Wolf             }
108417b005f1SKevin Wolf         }
108517b005f1SKevin Wolf     }
108617b005f1SKevin Wolf 
108717b005f1SKevin Wolf     assert(drv || !protocol);
1088f54120ffSKevin Wolf 
1089f54120ffSKevin Wolf     /* Driver-specific filename parsing */
109017b005f1SKevin Wolf     if (drv && drv->bdrv_parse_filename && parse_filename) {
1091f54120ffSKevin Wolf         drv->bdrv_parse_filename(filename, *options, &local_err);
1092f54120ffSKevin Wolf         if (local_err) {
1093f54120ffSKevin Wolf             error_propagate(errp, local_err);
1094f54120ffSKevin Wolf             return -EINVAL;
1095f54120ffSKevin Wolf         }
1096f54120ffSKevin Wolf 
1097f54120ffSKevin Wolf         if (!drv->bdrv_needs_filename) {
1098f54120ffSKevin Wolf             qdict_del(*options, "filename");
1099f54120ffSKevin Wolf         }
1100f54120ffSKevin Wolf     }
1101f54120ffSKevin Wolf 
1102f54120ffSKevin Wolf     return 0;
1103f54120ffSKevin Wolf }
1104f54120ffSKevin Wolf 
1105*b4b059f6SKevin Wolf static BdrvChild *bdrv_attach_child(BlockDriverState *parent_bs,
1106df581792SKevin Wolf                                     BlockDriverState *child_bs,
1107df581792SKevin Wolf                                     const BdrvChildRole *child_role)
1108df581792SKevin Wolf {
1109df581792SKevin Wolf     BdrvChild *child = g_new(BdrvChild, 1);
1110df581792SKevin Wolf     *child = (BdrvChild) {
1111df581792SKevin Wolf         .bs     = child_bs,
1112df581792SKevin Wolf         .role   = child_role,
1113df581792SKevin Wolf     };
1114df581792SKevin Wolf 
1115df581792SKevin Wolf     QLIST_INSERT_HEAD(&parent_bs->children, child, next);
1116*b4b059f6SKevin Wolf 
1117*b4b059f6SKevin Wolf     return child;
1118df581792SKevin Wolf }
1119df581792SKevin Wolf 
11208d24cce1SFam Zheng void bdrv_set_backing_hd(BlockDriverState *bs, BlockDriverState *backing_hd)
11218d24cce1SFam Zheng {
11228d24cce1SFam Zheng 
1123826b6ca0SFam Zheng     if (bs->backing_hd) {
1124826b6ca0SFam Zheng         assert(bs->backing_blocker);
1125826b6ca0SFam Zheng         bdrv_op_unblock_all(bs->backing_hd, bs->backing_blocker);
1126826b6ca0SFam Zheng     } else if (backing_hd) {
1127826b6ca0SFam Zheng         error_setg(&bs->backing_blocker,
112881e5f78aSAlberto Garcia                    "node is used as backing hd of '%s'",
112981e5f78aSAlberto Garcia                    bdrv_get_device_or_node_name(bs));
1130826b6ca0SFam Zheng     }
1131826b6ca0SFam Zheng 
11328d24cce1SFam Zheng     bs->backing_hd = backing_hd;
11338d24cce1SFam Zheng     if (!backing_hd) {
1134826b6ca0SFam Zheng         error_free(bs->backing_blocker);
1135826b6ca0SFam Zheng         bs->backing_blocker = NULL;
11368d24cce1SFam Zheng         goto out;
11378d24cce1SFam Zheng     }
11388d24cce1SFam Zheng     bs->open_flags &= ~BDRV_O_NO_BACKING;
11398d24cce1SFam Zheng     pstrcpy(bs->backing_file, sizeof(bs->backing_file), backing_hd->filename);
11408d24cce1SFam Zheng     pstrcpy(bs->backing_format, sizeof(bs->backing_format),
11418d24cce1SFam Zheng             backing_hd->drv ? backing_hd->drv->format_name : "");
1142826b6ca0SFam Zheng 
1143826b6ca0SFam Zheng     bdrv_op_block_all(bs->backing_hd, bs->backing_blocker);
1144826b6ca0SFam Zheng     /* Otherwise we won't be able to commit due to check in bdrv_commit */
1145bb00021dSFam Zheng     bdrv_op_unblock(bs->backing_hd, BLOCK_OP_TYPE_COMMIT_TARGET,
1146826b6ca0SFam Zheng                     bs->backing_blocker);
11478d24cce1SFam Zheng out:
11483baca891SKevin Wolf     bdrv_refresh_limits(bs, NULL);
11498d24cce1SFam Zheng }
11508d24cce1SFam Zheng 
115131ca6d07SKevin Wolf /*
115231ca6d07SKevin Wolf  * Opens the backing file for a BlockDriverState if not yet open
115331ca6d07SKevin Wolf  *
115431ca6d07SKevin Wolf  * options is a QDict of options to pass to the block drivers, or NULL for an
115531ca6d07SKevin Wolf  * empty set of options. The reference to the QDict is transferred to this
115631ca6d07SKevin Wolf  * function (even on failure), so if the caller intends to reuse the dictionary,
115731ca6d07SKevin Wolf  * it needs to use QINCREF() before calling bdrv_file_open.
115831ca6d07SKevin Wolf  */
115934b5d2c6SMax Reitz int bdrv_open_backing_file(BlockDriverState *bs, QDict *options, Error **errp)
11609156df12SPaolo Bonzini {
11611ba4b6a5SBenoît Canet     char *backing_filename = g_malloc0(PATH_MAX);
1162317fc44eSKevin Wolf     int ret = 0;
11638d24cce1SFam Zheng     BlockDriverState *backing_hd;
116434b5d2c6SMax Reitz     Error *local_err = NULL;
11659156df12SPaolo Bonzini 
11669156df12SPaolo Bonzini     if (bs->backing_hd != NULL) {
116731ca6d07SKevin Wolf         QDECREF(options);
11681ba4b6a5SBenoît Canet         goto free_exit;
11699156df12SPaolo Bonzini     }
11709156df12SPaolo Bonzini 
117131ca6d07SKevin Wolf     /* NULL means an empty set of options */
117231ca6d07SKevin Wolf     if (options == NULL) {
117331ca6d07SKevin Wolf         options = qdict_new();
117431ca6d07SKevin Wolf     }
117531ca6d07SKevin Wolf 
11769156df12SPaolo Bonzini     bs->open_flags &= ~BDRV_O_NO_BACKING;
11771cb6f506SKevin Wolf     if (qdict_haskey(options, "file.filename")) {
11781cb6f506SKevin Wolf         backing_filename[0] = '\0';
11791cb6f506SKevin Wolf     } else if (bs->backing_file[0] == '\0' && qdict_size(options) == 0) {
118031ca6d07SKevin Wolf         QDECREF(options);
11811ba4b6a5SBenoît Canet         goto free_exit;
1182dbecebddSFam Zheng     } else {
11839f07429eSMax Reitz         bdrv_get_full_backing_filename(bs, backing_filename, PATH_MAX,
11849f07429eSMax Reitz                                        &local_err);
11859f07429eSMax Reitz         if (local_err) {
11869f07429eSMax Reitz             ret = -EINVAL;
11879f07429eSMax Reitz             error_propagate(errp, local_err);
11889f07429eSMax Reitz             QDECREF(options);
11899f07429eSMax Reitz             goto free_exit;
11909f07429eSMax Reitz         }
11919156df12SPaolo Bonzini     }
11929156df12SPaolo Bonzini 
11938ee79e70SKevin Wolf     if (!bs->drv || !bs->drv->supports_backing) {
11948ee79e70SKevin Wolf         ret = -EINVAL;
11958ee79e70SKevin Wolf         error_setg(errp, "Driver doesn't support backing files");
11968ee79e70SKevin Wolf         QDECREF(options);
11978ee79e70SKevin Wolf         goto free_exit;
11988ee79e70SKevin Wolf     }
11998ee79e70SKevin Wolf 
1200e4e9986bSMarkus Armbruster     backing_hd = bdrv_new();
12018d24cce1SFam Zheng 
1202c5f6e493SKevin Wolf     if (bs->backing_format[0] != '\0' && !qdict_haskey(options, "driver")) {
1203c5f6e493SKevin Wolf         qdict_put(options, "driver", qstring_from_str(bs->backing_format));
12049156df12SPaolo Bonzini     }
12059156df12SPaolo Bonzini 
1206f67503e5SMax Reitz     assert(bs->backing_hd == NULL);
1207f3930ed0SKevin Wolf     ret = bdrv_open_inherit(&backing_hd,
1208f3930ed0SKevin Wolf                             *backing_filename ? backing_filename : NULL,
1209f3930ed0SKevin Wolf                             NULL, options, 0, bs, &child_backing,
1210f3930ed0SKevin Wolf                             NULL, &local_err);
12119156df12SPaolo Bonzini     if (ret < 0) {
12128d24cce1SFam Zheng         bdrv_unref(backing_hd);
12138d24cce1SFam Zheng         backing_hd = NULL;
12149156df12SPaolo Bonzini         bs->open_flags |= BDRV_O_NO_BACKING;
1215b04b6b6eSFam Zheng         error_setg(errp, "Could not open backing file: %s",
1216b04b6b6eSFam Zheng                    error_get_pretty(local_err));
1217b04b6b6eSFam Zheng         error_free(local_err);
12181ba4b6a5SBenoît Canet         goto free_exit;
12199156df12SPaolo Bonzini     }
1220df581792SKevin Wolf 
1221df581792SKevin Wolf     bdrv_attach_child(bs, backing_hd, &child_backing);
12228d24cce1SFam Zheng     bdrv_set_backing_hd(bs, backing_hd);
1223d80ac658SPeter Feiner 
12241ba4b6a5SBenoît Canet free_exit:
12251ba4b6a5SBenoît Canet     g_free(backing_filename);
12261ba4b6a5SBenoît Canet     return ret;
12279156df12SPaolo Bonzini }
12289156df12SPaolo Bonzini 
1229b6ce07aaSKevin Wolf /*
1230da557aacSMax Reitz  * Opens a disk image whose options are given as BlockdevRef in another block
1231da557aacSMax Reitz  * device's options.
1232da557aacSMax Reitz  *
1233da557aacSMax Reitz  * If allow_none is true, no image will be opened if filename is false and no
1234*b4b059f6SKevin Wolf  * BlockdevRef is given. NULL will be returned, but errp remains unset.
1235da557aacSMax Reitz  *
1236da557aacSMax Reitz  * bdrev_key specifies the key for the image's BlockdevRef in the options QDict.
1237da557aacSMax Reitz  * That QDict has to be flattened; therefore, if the BlockdevRef is a QDict
1238da557aacSMax Reitz  * itself, all options starting with "${bdref_key}." are considered part of the
1239da557aacSMax Reitz  * BlockdevRef.
1240da557aacSMax Reitz  *
1241da557aacSMax Reitz  * The BlockdevRef will be removed from the options QDict.
1242da557aacSMax Reitz  */
1243*b4b059f6SKevin Wolf BdrvChild *bdrv_open_child(const char *filename,
1244f3930ed0SKevin Wolf                            QDict *options, const char *bdref_key,
1245*b4b059f6SKevin Wolf                            BlockDriverState* parent,
1246*b4b059f6SKevin Wolf                            const BdrvChildRole *child_role,
1247f7d9fd8cSMax Reitz                            bool allow_none, Error **errp)
1248da557aacSMax Reitz {
1249*b4b059f6SKevin Wolf     BdrvChild *c = NULL;
1250*b4b059f6SKevin Wolf     BlockDriverState *bs;
1251da557aacSMax Reitz     QDict *image_options;
1252da557aacSMax Reitz     int ret;
1253da557aacSMax Reitz     char *bdref_key_dot;
1254da557aacSMax Reitz     const char *reference;
1255da557aacSMax Reitz 
1256df581792SKevin Wolf     assert(child_role != NULL);
1257f67503e5SMax Reitz 
1258da557aacSMax Reitz     bdref_key_dot = g_strdup_printf("%s.", bdref_key);
1259da557aacSMax Reitz     qdict_extract_subqdict(options, &image_options, bdref_key_dot);
1260da557aacSMax Reitz     g_free(bdref_key_dot);
1261da557aacSMax Reitz 
1262da557aacSMax Reitz     reference = qdict_get_try_str(options, bdref_key);
1263da557aacSMax Reitz     if (!filename && !reference && !qdict_size(image_options)) {
1264*b4b059f6SKevin Wolf         if (!allow_none) {
1265da557aacSMax Reitz             error_setg(errp, "A block device must be specified for \"%s\"",
1266da557aacSMax Reitz                        bdref_key);
1267da557aacSMax Reitz         }
1268b20e61e0SMarkus Armbruster         QDECREF(image_options);
1269da557aacSMax Reitz         goto done;
1270da557aacSMax Reitz     }
1271da557aacSMax Reitz 
1272*b4b059f6SKevin Wolf     bs = NULL;
1273*b4b059f6SKevin Wolf     ret = bdrv_open_inherit(&bs, filename, reference, image_options, 0,
1274f3930ed0SKevin Wolf                             parent, child_role, NULL, errp);
1275df581792SKevin Wolf     if (ret < 0) {
1276df581792SKevin Wolf         goto done;
1277df581792SKevin Wolf     }
1278df581792SKevin Wolf 
1279*b4b059f6SKevin Wolf     c = bdrv_attach_child(parent, bs, child_role);
1280da557aacSMax Reitz 
1281da557aacSMax Reitz done:
1282da557aacSMax Reitz     qdict_del(options, bdref_key);
1283*b4b059f6SKevin Wolf     return c;
1284*b4b059f6SKevin Wolf }
1285*b4b059f6SKevin Wolf 
1286*b4b059f6SKevin Wolf /*
1287*b4b059f6SKevin Wolf  * This is a version of bdrv_open_child() that returns 0/-EINVAL instead of
1288*b4b059f6SKevin Wolf  * a BdrvChild object.
1289*b4b059f6SKevin Wolf  *
1290*b4b059f6SKevin Wolf  * If allow_none is true, no image will be opened if filename is false and no
1291*b4b059f6SKevin Wolf  * BlockdevRef is given. *pbs will remain unchanged and 0 will be returned.
1292*b4b059f6SKevin Wolf  *
1293*b4b059f6SKevin Wolf  * To conform with the behavior of bdrv_open(), *pbs has to be NULL.
1294*b4b059f6SKevin Wolf  */
1295*b4b059f6SKevin Wolf int bdrv_open_image(BlockDriverState **pbs, const char *filename,
1296*b4b059f6SKevin Wolf                     QDict *options, const char *bdref_key,
1297*b4b059f6SKevin Wolf                     BlockDriverState* parent, const BdrvChildRole *child_role,
1298*b4b059f6SKevin Wolf                     bool allow_none, Error **errp)
1299*b4b059f6SKevin Wolf {
1300*b4b059f6SKevin Wolf     Error *local_err = NULL;
1301*b4b059f6SKevin Wolf     BdrvChild *c;
1302*b4b059f6SKevin Wolf 
1303*b4b059f6SKevin Wolf     assert(pbs);
1304*b4b059f6SKevin Wolf     assert(*pbs == NULL);
1305*b4b059f6SKevin Wolf 
1306*b4b059f6SKevin Wolf     c = bdrv_open_child(filename, options, bdref_key, parent, child_role,
1307*b4b059f6SKevin Wolf                         allow_none, &local_err);
1308*b4b059f6SKevin Wolf     if (local_err) {
1309*b4b059f6SKevin Wolf         error_propagate(errp, local_err);
1310*b4b059f6SKevin Wolf         return -EINVAL;
1311*b4b059f6SKevin Wolf     }
1312*b4b059f6SKevin Wolf 
1313*b4b059f6SKevin Wolf     if (c != NULL) {
1314*b4b059f6SKevin Wolf         *pbs = c->bs;
1315*b4b059f6SKevin Wolf     }
1316*b4b059f6SKevin Wolf 
1317*b4b059f6SKevin Wolf     return 0;
1318da557aacSMax Reitz }
1319da557aacSMax Reitz 
13206b8aeca5SChen Gang int bdrv_append_temp_snapshot(BlockDriverState *bs, int flags, Error **errp)
1321b998875dSKevin Wolf {
1322b998875dSKevin Wolf     /* TODO: extra byte is a hack to ensure MAX_PATH space on Windows. */
13231ba4b6a5SBenoît Canet     char *tmp_filename = g_malloc0(PATH_MAX + 1);
1324b998875dSKevin Wolf     int64_t total_size;
132583d0521aSChunyan Liu     QemuOpts *opts = NULL;
1326b998875dSKevin Wolf     QDict *snapshot_options;
1327b998875dSKevin Wolf     BlockDriverState *bs_snapshot;
1328c2e0dbbfSFam Zheng     Error *local_err = NULL;
1329b998875dSKevin Wolf     int ret;
1330b998875dSKevin Wolf 
1331b998875dSKevin Wolf     /* if snapshot, we create a temporary backing file and open it
1332b998875dSKevin Wolf        instead of opening 'filename' directly */
1333b998875dSKevin Wolf 
1334b998875dSKevin Wolf     /* Get the required size from the image */
1335f187743aSKevin Wolf     total_size = bdrv_getlength(bs);
1336f187743aSKevin Wolf     if (total_size < 0) {
13376b8aeca5SChen Gang         ret = total_size;
1338f187743aSKevin Wolf         error_setg_errno(errp, -total_size, "Could not get image size");
13391ba4b6a5SBenoît Canet         goto out;
1340f187743aSKevin Wolf     }
1341b998875dSKevin Wolf 
1342b998875dSKevin Wolf     /* Create the temporary image */
13431ba4b6a5SBenoît Canet     ret = get_tmp_filename(tmp_filename, PATH_MAX + 1);
1344b998875dSKevin Wolf     if (ret < 0) {
1345b998875dSKevin Wolf         error_setg_errno(errp, -ret, "Could not get temporary filename");
13461ba4b6a5SBenoît Canet         goto out;
1347b998875dSKevin Wolf     }
1348b998875dSKevin Wolf 
1349ef810437SMax Reitz     opts = qemu_opts_create(bdrv_qcow2.create_opts, NULL, 0,
1350c282e1fdSChunyan Liu                             &error_abort);
135139101f25SMarkus Armbruster     qemu_opt_set_number(opts, BLOCK_OPT_SIZE, total_size, &error_abort);
1352ef810437SMax Reitz     ret = bdrv_create(&bdrv_qcow2, tmp_filename, opts, &local_err);
135383d0521aSChunyan Liu     qemu_opts_del(opts);
1354b998875dSKevin Wolf     if (ret < 0) {
1355b998875dSKevin Wolf         error_setg_errno(errp, -ret, "Could not create temporary overlay "
1356b998875dSKevin Wolf                          "'%s': %s", tmp_filename,
1357b998875dSKevin Wolf                          error_get_pretty(local_err));
1358b998875dSKevin Wolf         error_free(local_err);
13591ba4b6a5SBenoît Canet         goto out;
1360b998875dSKevin Wolf     }
1361b998875dSKevin Wolf 
1362b998875dSKevin Wolf     /* Prepare a new options QDict for the temporary file */
1363b998875dSKevin Wolf     snapshot_options = qdict_new();
1364b998875dSKevin Wolf     qdict_put(snapshot_options, "file.driver",
1365b998875dSKevin Wolf               qstring_from_str("file"));
1366b998875dSKevin Wolf     qdict_put(snapshot_options, "file.filename",
1367b998875dSKevin Wolf               qstring_from_str(tmp_filename));
1368b998875dSKevin Wolf 
1369e4e9986bSMarkus Armbruster     bs_snapshot = bdrv_new();
1370b998875dSKevin Wolf 
1371b998875dSKevin Wolf     ret = bdrv_open(&bs_snapshot, NULL, NULL, snapshot_options,
1372ef810437SMax Reitz                     flags, &bdrv_qcow2, &local_err);
1373b998875dSKevin Wolf     if (ret < 0) {
1374b998875dSKevin Wolf         error_propagate(errp, local_err);
13751ba4b6a5SBenoît Canet         goto out;
1376b998875dSKevin Wolf     }
1377b998875dSKevin Wolf 
1378b998875dSKevin Wolf     bdrv_append(bs_snapshot, bs);
13791ba4b6a5SBenoît Canet 
13801ba4b6a5SBenoît Canet out:
13811ba4b6a5SBenoît Canet     g_free(tmp_filename);
13826b8aeca5SChen Gang     return ret;
1383b998875dSKevin Wolf }
1384b998875dSKevin Wolf 
1385da557aacSMax Reitz /*
1386b6ce07aaSKevin Wolf  * Opens a disk image (raw, qcow2, vmdk, ...)
1387de9c0cecSKevin Wolf  *
1388de9c0cecSKevin Wolf  * options is a QDict of options to pass to the block drivers, or NULL for an
1389de9c0cecSKevin Wolf  * empty set of options. The reference to the QDict belongs to the block layer
1390de9c0cecSKevin Wolf  * after the call (even on failure), so if the caller intends to reuse the
1391de9c0cecSKevin Wolf  * dictionary, it needs to use QINCREF() before calling bdrv_open.
1392f67503e5SMax Reitz  *
1393f67503e5SMax Reitz  * If *pbs is NULL, a new BDS will be created with a pointer to it stored there.
1394f67503e5SMax Reitz  * If it is not NULL, the referenced BDS will be reused.
1395ddf5636dSMax Reitz  *
1396ddf5636dSMax Reitz  * The reference parameter may be used to specify an existing block device which
1397ddf5636dSMax Reitz  * should be opened. If specified, neither options nor a filename may be given,
1398ddf5636dSMax Reitz  * nor can an existing BDS be reused (that is, *pbs has to be NULL).
1399b6ce07aaSKevin Wolf  */
1400f3930ed0SKevin Wolf static int bdrv_open_inherit(BlockDriverState **pbs, const char *filename,
1401ddf5636dSMax Reitz                              const char *reference, QDict *options, int flags,
1402f3930ed0SKevin Wolf                              BlockDriverState *parent,
1403f3930ed0SKevin Wolf                              const BdrvChildRole *child_role,
1404ddf5636dSMax Reitz                              BlockDriver *drv, Error **errp)
1405ea2384d3Sbellard {
1406b6ce07aaSKevin Wolf     int ret;
1407f67503e5SMax Reitz     BlockDriverState *file = NULL, *bs;
140874fe54f2SKevin Wolf     const char *drvname;
140934b5d2c6SMax Reitz     Error *local_err = NULL;
1410b1e6fc08SKevin Wolf     int snapshot_flags = 0;
141133e3963eSbellard 
1412f67503e5SMax Reitz     assert(pbs);
1413f3930ed0SKevin Wolf     assert(!child_role || !flags);
1414f3930ed0SKevin Wolf     assert(!child_role == !parent);
1415f67503e5SMax Reitz 
1416ddf5636dSMax Reitz     if (reference) {
1417ddf5636dSMax Reitz         bool options_non_empty = options ? qdict_size(options) : false;
1418ddf5636dSMax Reitz         QDECREF(options);
1419ddf5636dSMax Reitz 
1420ddf5636dSMax Reitz         if (*pbs) {
1421ddf5636dSMax Reitz             error_setg(errp, "Cannot reuse an existing BDS when referencing "
1422ddf5636dSMax Reitz                        "another block device");
1423ddf5636dSMax Reitz             return -EINVAL;
1424ddf5636dSMax Reitz         }
1425ddf5636dSMax Reitz 
1426ddf5636dSMax Reitz         if (filename || options_non_empty) {
1427ddf5636dSMax Reitz             error_setg(errp, "Cannot reference an existing block device with "
1428ddf5636dSMax Reitz                        "additional options or a new filename");
1429ddf5636dSMax Reitz             return -EINVAL;
1430ddf5636dSMax Reitz         }
1431ddf5636dSMax Reitz 
1432ddf5636dSMax Reitz         bs = bdrv_lookup_bs(reference, reference, errp);
1433ddf5636dSMax Reitz         if (!bs) {
1434ddf5636dSMax Reitz             return -ENODEV;
1435ddf5636dSMax Reitz         }
1436ddf5636dSMax Reitz         bdrv_ref(bs);
1437ddf5636dSMax Reitz         *pbs = bs;
1438ddf5636dSMax Reitz         return 0;
1439ddf5636dSMax Reitz     }
1440ddf5636dSMax Reitz 
1441f67503e5SMax Reitz     if (*pbs) {
1442f67503e5SMax Reitz         bs = *pbs;
1443f67503e5SMax Reitz     } else {
1444e4e9986bSMarkus Armbruster         bs = bdrv_new();
1445f67503e5SMax Reitz     }
1446f67503e5SMax Reitz 
1447de9c0cecSKevin Wolf     /* NULL means an empty set of options */
1448de9c0cecSKevin Wolf     if (options == NULL) {
1449de9c0cecSKevin Wolf         options = qdict_new();
1450de9c0cecSKevin Wolf     }
1451de9c0cecSKevin Wolf 
1452f3930ed0SKevin Wolf     if (child_role) {
1453bddcec37SKevin Wolf         bs->inherits_from = parent;
1454f3930ed0SKevin Wolf         flags = child_role->inherit_flags(parent->open_flags);
1455f3930ed0SKevin Wolf     }
1456f3930ed0SKevin Wolf 
145753a29513SMax Reitz     ret = bdrv_fill_options(&options, &filename, &flags, drv, &local_err);
1458462f5bcfSKevin Wolf     if (local_err) {
1459462f5bcfSKevin Wolf         goto fail;
1460462f5bcfSKevin Wolf     }
1461462f5bcfSKevin Wolf 
146276c591b0SKevin Wolf     /* Find the right image format driver */
146376c591b0SKevin Wolf     drv = NULL;
146476c591b0SKevin Wolf     drvname = qdict_get_try_str(options, "driver");
146576c591b0SKevin Wolf     if (drvname) {
146676c591b0SKevin Wolf         drv = bdrv_find_format(drvname);
146776c591b0SKevin Wolf         qdict_del(options, "driver");
146876c591b0SKevin Wolf         if (!drv) {
146976c591b0SKevin Wolf             error_setg(errp, "Unknown driver: '%s'", drvname);
147076c591b0SKevin Wolf             ret = -EINVAL;
147176c591b0SKevin Wolf             goto fail;
147276c591b0SKevin Wolf         }
147376c591b0SKevin Wolf     }
147476c591b0SKevin Wolf 
147576c591b0SKevin Wolf     assert(drvname || !(flags & BDRV_O_PROTOCOL));
147676c591b0SKevin Wolf 
1477f3930ed0SKevin Wolf     bs->open_flags = flags;
1478de9c0cecSKevin Wolf     bs->options = options;
1479b6ad491aSKevin Wolf     options = qdict_clone_shallow(options);
1480de9c0cecSKevin Wolf 
1481f500a6d3SKevin Wolf     /* Open image file without format layer */
1482f4788adcSKevin Wolf     if ((flags & BDRV_O_PROTOCOL) == 0) {
1483be028adcSJeff Cody         if (flags & BDRV_O_RDWR) {
1484be028adcSJeff Cody             flags |= BDRV_O_ALLOW_RDWR;
1485be028adcSJeff Cody         }
1486b1e6fc08SKevin Wolf         if (flags & BDRV_O_SNAPSHOT) {
1487b1e6fc08SKevin Wolf             snapshot_flags = bdrv_temp_snapshot_flags(flags);
1488b1e6fc08SKevin Wolf             flags = bdrv_backing_flags(flags);
1489b1e6fc08SKevin Wolf         }
1490be028adcSJeff Cody 
1491f67503e5SMax Reitz         assert(file == NULL);
1492f3930ed0SKevin Wolf         bs->open_flags = flags;
1493054963f8SMax Reitz         ret = bdrv_open_image(&file, filename, options, "file",
1494f3930ed0SKevin Wolf                               bs, &child_file, true, &local_err);
1495f500a6d3SKevin Wolf         if (ret < 0) {
14968bfea15dSKevin Wolf             goto fail;
1497f500a6d3SKevin Wolf         }
1498f4788adcSKevin Wolf     }
1499f500a6d3SKevin Wolf 
150076c591b0SKevin Wolf     /* Image format probing */
150138f3ef57SKevin Wolf     bs->probed = !drv;
150276c591b0SKevin Wolf     if (!drv && file) {
150334b5d2c6SMax Reitz         ret = find_image_format(file, filename, &drv, &local_err);
150417b005f1SKevin Wolf         if (ret < 0) {
150517b005f1SKevin Wolf             goto fail;
150617b005f1SKevin Wolf         }
150776c591b0SKevin Wolf     } else if (!drv) {
15082a05cbe4SMax Reitz         error_setg(errp, "Must specify either driver or file");
15092a05cbe4SMax Reitz         ret = -EINVAL;
15108bfea15dSKevin Wolf         goto fail;
15112a05cbe4SMax Reitz     }
1512f500a6d3SKevin Wolf 
151353a29513SMax Reitz     /* BDRV_O_PROTOCOL must be set iff a protocol BDS is about to be created */
151453a29513SMax Reitz     assert(!!(flags & BDRV_O_PROTOCOL) == !!drv->bdrv_file_open);
151553a29513SMax Reitz     /* file must be NULL if a protocol BDS is about to be created
151653a29513SMax Reitz      * (the inverse results in an error message from bdrv_open_common()) */
151753a29513SMax Reitz     assert(!(flags & BDRV_O_PROTOCOL) || !file);
151853a29513SMax Reitz 
1519b6ce07aaSKevin Wolf     /* Open the image */
152034b5d2c6SMax Reitz     ret = bdrv_open_common(bs, file, options, flags, drv, &local_err);
1521b6ce07aaSKevin Wolf     if (ret < 0) {
15228bfea15dSKevin Wolf         goto fail;
15236987307cSChristoph Hellwig     }
15246987307cSChristoph Hellwig 
15252a05cbe4SMax Reitz     if (file && (bs->file != file)) {
15264f6fd349SFam Zheng         bdrv_unref(file);
1527f500a6d3SKevin Wolf         file = NULL;
1528f500a6d3SKevin Wolf     }
1529f500a6d3SKevin Wolf 
1530b6ce07aaSKevin Wolf     /* If there is a backing file, use it */
15319156df12SPaolo Bonzini     if ((flags & BDRV_O_NO_BACKING) == 0) {
153231ca6d07SKevin Wolf         QDict *backing_options;
153331ca6d07SKevin Wolf 
15345726d872SBenoît Canet         qdict_extract_subqdict(options, &backing_options, "backing.");
153534b5d2c6SMax Reitz         ret = bdrv_open_backing_file(bs, backing_options, &local_err);
1536b6ce07aaSKevin Wolf         if (ret < 0) {
1537b6ad491aSKevin Wolf             goto close_and_fail;
1538b6ce07aaSKevin Wolf         }
1539b6ce07aaSKevin Wolf     }
1540b6ce07aaSKevin Wolf 
154191af7014SMax Reitz     bdrv_refresh_filename(bs);
154291af7014SMax Reitz 
1543b998875dSKevin Wolf     /* For snapshot=on, create a temporary qcow2 overlay. bs points to the
1544b998875dSKevin Wolf      * temporary snapshot afterwards. */
1545b1e6fc08SKevin Wolf     if (snapshot_flags) {
15466b8aeca5SChen Gang         ret = bdrv_append_temp_snapshot(bs, snapshot_flags, &local_err);
1547b998875dSKevin Wolf         if (local_err) {
1548b998875dSKevin Wolf             goto close_and_fail;
1549b998875dSKevin Wolf         }
1550b998875dSKevin Wolf     }
1551b998875dSKevin Wolf 
1552b6ad491aSKevin Wolf     /* Check if any unknown options were used */
15535acd9d81SMax Reitz     if (options && (qdict_size(options) != 0)) {
1554b6ad491aSKevin Wolf         const QDictEntry *entry = qdict_first(options);
15555acd9d81SMax Reitz         if (flags & BDRV_O_PROTOCOL) {
15565acd9d81SMax Reitz             error_setg(errp, "Block protocol '%s' doesn't support the option "
15575acd9d81SMax Reitz                        "'%s'", drv->format_name, entry->key);
15585acd9d81SMax Reitz         } else {
155934b5d2c6SMax Reitz             error_setg(errp, "Block format '%s' used by device '%s' doesn't "
15605acd9d81SMax Reitz                        "support the option '%s'", drv->format_name,
1561bfb197e0SMarkus Armbruster                        bdrv_get_device_name(bs), entry->key);
15625acd9d81SMax Reitz         }
1563b6ad491aSKevin Wolf 
1564b6ad491aSKevin Wolf         ret = -EINVAL;
1565b6ad491aSKevin Wolf         goto close_and_fail;
1566b6ad491aSKevin Wolf     }
1567b6ad491aSKevin Wolf 
1568b6ce07aaSKevin Wolf     if (!bdrv_key_required(bs)) {
1569a7f53e26SMarkus Armbruster         if (bs->blk) {
1570a7f53e26SMarkus Armbruster             blk_dev_change_media_cb(bs->blk, true);
1571a7f53e26SMarkus Armbruster         }
1572c3adb58fSMarkus Armbruster     } else if (!runstate_check(RUN_STATE_PRELAUNCH)
1573c3adb58fSMarkus Armbruster                && !runstate_check(RUN_STATE_INMIGRATE)
1574c3adb58fSMarkus Armbruster                && !runstate_check(RUN_STATE_PAUSED)) { /* HACK */
1575c3adb58fSMarkus Armbruster         error_setg(errp,
1576c3adb58fSMarkus Armbruster                    "Guest must be stopped for opening of encrypted image");
1577c3adb58fSMarkus Armbruster         ret = -EBUSY;
1578c3adb58fSMarkus Armbruster         goto close_and_fail;
1579b6ce07aaSKevin Wolf     }
1580b6ce07aaSKevin Wolf 
1581c3adb58fSMarkus Armbruster     QDECREF(options);
1582f67503e5SMax Reitz     *pbs = bs;
1583b6ce07aaSKevin Wolf     return 0;
1584b6ce07aaSKevin Wolf 
15858bfea15dSKevin Wolf fail:
1586f500a6d3SKevin Wolf     if (file != NULL) {
15874f6fd349SFam Zheng         bdrv_unref(file);
1588f500a6d3SKevin Wolf     }
1589de9c0cecSKevin Wolf     QDECREF(bs->options);
1590b6ad491aSKevin Wolf     QDECREF(options);
1591de9c0cecSKevin Wolf     bs->options = NULL;
1592f67503e5SMax Reitz     if (!*pbs) {
1593f67503e5SMax Reitz         /* If *pbs is NULL, a new BDS has been created in this function and
1594f67503e5SMax Reitz            needs to be freed now. Otherwise, it does not need to be closed,
1595f67503e5SMax Reitz            since it has not really been opened yet. */
1596f67503e5SMax Reitz         bdrv_unref(bs);
1597f67503e5SMax Reitz     }
159884d18f06SMarkus Armbruster     if (local_err) {
159934b5d2c6SMax Reitz         error_propagate(errp, local_err);
160034b5d2c6SMax Reitz     }
1601b6ad491aSKevin Wolf     return ret;
1602de9c0cecSKevin Wolf 
1603b6ad491aSKevin Wolf close_and_fail:
1604f67503e5SMax Reitz     /* See fail path, but now the BDS has to be always closed */
1605f67503e5SMax Reitz     if (*pbs) {
1606b6ad491aSKevin Wolf         bdrv_close(bs);
1607f67503e5SMax Reitz     } else {
1608f67503e5SMax Reitz         bdrv_unref(bs);
1609f67503e5SMax Reitz     }
1610b6ad491aSKevin Wolf     QDECREF(options);
161184d18f06SMarkus Armbruster     if (local_err) {
161234b5d2c6SMax Reitz         error_propagate(errp, local_err);
161334b5d2c6SMax Reitz     }
1614b6ce07aaSKevin Wolf     return ret;
1615b6ce07aaSKevin Wolf }
1616b6ce07aaSKevin Wolf 
1617f3930ed0SKevin Wolf int bdrv_open(BlockDriverState **pbs, const char *filename,
1618f3930ed0SKevin Wolf               const char *reference, QDict *options, int flags,
1619f3930ed0SKevin Wolf               BlockDriver *drv, Error **errp)
1620f3930ed0SKevin Wolf {
1621f3930ed0SKevin Wolf     return bdrv_open_inherit(pbs, filename, reference, options, flags, NULL,
1622f3930ed0SKevin Wolf                              NULL, drv, errp);
1623f3930ed0SKevin Wolf }
1624f3930ed0SKevin Wolf 
1625e971aa12SJeff Cody typedef struct BlockReopenQueueEntry {
1626e971aa12SJeff Cody      bool prepared;
1627e971aa12SJeff Cody      BDRVReopenState state;
1628e971aa12SJeff Cody      QSIMPLEQ_ENTRY(BlockReopenQueueEntry) entry;
1629e971aa12SJeff Cody } BlockReopenQueueEntry;
1630e971aa12SJeff Cody 
1631e971aa12SJeff Cody /*
1632e971aa12SJeff Cody  * Adds a BlockDriverState to a simple queue for an atomic, transactional
1633e971aa12SJeff Cody  * reopen of multiple devices.
1634e971aa12SJeff Cody  *
1635e971aa12SJeff Cody  * bs_queue can either be an existing BlockReopenQueue that has had QSIMPLE_INIT
1636e971aa12SJeff Cody  * already performed, or alternatively may be NULL a new BlockReopenQueue will
1637e971aa12SJeff Cody  * be created and initialized. This newly created BlockReopenQueue should be
1638e971aa12SJeff Cody  * passed back in for subsequent calls that are intended to be of the same
1639e971aa12SJeff Cody  * atomic 'set'.
1640e971aa12SJeff Cody  *
1641e971aa12SJeff Cody  * bs is the BlockDriverState to add to the reopen queue.
1642e971aa12SJeff Cody  *
1643e971aa12SJeff Cody  * flags contains the open flags for the associated bs
1644e971aa12SJeff Cody  *
1645e971aa12SJeff Cody  * returns a pointer to bs_queue, which is either the newly allocated
1646e971aa12SJeff Cody  * bs_queue, or the existing bs_queue being used.
1647e971aa12SJeff Cody  *
1648e971aa12SJeff Cody  */
1649e971aa12SJeff Cody BlockReopenQueue *bdrv_reopen_queue(BlockReopenQueue *bs_queue,
1650e971aa12SJeff Cody                                     BlockDriverState *bs, int flags)
1651e971aa12SJeff Cody {
1652e971aa12SJeff Cody     assert(bs != NULL);
1653e971aa12SJeff Cody 
1654e971aa12SJeff Cody     BlockReopenQueueEntry *bs_entry;
165567251a31SKevin Wolf     BdrvChild *child;
165667251a31SKevin Wolf 
1657e971aa12SJeff Cody     if (bs_queue == NULL) {
1658e971aa12SJeff Cody         bs_queue = g_new0(BlockReopenQueue, 1);
1659e971aa12SJeff Cody         QSIMPLEQ_INIT(bs_queue);
1660e971aa12SJeff Cody     }
1661e971aa12SJeff Cody 
1662f1f25a2eSKevin Wolf     /* bdrv_open() masks this flag out */
1663f1f25a2eSKevin Wolf     flags &= ~BDRV_O_PROTOCOL;
1664f1f25a2eSKevin Wolf 
166567251a31SKevin Wolf     QLIST_FOREACH(child, &bs->children, next) {
166667251a31SKevin Wolf         int child_flags;
166767251a31SKevin Wolf 
166867251a31SKevin Wolf         if (child->bs->inherits_from != bs) {
166967251a31SKevin Wolf             continue;
167067251a31SKevin Wolf         }
167167251a31SKevin Wolf 
167267251a31SKevin Wolf         child_flags = child->role->inherit_flags(flags);
167367251a31SKevin Wolf         bdrv_reopen_queue(bs_queue, child->bs, child_flags);
1674e971aa12SJeff Cody     }
1675e971aa12SJeff Cody 
1676e971aa12SJeff Cody     bs_entry = g_new0(BlockReopenQueueEntry, 1);
1677e971aa12SJeff Cody     QSIMPLEQ_INSERT_TAIL(bs_queue, bs_entry, entry);
1678e971aa12SJeff Cody 
1679e971aa12SJeff Cody     bs_entry->state.bs = bs;
1680e971aa12SJeff Cody     bs_entry->state.flags = flags;
1681e971aa12SJeff Cody 
1682e971aa12SJeff Cody     return bs_queue;
1683e971aa12SJeff Cody }
1684e971aa12SJeff Cody 
1685e971aa12SJeff Cody /*
1686e971aa12SJeff Cody  * Reopen multiple BlockDriverStates atomically & transactionally.
1687e971aa12SJeff Cody  *
1688e971aa12SJeff Cody  * The queue passed in (bs_queue) must have been built up previous
1689e971aa12SJeff Cody  * via bdrv_reopen_queue().
1690e971aa12SJeff Cody  *
1691e971aa12SJeff Cody  * Reopens all BDS specified in the queue, with the appropriate
1692e971aa12SJeff Cody  * flags.  All devices are prepared for reopen, and failure of any
1693e971aa12SJeff Cody  * device will cause all device changes to be abandonded, and intermediate
1694e971aa12SJeff Cody  * data cleaned up.
1695e971aa12SJeff Cody  *
1696e971aa12SJeff Cody  * If all devices prepare successfully, then the changes are committed
1697e971aa12SJeff Cody  * to all devices.
1698e971aa12SJeff Cody  *
1699e971aa12SJeff Cody  */
1700e971aa12SJeff Cody int bdrv_reopen_multiple(BlockReopenQueue *bs_queue, Error **errp)
1701e971aa12SJeff Cody {
1702e971aa12SJeff Cody     int ret = -1;
1703e971aa12SJeff Cody     BlockReopenQueueEntry *bs_entry, *next;
1704e971aa12SJeff Cody     Error *local_err = NULL;
1705e971aa12SJeff Cody 
1706e971aa12SJeff Cody     assert(bs_queue != NULL);
1707e971aa12SJeff Cody 
1708e971aa12SJeff Cody     bdrv_drain_all();
1709e971aa12SJeff Cody 
1710e971aa12SJeff Cody     QSIMPLEQ_FOREACH(bs_entry, bs_queue, entry) {
1711e971aa12SJeff Cody         if (bdrv_reopen_prepare(&bs_entry->state, bs_queue, &local_err)) {
1712e971aa12SJeff Cody             error_propagate(errp, local_err);
1713e971aa12SJeff Cody             goto cleanup;
1714e971aa12SJeff Cody         }
1715e971aa12SJeff Cody         bs_entry->prepared = true;
1716e971aa12SJeff Cody     }
1717e971aa12SJeff Cody 
1718e971aa12SJeff Cody     /* If we reach this point, we have success and just need to apply the
1719e971aa12SJeff Cody      * changes
1720e971aa12SJeff Cody      */
1721e971aa12SJeff Cody     QSIMPLEQ_FOREACH(bs_entry, bs_queue, entry) {
1722e971aa12SJeff Cody         bdrv_reopen_commit(&bs_entry->state);
1723e971aa12SJeff Cody     }
1724e971aa12SJeff Cody 
1725e971aa12SJeff Cody     ret = 0;
1726e971aa12SJeff Cody 
1727e971aa12SJeff Cody cleanup:
1728e971aa12SJeff Cody     QSIMPLEQ_FOREACH_SAFE(bs_entry, bs_queue, entry, next) {
1729e971aa12SJeff Cody         if (ret && bs_entry->prepared) {
1730e971aa12SJeff Cody             bdrv_reopen_abort(&bs_entry->state);
1731e971aa12SJeff Cody         }
1732e971aa12SJeff Cody         g_free(bs_entry);
1733e971aa12SJeff Cody     }
1734e971aa12SJeff Cody     g_free(bs_queue);
1735e971aa12SJeff Cody     return ret;
1736e971aa12SJeff Cody }
1737e971aa12SJeff Cody 
1738e971aa12SJeff Cody 
1739e971aa12SJeff Cody /* Reopen a single BlockDriverState with the specified flags. */
1740e971aa12SJeff Cody int bdrv_reopen(BlockDriverState *bs, int bdrv_flags, Error **errp)
1741e971aa12SJeff Cody {
1742e971aa12SJeff Cody     int ret = -1;
1743e971aa12SJeff Cody     Error *local_err = NULL;
1744e971aa12SJeff Cody     BlockReopenQueue *queue = bdrv_reopen_queue(NULL, bs, bdrv_flags);
1745e971aa12SJeff Cody 
1746e971aa12SJeff Cody     ret = bdrv_reopen_multiple(queue, &local_err);
1747e971aa12SJeff Cody     if (local_err != NULL) {
1748e971aa12SJeff Cody         error_propagate(errp, local_err);
1749e971aa12SJeff Cody     }
1750e971aa12SJeff Cody     return ret;
1751e971aa12SJeff Cody }
1752e971aa12SJeff Cody 
1753e971aa12SJeff Cody 
1754e971aa12SJeff Cody /*
1755e971aa12SJeff Cody  * Prepares a BlockDriverState for reopen. All changes are staged in the
1756e971aa12SJeff Cody  * 'opaque' field of the BDRVReopenState, which is used and allocated by
1757e971aa12SJeff Cody  * the block driver layer .bdrv_reopen_prepare()
1758e971aa12SJeff Cody  *
1759e971aa12SJeff Cody  * bs is the BlockDriverState to reopen
1760e971aa12SJeff Cody  * flags are the new open flags
1761e971aa12SJeff Cody  * queue is the reopen queue
1762e971aa12SJeff Cody  *
1763e971aa12SJeff Cody  * Returns 0 on success, non-zero on error.  On error errp will be set
1764e971aa12SJeff Cody  * as well.
1765e971aa12SJeff Cody  *
1766e971aa12SJeff Cody  * On failure, bdrv_reopen_abort() will be called to clean up any data.
1767e971aa12SJeff Cody  * It is the responsibility of the caller to then call the abort() or
1768e971aa12SJeff Cody  * commit() for any other BDS that have been left in a prepare() state
1769e971aa12SJeff Cody  *
1770e971aa12SJeff Cody  */
1771e971aa12SJeff Cody int bdrv_reopen_prepare(BDRVReopenState *reopen_state, BlockReopenQueue *queue,
1772e971aa12SJeff Cody                         Error **errp)
1773e971aa12SJeff Cody {
1774e971aa12SJeff Cody     int ret = -1;
1775e971aa12SJeff Cody     Error *local_err = NULL;
1776e971aa12SJeff Cody     BlockDriver *drv;
1777e971aa12SJeff Cody 
1778e971aa12SJeff Cody     assert(reopen_state != NULL);
1779e971aa12SJeff Cody     assert(reopen_state->bs->drv != NULL);
1780e971aa12SJeff Cody     drv = reopen_state->bs->drv;
1781e971aa12SJeff Cody 
1782e971aa12SJeff Cody     /* if we are to stay read-only, do not allow permission change
1783e971aa12SJeff Cody      * to r/w */
1784e971aa12SJeff Cody     if (!(reopen_state->bs->open_flags & BDRV_O_ALLOW_RDWR) &&
1785e971aa12SJeff Cody         reopen_state->flags & BDRV_O_RDWR) {
178681e5f78aSAlberto Garcia         error_setg(errp, "Node '%s' is read only",
178781e5f78aSAlberto Garcia                    bdrv_get_device_or_node_name(reopen_state->bs));
1788e971aa12SJeff Cody         goto error;
1789e971aa12SJeff Cody     }
1790e971aa12SJeff Cody 
1791e971aa12SJeff Cody 
1792e971aa12SJeff Cody     ret = bdrv_flush(reopen_state->bs);
1793e971aa12SJeff Cody     if (ret) {
1794e971aa12SJeff Cody         error_set(errp, ERROR_CLASS_GENERIC_ERROR, "Error (%s) flushing drive",
1795e971aa12SJeff Cody                   strerror(-ret));
1796e971aa12SJeff Cody         goto error;
1797e971aa12SJeff Cody     }
1798e971aa12SJeff Cody 
1799e971aa12SJeff Cody     if (drv->bdrv_reopen_prepare) {
1800e971aa12SJeff Cody         ret = drv->bdrv_reopen_prepare(reopen_state, queue, &local_err);
1801e971aa12SJeff Cody         if (ret) {
1802e971aa12SJeff Cody             if (local_err != NULL) {
1803e971aa12SJeff Cody                 error_propagate(errp, local_err);
1804e971aa12SJeff Cody             } else {
1805d8b6895fSLuiz Capitulino                 error_setg(errp, "failed while preparing to reopen image '%s'",
1806e971aa12SJeff Cody                            reopen_state->bs->filename);
1807e971aa12SJeff Cody             }
1808e971aa12SJeff Cody             goto error;
1809e971aa12SJeff Cody         }
1810e971aa12SJeff Cody     } else {
1811e971aa12SJeff Cody         /* It is currently mandatory to have a bdrv_reopen_prepare()
1812e971aa12SJeff Cody          * handler for each supported drv. */
181381e5f78aSAlberto Garcia         error_setg(errp, "Block format '%s' used by node '%s' "
181481e5f78aSAlberto Garcia                    "does not support reopening files", drv->format_name,
181581e5f78aSAlberto Garcia                    bdrv_get_device_or_node_name(reopen_state->bs));
1816e971aa12SJeff Cody         ret = -1;
1817e971aa12SJeff Cody         goto error;
1818e971aa12SJeff Cody     }
1819e971aa12SJeff Cody 
1820e971aa12SJeff Cody     ret = 0;
1821e971aa12SJeff Cody 
1822e971aa12SJeff Cody error:
1823e971aa12SJeff Cody     return ret;
1824e971aa12SJeff Cody }
1825e971aa12SJeff Cody 
1826e971aa12SJeff Cody /*
1827e971aa12SJeff Cody  * Takes the staged changes for the reopen from bdrv_reopen_prepare(), and
1828e971aa12SJeff Cody  * makes them final by swapping the staging BlockDriverState contents into
1829e971aa12SJeff Cody  * the active BlockDriverState contents.
1830e971aa12SJeff Cody  */
1831e971aa12SJeff Cody void bdrv_reopen_commit(BDRVReopenState *reopen_state)
1832e971aa12SJeff Cody {
1833e971aa12SJeff Cody     BlockDriver *drv;
1834e971aa12SJeff Cody 
1835e971aa12SJeff Cody     assert(reopen_state != NULL);
1836e971aa12SJeff Cody     drv = reopen_state->bs->drv;
1837e971aa12SJeff Cody     assert(drv != NULL);
1838e971aa12SJeff Cody 
1839e971aa12SJeff Cody     /* If there are any driver level actions to take */
1840e971aa12SJeff Cody     if (drv->bdrv_reopen_commit) {
1841e971aa12SJeff Cody         drv->bdrv_reopen_commit(reopen_state);
1842e971aa12SJeff Cody     }
1843e971aa12SJeff Cody 
1844e971aa12SJeff Cody     /* set BDS specific flags now */
1845e971aa12SJeff Cody     reopen_state->bs->open_flags         = reopen_state->flags;
1846e971aa12SJeff Cody     reopen_state->bs->enable_write_cache = !!(reopen_state->flags &
1847e971aa12SJeff Cody                                               BDRV_O_CACHE_WB);
1848e971aa12SJeff Cody     reopen_state->bs->read_only = !(reopen_state->flags & BDRV_O_RDWR);
1849355ef4acSKevin Wolf 
18503baca891SKevin Wolf     bdrv_refresh_limits(reopen_state->bs, NULL);
1851e971aa12SJeff Cody }
1852e971aa12SJeff Cody 
1853e971aa12SJeff Cody /*
1854e971aa12SJeff Cody  * Abort the reopen, and delete and free the staged changes in
1855e971aa12SJeff Cody  * reopen_state
1856e971aa12SJeff Cody  */
1857e971aa12SJeff Cody void bdrv_reopen_abort(BDRVReopenState *reopen_state)
1858e971aa12SJeff Cody {
1859e971aa12SJeff Cody     BlockDriver *drv;
1860e971aa12SJeff Cody 
1861e971aa12SJeff Cody     assert(reopen_state != NULL);
1862e971aa12SJeff Cody     drv = reopen_state->bs->drv;
1863e971aa12SJeff Cody     assert(drv != NULL);
1864e971aa12SJeff Cody 
1865e971aa12SJeff Cody     if (drv->bdrv_reopen_abort) {
1866e971aa12SJeff Cody         drv->bdrv_reopen_abort(reopen_state);
1867e971aa12SJeff Cody     }
1868e971aa12SJeff Cody }
1869e971aa12SJeff Cody 
1870e971aa12SJeff Cody 
1871fc01f7e7Sbellard void bdrv_close(BlockDriverState *bs)
1872fc01f7e7Sbellard {
187333384421SMax Reitz     BdrvAioNotifier *ban, *ban_next;
187433384421SMax Reitz 
18753e914655SPaolo Bonzini     if (bs->job) {
18763e914655SPaolo Bonzini         block_job_cancel_sync(bs->job);
18773e914655SPaolo Bonzini     }
187853ec73e2SFam Zheng     bdrv_drain(bs); /* complete I/O */
187958fda173SStefan Hajnoczi     bdrv_flush(bs);
188053ec73e2SFam Zheng     bdrv_drain(bs); /* in case flush left pending I/O */
1881d7d512f6SPaolo Bonzini     notifier_list_notify(&bs->close_notifiers, bs);
18827094f12fSKevin Wolf 
18833cbc002cSPaolo Bonzini     if (bs->drv) {
18846e93e7c4SKevin Wolf         BdrvChild *child, *next;
18856e93e7c4SKevin Wolf 
18866e93e7c4SKevin Wolf         QLIST_FOREACH_SAFE(child, &bs->children, next, next) {
1887bddcec37SKevin Wolf             if (child->bs->inherits_from == bs) {
1888bddcec37SKevin Wolf                 child->bs->inherits_from = NULL;
1889bddcec37SKevin Wolf             }
18906e93e7c4SKevin Wolf             QLIST_REMOVE(child, next);
18916e93e7c4SKevin Wolf             g_free(child);
18926e93e7c4SKevin Wolf         }
18936e93e7c4SKevin Wolf 
1894557df6acSStefan Hajnoczi         if (bs->backing_hd) {
1895826b6ca0SFam Zheng             BlockDriverState *backing_hd = bs->backing_hd;
1896826b6ca0SFam Zheng             bdrv_set_backing_hd(bs, NULL);
1897826b6ca0SFam Zheng             bdrv_unref(backing_hd);
1898557df6acSStefan Hajnoczi         }
1899ea2384d3Sbellard         bs->drv->bdrv_close(bs);
19007267c094SAnthony Liguori         g_free(bs->opaque);
1901ea2384d3Sbellard         bs->opaque = NULL;
1902ea2384d3Sbellard         bs->drv = NULL;
190353fec9d3SStefan Hajnoczi         bs->copy_on_read = 0;
1904a275fa42SPaolo Bonzini         bs->backing_file[0] = '\0';
1905a275fa42SPaolo Bonzini         bs->backing_format[0] = '\0';
19066405875cSPaolo Bonzini         bs->total_sectors = 0;
19076405875cSPaolo Bonzini         bs->encrypted = 0;
19086405875cSPaolo Bonzini         bs->valid_key = 0;
19096405875cSPaolo Bonzini         bs->sg = 0;
19100d51b4deSAsias He         bs->zero_beyond_eof = false;
1911de9c0cecSKevin Wolf         QDECREF(bs->options);
1912de9c0cecSKevin Wolf         bs->options = NULL;
191391af7014SMax Reitz         QDECREF(bs->full_open_options);
191491af7014SMax Reitz         bs->full_open_options = NULL;
1915b338082bSbellard 
191666f82ceeSKevin Wolf         if (bs->file != NULL) {
19174f6fd349SFam Zheng             bdrv_unref(bs->file);
19180ac9377dSPaolo Bonzini             bs->file = NULL;
191966f82ceeSKevin Wolf         }
19209ca11154SPavel Hrdina     }
192166f82ceeSKevin Wolf 
1922a7f53e26SMarkus Armbruster     if (bs->blk) {
1923a7f53e26SMarkus Armbruster         blk_dev_change_media_cb(bs->blk, false);
1924a7f53e26SMarkus Armbruster     }
192598f90dbaSZhi Yong Wu 
192698f90dbaSZhi Yong Wu     /*throttling disk I/O limits*/
192798f90dbaSZhi Yong Wu     if (bs->io_limits_enabled) {
192898f90dbaSZhi Yong Wu         bdrv_io_limits_disable(bs);
192998f90dbaSZhi Yong Wu     }
193033384421SMax Reitz 
193133384421SMax Reitz     QLIST_FOREACH_SAFE(ban, &bs->aio_notifiers, list, ban_next) {
193233384421SMax Reitz         g_free(ban);
193333384421SMax Reitz     }
193433384421SMax Reitz     QLIST_INIT(&bs->aio_notifiers);
1935b338082bSbellard }
1936b338082bSbellard 
19372bc93fedSMORITA Kazutaka void bdrv_close_all(void)
19382bc93fedSMORITA Kazutaka {
19392bc93fedSMORITA Kazutaka     BlockDriverState *bs;
19402bc93fedSMORITA Kazutaka 
1941dc364f4cSBenoît Canet     QTAILQ_FOREACH(bs, &bdrv_states, device_list) {
1942ed78cda3SStefan Hajnoczi         AioContext *aio_context = bdrv_get_aio_context(bs);
1943ed78cda3SStefan Hajnoczi 
1944ed78cda3SStefan Hajnoczi         aio_context_acquire(aio_context);
19452bc93fedSMORITA Kazutaka         bdrv_close(bs);
1946ed78cda3SStefan Hajnoczi         aio_context_release(aio_context);
19472bc93fedSMORITA Kazutaka     }
19482bc93fedSMORITA Kazutaka }
19492bc93fedSMORITA Kazutaka 
1950dc364f4cSBenoît Canet /* make a BlockDriverState anonymous by removing from bdrv_state and
1951dc364f4cSBenoît Canet  * graph_bdrv_state list.
1952d22b2f41SRyan Harper    Also, NULL terminate the device_name to prevent double remove */
1953d22b2f41SRyan Harper void bdrv_make_anon(BlockDriverState *bs)
1954d22b2f41SRyan Harper {
1955bfb197e0SMarkus Armbruster     /*
1956bfb197e0SMarkus Armbruster      * Take care to remove bs from bdrv_states only when it's actually
1957bfb197e0SMarkus Armbruster      * in it.  Note that bs->device_list.tqe_prev is initially null,
1958bfb197e0SMarkus Armbruster      * and gets set to non-null by QTAILQ_INSERT_TAIL().  Establish
1959bfb197e0SMarkus Armbruster      * the useful invariant "bs in bdrv_states iff bs->tqe_prev" by
1960bfb197e0SMarkus Armbruster      * resetting it to null on remove.
1961bfb197e0SMarkus Armbruster      */
1962bfb197e0SMarkus Armbruster     if (bs->device_list.tqe_prev) {
1963dc364f4cSBenoît Canet         QTAILQ_REMOVE(&bdrv_states, bs, device_list);
1964bfb197e0SMarkus Armbruster         bs->device_list.tqe_prev = NULL;
1965d22b2f41SRyan Harper     }
1966dc364f4cSBenoît Canet     if (bs->node_name[0] != '\0') {
1967dc364f4cSBenoît Canet         QTAILQ_REMOVE(&graph_bdrv_states, bs, node_list);
1968dc364f4cSBenoît Canet     }
1969dc364f4cSBenoît Canet     bs->node_name[0] = '\0';
1970d22b2f41SRyan Harper }
1971d22b2f41SRyan Harper 
1972e023b2e2SPaolo Bonzini static void bdrv_rebind(BlockDriverState *bs)
1973e023b2e2SPaolo Bonzini {
1974e023b2e2SPaolo Bonzini     if (bs->drv && bs->drv->bdrv_rebind) {
1975e023b2e2SPaolo Bonzini         bs->drv->bdrv_rebind(bs);
1976e023b2e2SPaolo Bonzini     }
1977e023b2e2SPaolo Bonzini }
1978e023b2e2SPaolo Bonzini 
19794ddc07caSPaolo Bonzini static void bdrv_move_feature_fields(BlockDriverState *bs_dest,
19804ddc07caSPaolo Bonzini                                      BlockDriverState *bs_src)
19814ddc07caSPaolo Bonzini {
19824ddc07caSPaolo Bonzini     /* move some fields that need to stay attached to the device */
19834ddc07caSPaolo Bonzini 
19844ddc07caSPaolo Bonzini     /* dev info */
19851b7fd729SPaolo Bonzini     bs_dest->guest_block_size   = bs_src->guest_block_size;
19864ddc07caSPaolo Bonzini     bs_dest->copy_on_read       = bs_src->copy_on_read;
19874ddc07caSPaolo Bonzini 
19884ddc07caSPaolo Bonzini     bs_dest->enable_write_cache = bs_src->enable_write_cache;
19894ddc07caSPaolo Bonzini 
1990cc0681c4SBenoît Canet     /* i/o throttled req */
199176f4afb4SAlberto Garcia     bs_dest->throttle_state     = bs_src->throttle_state,
199276f4afb4SAlberto Garcia     bs_dest->io_limits_enabled  = bs_src->io_limits_enabled;
199376f4afb4SAlberto Garcia     bs_dest->pending_reqs[0]    = bs_src->pending_reqs[0];
199476f4afb4SAlberto Garcia     bs_dest->pending_reqs[1]    = bs_src->pending_reqs[1];
199576f4afb4SAlberto Garcia     bs_dest->throttled_reqs[0]  = bs_src->throttled_reqs[0];
199676f4afb4SAlberto Garcia     bs_dest->throttled_reqs[1]  = bs_src->throttled_reqs[1];
199776f4afb4SAlberto Garcia     memcpy(&bs_dest->round_robin,
199876f4afb4SAlberto Garcia            &bs_src->round_robin,
199976f4afb4SAlberto Garcia            sizeof(bs_dest->round_robin));
20000e5b0a2dSBenoît Canet     memcpy(&bs_dest->throttle_timers,
20010e5b0a2dSBenoît Canet            &bs_src->throttle_timers,
20020e5b0a2dSBenoît Canet            sizeof(ThrottleTimers));
20034ddc07caSPaolo Bonzini 
20044ddc07caSPaolo Bonzini     /* r/w error */
20054ddc07caSPaolo Bonzini     bs_dest->on_read_error      = bs_src->on_read_error;
20064ddc07caSPaolo Bonzini     bs_dest->on_write_error     = bs_src->on_write_error;
20074ddc07caSPaolo Bonzini 
20084ddc07caSPaolo Bonzini     /* i/o status */
20094ddc07caSPaolo Bonzini     bs_dest->iostatus_enabled   = bs_src->iostatus_enabled;
20104ddc07caSPaolo Bonzini     bs_dest->iostatus           = bs_src->iostatus;
20114ddc07caSPaolo Bonzini 
20124ddc07caSPaolo Bonzini     /* dirty bitmap */
2013e4654d2dSFam Zheng     bs_dest->dirty_bitmaps      = bs_src->dirty_bitmaps;
20144ddc07caSPaolo Bonzini 
20159fcb0251SFam Zheng     /* reference count */
20169fcb0251SFam Zheng     bs_dest->refcnt             = bs_src->refcnt;
20179fcb0251SFam Zheng 
20184ddc07caSPaolo Bonzini     /* job */
20194ddc07caSPaolo Bonzini     bs_dest->job                = bs_src->job;
20204ddc07caSPaolo Bonzini 
20214ddc07caSPaolo Bonzini     /* keep the same entry in bdrv_states */
2022dc364f4cSBenoît Canet     bs_dest->device_list = bs_src->device_list;
20237e7d56d9SMarkus Armbruster     bs_dest->blk = bs_src->blk;
20247e7d56d9SMarkus Armbruster 
2025fbe40ff7SFam Zheng     memcpy(bs_dest->op_blockers, bs_src->op_blockers,
2026fbe40ff7SFam Zheng            sizeof(bs_dest->op_blockers));
20274ddc07caSPaolo Bonzini }
20284ddc07caSPaolo Bonzini 
20294ddc07caSPaolo Bonzini /*
20304ddc07caSPaolo Bonzini  * Swap bs contents for two image chains while they are live,
20314ddc07caSPaolo Bonzini  * while keeping required fields on the BlockDriverState that is
20324ddc07caSPaolo Bonzini  * actually attached to a device.
20334ddc07caSPaolo Bonzini  *
20344ddc07caSPaolo Bonzini  * This will modify the BlockDriverState fields, and swap contents
20354ddc07caSPaolo Bonzini  * between bs_new and bs_old. Both bs_new and bs_old are modified.
20364ddc07caSPaolo Bonzini  *
2037bfb197e0SMarkus Armbruster  * bs_new must not be attached to a BlockBackend.
20384ddc07caSPaolo Bonzini  *
20394ddc07caSPaolo Bonzini  * This function does not create any image files.
20404ddc07caSPaolo Bonzini  */
20414ddc07caSPaolo Bonzini void bdrv_swap(BlockDriverState *bs_new, BlockDriverState *bs_old)
20424ddc07caSPaolo Bonzini {
20434ddc07caSPaolo Bonzini     BlockDriverState tmp;
2044bddcec37SKevin Wolf     BdrvChild *child;
20454ddc07caSPaolo Bonzini 
20466ee4ce1eSKevin Wolf     bdrv_drain(bs_new);
20476ee4ce1eSKevin Wolf     bdrv_drain(bs_old);
20484ddc07caSPaolo Bonzini 
204990ce8a06SBenoît Canet     /* The code needs to swap the node_name but simply swapping node_list won't
205090ce8a06SBenoît Canet      * work so first remove the nodes from the graph list, do the swap then
205190ce8a06SBenoît Canet      * insert them back if needed.
205290ce8a06SBenoît Canet      */
205390ce8a06SBenoît Canet     if (bs_new->node_name[0] != '\0') {
205490ce8a06SBenoît Canet         QTAILQ_REMOVE(&graph_bdrv_states, bs_new, node_list);
205590ce8a06SBenoît Canet     }
205690ce8a06SBenoît Canet     if (bs_old->node_name[0] != '\0') {
205790ce8a06SBenoît Canet         QTAILQ_REMOVE(&graph_bdrv_states, bs_old, node_list);
205890ce8a06SBenoît Canet     }
205990ce8a06SBenoît Canet 
2060db628338SAlberto Garcia     /* If the BlockDriverState is part of a throttling group acquire
2061db628338SAlberto Garcia      * its lock since we're going to mess with the protected fields.
2062db628338SAlberto Garcia      * Otherwise there's no need to worry since no one else can touch
2063db628338SAlberto Garcia      * them. */
2064db628338SAlberto Garcia     if (bs_old->throttle_state) {
2065db628338SAlberto Garcia         throttle_group_lock(bs_old);
2066db628338SAlberto Garcia     }
2067db628338SAlberto Garcia 
2068bfb197e0SMarkus Armbruster     /* bs_new must be unattached and shouldn't have anything fancy enabled */
20697e7d56d9SMarkus Armbruster     assert(!bs_new->blk);
2070e4654d2dSFam Zheng     assert(QLIST_EMPTY(&bs_new->dirty_bitmaps));
20714ddc07caSPaolo Bonzini     assert(bs_new->job == NULL);
20724ddc07caSPaolo Bonzini     assert(bs_new->io_limits_enabled == false);
2073db628338SAlberto Garcia     assert(bs_new->throttle_state == NULL);
20740e5b0a2dSBenoît Canet     assert(!throttle_timers_are_initialized(&bs_new->throttle_timers));
20754ddc07caSPaolo Bonzini 
20764ddc07caSPaolo Bonzini     tmp = *bs_new;
20774ddc07caSPaolo Bonzini     *bs_new = *bs_old;
20784ddc07caSPaolo Bonzini     *bs_old = tmp;
20794ddc07caSPaolo Bonzini 
20804ddc07caSPaolo Bonzini     /* there are some fields that should not be swapped, move them back */
20814ddc07caSPaolo Bonzini     bdrv_move_feature_fields(&tmp, bs_old);
20824ddc07caSPaolo Bonzini     bdrv_move_feature_fields(bs_old, bs_new);
20834ddc07caSPaolo Bonzini     bdrv_move_feature_fields(bs_new, &tmp);
20844ddc07caSPaolo Bonzini 
2085bfb197e0SMarkus Armbruster     /* bs_new must remain unattached */
20867e7d56d9SMarkus Armbruster     assert(!bs_new->blk);
20874ddc07caSPaolo Bonzini 
20884ddc07caSPaolo Bonzini     /* Check a few fields that should remain attached to the device */
20894ddc07caSPaolo Bonzini     assert(bs_new->job == NULL);
20904ddc07caSPaolo Bonzini     assert(bs_new->io_limits_enabled == false);
2091db628338SAlberto Garcia     assert(bs_new->throttle_state == NULL);
20920e5b0a2dSBenoît Canet     assert(!throttle_timers_are_initialized(&bs_new->throttle_timers));
20934ddc07caSPaolo Bonzini 
2094db628338SAlberto Garcia     /* Release the ThrottleGroup lock */
2095db628338SAlberto Garcia     if (bs_old->throttle_state) {
2096db628338SAlberto Garcia         throttle_group_unlock(bs_old);
2097db628338SAlberto Garcia     }
2098db628338SAlberto Garcia 
209990ce8a06SBenoît Canet     /* insert the nodes back into the graph node list if needed */
210090ce8a06SBenoît Canet     if (bs_new->node_name[0] != '\0') {
210190ce8a06SBenoît Canet         QTAILQ_INSERT_TAIL(&graph_bdrv_states, bs_new, node_list);
210290ce8a06SBenoît Canet     }
210390ce8a06SBenoît Canet     if (bs_old->node_name[0] != '\0') {
210490ce8a06SBenoît Canet         QTAILQ_INSERT_TAIL(&graph_bdrv_states, bs_old, node_list);
210590ce8a06SBenoît Canet     }
210690ce8a06SBenoît Canet 
21076e93e7c4SKevin Wolf     /*
21086e93e7c4SKevin Wolf      * Update lh_first.le_prev for non-empty lists.
21096e93e7c4SKevin Wolf      *
21106e93e7c4SKevin Wolf      * The head of the op blocker list doesn't change because it is moved back
21116e93e7c4SKevin Wolf      * in bdrv_move_feature_fields().
21126e93e7c4SKevin Wolf      */
21136ee4ce1eSKevin Wolf     assert(QLIST_EMPTY(&bs_old->tracked_requests));
21146ee4ce1eSKevin Wolf     assert(QLIST_EMPTY(&bs_new->tracked_requests));
21156ee4ce1eSKevin Wolf 
21166e93e7c4SKevin Wolf     QLIST_FIX_HEAD_PTR(&bs_new->children, next);
21176e93e7c4SKevin Wolf     QLIST_FIX_HEAD_PTR(&bs_old->children, next);
21186e93e7c4SKevin Wolf 
2119bddcec37SKevin Wolf     /* Update references in bs->opaque and children */
2120bddcec37SKevin Wolf     QLIST_FOREACH(child, &bs_old->children, next) {
2121bddcec37SKevin Wolf         if (child->bs->inherits_from == bs_new) {
2122bddcec37SKevin Wolf             child->bs->inherits_from = bs_old;
2123bddcec37SKevin Wolf         }
2124bddcec37SKevin Wolf     }
2125bddcec37SKevin Wolf     QLIST_FOREACH(child, &bs_new->children, next) {
2126bddcec37SKevin Wolf         if (child->bs->inherits_from == bs_old) {
2127bddcec37SKevin Wolf             child->bs->inherits_from = bs_new;
2128bddcec37SKevin Wolf         }
2129bddcec37SKevin Wolf     }
2130bddcec37SKevin Wolf 
21314ddc07caSPaolo Bonzini     bdrv_rebind(bs_new);
21324ddc07caSPaolo Bonzini     bdrv_rebind(bs_old);
21334ddc07caSPaolo Bonzini }
21344ddc07caSPaolo Bonzini 
21358802d1fdSJeff Cody /*
21368802d1fdSJeff Cody  * Add new bs contents at the top of an image chain while the chain is
21378802d1fdSJeff Cody  * live, while keeping required fields on the top layer.
21388802d1fdSJeff Cody  *
21398802d1fdSJeff Cody  * This will modify the BlockDriverState fields, and swap contents
21408802d1fdSJeff Cody  * between bs_new and bs_top. Both bs_new and bs_top are modified.
21418802d1fdSJeff Cody  *
2142bfb197e0SMarkus Armbruster  * bs_new must not be attached to a BlockBackend.
2143f6801b83SJeff Cody  *
21448802d1fdSJeff Cody  * This function does not create any image files.
21458802d1fdSJeff Cody  */
21468802d1fdSJeff Cody void bdrv_append(BlockDriverState *bs_new, BlockDriverState *bs_top)
21478802d1fdSJeff Cody {
21484ddc07caSPaolo Bonzini     bdrv_swap(bs_new, bs_top);
21498802d1fdSJeff Cody 
21508802d1fdSJeff Cody     /* The contents of 'tmp' will become bs_top, as we are
21518802d1fdSJeff Cody      * swapping bs_new and bs_top contents. */
21528d24cce1SFam Zheng     bdrv_set_backing_hd(bs_top, bs_new);
21536e93e7c4SKevin Wolf     bdrv_attach_child(bs_top, bs_new, &child_backing);
21548802d1fdSJeff Cody }
21558802d1fdSJeff Cody 
21564f6fd349SFam Zheng static void bdrv_delete(BlockDriverState *bs)
2157b338082bSbellard {
21583e914655SPaolo Bonzini     assert(!bs->job);
21593718d8abSFam Zheng     assert(bdrv_op_blocker_is_empty(bs));
21604f6fd349SFam Zheng     assert(!bs->refcnt);
2161e4654d2dSFam Zheng     assert(QLIST_EMPTY(&bs->dirty_bitmaps));
216218846deeSMarkus Armbruster 
2163e1b5c52eSStefan Hajnoczi     bdrv_close(bs);
2164e1b5c52eSStefan Hajnoczi 
21651b7bdbc1SStefan Hajnoczi     /* remove from list, if necessary */
2166d22b2f41SRyan Harper     bdrv_make_anon(bs);
216734c6f050Saurel32 
21687267c094SAnthony Liguori     g_free(bs);
2169fc01f7e7Sbellard }
2170fc01f7e7Sbellard 
2171e97fc193Saliguori /*
2172e97fc193Saliguori  * Run consistency checks on an image
2173e97fc193Saliguori  *
2174e076f338SKevin Wolf  * Returns 0 if the check could be completed (it doesn't mean that the image is
2175a1c7273bSStefan Weil  * free of errors) or -errno when an internal error occurred. The results of the
2176e076f338SKevin Wolf  * check are stored in res.
2177e97fc193Saliguori  */
21784534ff54SKevin Wolf int bdrv_check(BlockDriverState *bs, BdrvCheckResult *res, BdrvCheckMode fix)
2179e97fc193Saliguori {
2180908bcd54SMax Reitz     if (bs->drv == NULL) {
2181908bcd54SMax Reitz         return -ENOMEDIUM;
2182908bcd54SMax Reitz     }
2183e97fc193Saliguori     if (bs->drv->bdrv_check == NULL) {
2184e97fc193Saliguori         return -ENOTSUP;
2185e97fc193Saliguori     }
2186e97fc193Saliguori 
2187e076f338SKevin Wolf     memset(res, 0, sizeof(*res));
21884534ff54SKevin Wolf     return bs->drv->bdrv_check(bs, res, fix);
2189e97fc193Saliguori }
2190e97fc193Saliguori 
21918a426614SKevin Wolf #define COMMIT_BUF_SECTORS 2048
21928a426614SKevin Wolf 
219333e3963eSbellard /* commit COW file into the raw image */
219433e3963eSbellard int bdrv_commit(BlockDriverState *bs)
219533e3963eSbellard {
219619cb3738Sbellard     BlockDriver *drv = bs->drv;
219772706ea4SJeff Cody     int64_t sector, total_sectors, length, backing_length;
21988a426614SKevin Wolf     int n, ro, open_flags;
21990bce597dSJeff Cody     int ret = 0;
220072706ea4SJeff Cody     uint8_t *buf = NULL;
220133e3963eSbellard 
220219cb3738Sbellard     if (!drv)
220319cb3738Sbellard         return -ENOMEDIUM;
220433e3963eSbellard 
22054dca4b63SNaphtali Sprei     if (!bs->backing_hd) {
22064dca4b63SNaphtali Sprei         return -ENOTSUP;
22074dca4b63SNaphtali Sprei     }
22084dca4b63SNaphtali Sprei 
2209bb00021dSFam Zheng     if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_COMMIT_SOURCE, NULL) ||
2210bb00021dSFam Zheng         bdrv_op_is_blocked(bs->backing_hd, BLOCK_OP_TYPE_COMMIT_TARGET, NULL)) {
22112d3735d3SStefan Hajnoczi         return -EBUSY;
22122d3735d3SStefan Hajnoczi     }
22132d3735d3SStefan Hajnoczi 
22144dca4b63SNaphtali Sprei     ro = bs->backing_hd->read_only;
22154dca4b63SNaphtali Sprei     open_flags =  bs->backing_hd->open_flags;
22164dca4b63SNaphtali Sprei 
22174dca4b63SNaphtali Sprei     if (ro) {
22180bce597dSJeff Cody         if (bdrv_reopen(bs->backing_hd, open_flags | BDRV_O_RDWR, NULL)) {
22190bce597dSJeff Cody             return -EACCES;
22204dca4b63SNaphtali Sprei         }
2221ea2384d3Sbellard     }
2222ea2384d3Sbellard 
222372706ea4SJeff Cody     length = bdrv_getlength(bs);
222472706ea4SJeff Cody     if (length < 0) {
222572706ea4SJeff Cody         ret = length;
222672706ea4SJeff Cody         goto ro_cleanup;
222772706ea4SJeff Cody     }
222872706ea4SJeff Cody 
222972706ea4SJeff Cody     backing_length = bdrv_getlength(bs->backing_hd);
223072706ea4SJeff Cody     if (backing_length < 0) {
223172706ea4SJeff Cody         ret = backing_length;
223272706ea4SJeff Cody         goto ro_cleanup;
223372706ea4SJeff Cody     }
223472706ea4SJeff Cody 
223572706ea4SJeff Cody     /* If our top snapshot is larger than the backing file image,
223672706ea4SJeff Cody      * grow the backing file image if possible.  If not possible,
223772706ea4SJeff Cody      * we must return an error */
223872706ea4SJeff Cody     if (length > backing_length) {
223972706ea4SJeff Cody         ret = bdrv_truncate(bs->backing_hd, length);
224072706ea4SJeff Cody         if (ret < 0) {
224172706ea4SJeff Cody             goto ro_cleanup;
224272706ea4SJeff Cody         }
224372706ea4SJeff Cody     }
224472706ea4SJeff Cody 
224572706ea4SJeff Cody     total_sectors = length >> BDRV_SECTOR_BITS;
2246857d4f46SKevin Wolf 
2247857d4f46SKevin Wolf     /* qemu_try_blockalign() for bs will choose an alignment that works for
2248857d4f46SKevin Wolf      * bs->backing_hd as well, so no need to compare the alignment manually. */
2249857d4f46SKevin Wolf     buf = qemu_try_blockalign(bs, COMMIT_BUF_SECTORS * BDRV_SECTOR_SIZE);
2250857d4f46SKevin Wolf     if (buf == NULL) {
2251857d4f46SKevin Wolf         ret = -ENOMEM;
2252857d4f46SKevin Wolf         goto ro_cleanup;
2253857d4f46SKevin Wolf     }
22548a426614SKevin Wolf 
22558a426614SKevin Wolf     for (sector = 0; sector < total_sectors; sector += n) {
2256d663640cSPaolo Bonzini         ret = bdrv_is_allocated(bs, sector, COMMIT_BUF_SECTORS, &n);
2257d663640cSPaolo Bonzini         if (ret < 0) {
2258d663640cSPaolo Bonzini             goto ro_cleanup;
2259d663640cSPaolo Bonzini         }
2260d663640cSPaolo Bonzini         if (ret) {
2261dabfa6ccSKevin Wolf             ret = bdrv_read(bs, sector, buf, n);
2262dabfa6ccSKevin Wolf             if (ret < 0) {
22634dca4b63SNaphtali Sprei                 goto ro_cleanup;
226433e3963eSbellard             }
226533e3963eSbellard 
2266dabfa6ccSKevin Wolf             ret = bdrv_write(bs->backing_hd, sector, buf, n);
2267dabfa6ccSKevin Wolf             if (ret < 0) {
22684dca4b63SNaphtali Sprei                 goto ro_cleanup;
226933e3963eSbellard             }
227033e3963eSbellard         }
227133e3963eSbellard     }
227295389c86Sbellard 
22731d44952fSChristoph Hellwig     if (drv->bdrv_make_empty) {
22741d44952fSChristoph Hellwig         ret = drv->bdrv_make_empty(bs);
2275dabfa6ccSKevin Wolf         if (ret < 0) {
2276dabfa6ccSKevin Wolf             goto ro_cleanup;
2277dabfa6ccSKevin Wolf         }
22781d44952fSChristoph Hellwig         bdrv_flush(bs);
22791d44952fSChristoph Hellwig     }
228095389c86Sbellard 
22813f5075aeSChristoph Hellwig     /*
22823f5075aeSChristoph Hellwig      * Make sure all data we wrote to the backing device is actually
22833f5075aeSChristoph Hellwig      * stable on disk.
22843f5075aeSChristoph Hellwig      */
2285dabfa6ccSKevin Wolf     if (bs->backing_hd) {
22863f5075aeSChristoph Hellwig         bdrv_flush(bs->backing_hd);
2287dabfa6ccSKevin Wolf     }
22884dca4b63SNaphtali Sprei 
2289dabfa6ccSKevin Wolf     ret = 0;
22904dca4b63SNaphtali Sprei ro_cleanup:
2291857d4f46SKevin Wolf     qemu_vfree(buf);
22924dca4b63SNaphtali Sprei 
22934dca4b63SNaphtali Sprei     if (ro) {
22940bce597dSJeff Cody         /* ignoring error return here */
22950bce597dSJeff Cody         bdrv_reopen(bs->backing_hd, open_flags & ~BDRV_O_RDWR, NULL);
22964dca4b63SNaphtali Sprei     }
22974dca4b63SNaphtali Sprei 
22981d44952fSChristoph Hellwig     return ret;
229933e3963eSbellard }
230033e3963eSbellard 
2301e8877497SStefan Hajnoczi int bdrv_commit_all(void)
23026ab4b5abSMarkus Armbruster {
23036ab4b5abSMarkus Armbruster     BlockDriverState *bs;
23046ab4b5abSMarkus Armbruster 
2305dc364f4cSBenoît Canet     QTAILQ_FOREACH(bs, &bdrv_states, device_list) {
2306ed78cda3SStefan Hajnoczi         AioContext *aio_context = bdrv_get_aio_context(bs);
2307ed78cda3SStefan Hajnoczi 
2308ed78cda3SStefan Hajnoczi         aio_context_acquire(aio_context);
2309272d2d8eSJeff Cody         if (bs->drv && bs->backing_hd) {
2310e8877497SStefan Hajnoczi             int ret = bdrv_commit(bs);
2311e8877497SStefan Hajnoczi             if (ret < 0) {
2312ed78cda3SStefan Hajnoczi                 aio_context_release(aio_context);
2313e8877497SStefan Hajnoczi                 return ret;
23146ab4b5abSMarkus Armbruster             }
23156ab4b5abSMarkus Armbruster         }
2316ed78cda3SStefan Hajnoczi         aio_context_release(aio_context);
2317272d2d8eSJeff Cody     }
2318e8877497SStefan Hajnoczi     return 0;
2319e8877497SStefan Hajnoczi }
23206ab4b5abSMarkus Armbruster 
2321756e6736SKevin Wolf /*
2322756e6736SKevin Wolf  * Return values:
2323756e6736SKevin Wolf  * 0        - success
2324756e6736SKevin Wolf  * -EINVAL  - backing format specified, but no file
2325756e6736SKevin Wolf  * -ENOSPC  - can't update the backing file because no space is left in the
2326756e6736SKevin Wolf  *            image file header
2327756e6736SKevin Wolf  * -ENOTSUP - format driver doesn't support changing the backing file
2328756e6736SKevin Wolf  */
2329756e6736SKevin Wolf int bdrv_change_backing_file(BlockDriverState *bs,
2330756e6736SKevin Wolf     const char *backing_file, const char *backing_fmt)
2331756e6736SKevin Wolf {
2332756e6736SKevin Wolf     BlockDriver *drv = bs->drv;
2333469ef350SPaolo Bonzini     int ret;
2334756e6736SKevin Wolf 
23355f377794SPaolo Bonzini     /* Backing file format doesn't make sense without a backing file */
23365f377794SPaolo Bonzini     if (backing_fmt && !backing_file) {
23375f377794SPaolo Bonzini         return -EINVAL;
23385f377794SPaolo Bonzini     }
23395f377794SPaolo Bonzini 
2340756e6736SKevin Wolf     if (drv->bdrv_change_backing_file != NULL) {
2341469ef350SPaolo Bonzini         ret = drv->bdrv_change_backing_file(bs, backing_file, backing_fmt);
2342756e6736SKevin Wolf     } else {
2343469ef350SPaolo Bonzini         ret = -ENOTSUP;
2344756e6736SKevin Wolf     }
2345469ef350SPaolo Bonzini 
2346469ef350SPaolo Bonzini     if (ret == 0) {
2347469ef350SPaolo Bonzini         pstrcpy(bs->backing_file, sizeof(bs->backing_file), backing_file ?: "");
2348469ef350SPaolo Bonzini         pstrcpy(bs->backing_format, sizeof(bs->backing_format), backing_fmt ?: "");
2349469ef350SPaolo Bonzini     }
2350469ef350SPaolo Bonzini     return ret;
2351756e6736SKevin Wolf }
2352756e6736SKevin Wolf 
23536ebdcee2SJeff Cody /*
23546ebdcee2SJeff Cody  * Finds the image layer in the chain that has 'bs' as its backing file.
23556ebdcee2SJeff Cody  *
23566ebdcee2SJeff Cody  * active is the current topmost image.
23576ebdcee2SJeff Cody  *
23586ebdcee2SJeff Cody  * Returns NULL if bs is not found in active's image chain,
23596ebdcee2SJeff Cody  * or if active == bs.
23604caf0fcdSJeff Cody  *
23614caf0fcdSJeff Cody  * Returns the bottommost base image if bs == NULL.
23626ebdcee2SJeff Cody  */
23636ebdcee2SJeff Cody BlockDriverState *bdrv_find_overlay(BlockDriverState *active,
23646ebdcee2SJeff Cody                                     BlockDriverState *bs)
23656ebdcee2SJeff Cody {
23664caf0fcdSJeff Cody     while (active && bs != active->backing_hd) {
23674caf0fcdSJeff Cody         active = active->backing_hd;
23686ebdcee2SJeff Cody     }
23696ebdcee2SJeff Cody 
23704caf0fcdSJeff Cody     return active;
23716ebdcee2SJeff Cody }
23726ebdcee2SJeff Cody 
23734caf0fcdSJeff Cody /* Given a BDS, searches for the base layer. */
23744caf0fcdSJeff Cody BlockDriverState *bdrv_find_base(BlockDriverState *bs)
23754caf0fcdSJeff Cody {
23764caf0fcdSJeff Cody     return bdrv_find_overlay(bs, NULL);
23776ebdcee2SJeff Cody }
23786ebdcee2SJeff Cody 
23796ebdcee2SJeff Cody typedef struct BlkIntermediateStates {
23806ebdcee2SJeff Cody     BlockDriverState *bs;
23816ebdcee2SJeff Cody     QSIMPLEQ_ENTRY(BlkIntermediateStates) entry;
23826ebdcee2SJeff Cody } BlkIntermediateStates;
23836ebdcee2SJeff Cody 
23846ebdcee2SJeff Cody 
23856ebdcee2SJeff Cody /*
23866ebdcee2SJeff Cody  * Drops images above 'base' up to and including 'top', and sets the image
23876ebdcee2SJeff Cody  * above 'top' to have base as its backing file.
23886ebdcee2SJeff Cody  *
23896ebdcee2SJeff Cody  * Requires that the overlay to 'top' is opened r/w, so that the backing file
23906ebdcee2SJeff Cody  * information in 'bs' can be properly updated.
23916ebdcee2SJeff Cody  *
23926ebdcee2SJeff Cody  * E.g., this will convert the following chain:
23936ebdcee2SJeff Cody  * bottom <- base <- intermediate <- top <- active
23946ebdcee2SJeff Cody  *
23956ebdcee2SJeff Cody  * to
23966ebdcee2SJeff Cody  *
23976ebdcee2SJeff Cody  * bottom <- base <- active
23986ebdcee2SJeff Cody  *
23996ebdcee2SJeff Cody  * It is allowed for bottom==base, in which case it converts:
24006ebdcee2SJeff Cody  *
24016ebdcee2SJeff Cody  * base <- intermediate <- top <- active
24026ebdcee2SJeff Cody  *
24036ebdcee2SJeff Cody  * to
24046ebdcee2SJeff Cody  *
24056ebdcee2SJeff Cody  * base <- active
24066ebdcee2SJeff Cody  *
240754e26900SJeff Cody  * If backing_file_str is non-NULL, it will be used when modifying top's
240854e26900SJeff Cody  * overlay image metadata.
240954e26900SJeff Cody  *
24106ebdcee2SJeff Cody  * Error conditions:
24116ebdcee2SJeff Cody  *  if active == top, that is considered an error
24126ebdcee2SJeff Cody  *
24136ebdcee2SJeff Cody  */
24146ebdcee2SJeff Cody int bdrv_drop_intermediate(BlockDriverState *active, BlockDriverState *top,
241554e26900SJeff Cody                            BlockDriverState *base, const char *backing_file_str)
24166ebdcee2SJeff Cody {
24176ebdcee2SJeff Cody     BlockDriverState *intermediate;
24186ebdcee2SJeff Cody     BlockDriverState *base_bs = NULL;
24196ebdcee2SJeff Cody     BlockDriverState *new_top_bs = NULL;
24206ebdcee2SJeff Cody     BlkIntermediateStates *intermediate_state, *next;
24216ebdcee2SJeff Cody     int ret = -EIO;
24226ebdcee2SJeff Cody 
24236ebdcee2SJeff Cody     QSIMPLEQ_HEAD(states_to_delete, BlkIntermediateStates) states_to_delete;
24246ebdcee2SJeff Cody     QSIMPLEQ_INIT(&states_to_delete);
24256ebdcee2SJeff Cody 
24266ebdcee2SJeff Cody     if (!top->drv || !base->drv) {
24276ebdcee2SJeff Cody         goto exit;
24286ebdcee2SJeff Cody     }
24296ebdcee2SJeff Cody 
24306ebdcee2SJeff Cody     new_top_bs = bdrv_find_overlay(active, top);
24316ebdcee2SJeff Cody 
24326ebdcee2SJeff Cody     if (new_top_bs == NULL) {
24336ebdcee2SJeff Cody         /* we could not find the image above 'top', this is an error */
24346ebdcee2SJeff Cody         goto exit;
24356ebdcee2SJeff Cody     }
24366ebdcee2SJeff Cody 
24376ebdcee2SJeff Cody     /* special case of new_top_bs->backing_hd already pointing to base - nothing
24386ebdcee2SJeff Cody      * to do, no intermediate images */
24396ebdcee2SJeff Cody     if (new_top_bs->backing_hd == base) {
24406ebdcee2SJeff Cody         ret = 0;
24416ebdcee2SJeff Cody         goto exit;
24426ebdcee2SJeff Cody     }
24436ebdcee2SJeff Cody 
24446ebdcee2SJeff Cody     intermediate = top;
24456ebdcee2SJeff Cody 
24466ebdcee2SJeff Cody     /* now we will go down through the list, and add each BDS we find
24476ebdcee2SJeff Cody      * into our deletion queue, until we hit the 'base'
24486ebdcee2SJeff Cody      */
24496ebdcee2SJeff Cody     while (intermediate) {
24505839e53bSMarkus Armbruster         intermediate_state = g_new0(BlkIntermediateStates, 1);
24516ebdcee2SJeff Cody         intermediate_state->bs = intermediate;
24526ebdcee2SJeff Cody         QSIMPLEQ_INSERT_TAIL(&states_to_delete, intermediate_state, entry);
24536ebdcee2SJeff Cody 
24546ebdcee2SJeff Cody         if (intermediate->backing_hd == base) {
24556ebdcee2SJeff Cody             base_bs = intermediate->backing_hd;
24566ebdcee2SJeff Cody             break;
24576ebdcee2SJeff Cody         }
24586ebdcee2SJeff Cody         intermediate = intermediate->backing_hd;
24596ebdcee2SJeff Cody     }
24606ebdcee2SJeff Cody     if (base_bs == NULL) {
24616ebdcee2SJeff Cody         /* something went wrong, we did not end at the base. safely
24626ebdcee2SJeff Cody          * unravel everything, and exit with error */
24636ebdcee2SJeff Cody         goto exit;
24646ebdcee2SJeff Cody     }
24656ebdcee2SJeff Cody 
24666ebdcee2SJeff Cody     /* success - we can delete the intermediate states, and link top->base */
246754e26900SJeff Cody     backing_file_str = backing_file_str ? backing_file_str : base_bs->filename;
246854e26900SJeff Cody     ret = bdrv_change_backing_file(new_top_bs, backing_file_str,
24696ebdcee2SJeff Cody                                    base_bs->drv ? base_bs->drv->format_name : "");
24706ebdcee2SJeff Cody     if (ret) {
24716ebdcee2SJeff Cody         goto exit;
24726ebdcee2SJeff Cody     }
2473920beae1SFam Zheng     bdrv_set_backing_hd(new_top_bs, base_bs);
24746ebdcee2SJeff Cody 
24756ebdcee2SJeff Cody     QSIMPLEQ_FOREACH_SAFE(intermediate_state, &states_to_delete, entry, next) {
24766ebdcee2SJeff Cody         /* so that bdrv_close() does not recursively close the chain */
2477920beae1SFam Zheng         bdrv_set_backing_hd(intermediate_state->bs, NULL);
24784f6fd349SFam Zheng         bdrv_unref(intermediate_state->bs);
24796ebdcee2SJeff Cody     }
24806ebdcee2SJeff Cody     ret = 0;
24816ebdcee2SJeff Cody 
24826ebdcee2SJeff Cody exit:
24836ebdcee2SJeff Cody     QSIMPLEQ_FOREACH_SAFE(intermediate_state, &states_to_delete, entry, next) {
24846ebdcee2SJeff Cody         g_free(intermediate_state);
24856ebdcee2SJeff Cody     }
24866ebdcee2SJeff Cody     return ret;
24876ebdcee2SJeff Cody }
24886ebdcee2SJeff Cody 
248983f64091Sbellard /**
249083f64091Sbellard  * Truncate file to 'offset' bytes (needed only for file protocols)
249183f64091Sbellard  */
249283f64091Sbellard int bdrv_truncate(BlockDriverState *bs, int64_t offset)
249383f64091Sbellard {
249483f64091Sbellard     BlockDriver *drv = bs->drv;
249551762288SStefan Hajnoczi     int ret;
249683f64091Sbellard     if (!drv)
249719cb3738Sbellard         return -ENOMEDIUM;
249883f64091Sbellard     if (!drv->bdrv_truncate)
249983f64091Sbellard         return -ENOTSUP;
250059f2689dSNaphtali Sprei     if (bs->read_only)
250159f2689dSNaphtali Sprei         return -EACCES;
25029c75e168SJeff Cody 
250351762288SStefan Hajnoczi     ret = drv->bdrv_truncate(bs, offset);
250451762288SStefan Hajnoczi     if (ret == 0) {
250551762288SStefan Hajnoczi         ret = refresh_total_sectors(bs, offset >> BDRV_SECTOR_BITS);
2506ce1ffea8SJohn Snow         bdrv_dirty_bitmap_truncate(bs);
2507a7f53e26SMarkus Armbruster         if (bs->blk) {
2508a7f53e26SMarkus Armbruster             blk_dev_resize_cb(bs->blk);
2509a7f53e26SMarkus Armbruster         }
251051762288SStefan Hajnoczi     }
251151762288SStefan Hajnoczi     return ret;
251283f64091Sbellard }
251383f64091Sbellard 
251483f64091Sbellard /**
25154a1d5e1fSFam Zheng  * Length of a allocated file in bytes. Sparse files are counted by actual
25164a1d5e1fSFam Zheng  * allocated space. Return < 0 if error or unknown.
25174a1d5e1fSFam Zheng  */
25184a1d5e1fSFam Zheng int64_t bdrv_get_allocated_file_size(BlockDriverState *bs)
25194a1d5e1fSFam Zheng {
25204a1d5e1fSFam Zheng     BlockDriver *drv = bs->drv;
25214a1d5e1fSFam Zheng     if (!drv) {
25224a1d5e1fSFam Zheng         return -ENOMEDIUM;
25234a1d5e1fSFam Zheng     }
25244a1d5e1fSFam Zheng     if (drv->bdrv_get_allocated_file_size) {
25254a1d5e1fSFam Zheng         return drv->bdrv_get_allocated_file_size(bs);
25264a1d5e1fSFam Zheng     }
25274a1d5e1fSFam Zheng     if (bs->file) {
25284a1d5e1fSFam Zheng         return bdrv_get_allocated_file_size(bs->file);
25294a1d5e1fSFam Zheng     }
25304a1d5e1fSFam Zheng     return -ENOTSUP;
25314a1d5e1fSFam Zheng }
25324a1d5e1fSFam Zheng 
25334a1d5e1fSFam Zheng /**
253465a9bb25SMarkus Armbruster  * Return number of sectors on success, -errno on error.
253583f64091Sbellard  */
253665a9bb25SMarkus Armbruster int64_t bdrv_nb_sectors(BlockDriverState *bs)
253783f64091Sbellard {
253883f64091Sbellard     BlockDriver *drv = bs->drv;
253965a9bb25SMarkus Armbruster 
254083f64091Sbellard     if (!drv)
254119cb3738Sbellard         return -ENOMEDIUM;
254251762288SStefan Hajnoczi 
2543b94a2610SKevin Wolf     if (drv->has_variable_length) {
2544b94a2610SKevin Wolf         int ret = refresh_total_sectors(bs, bs->total_sectors);
2545b94a2610SKevin Wolf         if (ret < 0) {
2546b94a2610SKevin Wolf             return ret;
2547fc01f7e7Sbellard         }
254846a4e4e6SStefan Hajnoczi     }
254965a9bb25SMarkus Armbruster     return bs->total_sectors;
255065a9bb25SMarkus Armbruster }
255165a9bb25SMarkus Armbruster 
255265a9bb25SMarkus Armbruster /**
255365a9bb25SMarkus Armbruster  * Return length in bytes on success, -errno on error.
255465a9bb25SMarkus Armbruster  * The length is always a multiple of BDRV_SECTOR_SIZE.
255565a9bb25SMarkus Armbruster  */
255665a9bb25SMarkus Armbruster int64_t bdrv_getlength(BlockDriverState *bs)
255765a9bb25SMarkus Armbruster {
255865a9bb25SMarkus Armbruster     int64_t ret = bdrv_nb_sectors(bs);
255965a9bb25SMarkus Armbruster 
25604a9c9ea0SFam Zheng     ret = ret > INT64_MAX / BDRV_SECTOR_SIZE ? -EFBIG : ret;
256165a9bb25SMarkus Armbruster     return ret < 0 ? ret : ret * BDRV_SECTOR_SIZE;
256246a4e4e6SStefan Hajnoczi }
2563fc01f7e7Sbellard 
256419cb3738Sbellard /* return 0 as number of sectors if no device present or error */
256596b8f136Sths void bdrv_get_geometry(BlockDriverState *bs, uint64_t *nb_sectors_ptr)
2566fc01f7e7Sbellard {
256765a9bb25SMarkus Armbruster     int64_t nb_sectors = bdrv_nb_sectors(bs);
256865a9bb25SMarkus Armbruster 
256965a9bb25SMarkus Armbruster     *nb_sectors_ptr = nb_sectors < 0 ? 0 : nb_sectors;
2570fc01f7e7Sbellard }
2571cf98951bSbellard 
2572ff06f5f3SPaolo Bonzini void bdrv_set_on_error(BlockDriverState *bs, BlockdevOnError on_read_error,
2573ff06f5f3SPaolo Bonzini                        BlockdevOnError on_write_error)
2574abd7f68dSMarkus Armbruster {
2575abd7f68dSMarkus Armbruster     bs->on_read_error = on_read_error;
2576abd7f68dSMarkus Armbruster     bs->on_write_error = on_write_error;
2577abd7f68dSMarkus Armbruster }
2578abd7f68dSMarkus Armbruster 
25791ceee0d5SPaolo Bonzini BlockdevOnError bdrv_get_on_error(BlockDriverState *bs, bool is_read)
2580abd7f68dSMarkus Armbruster {
2581abd7f68dSMarkus Armbruster     return is_read ? bs->on_read_error : bs->on_write_error;
2582abd7f68dSMarkus Armbruster }
2583abd7f68dSMarkus Armbruster 
25843e1caa5fSPaolo Bonzini BlockErrorAction bdrv_get_error_action(BlockDriverState *bs, bool is_read, int error)
25853e1caa5fSPaolo Bonzini {
25863e1caa5fSPaolo Bonzini     BlockdevOnError on_err = is_read ? bs->on_read_error : bs->on_write_error;
25873e1caa5fSPaolo Bonzini 
25883e1caa5fSPaolo Bonzini     switch (on_err) {
25893e1caa5fSPaolo Bonzini     case BLOCKDEV_ON_ERROR_ENOSPC:
2590a589569fSWenchao Xia         return (error == ENOSPC) ?
2591a589569fSWenchao Xia                BLOCK_ERROR_ACTION_STOP : BLOCK_ERROR_ACTION_REPORT;
25923e1caa5fSPaolo Bonzini     case BLOCKDEV_ON_ERROR_STOP:
2593a589569fSWenchao Xia         return BLOCK_ERROR_ACTION_STOP;
25943e1caa5fSPaolo Bonzini     case BLOCKDEV_ON_ERROR_REPORT:
2595a589569fSWenchao Xia         return BLOCK_ERROR_ACTION_REPORT;
25963e1caa5fSPaolo Bonzini     case BLOCKDEV_ON_ERROR_IGNORE:
2597a589569fSWenchao Xia         return BLOCK_ERROR_ACTION_IGNORE;
25983e1caa5fSPaolo Bonzini     default:
25993e1caa5fSPaolo Bonzini         abort();
26003e1caa5fSPaolo Bonzini     }
26013e1caa5fSPaolo Bonzini }
26023e1caa5fSPaolo Bonzini 
2603c7c2ff0cSLuiz Capitulino static void send_qmp_error_event(BlockDriverState *bs,
2604c7c2ff0cSLuiz Capitulino                                  BlockErrorAction action,
2605c7c2ff0cSLuiz Capitulino                                  bool is_read, int error)
2606c7c2ff0cSLuiz Capitulino {
2607573742a5SPeter Maydell     IoOperationType optype;
2608c7c2ff0cSLuiz Capitulino 
2609573742a5SPeter Maydell     optype = is_read ? IO_OPERATION_TYPE_READ : IO_OPERATION_TYPE_WRITE;
2610573742a5SPeter Maydell     qapi_event_send_block_io_error(bdrv_get_device_name(bs), optype, action,
2611c7c2ff0cSLuiz Capitulino                                    bdrv_iostatus_is_enabled(bs),
2612624ff573SLuiz Capitulino                                    error == ENOSPC, strerror(error),
2613624ff573SLuiz Capitulino                                    &error_abort);
2614c7c2ff0cSLuiz Capitulino }
2615c7c2ff0cSLuiz Capitulino 
26163e1caa5fSPaolo Bonzini /* This is done by device models because, while the block layer knows
26173e1caa5fSPaolo Bonzini  * about the error, it does not know whether an operation comes from
26183e1caa5fSPaolo Bonzini  * the device or the block layer (from a job, for example).
26193e1caa5fSPaolo Bonzini  */
26203e1caa5fSPaolo Bonzini void bdrv_error_action(BlockDriverState *bs, BlockErrorAction action,
26213e1caa5fSPaolo Bonzini                        bool is_read, int error)
26223e1caa5fSPaolo Bonzini {
26233e1caa5fSPaolo Bonzini     assert(error >= 0);
26242bd3bce8SPaolo Bonzini 
2625a589569fSWenchao Xia     if (action == BLOCK_ERROR_ACTION_STOP) {
26262bd3bce8SPaolo Bonzini         /* First set the iostatus, so that "info block" returns an iostatus
26272bd3bce8SPaolo Bonzini          * that matches the events raised so far (an additional error iostatus
26282bd3bce8SPaolo Bonzini          * is fine, but not a lost one).
26292bd3bce8SPaolo Bonzini          */
26303e1caa5fSPaolo Bonzini         bdrv_iostatus_set_err(bs, error);
26312bd3bce8SPaolo Bonzini 
26322bd3bce8SPaolo Bonzini         /* Then raise the request to stop the VM and the event.
26332bd3bce8SPaolo Bonzini          * qemu_system_vmstop_request_prepare has two effects.  First,
26342bd3bce8SPaolo Bonzini          * it ensures that the STOP event always comes after the
26352bd3bce8SPaolo Bonzini          * BLOCK_IO_ERROR event.  Second, it ensures that even if management
26362bd3bce8SPaolo Bonzini          * can observe the STOP event and do a "cont" before the STOP
26372bd3bce8SPaolo Bonzini          * event is issued, the VM will not stop.  In this case, vm_start()
26382bd3bce8SPaolo Bonzini          * also ensures that the STOP/RESUME pair of events is emitted.
26392bd3bce8SPaolo Bonzini          */
26402bd3bce8SPaolo Bonzini         qemu_system_vmstop_request_prepare();
2641c7c2ff0cSLuiz Capitulino         send_qmp_error_event(bs, action, is_read, error);
26422bd3bce8SPaolo Bonzini         qemu_system_vmstop_request(RUN_STATE_IO_ERROR);
26432bd3bce8SPaolo Bonzini     } else {
2644c7c2ff0cSLuiz Capitulino         send_qmp_error_event(bs, action, is_read, error);
26453e1caa5fSPaolo Bonzini     }
26463e1caa5fSPaolo Bonzini }
26473e1caa5fSPaolo Bonzini 
2648b338082bSbellard int bdrv_is_read_only(BlockDriverState *bs)
2649b338082bSbellard {
2650b338082bSbellard     return bs->read_only;
2651b338082bSbellard }
2652b338082bSbellard 
2653985a03b0Sths int bdrv_is_sg(BlockDriverState *bs)
2654985a03b0Sths {
2655985a03b0Sths     return bs->sg;
2656985a03b0Sths }
2657985a03b0Sths 
2658e900a7b7SChristoph Hellwig int bdrv_enable_write_cache(BlockDriverState *bs)
2659e900a7b7SChristoph Hellwig {
2660e900a7b7SChristoph Hellwig     return bs->enable_write_cache;
2661e900a7b7SChristoph Hellwig }
2662e900a7b7SChristoph Hellwig 
2663425b0148SPaolo Bonzini void bdrv_set_enable_write_cache(BlockDriverState *bs, bool wce)
2664425b0148SPaolo Bonzini {
2665425b0148SPaolo Bonzini     bs->enable_write_cache = wce;
266655b110f2SJeff Cody 
266755b110f2SJeff Cody     /* so a reopen() will preserve wce */
266855b110f2SJeff Cody     if (wce) {
266955b110f2SJeff Cody         bs->open_flags |= BDRV_O_CACHE_WB;
267055b110f2SJeff Cody     } else {
267155b110f2SJeff Cody         bs->open_flags &= ~BDRV_O_CACHE_WB;
267255b110f2SJeff Cody     }
2673425b0148SPaolo Bonzini }
2674425b0148SPaolo Bonzini 
2675ea2384d3Sbellard int bdrv_is_encrypted(BlockDriverState *bs)
2676ea2384d3Sbellard {
2677ea2384d3Sbellard     if (bs->backing_hd && bs->backing_hd->encrypted)
2678ea2384d3Sbellard         return 1;
2679ea2384d3Sbellard     return bs->encrypted;
2680ea2384d3Sbellard }
2681ea2384d3Sbellard 
2682c0f4ce77Saliguori int bdrv_key_required(BlockDriverState *bs)
2683c0f4ce77Saliguori {
2684c0f4ce77Saliguori     BlockDriverState *backing_hd = bs->backing_hd;
2685c0f4ce77Saliguori 
2686c0f4ce77Saliguori     if (backing_hd && backing_hd->encrypted && !backing_hd->valid_key)
2687c0f4ce77Saliguori         return 1;
2688c0f4ce77Saliguori     return (bs->encrypted && !bs->valid_key);
2689c0f4ce77Saliguori }
2690c0f4ce77Saliguori 
2691ea2384d3Sbellard int bdrv_set_key(BlockDriverState *bs, const char *key)
2692ea2384d3Sbellard {
2693ea2384d3Sbellard     int ret;
2694ea2384d3Sbellard     if (bs->backing_hd && bs->backing_hd->encrypted) {
2695ea2384d3Sbellard         ret = bdrv_set_key(bs->backing_hd, key);
2696ea2384d3Sbellard         if (ret < 0)
2697ea2384d3Sbellard             return ret;
2698ea2384d3Sbellard         if (!bs->encrypted)
2699ea2384d3Sbellard             return 0;
2700ea2384d3Sbellard     }
2701fd04a2aeSShahar Havivi     if (!bs->encrypted) {
2702fd04a2aeSShahar Havivi         return -EINVAL;
2703fd04a2aeSShahar Havivi     } else if (!bs->drv || !bs->drv->bdrv_set_key) {
2704fd04a2aeSShahar Havivi         return -ENOMEDIUM;
2705fd04a2aeSShahar Havivi     }
2706c0f4ce77Saliguori     ret = bs->drv->bdrv_set_key(bs, key);
2707bb5fc20fSaliguori     if (ret < 0) {
2708bb5fc20fSaliguori         bs->valid_key = 0;
2709bb5fc20fSaliguori     } else if (!bs->valid_key) {
2710bb5fc20fSaliguori         bs->valid_key = 1;
2711a7f53e26SMarkus Armbruster         if (bs->blk) {
2712bb5fc20fSaliguori             /* call the change callback now, we skipped it on open */
2713a7f53e26SMarkus Armbruster             blk_dev_change_media_cb(bs->blk, true);
2714a7f53e26SMarkus Armbruster         }
2715bb5fc20fSaliguori     }
2716c0f4ce77Saliguori     return ret;
2717ea2384d3Sbellard }
2718ea2384d3Sbellard 
27194d2855a3SMarkus Armbruster /*
27204d2855a3SMarkus Armbruster  * Provide an encryption key for @bs.
27214d2855a3SMarkus Armbruster  * If @key is non-null:
27224d2855a3SMarkus Armbruster  *     If @bs is not encrypted, fail.
27234d2855a3SMarkus Armbruster  *     Else if the key is invalid, fail.
27244d2855a3SMarkus Armbruster  *     Else set @bs's key to @key, replacing the existing key, if any.
27254d2855a3SMarkus Armbruster  * If @key is null:
27264d2855a3SMarkus Armbruster  *     If @bs is encrypted and still lacks a key, fail.
27274d2855a3SMarkus Armbruster  *     Else do nothing.
27284d2855a3SMarkus Armbruster  * On failure, store an error object through @errp if non-null.
27294d2855a3SMarkus Armbruster  */
27304d2855a3SMarkus Armbruster void bdrv_add_key(BlockDriverState *bs, const char *key, Error **errp)
27314d2855a3SMarkus Armbruster {
27324d2855a3SMarkus Armbruster     if (key) {
27334d2855a3SMarkus Armbruster         if (!bdrv_is_encrypted(bs)) {
273481e5f78aSAlberto Garcia             error_setg(errp, "Node '%s' is not encrypted",
273581e5f78aSAlberto Garcia                       bdrv_get_device_or_node_name(bs));
27364d2855a3SMarkus Armbruster         } else if (bdrv_set_key(bs, key) < 0) {
2737c6bd8c70SMarkus Armbruster             error_setg(errp, QERR_INVALID_PASSWORD);
27384d2855a3SMarkus Armbruster         }
27394d2855a3SMarkus Armbruster     } else {
27404d2855a3SMarkus Armbruster         if (bdrv_key_required(bs)) {
2741b1ca6391SMarkus Armbruster             error_set(errp, ERROR_CLASS_DEVICE_ENCRYPTED,
2742b1ca6391SMarkus Armbruster                       "'%s' (%s) is encrypted",
274381e5f78aSAlberto Garcia                       bdrv_get_device_or_node_name(bs),
27444d2855a3SMarkus Armbruster                       bdrv_get_encrypted_filename(bs));
27454d2855a3SMarkus Armbruster         }
27464d2855a3SMarkus Armbruster     }
27474d2855a3SMarkus Armbruster }
27484d2855a3SMarkus Armbruster 
2749f8d6bba1SMarkus Armbruster const char *bdrv_get_format_name(BlockDriverState *bs)
2750ea2384d3Sbellard {
2751f8d6bba1SMarkus Armbruster     return bs->drv ? bs->drv->format_name : NULL;
2752ea2384d3Sbellard }
2753ea2384d3Sbellard 
2754ada42401SStefan Hajnoczi static int qsort_strcmp(const void *a, const void *b)
2755ada42401SStefan Hajnoczi {
2756ada42401SStefan Hajnoczi     return strcmp(a, b);
2757ada42401SStefan Hajnoczi }
2758ada42401SStefan Hajnoczi 
2759ea2384d3Sbellard void bdrv_iterate_format(void (*it)(void *opaque, const char *name),
2760ea2384d3Sbellard                          void *opaque)
2761ea2384d3Sbellard {
2762ea2384d3Sbellard     BlockDriver *drv;
2763e855e4fbSJeff Cody     int count = 0;
2764ada42401SStefan Hajnoczi     int i;
2765e855e4fbSJeff Cody     const char **formats = NULL;
2766ea2384d3Sbellard 
27678a22f02aSStefan Hajnoczi     QLIST_FOREACH(drv, &bdrv_drivers, list) {
2768e855e4fbSJeff Cody         if (drv->format_name) {
2769e855e4fbSJeff Cody             bool found = false;
2770e855e4fbSJeff Cody             int i = count;
2771e855e4fbSJeff Cody             while (formats && i && !found) {
2772e855e4fbSJeff Cody                 found = !strcmp(formats[--i], drv->format_name);
2773e855e4fbSJeff Cody             }
2774e855e4fbSJeff Cody 
2775e855e4fbSJeff Cody             if (!found) {
27765839e53bSMarkus Armbruster                 formats = g_renew(const char *, formats, count + 1);
2777e855e4fbSJeff Cody                 formats[count++] = drv->format_name;
2778ea2384d3Sbellard             }
2779ea2384d3Sbellard         }
2780e855e4fbSJeff Cody     }
2781ada42401SStefan Hajnoczi 
2782ada42401SStefan Hajnoczi     qsort(formats, count, sizeof(formats[0]), qsort_strcmp);
2783ada42401SStefan Hajnoczi 
2784ada42401SStefan Hajnoczi     for (i = 0; i < count; i++) {
2785ada42401SStefan Hajnoczi         it(opaque, formats[i]);
2786ada42401SStefan Hajnoczi     }
2787ada42401SStefan Hajnoczi 
2788e855e4fbSJeff Cody     g_free(formats);
2789e855e4fbSJeff Cody }
2790ea2384d3Sbellard 
2791dc364f4cSBenoît Canet /* This function is to find a node in the bs graph */
2792dc364f4cSBenoît Canet BlockDriverState *bdrv_find_node(const char *node_name)
2793dc364f4cSBenoît Canet {
2794dc364f4cSBenoît Canet     BlockDriverState *bs;
2795dc364f4cSBenoît Canet 
2796dc364f4cSBenoît Canet     assert(node_name);
2797dc364f4cSBenoît Canet 
2798dc364f4cSBenoît Canet     QTAILQ_FOREACH(bs, &graph_bdrv_states, node_list) {
2799dc364f4cSBenoît Canet         if (!strcmp(node_name, bs->node_name)) {
2800dc364f4cSBenoît Canet             return bs;
2801dc364f4cSBenoît Canet         }
2802dc364f4cSBenoît Canet     }
2803dc364f4cSBenoît Canet     return NULL;
2804dc364f4cSBenoît Canet }
2805dc364f4cSBenoît Canet 
2806c13163fbSBenoît Canet /* Put this QMP function here so it can access the static graph_bdrv_states. */
2807d5a8ee60SAlberto Garcia BlockDeviceInfoList *bdrv_named_nodes_list(Error **errp)
2808c13163fbSBenoît Canet {
2809c13163fbSBenoît Canet     BlockDeviceInfoList *list, *entry;
2810c13163fbSBenoît Canet     BlockDriverState *bs;
2811c13163fbSBenoît Canet 
2812c13163fbSBenoît Canet     list = NULL;
2813c13163fbSBenoît Canet     QTAILQ_FOREACH(bs, &graph_bdrv_states, node_list) {
2814d5a8ee60SAlberto Garcia         BlockDeviceInfo *info = bdrv_block_device_info(bs, errp);
2815d5a8ee60SAlberto Garcia         if (!info) {
2816d5a8ee60SAlberto Garcia             qapi_free_BlockDeviceInfoList(list);
2817d5a8ee60SAlberto Garcia             return NULL;
2818d5a8ee60SAlberto Garcia         }
2819c13163fbSBenoît Canet         entry = g_malloc0(sizeof(*entry));
2820d5a8ee60SAlberto Garcia         entry->value = info;
2821c13163fbSBenoît Canet         entry->next = list;
2822c13163fbSBenoît Canet         list = entry;
2823c13163fbSBenoît Canet     }
2824c13163fbSBenoît Canet 
2825c13163fbSBenoît Canet     return list;
2826c13163fbSBenoît Canet }
2827c13163fbSBenoît Canet 
282812d3ba82SBenoît Canet BlockDriverState *bdrv_lookup_bs(const char *device,
282912d3ba82SBenoît Canet                                  const char *node_name,
283012d3ba82SBenoît Canet                                  Error **errp)
283112d3ba82SBenoît Canet {
28327f06d47eSMarkus Armbruster     BlockBackend *blk;
28337f06d47eSMarkus Armbruster     BlockDriverState *bs;
283412d3ba82SBenoît Canet 
283512d3ba82SBenoît Canet     if (device) {
28367f06d47eSMarkus Armbruster         blk = blk_by_name(device);
283712d3ba82SBenoît Canet 
28387f06d47eSMarkus Armbruster         if (blk) {
28397f06d47eSMarkus Armbruster             return blk_bs(blk);
284012d3ba82SBenoît Canet         }
2841dd67fa50SBenoît Canet     }
284212d3ba82SBenoît Canet 
2843dd67fa50SBenoît Canet     if (node_name) {
284412d3ba82SBenoît Canet         bs = bdrv_find_node(node_name);
284512d3ba82SBenoît Canet 
2846dd67fa50SBenoît Canet         if (bs) {
2847dd67fa50SBenoît Canet             return bs;
2848dd67fa50SBenoît Canet         }
284912d3ba82SBenoît Canet     }
285012d3ba82SBenoît Canet 
2851dd67fa50SBenoît Canet     error_setg(errp, "Cannot find device=%s nor node_name=%s",
2852dd67fa50SBenoît Canet                      device ? device : "",
2853dd67fa50SBenoît Canet                      node_name ? node_name : "");
2854dd67fa50SBenoît Canet     return NULL;
285512d3ba82SBenoît Canet }
285612d3ba82SBenoît Canet 
28575a6684d2SJeff Cody /* If 'base' is in the same chain as 'top', return true. Otherwise,
28585a6684d2SJeff Cody  * return false.  If either argument is NULL, return false. */
28595a6684d2SJeff Cody bool bdrv_chain_contains(BlockDriverState *top, BlockDriverState *base)
28605a6684d2SJeff Cody {
28615a6684d2SJeff Cody     while (top && top != base) {
28625a6684d2SJeff Cody         top = top->backing_hd;
28635a6684d2SJeff Cody     }
28645a6684d2SJeff Cody 
28655a6684d2SJeff Cody     return top != NULL;
28665a6684d2SJeff Cody }
28675a6684d2SJeff Cody 
286804df765aSFam Zheng BlockDriverState *bdrv_next_node(BlockDriverState *bs)
286904df765aSFam Zheng {
287004df765aSFam Zheng     if (!bs) {
287104df765aSFam Zheng         return QTAILQ_FIRST(&graph_bdrv_states);
287204df765aSFam Zheng     }
287304df765aSFam Zheng     return QTAILQ_NEXT(bs, node_list);
287404df765aSFam Zheng }
287504df765aSFam Zheng 
28762f399b0aSMarkus Armbruster BlockDriverState *bdrv_next(BlockDriverState *bs)
28772f399b0aSMarkus Armbruster {
28782f399b0aSMarkus Armbruster     if (!bs) {
28792f399b0aSMarkus Armbruster         return QTAILQ_FIRST(&bdrv_states);
28802f399b0aSMarkus Armbruster     }
2881dc364f4cSBenoît Canet     return QTAILQ_NEXT(bs, device_list);
28822f399b0aSMarkus Armbruster }
28832f399b0aSMarkus Armbruster 
288420a9e77dSFam Zheng const char *bdrv_get_node_name(const BlockDriverState *bs)
288520a9e77dSFam Zheng {
288620a9e77dSFam Zheng     return bs->node_name;
288720a9e77dSFam Zheng }
288820a9e77dSFam Zheng 
28897f06d47eSMarkus Armbruster /* TODO check what callers really want: bs->node_name or blk_name() */
2890bfb197e0SMarkus Armbruster const char *bdrv_get_device_name(const BlockDriverState *bs)
2891ea2384d3Sbellard {
2892bfb197e0SMarkus Armbruster     return bs->blk ? blk_name(bs->blk) : "";
2893ea2384d3Sbellard }
2894ea2384d3Sbellard 
28959b2aa84fSAlberto Garcia /* This can be used to identify nodes that might not have a device
28969b2aa84fSAlberto Garcia  * name associated. Since node and device names live in the same
28979b2aa84fSAlberto Garcia  * namespace, the result is unambiguous. The exception is if both are
28989b2aa84fSAlberto Garcia  * absent, then this returns an empty (non-null) string. */
28999b2aa84fSAlberto Garcia const char *bdrv_get_device_or_node_name(const BlockDriverState *bs)
29009b2aa84fSAlberto Garcia {
29019b2aa84fSAlberto Garcia     return bs->blk ? blk_name(bs->blk) : bs->node_name;
29029b2aa84fSAlberto Garcia }
29039b2aa84fSAlberto Garcia 
2904c8433287SMarkus Armbruster int bdrv_get_flags(BlockDriverState *bs)
2905c8433287SMarkus Armbruster {
2906c8433287SMarkus Armbruster     return bs->open_flags;
2907c8433287SMarkus Armbruster }
2908c8433287SMarkus Armbruster 
29093ac21627SPeter Lieven int bdrv_has_zero_init_1(BlockDriverState *bs)
29103ac21627SPeter Lieven {
29113ac21627SPeter Lieven     return 1;
29123ac21627SPeter Lieven }
29133ac21627SPeter Lieven 
2914f2feebbdSKevin Wolf int bdrv_has_zero_init(BlockDriverState *bs)
2915f2feebbdSKevin Wolf {
2916f2feebbdSKevin Wolf     assert(bs->drv);
2917f2feebbdSKevin Wolf 
291811212d8fSPaolo Bonzini     /* If BS is a copy on write image, it is initialized to
291911212d8fSPaolo Bonzini        the contents of the base image, which may not be zeroes.  */
292011212d8fSPaolo Bonzini     if (bs->backing_hd) {
292111212d8fSPaolo Bonzini         return 0;
292211212d8fSPaolo Bonzini     }
2923336c1c12SKevin Wolf     if (bs->drv->bdrv_has_zero_init) {
2924336c1c12SKevin Wolf         return bs->drv->bdrv_has_zero_init(bs);
2925f2feebbdSKevin Wolf     }
2926f2feebbdSKevin Wolf 
29273ac21627SPeter Lieven     /* safe default */
29283ac21627SPeter Lieven     return 0;
2929f2feebbdSKevin Wolf }
2930f2feebbdSKevin Wolf 
29314ce78691SPeter Lieven bool bdrv_unallocated_blocks_are_zero(BlockDriverState *bs)
29324ce78691SPeter Lieven {
29334ce78691SPeter Lieven     BlockDriverInfo bdi;
29344ce78691SPeter Lieven 
29354ce78691SPeter Lieven     if (bs->backing_hd) {
29364ce78691SPeter Lieven         return false;
29374ce78691SPeter Lieven     }
29384ce78691SPeter Lieven 
29394ce78691SPeter Lieven     if (bdrv_get_info(bs, &bdi) == 0) {
29404ce78691SPeter Lieven         return bdi.unallocated_blocks_are_zero;
29414ce78691SPeter Lieven     }
29424ce78691SPeter Lieven 
29434ce78691SPeter Lieven     return false;
29444ce78691SPeter Lieven }
29454ce78691SPeter Lieven 
29464ce78691SPeter Lieven bool bdrv_can_write_zeroes_with_unmap(BlockDriverState *bs)
29474ce78691SPeter Lieven {
29484ce78691SPeter Lieven     BlockDriverInfo bdi;
29494ce78691SPeter Lieven 
29504ce78691SPeter Lieven     if (bs->backing_hd || !(bs->open_flags & BDRV_O_UNMAP)) {
29514ce78691SPeter Lieven         return false;
29524ce78691SPeter Lieven     }
29534ce78691SPeter Lieven 
29544ce78691SPeter Lieven     if (bdrv_get_info(bs, &bdi) == 0) {
29554ce78691SPeter Lieven         return bdi.can_write_zeroes_with_unmap;
29564ce78691SPeter Lieven     }
29574ce78691SPeter Lieven 
29584ce78691SPeter Lieven     return false;
29594ce78691SPeter Lieven }
29604ce78691SPeter Lieven 
2961045df330Saliguori const char *bdrv_get_encrypted_filename(BlockDriverState *bs)
2962045df330Saliguori {
2963045df330Saliguori     if (bs->backing_hd && bs->backing_hd->encrypted)
2964045df330Saliguori         return bs->backing_file;
2965045df330Saliguori     else if (bs->encrypted)
2966045df330Saliguori         return bs->filename;
2967045df330Saliguori     else
2968045df330Saliguori         return NULL;
2969045df330Saliguori }
2970045df330Saliguori 
297183f64091Sbellard void bdrv_get_backing_filename(BlockDriverState *bs,
297283f64091Sbellard                                char *filename, int filename_size)
297383f64091Sbellard {
297483f64091Sbellard     pstrcpy(filename, filename_size, bs->backing_file);
297583f64091Sbellard }
297683f64091Sbellard 
2977faea38e7Sbellard int bdrv_get_info(BlockDriverState *bs, BlockDriverInfo *bdi)
2978faea38e7Sbellard {
2979faea38e7Sbellard     BlockDriver *drv = bs->drv;
2980faea38e7Sbellard     if (!drv)
298119cb3738Sbellard         return -ENOMEDIUM;
2982faea38e7Sbellard     if (!drv->bdrv_get_info)
2983faea38e7Sbellard         return -ENOTSUP;
2984faea38e7Sbellard     memset(bdi, 0, sizeof(*bdi));
2985faea38e7Sbellard     return drv->bdrv_get_info(bs, bdi);
2986faea38e7Sbellard }
2987faea38e7Sbellard 
2988eae041feSMax Reitz ImageInfoSpecific *bdrv_get_specific_info(BlockDriverState *bs)
2989eae041feSMax Reitz {
2990eae041feSMax Reitz     BlockDriver *drv = bs->drv;
2991eae041feSMax Reitz     if (drv && drv->bdrv_get_specific_info) {
2992eae041feSMax Reitz         return drv->bdrv_get_specific_info(bs);
2993eae041feSMax Reitz     }
2994eae041feSMax Reitz     return NULL;
2995eae041feSMax Reitz }
2996eae041feSMax Reitz 
29978b9b0cc2SKevin Wolf void bdrv_debug_event(BlockDriverState *bs, BlkDebugEvent event)
29988b9b0cc2SKevin Wolf {
2999bf736fe3SKevin Wolf     if (!bs || !bs->drv || !bs->drv->bdrv_debug_event) {
30008b9b0cc2SKevin Wolf         return;
30018b9b0cc2SKevin Wolf     }
30028b9b0cc2SKevin Wolf 
3003bf736fe3SKevin Wolf     bs->drv->bdrv_debug_event(bs, event);
300441c695c7SKevin Wolf }
30058b9b0cc2SKevin Wolf 
300641c695c7SKevin Wolf int bdrv_debug_breakpoint(BlockDriverState *bs, const char *event,
300741c695c7SKevin Wolf                           const char *tag)
300841c695c7SKevin Wolf {
300941c695c7SKevin Wolf     while (bs && bs->drv && !bs->drv->bdrv_debug_breakpoint) {
301041c695c7SKevin Wolf         bs = bs->file;
301141c695c7SKevin Wolf     }
301241c695c7SKevin Wolf 
301341c695c7SKevin Wolf     if (bs && bs->drv && bs->drv->bdrv_debug_breakpoint) {
301441c695c7SKevin Wolf         return bs->drv->bdrv_debug_breakpoint(bs, event, tag);
301541c695c7SKevin Wolf     }
301641c695c7SKevin Wolf 
301741c695c7SKevin Wolf     return -ENOTSUP;
301841c695c7SKevin Wolf }
301941c695c7SKevin Wolf 
30204cc70e93SFam Zheng int bdrv_debug_remove_breakpoint(BlockDriverState *bs, const char *tag)
30214cc70e93SFam Zheng {
30224cc70e93SFam Zheng     while (bs && bs->drv && !bs->drv->bdrv_debug_remove_breakpoint) {
30234cc70e93SFam Zheng         bs = bs->file;
30244cc70e93SFam Zheng     }
30254cc70e93SFam Zheng 
30264cc70e93SFam Zheng     if (bs && bs->drv && bs->drv->bdrv_debug_remove_breakpoint) {
30274cc70e93SFam Zheng         return bs->drv->bdrv_debug_remove_breakpoint(bs, tag);
30284cc70e93SFam Zheng     }
30294cc70e93SFam Zheng 
30304cc70e93SFam Zheng     return -ENOTSUP;
30314cc70e93SFam Zheng }
30324cc70e93SFam Zheng 
303341c695c7SKevin Wolf int bdrv_debug_resume(BlockDriverState *bs, const char *tag)
303441c695c7SKevin Wolf {
3035938789eaSMax Reitz     while (bs && (!bs->drv || !bs->drv->bdrv_debug_resume)) {
303641c695c7SKevin Wolf         bs = bs->file;
303741c695c7SKevin Wolf     }
303841c695c7SKevin Wolf 
303941c695c7SKevin Wolf     if (bs && bs->drv && bs->drv->bdrv_debug_resume) {
304041c695c7SKevin Wolf         return bs->drv->bdrv_debug_resume(bs, tag);
304141c695c7SKevin Wolf     }
304241c695c7SKevin Wolf 
304341c695c7SKevin Wolf     return -ENOTSUP;
304441c695c7SKevin Wolf }
304541c695c7SKevin Wolf 
304641c695c7SKevin Wolf bool bdrv_debug_is_suspended(BlockDriverState *bs, const char *tag)
304741c695c7SKevin Wolf {
304841c695c7SKevin Wolf     while (bs && bs->drv && !bs->drv->bdrv_debug_is_suspended) {
304941c695c7SKevin Wolf         bs = bs->file;
305041c695c7SKevin Wolf     }
305141c695c7SKevin Wolf 
305241c695c7SKevin Wolf     if (bs && bs->drv && bs->drv->bdrv_debug_is_suspended) {
305341c695c7SKevin Wolf         return bs->drv->bdrv_debug_is_suspended(bs, tag);
305441c695c7SKevin Wolf     }
305541c695c7SKevin Wolf 
305641c695c7SKevin Wolf     return false;
30578b9b0cc2SKevin Wolf }
30588b9b0cc2SKevin Wolf 
3059199630b6SBlue Swirl int bdrv_is_snapshot(BlockDriverState *bs)
3060199630b6SBlue Swirl {
3061199630b6SBlue Swirl     return !!(bs->open_flags & BDRV_O_SNAPSHOT);
3062199630b6SBlue Swirl }
3063199630b6SBlue Swirl 
3064b1b1d783SJeff Cody /* backing_file can either be relative, or absolute, or a protocol.  If it is
3065b1b1d783SJeff Cody  * relative, it must be relative to the chain.  So, passing in bs->filename
3066b1b1d783SJeff Cody  * from a BDS as backing_file should not be done, as that may be relative to
3067b1b1d783SJeff Cody  * the CWD rather than the chain. */
3068e8a6bb9cSMarcelo Tosatti BlockDriverState *bdrv_find_backing_image(BlockDriverState *bs,
3069e8a6bb9cSMarcelo Tosatti         const char *backing_file)
3070e8a6bb9cSMarcelo Tosatti {
3071b1b1d783SJeff Cody     char *filename_full = NULL;
3072b1b1d783SJeff Cody     char *backing_file_full = NULL;
3073b1b1d783SJeff Cody     char *filename_tmp = NULL;
3074b1b1d783SJeff Cody     int is_protocol = 0;
3075b1b1d783SJeff Cody     BlockDriverState *curr_bs = NULL;
3076b1b1d783SJeff Cody     BlockDriverState *retval = NULL;
3077b1b1d783SJeff Cody 
3078b1b1d783SJeff Cody     if (!bs || !bs->drv || !backing_file) {
3079e8a6bb9cSMarcelo Tosatti         return NULL;
3080e8a6bb9cSMarcelo Tosatti     }
3081e8a6bb9cSMarcelo Tosatti 
3082b1b1d783SJeff Cody     filename_full     = g_malloc(PATH_MAX);
3083b1b1d783SJeff Cody     backing_file_full = g_malloc(PATH_MAX);
3084b1b1d783SJeff Cody     filename_tmp      = g_malloc(PATH_MAX);
3085b1b1d783SJeff Cody 
3086b1b1d783SJeff Cody     is_protocol = path_has_protocol(backing_file);
3087b1b1d783SJeff Cody 
3088b1b1d783SJeff Cody     for (curr_bs = bs; curr_bs->backing_hd; curr_bs = curr_bs->backing_hd) {
3089b1b1d783SJeff Cody 
3090b1b1d783SJeff Cody         /* If either of the filename paths is actually a protocol, then
3091b1b1d783SJeff Cody          * compare unmodified paths; otherwise make paths relative */
3092b1b1d783SJeff Cody         if (is_protocol || path_has_protocol(curr_bs->backing_file)) {
3093b1b1d783SJeff Cody             if (strcmp(backing_file, curr_bs->backing_file) == 0) {
3094b1b1d783SJeff Cody                 retval = curr_bs->backing_hd;
3095b1b1d783SJeff Cody                 break;
3096b1b1d783SJeff Cody             }
3097e8a6bb9cSMarcelo Tosatti         } else {
3098b1b1d783SJeff Cody             /* If not an absolute filename path, make it relative to the current
3099b1b1d783SJeff Cody              * image's filename path */
3100b1b1d783SJeff Cody             path_combine(filename_tmp, PATH_MAX, curr_bs->filename,
3101b1b1d783SJeff Cody                          backing_file);
3102b1b1d783SJeff Cody 
3103b1b1d783SJeff Cody             /* We are going to compare absolute pathnames */
3104b1b1d783SJeff Cody             if (!realpath(filename_tmp, filename_full)) {
3105b1b1d783SJeff Cody                 continue;
3106b1b1d783SJeff Cody             }
3107b1b1d783SJeff Cody 
3108b1b1d783SJeff Cody             /* We need to make sure the backing filename we are comparing against
3109b1b1d783SJeff Cody              * is relative to the current image filename (or absolute) */
3110b1b1d783SJeff Cody             path_combine(filename_tmp, PATH_MAX, curr_bs->filename,
3111b1b1d783SJeff Cody                          curr_bs->backing_file);
3112b1b1d783SJeff Cody 
3113b1b1d783SJeff Cody             if (!realpath(filename_tmp, backing_file_full)) {
3114b1b1d783SJeff Cody                 continue;
3115b1b1d783SJeff Cody             }
3116b1b1d783SJeff Cody 
3117b1b1d783SJeff Cody             if (strcmp(backing_file_full, filename_full) == 0) {
3118b1b1d783SJeff Cody                 retval = curr_bs->backing_hd;
3119b1b1d783SJeff Cody                 break;
3120b1b1d783SJeff Cody             }
3121e8a6bb9cSMarcelo Tosatti         }
3122e8a6bb9cSMarcelo Tosatti     }
3123e8a6bb9cSMarcelo Tosatti 
3124b1b1d783SJeff Cody     g_free(filename_full);
3125b1b1d783SJeff Cody     g_free(backing_file_full);
3126b1b1d783SJeff Cody     g_free(filename_tmp);
3127b1b1d783SJeff Cody     return retval;
3128e8a6bb9cSMarcelo Tosatti }
3129e8a6bb9cSMarcelo Tosatti 
3130f198fd1cSBenoît Canet int bdrv_get_backing_file_depth(BlockDriverState *bs)
3131f198fd1cSBenoît Canet {
3132f198fd1cSBenoît Canet     if (!bs->drv) {
3133f198fd1cSBenoît Canet         return 0;
3134f198fd1cSBenoît Canet     }
3135f198fd1cSBenoît Canet 
3136f198fd1cSBenoît Canet     if (!bs->backing_hd) {
3137f198fd1cSBenoît Canet         return 0;
3138f198fd1cSBenoît Canet     }
3139f198fd1cSBenoît Canet 
3140f198fd1cSBenoît Canet     return 1 + bdrv_get_backing_file_depth(bs->backing_hd);
3141f198fd1cSBenoît Canet }
3142f198fd1cSBenoît Canet 
3143ea2384d3Sbellard void bdrv_init(void)
3144ea2384d3Sbellard {
31455efa9d5aSAnthony Liguori     module_call_init(MODULE_INIT_BLOCK);
3146ea2384d3Sbellard }
3147ce1a14dcSpbrook 
3148eb852011SMarkus Armbruster void bdrv_init_with_whitelist(void)
3149eb852011SMarkus Armbruster {
3150eb852011SMarkus Armbruster     use_bdrv_whitelist = 1;
3151eb852011SMarkus Armbruster     bdrv_init();
3152eb852011SMarkus Armbruster }
3153eb852011SMarkus Armbruster 
31545a8a30dbSKevin Wolf void bdrv_invalidate_cache(BlockDriverState *bs, Error **errp)
31550f15423cSAnthony Liguori {
31565a8a30dbSKevin Wolf     Error *local_err = NULL;
31575a8a30dbSKevin Wolf     int ret;
31585a8a30dbSKevin Wolf 
31593456a8d1SKevin Wolf     if (!bs->drv)  {
31603456a8d1SKevin Wolf         return;
31610f15423cSAnthony Liguori     }
31623456a8d1SKevin Wolf 
31637ea2d269SAlexey Kardashevskiy     if (!(bs->open_flags & BDRV_O_INCOMING)) {
31647ea2d269SAlexey Kardashevskiy         return;
31657ea2d269SAlexey Kardashevskiy     }
31667ea2d269SAlexey Kardashevskiy     bs->open_flags &= ~BDRV_O_INCOMING;
31677ea2d269SAlexey Kardashevskiy 
31683456a8d1SKevin Wolf     if (bs->drv->bdrv_invalidate_cache) {
31695a8a30dbSKevin Wolf         bs->drv->bdrv_invalidate_cache(bs, &local_err);
31703456a8d1SKevin Wolf     } else if (bs->file) {
31715a8a30dbSKevin Wolf         bdrv_invalidate_cache(bs->file, &local_err);
31725a8a30dbSKevin Wolf     }
31735a8a30dbSKevin Wolf     if (local_err) {
31745a8a30dbSKevin Wolf         error_propagate(errp, local_err);
31755a8a30dbSKevin Wolf         return;
31763456a8d1SKevin Wolf     }
31773456a8d1SKevin Wolf 
31785a8a30dbSKevin Wolf     ret = refresh_total_sectors(bs, bs->total_sectors);
31795a8a30dbSKevin Wolf     if (ret < 0) {
31805a8a30dbSKevin Wolf         error_setg_errno(errp, -ret, "Could not refresh total sector count");
31815a8a30dbSKevin Wolf         return;
31825a8a30dbSKevin Wolf     }
31830f15423cSAnthony Liguori }
31840f15423cSAnthony Liguori 
31855a8a30dbSKevin Wolf void bdrv_invalidate_cache_all(Error **errp)
31860f15423cSAnthony Liguori {
31870f15423cSAnthony Liguori     BlockDriverState *bs;
31885a8a30dbSKevin Wolf     Error *local_err = NULL;
31890f15423cSAnthony Liguori 
3190dc364f4cSBenoît Canet     QTAILQ_FOREACH(bs, &bdrv_states, device_list) {
3191ed78cda3SStefan Hajnoczi         AioContext *aio_context = bdrv_get_aio_context(bs);
3192ed78cda3SStefan Hajnoczi 
3193ed78cda3SStefan Hajnoczi         aio_context_acquire(aio_context);
31945a8a30dbSKevin Wolf         bdrv_invalidate_cache(bs, &local_err);
3195ed78cda3SStefan Hajnoczi         aio_context_release(aio_context);
31965a8a30dbSKevin Wolf         if (local_err) {
31975a8a30dbSKevin Wolf             error_propagate(errp, local_err);
31985a8a30dbSKevin Wolf             return;
31995a8a30dbSKevin Wolf         }
32000f15423cSAnthony Liguori     }
32010f15423cSAnthony Liguori }
32020f15423cSAnthony Liguori 
3203f9f05dc5SKevin Wolf /**************************************************************/
320419cb3738Sbellard /* removable device support */
320519cb3738Sbellard 
320619cb3738Sbellard /**
320719cb3738Sbellard  * Return TRUE if the media is present
320819cb3738Sbellard  */
320919cb3738Sbellard int bdrv_is_inserted(BlockDriverState *bs)
321019cb3738Sbellard {
321119cb3738Sbellard     BlockDriver *drv = bs->drv;
3212a1aff5bfSMarkus Armbruster 
321319cb3738Sbellard     if (!drv)
321419cb3738Sbellard         return 0;
321519cb3738Sbellard     if (!drv->bdrv_is_inserted)
3216a1aff5bfSMarkus Armbruster         return 1;
3217a1aff5bfSMarkus Armbruster     return drv->bdrv_is_inserted(bs);
321819cb3738Sbellard }
321919cb3738Sbellard 
322019cb3738Sbellard /**
32218e49ca46SMarkus Armbruster  * Return whether the media changed since the last call to this
32228e49ca46SMarkus Armbruster  * function, or -ENOTSUP if we don't know.  Most drivers don't know.
322319cb3738Sbellard  */
322419cb3738Sbellard int bdrv_media_changed(BlockDriverState *bs)
322519cb3738Sbellard {
322619cb3738Sbellard     BlockDriver *drv = bs->drv;
322719cb3738Sbellard 
32288e49ca46SMarkus Armbruster     if (drv && drv->bdrv_media_changed) {
32298e49ca46SMarkus Armbruster         return drv->bdrv_media_changed(bs);
32308e49ca46SMarkus Armbruster     }
32318e49ca46SMarkus Armbruster     return -ENOTSUP;
323219cb3738Sbellard }
323319cb3738Sbellard 
323419cb3738Sbellard /**
323519cb3738Sbellard  * If eject_flag is TRUE, eject the media. Otherwise, close the tray
323619cb3738Sbellard  */
3237f36f3949SLuiz Capitulino void bdrv_eject(BlockDriverState *bs, bool eject_flag)
323819cb3738Sbellard {
323919cb3738Sbellard     BlockDriver *drv = bs->drv;
3240bfb197e0SMarkus Armbruster     const char *device_name;
324119cb3738Sbellard 
3242822e1cd1SMarkus Armbruster     if (drv && drv->bdrv_eject) {
3243822e1cd1SMarkus Armbruster         drv->bdrv_eject(bs, eject_flag);
324419cb3738Sbellard     }
32456f382ed2SLuiz Capitulino 
3246bfb197e0SMarkus Armbruster     device_name = bdrv_get_device_name(bs);
3247bfb197e0SMarkus Armbruster     if (device_name[0] != '\0') {
3248bfb197e0SMarkus Armbruster         qapi_event_send_device_tray_moved(device_name,
3249a5ee7bd4SWenchao Xia                                           eject_flag, &error_abort);
32506f382ed2SLuiz Capitulino     }
325119cb3738Sbellard }
325219cb3738Sbellard 
325319cb3738Sbellard /**
325419cb3738Sbellard  * Lock or unlock the media (if it is locked, the user won't be able
325519cb3738Sbellard  * to eject it manually).
325619cb3738Sbellard  */
3257025e849aSMarkus Armbruster void bdrv_lock_medium(BlockDriverState *bs, bool locked)
325819cb3738Sbellard {
325919cb3738Sbellard     BlockDriver *drv = bs->drv;
326019cb3738Sbellard 
3261025e849aSMarkus Armbruster     trace_bdrv_lock_medium(bs, locked);
3262b8c6d095SStefan Hajnoczi 
3263025e849aSMarkus Armbruster     if (drv && drv->bdrv_lock_medium) {
3264025e849aSMarkus Armbruster         drv->bdrv_lock_medium(bs, locked);
326519cb3738Sbellard     }
326619cb3738Sbellard }
3267985a03b0Sths 
32681b7fd729SPaolo Bonzini void bdrv_set_guest_block_size(BlockDriverState *bs, int align)
32697b6f9300SMarkus Armbruster {
32701b7fd729SPaolo Bonzini     bs->guest_block_size = align;
32717b6f9300SMarkus Armbruster }
32727cd1e32aSlirans@il.ibm.com 
32730db6e54aSFam Zheng BdrvDirtyBitmap *bdrv_find_dirty_bitmap(BlockDriverState *bs, const char *name)
32740db6e54aSFam Zheng {
32750db6e54aSFam Zheng     BdrvDirtyBitmap *bm;
32760db6e54aSFam Zheng 
32770db6e54aSFam Zheng     assert(name);
32780db6e54aSFam Zheng     QLIST_FOREACH(bm, &bs->dirty_bitmaps, list) {
32790db6e54aSFam Zheng         if (bm->name && !strcmp(name, bm->name)) {
32800db6e54aSFam Zheng             return bm;
32810db6e54aSFam Zheng         }
32820db6e54aSFam Zheng     }
32830db6e54aSFam Zheng     return NULL;
32840db6e54aSFam Zheng }
32850db6e54aSFam Zheng 
328620dca810SJohn Snow void bdrv_dirty_bitmap_make_anon(BdrvDirtyBitmap *bitmap)
32870db6e54aSFam Zheng {
32889bd2b08fSJohn Snow     assert(!bdrv_dirty_bitmap_frozen(bitmap));
32890db6e54aSFam Zheng     g_free(bitmap->name);
32900db6e54aSFam Zheng     bitmap->name = NULL;
32910db6e54aSFam Zheng }
32920db6e54aSFam Zheng 
32930db6e54aSFam Zheng BdrvDirtyBitmap *bdrv_create_dirty_bitmap(BlockDriverState *bs,
32945fba6c0eSJohn Snow                                           uint32_t granularity,
32950db6e54aSFam Zheng                                           const char *name,
3296b8afb520SFam Zheng                                           Error **errp)
32977cd1e32aSlirans@il.ibm.com {
32987cd1e32aSlirans@il.ibm.com     int64_t bitmap_size;
3299e4654d2dSFam Zheng     BdrvDirtyBitmap *bitmap;
33005fba6c0eSJohn Snow     uint32_t sector_granularity;
3301a55eb92cSJan Kiszka 
330250717e94SPaolo Bonzini     assert((granularity & (granularity - 1)) == 0);
330350717e94SPaolo Bonzini 
33040db6e54aSFam Zheng     if (name && bdrv_find_dirty_bitmap(bs, name)) {
33050db6e54aSFam Zheng         error_setg(errp, "Bitmap already exists: %s", name);
33060db6e54aSFam Zheng         return NULL;
33070db6e54aSFam Zheng     }
33085fba6c0eSJohn Snow     sector_granularity = granularity >> BDRV_SECTOR_BITS;
33095fba6c0eSJohn Snow     assert(sector_granularity);
331057322b78SMarkus Armbruster     bitmap_size = bdrv_nb_sectors(bs);
3311b8afb520SFam Zheng     if (bitmap_size < 0) {
3312b8afb520SFam Zheng         error_setg_errno(errp, -bitmap_size, "could not get length of device");
3313b8afb520SFam Zheng         errno = -bitmap_size;
3314b8afb520SFam Zheng         return NULL;
3315b8afb520SFam Zheng     }
33165839e53bSMarkus Armbruster     bitmap = g_new0(BdrvDirtyBitmap, 1);
33175fba6c0eSJohn Snow     bitmap->bitmap = hbitmap_alloc(bitmap_size, ctz32(sector_granularity));
3318e74e6b78SJohn Snow     bitmap->size = bitmap_size;
33190db6e54aSFam Zheng     bitmap->name = g_strdup(name);
3320b8e6fb75SJohn Snow     bitmap->disabled = false;
3321e4654d2dSFam Zheng     QLIST_INSERT_HEAD(&bs->dirty_bitmaps, bitmap, list);
3322e4654d2dSFam Zheng     return bitmap;
3323e4654d2dSFam Zheng }
3324e4654d2dSFam Zheng 
33259bd2b08fSJohn Snow bool bdrv_dirty_bitmap_frozen(BdrvDirtyBitmap *bitmap)
33269bd2b08fSJohn Snow {
33279bd2b08fSJohn Snow     return bitmap->successor;
33289bd2b08fSJohn Snow }
33299bd2b08fSJohn Snow 
3330b8e6fb75SJohn Snow bool bdrv_dirty_bitmap_enabled(BdrvDirtyBitmap *bitmap)
3331b8e6fb75SJohn Snow {
33329bd2b08fSJohn Snow     return !(bitmap->disabled || bitmap->successor);
33339bd2b08fSJohn Snow }
33349bd2b08fSJohn Snow 
33359abe3bdcSJohn Snow DirtyBitmapStatus bdrv_dirty_bitmap_status(BdrvDirtyBitmap *bitmap)
33369abe3bdcSJohn Snow {
33379abe3bdcSJohn Snow     if (bdrv_dirty_bitmap_frozen(bitmap)) {
33389abe3bdcSJohn Snow         return DIRTY_BITMAP_STATUS_FROZEN;
33399abe3bdcSJohn Snow     } else if (!bdrv_dirty_bitmap_enabled(bitmap)) {
33409abe3bdcSJohn Snow         return DIRTY_BITMAP_STATUS_DISABLED;
33419abe3bdcSJohn Snow     } else {
33429abe3bdcSJohn Snow         return DIRTY_BITMAP_STATUS_ACTIVE;
33439abe3bdcSJohn Snow     }
33449abe3bdcSJohn Snow }
33459abe3bdcSJohn Snow 
33469bd2b08fSJohn Snow /**
33479bd2b08fSJohn Snow  * Create a successor bitmap destined to replace this bitmap after an operation.
33489bd2b08fSJohn Snow  * Requires that the bitmap is not frozen and has no successor.
33499bd2b08fSJohn Snow  */
33509bd2b08fSJohn Snow int bdrv_dirty_bitmap_create_successor(BlockDriverState *bs,
33519bd2b08fSJohn Snow                                        BdrvDirtyBitmap *bitmap, Error **errp)
33529bd2b08fSJohn Snow {
33539bd2b08fSJohn Snow     uint64_t granularity;
33549bd2b08fSJohn Snow     BdrvDirtyBitmap *child;
33559bd2b08fSJohn Snow 
33569bd2b08fSJohn Snow     if (bdrv_dirty_bitmap_frozen(bitmap)) {
33579bd2b08fSJohn Snow         error_setg(errp, "Cannot create a successor for a bitmap that is "
33589bd2b08fSJohn Snow                    "currently frozen");
33599bd2b08fSJohn Snow         return -1;
33609bd2b08fSJohn Snow     }
33619bd2b08fSJohn Snow     assert(!bitmap->successor);
33629bd2b08fSJohn Snow 
33639bd2b08fSJohn Snow     /* Create an anonymous successor */
33649bd2b08fSJohn Snow     granularity = bdrv_dirty_bitmap_granularity(bitmap);
33659bd2b08fSJohn Snow     child = bdrv_create_dirty_bitmap(bs, granularity, NULL, errp);
33669bd2b08fSJohn Snow     if (!child) {
33679bd2b08fSJohn Snow         return -1;
33689bd2b08fSJohn Snow     }
33699bd2b08fSJohn Snow 
33709bd2b08fSJohn Snow     /* Successor will be on or off based on our current state. */
33719bd2b08fSJohn Snow     child->disabled = bitmap->disabled;
33729bd2b08fSJohn Snow 
33739bd2b08fSJohn Snow     /* Install the successor and freeze the parent */
33749bd2b08fSJohn Snow     bitmap->successor = child;
33759bd2b08fSJohn Snow     return 0;
33769bd2b08fSJohn Snow }
33779bd2b08fSJohn Snow 
33789bd2b08fSJohn Snow /**
33799bd2b08fSJohn Snow  * For a bitmap with a successor, yield our name to the successor,
33809bd2b08fSJohn Snow  * delete the old bitmap, and return a handle to the new bitmap.
33819bd2b08fSJohn Snow  */
33829bd2b08fSJohn Snow BdrvDirtyBitmap *bdrv_dirty_bitmap_abdicate(BlockDriverState *bs,
33839bd2b08fSJohn Snow                                             BdrvDirtyBitmap *bitmap,
33849bd2b08fSJohn Snow                                             Error **errp)
33859bd2b08fSJohn Snow {
33869bd2b08fSJohn Snow     char *name;
33879bd2b08fSJohn Snow     BdrvDirtyBitmap *successor = bitmap->successor;
33889bd2b08fSJohn Snow 
33899bd2b08fSJohn Snow     if (successor == NULL) {
33909bd2b08fSJohn Snow         error_setg(errp, "Cannot relinquish control if "
33919bd2b08fSJohn Snow                    "there's no successor present");
33929bd2b08fSJohn Snow         return NULL;
33939bd2b08fSJohn Snow     }
33949bd2b08fSJohn Snow 
33959bd2b08fSJohn Snow     name = bitmap->name;
33969bd2b08fSJohn Snow     bitmap->name = NULL;
33979bd2b08fSJohn Snow     successor->name = name;
33989bd2b08fSJohn Snow     bitmap->successor = NULL;
33999bd2b08fSJohn Snow     bdrv_release_dirty_bitmap(bs, bitmap);
34009bd2b08fSJohn Snow 
34019bd2b08fSJohn Snow     return successor;
34029bd2b08fSJohn Snow }
34039bd2b08fSJohn Snow 
34049bd2b08fSJohn Snow /**
34059bd2b08fSJohn Snow  * In cases of failure where we can no longer safely delete the parent,
34069bd2b08fSJohn Snow  * we may wish to re-join the parent and child/successor.
34079bd2b08fSJohn Snow  * The merged parent will be un-frozen, but not explicitly re-enabled.
34089bd2b08fSJohn Snow  */
34099bd2b08fSJohn Snow BdrvDirtyBitmap *bdrv_reclaim_dirty_bitmap(BlockDriverState *bs,
34109bd2b08fSJohn Snow                                            BdrvDirtyBitmap *parent,
34119bd2b08fSJohn Snow                                            Error **errp)
34129bd2b08fSJohn Snow {
34139bd2b08fSJohn Snow     BdrvDirtyBitmap *successor = parent->successor;
34149bd2b08fSJohn Snow 
34159bd2b08fSJohn Snow     if (!successor) {
34169bd2b08fSJohn Snow         error_setg(errp, "Cannot reclaim a successor when none is present");
34179bd2b08fSJohn Snow         return NULL;
34189bd2b08fSJohn Snow     }
34199bd2b08fSJohn Snow 
34209bd2b08fSJohn Snow     if (!hbitmap_merge(parent->bitmap, successor->bitmap)) {
34219bd2b08fSJohn Snow         error_setg(errp, "Merging of parent and successor bitmap failed");
34229bd2b08fSJohn Snow         return NULL;
34239bd2b08fSJohn Snow     }
34249bd2b08fSJohn Snow     bdrv_release_dirty_bitmap(bs, successor);
34259bd2b08fSJohn Snow     parent->successor = NULL;
34269bd2b08fSJohn Snow 
34279bd2b08fSJohn Snow     return parent;
3428b8e6fb75SJohn Snow }
3429b8e6fb75SJohn Snow 
3430ce1ffea8SJohn Snow /**
3431ce1ffea8SJohn Snow  * Truncates _all_ bitmaps attached to a BDS.
3432ce1ffea8SJohn Snow  */
3433ce1ffea8SJohn Snow static void bdrv_dirty_bitmap_truncate(BlockDriverState *bs)
3434ce1ffea8SJohn Snow {
3435ce1ffea8SJohn Snow     BdrvDirtyBitmap *bitmap;
3436ce1ffea8SJohn Snow     uint64_t size = bdrv_nb_sectors(bs);
3437ce1ffea8SJohn Snow 
3438ce1ffea8SJohn Snow     QLIST_FOREACH(bitmap, &bs->dirty_bitmaps, list) {
343906207b0fSJohn Snow         assert(!bdrv_dirty_bitmap_frozen(bitmap));
3440ce1ffea8SJohn Snow         hbitmap_truncate(bitmap->bitmap, size);
34415270b6a0SJohn Snow         bitmap->size = size;
3442ce1ffea8SJohn Snow     }
3443ce1ffea8SJohn Snow }
3444ce1ffea8SJohn Snow 
3445e4654d2dSFam Zheng void bdrv_release_dirty_bitmap(BlockDriverState *bs, BdrvDirtyBitmap *bitmap)
3446e4654d2dSFam Zheng {
3447e4654d2dSFam Zheng     BdrvDirtyBitmap *bm, *next;
3448e4654d2dSFam Zheng     QLIST_FOREACH_SAFE(bm, &bs->dirty_bitmaps, list, next) {
3449e4654d2dSFam Zheng         if (bm == bitmap) {
34509bd2b08fSJohn Snow             assert(!bdrv_dirty_bitmap_frozen(bm));
3451e4654d2dSFam Zheng             QLIST_REMOVE(bitmap, list);
3452e4654d2dSFam Zheng             hbitmap_free(bitmap->bitmap);
34530db6e54aSFam Zheng             g_free(bitmap->name);
3454e4654d2dSFam Zheng             g_free(bitmap);
3455e4654d2dSFam Zheng             return;
34567cd1e32aSlirans@il.ibm.com         }
34577cd1e32aSlirans@il.ibm.com     }
34587cd1e32aSlirans@il.ibm.com }
34597cd1e32aSlirans@il.ibm.com 
3460b8e6fb75SJohn Snow void bdrv_disable_dirty_bitmap(BdrvDirtyBitmap *bitmap)
3461b8e6fb75SJohn Snow {
34629bd2b08fSJohn Snow     assert(!bdrv_dirty_bitmap_frozen(bitmap));
3463b8e6fb75SJohn Snow     bitmap->disabled = true;
3464b8e6fb75SJohn Snow }
3465b8e6fb75SJohn Snow 
3466b8e6fb75SJohn Snow void bdrv_enable_dirty_bitmap(BdrvDirtyBitmap *bitmap)
3467b8e6fb75SJohn Snow {
34689bd2b08fSJohn Snow     assert(!bdrv_dirty_bitmap_frozen(bitmap));
3469b8e6fb75SJohn Snow     bitmap->disabled = false;
3470b8e6fb75SJohn Snow }
3471b8e6fb75SJohn Snow 
347221b56835SFam Zheng BlockDirtyInfoList *bdrv_query_dirty_bitmaps(BlockDriverState *bs)
347321b56835SFam Zheng {
347421b56835SFam Zheng     BdrvDirtyBitmap *bm;
347521b56835SFam Zheng     BlockDirtyInfoList *list = NULL;
347621b56835SFam Zheng     BlockDirtyInfoList **plist = &list;
347721b56835SFam Zheng 
347821b56835SFam Zheng     QLIST_FOREACH(bm, &bs->dirty_bitmaps, list) {
34795839e53bSMarkus Armbruster         BlockDirtyInfo *info = g_new0(BlockDirtyInfo, 1);
34805839e53bSMarkus Armbruster         BlockDirtyInfoList *entry = g_new0(BlockDirtyInfoList, 1);
348120dca810SJohn Snow         info->count = bdrv_get_dirty_count(bm);
3482592fdd02SJohn Snow         info->granularity = bdrv_dirty_bitmap_granularity(bm);
34830db6e54aSFam Zheng         info->has_name = !!bm->name;
34840db6e54aSFam Zheng         info->name = g_strdup(bm->name);
34859abe3bdcSJohn Snow         info->status = bdrv_dirty_bitmap_status(bm);
348621b56835SFam Zheng         entry->value = info;
348721b56835SFam Zheng         *plist = entry;
348821b56835SFam Zheng         plist = &entry->next;
348921b56835SFam Zheng     }
349021b56835SFam Zheng 
349121b56835SFam Zheng     return list;
349221b56835SFam Zheng }
349321b56835SFam Zheng 
3494e4654d2dSFam Zheng int bdrv_get_dirty(BlockDriverState *bs, BdrvDirtyBitmap *bitmap, int64_t sector)
34957cd1e32aSlirans@il.ibm.com {
3496e4654d2dSFam Zheng     if (bitmap) {
3497e4654d2dSFam Zheng         return hbitmap_get(bitmap->bitmap, sector);
34987cd1e32aSlirans@il.ibm.com     } else {
34997cd1e32aSlirans@il.ibm.com         return 0;
35007cd1e32aSlirans@il.ibm.com     }
35017cd1e32aSlirans@il.ibm.com }
35027cd1e32aSlirans@il.ibm.com 
3503341ebc2fSJohn Snow /**
3504341ebc2fSJohn Snow  * Chooses a default granularity based on the existing cluster size,
3505341ebc2fSJohn Snow  * but clamped between [4K, 64K]. Defaults to 64K in the case that there
3506341ebc2fSJohn Snow  * is no cluster size information available.
3507341ebc2fSJohn Snow  */
3508341ebc2fSJohn Snow uint32_t bdrv_get_default_bitmap_granularity(BlockDriverState *bs)
3509341ebc2fSJohn Snow {
3510341ebc2fSJohn Snow     BlockDriverInfo bdi;
3511341ebc2fSJohn Snow     uint32_t granularity;
3512341ebc2fSJohn Snow 
3513341ebc2fSJohn Snow     if (bdrv_get_info(bs, &bdi) >= 0 && bdi.cluster_size > 0) {
3514341ebc2fSJohn Snow         granularity = MAX(4096, bdi.cluster_size);
3515341ebc2fSJohn Snow         granularity = MIN(65536, granularity);
3516341ebc2fSJohn Snow     } else {
3517341ebc2fSJohn Snow         granularity = 65536;
3518341ebc2fSJohn Snow     }
3519341ebc2fSJohn Snow 
3520341ebc2fSJohn Snow     return granularity;
3521341ebc2fSJohn Snow }
3522341ebc2fSJohn Snow 
3523592fdd02SJohn Snow uint32_t bdrv_dirty_bitmap_granularity(BdrvDirtyBitmap *bitmap)
3524592fdd02SJohn Snow {
3525592fdd02SJohn Snow     return BDRV_SECTOR_SIZE << hbitmap_granularity(bitmap->bitmap);
3526592fdd02SJohn Snow }
3527592fdd02SJohn Snow 
352820dca810SJohn Snow void bdrv_dirty_iter_init(BdrvDirtyBitmap *bitmap, HBitmapIter *hbi)
35291755da16SPaolo Bonzini {
3530e4654d2dSFam Zheng     hbitmap_iter_init(hbi, bitmap->bitmap, 0);
35311755da16SPaolo Bonzini }
35321755da16SPaolo Bonzini 
353320dca810SJohn Snow void bdrv_set_dirty_bitmap(BdrvDirtyBitmap *bitmap,
3534c4237dfaSVladimir Sementsov-Ogievskiy                            int64_t cur_sector, int nr_sectors)
3535c4237dfaSVladimir Sementsov-Ogievskiy {
3536b8e6fb75SJohn Snow     assert(bdrv_dirty_bitmap_enabled(bitmap));
3537c4237dfaSVladimir Sementsov-Ogievskiy     hbitmap_set(bitmap->bitmap, cur_sector, nr_sectors);
3538c4237dfaSVladimir Sementsov-Ogievskiy }
3539c4237dfaSVladimir Sementsov-Ogievskiy 
354020dca810SJohn Snow void bdrv_reset_dirty_bitmap(BdrvDirtyBitmap *bitmap,
3541c4237dfaSVladimir Sementsov-Ogievskiy                              int64_t cur_sector, int nr_sectors)
3542c4237dfaSVladimir Sementsov-Ogievskiy {
3543b8e6fb75SJohn Snow     assert(bdrv_dirty_bitmap_enabled(bitmap));
3544c4237dfaSVladimir Sementsov-Ogievskiy     hbitmap_reset(bitmap->bitmap, cur_sector, nr_sectors);
3545c4237dfaSVladimir Sementsov-Ogievskiy }
3546c4237dfaSVladimir Sementsov-Ogievskiy 
3547e74e6b78SJohn Snow void bdrv_clear_dirty_bitmap(BdrvDirtyBitmap *bitmap)
3548e74e6b78SJohn Snow {
3549e74e6b78SJohn Snow     assert(bdrv_dirty_bitmap_enabled(bitmap));
3550c6a8c328SWen Congyang     hbitmap_reset_all(bitmap->bitmap);
3551e74e6b78SJohn Snow }
3552e74e6b78SJohn Snow 
3553e0c47b6cSStefan Hajnoczi void bdrv_set_dirty(BlockDriverState *bs, int64_t cur_sector,
35541755da16SPaolo Bonzini                     int nr_sectors)
35551755da16SPaolo Bonzini {
3556e4654d2dSFam Zheng     BdrvDirtyBitmap *bitmap;
3557e4654d2dSFam Zheng     QLIST_FOREACH(bitmap, &bs->dirty_bitmaps, list) {
3558b8e6fb75SJohn Snow         if (!bdrv_dirty_bitmap_enabled(bitmap)) {
3559b8e6fb75SJohn Snow             continue;
3560b8e6fb75SJohn Snow         }
3561e4654d2dSFam Zheng         hbitmap_set(bitmap->bitmap, cur_sector, nr_sectors);
3562e4654d2dSFam Zheng     }
35631755da16SPaolo Bonzini }
35641755da16SPaolo Bonzini 
3565d58d8453SJohn Snow /**
3566d58d8453SJohn Snow  * Advance an HBitmapIter to an arbitrary offset.
3567d58d8453SJohn Snow  */
3568d58d8453SJohn Snow void bdrv_set_dirty_iter(HBitmapIter *hbi, int64_t offset)
3569d58d8453SJohn Snow {
3570d58d8453SJohn Snow     assert(hbi->hb);
3571d58d8453SJohn Snow     hbitmap_iter_init(hbi, hbi->hb, offset);
3572d58d8453SJohn Snow }
3573d58d8453SJohn Snow 
357420dca810SJohn Snow int64_t bdrv_get_dirty_count(BdrvDirtyBitmap *bitmap)
3575aaa0eb75SLiran Schour {
3576e4654d2dSFam Zheng     return hbitmap_count(bitmap->bitmap);
3577aaa0eb75SLiran Schour }
3578f88e1a42SJes Sorensen 
35799fcb0251SFam Zheng /* Get a reference to bs */
35809fcb0251SFam Zheng void bdrv_ref(BlockDriverState *bs)
35819fcb0251SFam Zheng {
35829fcb0251SFam Zheng     bs->refcnt++;
35839fcb0251SFam Zheng }
35849fcb0251SFam Zheng 
35859fcb0251SFam Zheng /* Release a previously grabbed reference to bs.
35869fcb0251SFam Zheng  * If after releasing, reference count is zero, the BlockDriverState is
35879fcb0251SFam Zheng  * deleted. */
35889fcb0251SFam Zheng void bdrv_unref(BlockDriverState *bs)
35899fcb0251SFam Zheng {
35909a4d5ca6SJeff Cody     if (!bs) {
35919a4d5ca6SJeff Cody         return;
35929a4d5ca6SJeff Cody     }
35939fcb0251SFam Zheng     assert(bs->refcnt > 0);
35949fcb0251SFam Zheng     if (--bs->refcnt == 0) {
35959fcb0251SFam Zheng         bdrv_delete(bs);
35969fcb0251SFam Zheng     }
35979fcb0251SFam Zheng }
35989fcb0251SFam Zheng 
3599fbe40ff7SFam Zheng struct BdrvOpBlocker {
3600fbe40ff7SFam Zheng     Error *reason;
3601fbe40ff7SFam Zheng     QLIST_ENTRY(BdrvOpBlocker) list;
3602fbe40ff7SFam Zheng };
3603fbe40ff7SFam Zheng 
3604fbe40ff7SFam Zheng bool bdrv_op_is_blocked(BlockDriverState *bs, BlockOpType op, Error **errp)
3605fbe40ff7SFam Zheng {
3606fbe40ff7SFam Zheng     BdrvOpBlocker *blocker;
3607fbe40ff7SFam Zheng     assert((int) op >= 0 && op < BLOCK_OP_TYPE_MAX);
3608fbe40ff7SFam Zheng     if (!QLIST_EMPTY(&bs->op_blockers[op])) {
3609fbe40ff7SFam Zheng         blocker = QLIST_FIRST(&bs->op_blockers[op]);
3610fbe40ff7SFam Zheng         if (errp) {
361181e5f78aSAlberto Garcia             error_setg(errp, "Node '%s' is busy: %s",
361281e5f78aSAlberto Garcia                        bdrv_get_device_or_node_name(bs),
3613bfb197e0SMarkus Armbruster                        error_get_pretty(blocker->reason));
3614fbe40ff7SFam Zheng         }
3615fbe40ff7SFam Zheng         return true;
3616fbe40ff7SFam Zheng     }
3617fbe40ff7SFam Zheng     return false;
3618fbe40ff7SFam Zheng }
3619fbe40ff7SFam Zheng 
3620fbe40ff7SFam Zheng void bdrv_op_block(BlockDriverState *bs, BlockOpType op, Error *reason)
3621fbe40ff7SFam Zheng {
3622fbe40ff7SFam Zheng     BdrvOpBlocker *blocker;
3623fbe40ff7SFam Zheng     assert((int) op >= 0 && op < BLOCK_OP_TYPE_MAX);
3624fbe40ff7SFam Zheng 
36255839e53bSMarkus Armbruster     blocker = g_new0(BdrvOpBlocker, 1);
3626fbe40ff7SFam Zheng     blocker->reason = reason;
3627fbe40ff7SFam Zheng     QLIST_INSERT_HEAD(&bs->op_blockers[op], blocker, list);
3628fbe40ff7SFam Zheng }
3629fbe40ff7SFam Zheng 
3630fbe40ff7SFam Zheng void bdrv_op_unblock(BlockDriverState *bs, BlockOpType op, Error *reason)
3631fbe40ff7SFam Zheng {
3632fbe40ff7SFam Zheng     BdrvOpBlocker *blocker, *next;
3633fbe40ff7SFam Zheng     assert((int) op >= 0 && op < BLOCK_OP_TYPE_MAX);
3634fbe40ff7SFam Zheng     QLIST_FOREACH_SAFE(blocker, &bs->op_blockers[op], list, next) {
3635fbe40ff7SFam Zheng         if (blocker->reason == reason) {
3636fbe40ff7SFam Zheng             QLIST_REMOVE(blocker, list);
3637fbe40ff7SFam Zheng             g_free(blocker);
3638fbe40ff7SFam Zheng         }
3639fbe40ff7SFam Zheng     }
3640fbe40ff7SFam Zheng }
3641fbe40ff7SFam Zheng 
3642fbe40ff7SFam Zheng void bdrv_op_block_all(BlockDriverState *bs, Error *reason)
3643fbe40ff7SFam Zheng {
3644fbe40ff7SFam Zheng     int i;
3645fbe40ff7SFam Zheng     for (i = 0; i < BLOCK_OP_TYPE_MAX; i++) {
3646fbe40ff7SFam Zheng         bdrv_op_block(bs, i, reason);
3647fbe40ff7SFam Zheng     }
3648fbe40ff7SFam Zheng }
3649fbe40ff7SFam Zheng 
3650fbe40ff7SFam Zheng void bdrv_op_unblock_all(BlockDriverState *bs, Error *reason)
3651fbe40ff7SFam Zheng {
3652fbe40ff7SFam Zheng     int i;
3653fbe40ff7SFam Zheng     for (i = 0; i < BLOCK_OP_TYPE_MAX; i++) {
3654fbe40ff7SFam Zheng         bdrv_op_unblock(bs, i, reason);
3655fbe40ff7SFam Zheng     }
3656fbe40ff7SFam Zheng }
3657fbe40ff7SFam Zheng 
3658fbe40ff7SFam Zheng bool bdrv_op_blocker_is_empty(BlockDriverState *bs)
3659fbe40ff7SFam Zheng {
3660fbe40ff7SFam Zheng     int i;
3661fbe40ff7SFam Zheng 
3662fbe40ff7SFam Zheng     for (i = 0; i < BLOCK_OP_TYPE_MAX; i++) {
3663fbe40ff7SFam Zheng         if (!QLIST_EMPTY(&bs->op_blockers[i])) {
3664fbe40ff7SFam Zheng             return false;
3665fbe40ff7SFam Zheng         }
3666fbe40ff7SFam Zheng     }
3667fbe40ff7SFam Zheng     return true;
3668fbe40ff7SFam Zheng }
3669fbe40ff7SFam Zheng 
367028a7282aSLuiz Capitulino void bdrv_iostatus_enable(BlockDriverState *bs)
367128a7282aSLuiz Capitulino {
3672d6bf279eSLuiz Capitulino     bs->iostatus_enabled = true;
367358e21ef5SLuiz Capitulino     bs->iostatus = BLOCK_DEVICE_IO_STATUS_OK;
367428a7282aSLuiz Capitulino }
367528a7282aSLuiz Capitulino 
367628a7282aSLuiz Capitulino /* The I/O status is only enabled if the drive explicitly
367728a7282aSLuiz Capitulino  * enables it _and_ the VM is configured to stop on errors */
367828a7282aSLuiz Capitulino bool bdrv_iostatus_is_enabled(const BlockDriverState *bs)
367928a7282aSLuiz Capitulino {
3680d6bf279eSLuiz Capitulino     return (bs->iostatus_enabled &&
368192aa5c6dSPaolo Bonzini            (bs->on_write_error == BLOCKDEV_ON_ERROR_ENOSPC ||
368292aa5c6dSPaolo Bonzini             bs->on_write_error == BLOCKDEV_ON_ERROR_STOP   ||
368392aa5c6dSPaolo Bonzini             bs->on_read_error == BLOCKDEV_ON_ERROR_STOP));
368428a7282aSLuiz Capitulino }
368528a7282aSLuiz Capitulino 
368628a7282aSLuiz Capitulino void bdrv_iostatus_disable(BlockDriverState *bs)
368728a7282aSLuiz Capitulino {
3688d6bf279eSLuiz Capitulino     bs->iostatus_enabled = false;
368928a7282aSLuiz Capitulino }
369028a7282aSLuiz Capitulino 
369128a7282aSLuiz Capitulino void bdrv_iostatus_reset(BlockDriverState *bs)
369228a7282aSLuiz Capitulino {
369328a7282aSLuiz Capitulino     if (bdrv_iostatus_is_enabled(bs)) {
369458e21ef5SLuiz Capitulino         bs->iostatus = BLOCK_DEVICE_IO_STATUS_OK;
36953bd293c3SPaolo Bonzini         if (bs->job) {
36963bd293c3SPaolo Bonzini             block_job_iostatus_reset(bs->job);
36973bd293c3SPaolo Bonzini         }
369828a7282aSLuiz Capitulino     }
369928a7282aSLuiz Capitulino }
370028a7282aSLuiz Capitulino 
370128a7282aSLuiz Capitulino void bdrv_iostatus_set_err(BlockDriverState *bs, int error)
370228a7282aSLuiz Capitulino {
37033e1caa5fSPaolo Bonzini     assert(bdrv_iostatus_is_enabled(bs));
37043e1caa5fSPaolo Bonzini     if (bs->iostatus == BLOCK_DEVICE_IO_STATUS_OK) {
370558e21ef5SLuiz Capitulino         bs->iostatus = error == ENOSPC ? BLOCK_DEVICE_IO_STATUS_NOSPACE :
370658e21ef5SLuiz Capitulino                                          BLOCK_DEVICE_IO_STATUS_FAILED;
370728a7282aSLuiz Capitulino     }
370828a7282aSLuiz Capitulino }
370928a7282aSLuiz Capitulino 
3710d92ada22SLuiz Capitulino void bdrv_img_create(const char *filename, const char *fmt,
3711f88e1a42SJes Sorensen                      const char *base_filename, const char *base_fmt,
3712f382d43aSMiroslav Rezanina                      char *options, uint64_t img_size, int flags,
3713f382d43aSMiroslav Rezanina                      Error **errp, bool quiet)
3714f88e1a42SJes Sorensen {
371583d0521aSChunyan Liu     QemuOptsList *create_opts = NULL;
371683d0521aSChunyan Liu     QemuOpts *opts = NULL;
371783d0521aSChunyan Liu     const char *backing_fmt, *backing_file;
371883d0521aSChunyan Liu     int64_t size;
3719f88e1a42SJes Sorensen     BlockDriver *drv, *proto_drv;
372096df67d1SStefan Hajnoczi     BlockDriver *backing_drv = NULL;
3721cc84d90fSMax Reitz     Error *local_err = NULL;
3722f88e1a42SJes Sorensen     int ret = 0;
3723f88e1a42SJes Sorensen 
3724f88e1a42SJes Sorensen     /* Find driver and parse its options */
3725f88e1a42SJes Sorensen     drv = bdrv_find_format(fmt);
3726f88e1a42SJes Sorensen     if (!drv) {
372771c79813SLuiz Capitulino         error_setg(errp, "Unknown file format '%s'", fmt);
3728d92ada22SLuiz Capitulino         return;
3729f88e1a42SJes Sorensen     }
3730f88e1a42SJes Sorensen 
3731b65a5e12SMax Reitz     proto_drv = bdrv_find_protocol(filename, true, errp);
3732f88e1a42SJes Sorensen     if (!proto_drv) {
3733d92ada22SLuiz Capitulino         return;
3734f88e1a42SJes Sorensen     }
3735f88e1a42SJes Sorensen 
3736c6149724SMax Reitz     if (!drv->create_opts) {
3737c6149724SMax Reitz         error_setg(errp, "Format driver '%s' does not support image creation",
3738c6149724SMax Reitz                    drv->format_name);
3739c6149724SMax Reitz         return;
3740c6149724SMax Reitz     }
3741c6149724SMax Reitz 
3742c6149724SMax Reitz     if (!proto_drv->create_opts) {
3743c6149724SMax Reitz         error_setg(errp, "Protocol driver '%s' does not support image creation",
3744c6149724SMax Reitz                    proto_drv->format_name);
3745c6149724SMax Reitz         return;
3746c6149724SMax Reitz     }
3747c6149724SMax Reitz 
3748c282e1fdSChunyan Liu     create_opts = qemu_opts_append(create_opts, drv->create_opts);
3749c282e1fdSChunyan Liu     create_opts = qemu_opts_append(create_opts, proto_drv->create_opts);
3750f88e1a42SJes Sorensen 
3751f88e1a42SJes Sorensen     /* Create parameter list with default values */
375283d0521aSChunyan Liu     opts = qemu_opts_create(create_opts, NULL, 0, &error_abort);
375339101f25SMarkus Armbruster     qemu_opt_set_number(opts, BLOCK_OPT_SIZE, img_size, &error_abort);
3754f88e1a42SJes Sorensen 
3755f88e1a42SJes Sorensen     /* Parse -o options */
3756f88e1a42SJes Sorensen     if (options) {
3757dc523cd3SMarkus Armbruster         qemu_opts_do_parse(opts, options, NULL, &local_err);
3758dc523cd3SMarkus Armbruster         if (local_err) {
3759dc523cd3SMarkus Armbruster             error_report_err(local_err);
3760dc523cd3SMarkus Armbruster             local_err = NULL;
376183d0521aSChunyan Liu             error_setg(errp, "Invalid options for file format '%s'", fmt);
3762f88e1a42SJes Sorensen             goto out;
3763f88e1a42SJes Sorensen         }
3764f88e1a42SJes Sorensen     }
3765f88e1a42SJes Sorensen 
3766f88e1a42SJes Sorensen     if (base_filename) {
3767f43e47dbSMarkus Armbruster         qemu_opt_set(opts, BLOCK_OPT_BACKING_FILE, base_filename, &local_err);
37686be4194bSMarkus Armbruster         if (local_err) {
376971c79813SLuiz Capitulino             error_setg(errp, "Backing file not supported for file format '%s'",
377071c79813SLuiz Capitulino                        fmt);
3771f88e1a42SJes Sorensen             goto out;
3772f88e1a42SJes Sorensen         }
3773f88e1a42SJes Sorensen     }
3774f88e1a42SJes Sorensen 
3775f88e1a42SJes Sorensen     if (base_fmt) {
3776f43e47dbSMarkus Armbruster         qemu_opt_set(opts, BLOCK_OPT_BACKING_FMT, base_fmt, &local_err);
37776be4194bSMarkus Armbruster         if (local_err) {
377871c79813SLuiz Capitulino             error_setg(errp, "Backing file format not supported for file "
377971c79813SLuiz Capitulino                              "format '%s'", fmt);
3780f88e1a42SJes Sorensen             goto out;
3781f88e1a42SJes Sorensen         }
3782f88e1a42SJes Sorensen     }
3783f88e1a42SJes Sorensen 
378483d0521aSChunyan Liu     backing_file = qemu_opt_get(opts, BLOCK_OPT_BACKING_FILE);
378583d0521aSChunyan Liu     if (backing_file) {
378683d0521aSChunyan Liu         if (!strcmp(filename, backing_file)) {
378771c79813SLuiz Capitulino             error_setg(errp, "Error: Trying to create an image with the "
378871c79813SLuiz Capitulino                              "same filename as the backing file");
3789792da93aSJes Sorensen             goto out;
3790792da93aSJes Sorensen         }
3791792da93aSJes Sorensen     }
3792792da93aSJes Sorensen 
379383d0521aSChunyan Liu     backing_fmt = qemu_opt_get(opts, BLOCK_OPT_BACKING_FMT);
379483d0521aSChunyan Liu     if (backing_fmt) {
379583d0521aSChunyan Liu         backing_drv = bdrv_find_format(backing_fmt);
379696df67d1SStefan Hajnoczi         if (!backing_drv) {
379771c79813SLuiz Capitulino             error_setg(errp, "Unknown backing file format '%s'",
379883d0521aSChunyan Liu                        backing_fmt);
3799f88e1a42SJes Sorensen             goto out;
3800f88e1a42SJes Sorensen         }
3801f88e1a42SJes Sorensen     }
3802f88e1a42SJes Sorensen 
3803f88e1a42SJes Sorensen     // The size for the image must always be specified, with one exception:
3804f88e1a42SJes Sorensen     // If we are using a backing file, we can obtain the size from there
380583d0521aSChunyan Liu     size = qemu_opt_get_size(opts, BLOCK_OPT_SIZE, 0);
380683d0521aSChunyan Liu     if (size == -1) {
380783d0521aSChunyan Liu         if (backing_file) {
380866f6b814SMax Reitz             BlockDriverState *bs;
380929168018SMax Reitz             char *full_backing = g_new0(char, PATH_MAX);
381052bf1e72SMarkus Armbruster             int64_t size;
381163090dacSPaolo Bonzini             int back_flags;
381263090dacSPaolo Bonzini 
381329168018SMax Reitz             bdrv_get_full_backing_filename_from_filename(filename, backing_file,
381429168018SMax Reitz                                                          full_backing, PATH_MAX,
381529168018SMax Reitz                                                          &local_err);
381629168018SMax Reitz             if (local_err) {
381729168018SMax Reitz                 g_free(full_backing);
381829168018SMax Reitz                 goto out;
381929168018SMax Reitz             }
382029168018SMax Reitz 
382163090dacSPaolo Bonzini             /* backing files always opened read-only */
382263090dacSPaolo Bonzini             back_flags =
382363090dacSPaolo Bonzini                 flags & ~(BDRV_O_RDWR | BDRV_O_SNAPSHOT | BDRV_O_NO_BACKING);
3824f88e1a42SJes Sorensen 
3825f67503e5SMax Reitz             bs = NULL;
382629168018SMax Reitz             ret = bdrv_open(&bs, full_backing, NULL, NULL, back_flags,
3827cc84d90fSMax Reitz                             backing_drv, &local_err);
382829168018SMax Reitz             g_free(full_backing);
3829f88e1a42SJes Sorensen             if (ret < 0) {
3830f88e1a42SJes Sorensen                 goto out;
3831f88e1a42SJes Sorensen             }
383252bf1e72SMarkus Armbruster             size = bdrv_getlength(bs);
383352bf1e72SMarkus Armbruster             if (size < 0) {
383452bf1e72SMarkus Armbruster                 error_setg_errno(errp, -size, "Could not get size of '%s'",
383552bf1e72SMarkus Armbruster                                  backing_file);
383652bf1e72SMarkus Armbruster                 bdrv_unref(bs);
383752bf1e72SMarkus Armbruster                 goto out;
383852bf1e72SMarkus Armbruster             }
3839f88e1a42SJes Sorensen 
384039101f25SMarkus Armbruster             qemu_opt_set_number(opts, BLOCK_OPT_SIZE, size, &error_abort);
384166f6b814SMax Reitz 
384266f6b814SMax Reitz             bdrv_unref(bs);
3843f88e1a42SJes Sorensen         } else {
384471c79813SLuiz Capitulino             error_setg(errp, "Image creation needs a size parameter");
3845f88e1a42SJes Sorensen             goto out;
3846f88e1a42SJes Sorensen         }
3847f88e1a42SJes Sorensen     }
3848f88e1a42SJes Sorensen 
3849f382d43aSMiroslav Rezanina     if (!quiet) {
3850f88e1a42SJes Sorensen         printf("Formatting '%s', fmt=%s", filename, fmt);
385143c5d8f8SFam Zheng         qemu_opts_print(opts, " ");
3852f88e1a42SJes Sorensen         puts("");
3853f382d43aSMiroslav Rezanina     }
385483d0521aSChunyan Liu 
3855c282e1fdSChunyan Liu     ret = bdrv_create(drv, filename, opts, &local_err);
385683d0521aSChunyan Liu 
3857cc84d90fSMax Reitz     if (ret == -EFBIG) {
3858cc84d90fSMax Reitz         /* This is generally a better message than whatever the driver would
3859cc84d90fSMax Reitz          * deliver (especially because of the cluster_size_hint), since that
3860cc84d90fSMax Reitz          * is most probably not much different from "image too large". */
3861f3f4d2c0SKevin Wolf         const char *cluster_size_hint = "";
386283d0521aSChunyan Liu         if (qemu_opt_get_size(opts, BLOCK_OPT_CLUSTER_SIZE, 0)) {
3863f3f4d2c0SKevin Wolf             cluster_size_hint = " (try using a larger cluster size)";
3864f3f4d2c0SKevin Wolf         }
3865cc84d90fSMax Reitz         error_setg(errp, "The image size is too large for file format '%s'"
3866cc84d90fSMax Reitz                    "%s", fmt, cluster_size_hint);
3867cc84d90fSMax Reitz         error_free(local_err);
3868cc84d90fSMax Reitz         local_err = NULL;
3869f88e1a42SJes Sorensen     }
3870f88e1a42SJes Sorensen 
3871f88e1a42SJes Sorensen out:
387283d0521aSChunyan Liu     qemu_opts_del(opts);
387383d0521aSChunyan Liu     qemu_opts_free(create_opts);
387484d18f06SMarkus Armbruster     if (local_err) {
3875cc84d90fSMax Reitz         error_propagate(errp, local_err);
3876cc84d90fSMax Reitz     }
3877f88e1a42SJes Sorensen }
387885d126f3SStefan Hajnoczi 
387985d126f3SStefan Hajnoczi AioContext *bdrv_get_aio_context(BlockDriverState *bs)
388085d126f3SStefan Hajnoczi {
3881dcd04228SStefan Hajnoczi     return bs->aio_context;
3882dcd04228SStefan Hajnoczi }
3883dcd04228SStefan Hajnoczi 
3884dcd04228SStefan Hajnoczi void bdrv_detach_aio_context(BlockDriverState *bs)
3885dcd04228SStefan Hajnoczi {
388633384421SMax Reitz     BdrvAioNotifier *baf;
388733384421SMax Reitz 
3888dcd04228SStefan Hajnoczi     if (!bs->drv) {
3889dcd04228SStefan Hajnoczi         return;
3890dcd04228SStefan Hajnoczi     }
3891dcd04228SStefan Hajnoczi 
389233384421SMax Reitz     QLIST_FOREACH(baf, &bs->aio_notifiers, list) {
389333384421SMax Reitz         baf->detach_aio_context(baf->opaque);
389433384421SMax Reitz     }
389533384421SMax Reitz 
389613af91ebSStefan Hajnoczi     if (bs->io_limits_enabled) {
38970e5b0a2dSBenoît Canet         throttle_timers_detach_aio_context(&bs->throttle_timers);
389813af91ebSStefan Hajnoczi     }
3899dcd04228SStefan Hajnoczi     if (bs->drv->bdrv_detach_aio_context) {
3900dcd04228SStefan Hajnoczi         bs->drv->bdrv_detach_aio_context(bs);
3901dcd04228SStefan Hajnoczi     }
3902dcd04228SStefan Hajnoczi     if (bs->file) {
3903dcd04228SStefan Hajnoczi         bdrv_detach_aio_context(bs->file);
3904dcd04228SStefan Hajnoczi     }
3905dcd04228SStefan Hajnoczi     if (bs->backing_hd) {
3906dcd04228SStefan Hajnoczi         bdrv_detach_aio_context(bs->backing_hd);
3907dcd04228SStefan Hajnoczi     }
3908dcd04228SStefan Hajnoczi 
3909dcd04228SStefan Hajnoczi     bs->aio_context = NULL;
3910dcd04228SStefan Hajnoczi }
3911dcd04228SStefan Hajnoczi 
3912dcd04228SStefan Hajnoczi void bdrv_attach_aio_context(BlockDriverState *bs,
3913dcd04228SStefan Hajnoczi                              AioContext *new_context)
3914dcd04228SStefan Hajnoczi {
391533384421SMax Reitz     BdrvAioNotifier *ban;
391633384421SMax Reitz 
3917dcd04228SStefan Hajnoczi     if (!bs->drv) {
3918dcd04228SStefan Hajnoczi         return;
3919dcd04228SStefan Hajnoczi     }
3920dcd04228SStefan Hajnoczi 
3921dcd04228SStefan Hajnoczi     bs->aio_context = new_context;
3922dcd04228SStefan Hajnoczi 
3923dcd04228SStefan Hajnoczi     if (bs->backing_hd) {
3924dcd04228SStefan Hajnoczi         bdrv_attach_aio_context(bs->backing_hd, new_context);
3925dcd04228SStefan Hajnoczi     }
3926dcd04228SStefan Hajnoczi     if (bs->file) {
3927dcd04228SStefan Hajnoczi         bdrv_attach_aio_context(bs->file, new_context);
3928dcd04228SStefan Hajnoczi     }
3929dcd04228SStefan Hajnoczi     if (bs->drv->bdrv_attach_aio_context) {
3930dcd04228SStefan Hajnoczi         bs->drv->bdrv_attach_aio_context(bs, new_context);
3931dcd04228SStefan Hajnoczi     }
393213af91ebSStefan Hajnoczi     if (bs->io_limits_enabled) {
39330e5b0a2dSBenoît Canet         throttle_timers_attach_aio_context(&bs->throttle_timers, new_context);
393413af91ebSStefan Hajnoczi     }
393533384421SMax Reitz 
393633384421SMax Reitz     QLIST_FOREACH(ban, &bs->aio_notifiers, list) {
393733384421SMax Reitz         ban->attached_aio_context(new_context, ban->opaque);
393833384421SMax Reitz     }
3939dcd04228SStefan Hajnoczi }
3940dcd04228SStefan Hajnoczi 
3941dcd04228SStefan Hajnoczi void bdrv_set_aio_context(BlockDriverState *bs, AioContext *new_context)
3942dcd04228SStefan Hajnoczi {
394353ec73e2SFam Zheng     bdrv_drain(bs); /* ensure there are no in-flight requests */
3944dcd04228SStefan Hajnoczi 
3945dcd04228SStefan Hajnoczi     bdrv_detach_aio_context(bs);
3946dcd04228SStefan Hajnoczi 
3947dcd04228SStefan Hajnoczi     /* This function executes in the old AioContext so acquire the new one in
3948dcd04228SStefan Hajnoczi      * case it runs in a different thread.
3949dcd04228SStefan Hajnoczi      */
3950dcd04228SStefan Hajnoczi     aio_context_acquire(new_context);
3951dcd04228SStefan Hajnoczi     bdrv_attach_aio_context(bs, new_context);
3952dcd04228SStefan Hajnoczi     aio_context_release(new_context);
395385d126f3SStefan Hajnoczi }
3954d616b224SStefan Hajnoczi 
395533384421SMax Reitz void bdrv_add_aio_context_notifier(BlockDriverState *bs,
395633384421SMax Reitz         void (*attached_aio_context)(AioContext *new_context, void *opaque),
395733384421SMax Reitz         void (*detach_aio_context)(void *opaque), void *opaque)
395833384421SMax Reitz {
395933384421SMax Reitz     BdrvAioNotifier *ban = g_new(BdrvAioNotifier, 1);
396033384421SMax Reitz     *ban = (BdrvAioNotifier){
396133384421SMax Reitz         .attached_aio_context = attached_aio_context,
396233384421SMax Reitz         .detach_aio_context   = detach_aio_context,
396333384421SMax Reitz         .opaque               = opaque
396433384421SMax Reitz     };
396533384421SMax Reitz 
396633384421SMax Reitz     QLIST_INSERT_HEAD(&bs->aio_notifiers, ban, list);
396733384421SMax Reitz }
396833384421SMax Reitz 
396933384421SMax Reitz void bdrv_remove_aio_context_notifier(BlockDriverState *bs,
397033384421SMax Reitz                                       void (*attached_aio_context)(AioContext *,
397133384421SMax Reitz                                                                    void *),
397233384421SMax Reitz                                       void (*detach_aio_context)(void *),
397333384421SMax Reitz                                       void *opaque)
397433384421SMax Reitz {
397533384421SMax Reitz     BdrvAioNotifier *ban, *ban_next;
397633384421SMax Reitz 
397733384421SMax Reitz     QLIST_FOREACH_SAFE(ban, &bs->aio_notifiers, list, ban_next) {
397833384421SMax Reitz         if (ban->attached_aio_context == attached_aio_context &&
397933384421SMax Reitz             ban->detach_aio_context   == detach_aio_context   &&
398033384421SMax Reitz             ban->opaque               == opaque)
398133384421SMax Reitz         {
398233384421SMax Reitz             QLIST_REMOVE(ban, list);
398333384421SMax Reitz             g_free(ban);
398433384421SMax Reitz 
398533384421SMax Reitz             return;
398633384421SMax Reitz         }
398733384421SMax Reitz     }
398833384421SMax Reitz 
398933384421SMax Reitz     abort();
399033384421SMax Reitz }
399133384421SMax Reitz 
399277485434SMax Reitz int bdrv_amend_options(BlockDriverState *bs, QemuOpts *opts,
399377485434SMax Reitz                        BlockDriverAmendStatusCB *status_cb)
39946f176b48SMax Reitz {
3995c282e1fdSChunyan Liu     if (!bs->drv->bdrv_amend_options) {
39966f176b48SMax Reitz         return -ENOTSUP;
39976f176b48SMax Reitz     }
399877485434SMax Reitz     return bs->drv->bdrv_amend_options(bs, opts, status_cb);
39996f176b48SMax Reitz }
4000f6186f49SBenoît Canet 
4001b5042a36SBenoît Canet /* This function will be called by the bdrv_recurse_is_first_non_filter method
4002b5042a36SBenoît Canet  * of block filter and by bdrv_is_first_non_filter.
4003b5042a36SBenoît Canet  * It is used to test if the given bs is the candidate or recurse more in the
4004b5042a36SBenoît Canet  * node graph.
4005212a5a8fSBenoît Canet  */
4006212a5a8fSBenoît Canet bool bdrv_recurse_is_first_non_filter(BlockDriverState *bs,
4007212a5a8fSBenoît Canet                                       BlockDriverState *candidate)
4008f6186f49SBenoît Canet {
4009b5042a36SBenoît Canet     /* return false if basic checks fails */
4010b5042a36SBenoît Canet     if (!bs || !bs->drv) {
4011b5042a36SBenoît Canet         return false;
4012b5042a36SBenoît Canet     }
4013b5042a36SBenoît Canet 
4014b5042a36SBenoît Canet     /* the code reached a non block filter driver -> check if the bs is
4015b5042a36SBenoît Canet      * the same as the candidate. It's the recursion termination condition.
4016b5042a36SBenoît Canet      */
4017b5042a36SBenoît Canet     if (!bs->drv->is_filter) {
4018b5042a36SBenoît Canet         return bs == candidate;
4019b5042a36SBenoît Canet     }
4020b5042a36SBenoît Canet     /* Down this path the driver is a block filter driver */
4021b5042a36SBenoît Canet 
4022b5042a36SBenoît Canet     /* If the block filter recursion method is defined use it to recurse down
4023b5042a36SBenoît Canet      * the node graph.
4024b5042a36SBenoît Canet      */
4025b5042a36SBenoît Canet     if (bs->drv->bdrv_recurse_is_first_non_filter) {
4026212a5a8fSBenoît Canet         return bs->drv->bdrv_recurse_is_first_non_filter(bs, candidate);
4027212a5a8fSBenoît Canet     }
4028212a5a8fSBenoît Canet 
4029b5042a36SBenoît Canet     /* the driver is a block filter but don't allow to recurse -> return false
4030b5042a36SBenoît Canet      */
4031b5042a36SBenoît Canet     return false;
4032212a5a8fSBenoît Canet }
4033212a5a8fSBenoît Canet 
4034212a5a8fSBenoît Canet /* This function checks if the candidate is the first non filter bs down it's
4035212a5a8fSBenoît Canet  * bs chain. Since we don't have pointers to parents it explore all bs chains
4036212a5a8fSBenoît Canet  * from the top. Some filters can choose not to pass down the recursion.
4037212a5a8fSBenoît Canet  */
4038212a5a8fSBenoît Canet bool bdrv_is_first_non_filter(BlockDriverState *candidate)
4039212a5a8fSBenoît Canet {
4040212a5a8fSBenoît Canet     BlockDriverState *bs;
4041212a5a8fSBenoît Canet 
4042212a5a8fSBenoît Canet     /* walk down the bs forest recursively */
4043212a5a8fSBenoît Canet     QTAILQ_FOREACH(bs, &bdrv_states, device_list) {
4044212a5a8fSBenoît Canet         bool perm;
4045212a5a8fSBenoît Canet 
4046b5042a36SBenoît Canet         /* try to recurse in this top level bs */
4047e6dc8a1fSKevin Wolf         perm = bdrv_recurse_is_first_non_filter(bs, candidate);
4048212a5a8fSBenoît Canet 
4049212a5a8fSBenoît Canet         /* candidate is the first non filter */
4050212a5a8fSBenoît Canet         if (perm) {
4051212a5a8fSBenoît Canet             return true;
4052212a5a8fSBenoît Canet         }
4053212a5a8fSBenoît Canet     }
4054212a5a8fSBenoît Canet 
4055212a5a8fSBenoît Canet     return false;
4056f6186f49SBenoît Canet }
405709158f00SBenoît Canet 
405809158f00SBenoît Canet BlockDriverState *check_to_replace_node(const char *node_name, Error **errp)
405909158f00SBenoît Canet {
406009158f00SBenoît Canet     BlockDriverState *to_replace_bs = bdrv_find_node(node_name);
40615a7e7a0bSStefan Hajnoczi     AioContext *aio_context;
40625a7e7a0bSStefan Hajnoczi 
406309158f00SBenoît Canet     if (!to_replace_bs) {
406409158f00SBenoît Canet         error_setg(errp, "Node name '%s' not found", node_name);
406509158f00SBenoît Canet         return NULL;
406609158f00SBenoît Canet     }
406709158f00SBenoît Canet 
40685a7e7a0bSStefan Hajnoczi     aio_context = bdrv_get_aio_context(to_replace_bs);
40695a7e7a0bSStefan Hajnoczi     aio_context_acquire(aio_context);
40705a7e7a0bSStefan Hajnoczi 
407109158f00SBenoît Canet     if (bdrv_op_is_blocked(to_replace_bs, BLOCK_OP_TYPE_REPLACE, errp)) {
40725a7e7a0bSStefan Hajnoczi         to_replace_bs = NULL;
40735a7e7a0bSStefan Hajnoczi         goto out;
407409158f00SBenoît Canet     }
407509158f00SBenoît Canet 
407609158f00SBenoît Canet     /* We don't want arbitrary node of the BDS chain to be replaced only the top
407709158f00SBenoît Canet      * most non filter in order to prevent data corruption.
407809158f00SBenoît Canet      * Another benefit is that this tests exclude backing files which are
407909158f00SBenoît Canet      * blocked by the backing blockers.
408009158f00SBenoît Canet      */
408109158f00SBenoît Canet     if (!bdrv_is_first_non_filter(to_replace_bs)) {
408209158f00SBenoît Canet         error_setg(errp, "Only top most non filter can be replaced");
40835a7e7a0bSStefan Hajnoczi         to_replace_bs = NULL;
40845a7e7a0bSStefan Hajnoczi         goto out;
408509158f00SBenoît Canet     }
408609158f00SBenoît Canet 
40875a7e7a0bSStefan Hajnoczi out:
40885a7e7a0bSStefan Hajnoczi     aio_context_release(aio_context);
408909158f00SBenoît Canet     return to_replace_bs;
409009158f00SBenoît Canet }
4091448ad91dSMing Lei 
409291af7014SMax Reitz static bool append_open_options(QDict *d, BlockDriverState *bs)
409391af7014SMax Reitz {
409491af7014SMax Reitz     const QDictEntry *entry;
409591af7014SMax Reitz     bool found_any = false;
409691af7014SMax Reitz 
409791af7014SMax Reitz     for (entry = qdict_first(bs->options); entry;
409891af7014SMax Reitz          entry = qdict_next(bs->options, entry))
409991af7014SMax Reitz     {
410091af7014SMax Reitz         /* Only take options for this level and exclude all non-driver-specific
410191af7014SMax Reitz          * options */
410291af7014SMax Reitz         if (!strchr(qdict_entry_key(entry), '.') &&
410391af7014SMax Reitz             strcmp(qdict_entry_key(entry), "node-name"))
410491af7014SMax Reitz         {
410591af7014SMax Reitz             qobject_incref(qdict_entry_value(entry));
410691af7014SMax Reitz             qdict_put_obj(d, qdict_entry_key(entry), qdict_entry_value(entry));
410791af7014SMax Reitz             found_any = true;
410891af7014SMax Reitz         }
410991af7014SMax Reitz     }
411091af7014SMax Reitz 
411191af7014SMax Reitz     return found_any;
411291af7014SMax Reitz }
411391af7014SMax Reitz 
411491af7014SMax Reitz /* Updates the following BDS fields:
411591af7014SMax Reitz  *  - exact_filename: A filename which may be used for opening a block device
411691af7014SMax Reitz  *                    which (mostly) equals the given BDS (even without any
411791af7014SMax Reitz  *                    other options; so reading and writing must return the same
411891af7014SMax Reitz  *                    results, but caching etc. may be different)
411991af7014SMax Reitz  *  - full_open_options: Options which, when given when opening a block device
412091af7014SMax Reitz  *                       (without a filename), result in a BDS (mostly)
412191af7014SMax Reitz  *                       equalling the given one
412291af7014SMax Reitz  *  - filename: If exact_filename is set, it is copied here. Otherwise,
412391af7014SMax Reitz  *              full_open_options is converted to a JSON object, prefixed with
412491af7014SMax Reitz  *              "json:" (for use through the JSON pseudo protocol) and put here.
412591af7014SMax Reitz  */
412691af7014SMax Reitz void bdrv_refresh_filename(BlockDriverState *bs)
412791af7014SMax Reitz {
412891af7014SMax Reitz     BlockDriver *drv = bs->drv;
412991af7014SMax Reitz     QDict *opts;
413091af7014SMax Reitz 
413191af7014SMax Reitz     if (!drv) {
413291af7014SMax Reitz         return;
413391af7014SMax Reitz     }
413491af7014SMax Reitz 
413591af7014SMax Reitz     /* This BDS's file name will most probably depend on its file's name, so
413691af7014SMax Reitz      * refresh that first */
413791af7014SMax Reitz     if (bs->file) {
413891af7014SMax Reitz         bdrv_refresh_filename(bs->file);
413991af7014SMax Reitz     }
414091af7014SMax Reitz 
414191af7014SMax Reitz     if (drv->bdrv_refresh_filename) {
414291af7014SMax Reitz         /* Obsolete information is of no use here, so drop the old file name
414391af7014SMax Reitz          * information before refreshing it */
414491af7014SMax Reitz         bs->exact_filename[0] = '\0';
414591af7014SMax Reitz         if (bs->full_open_options) {
414691af7014SMax Reitz             QDECREF(bs->full_open_options);
414791af7014SMax Reitz             bs->full_open_options = NULL;
414891af7014SMax Reitz         }
414991af7014SMax Reitz 
415091af7014SMax Reitz         drv->bdrv_refresh_filename(bs);
415191af7014SMax Reitz     } else if (bs->file) {
415291af7014SMax Reitz         /* Try to reconstruct valid information from the underlying file */
415391af7014SMax Reitz         bool has_open_options;
415491af7014SMax Reitz 
415591af7014SMax Reitz         bs->exact_filename[0] = '\0';
415691af7014SMax Reitz         if (bs->full_open_options) {
415791af7014SMax Reitz             QDECREF(bs->full_open_options);
415891af7014SMax Reitz             bs->full_open_options = NULL;
415991af7014SMax Reitz         }
416091af7014SMax Reitz 
416191af7014SMax Reitz         opts = qdict_new();
416291af7014SMax Reitz         has_open_options = append_open_options(opts, bs);
416391af7014SMax Reitz 
416491af7014SMax Reitz         /* If no specific options have been given for this BDS, the filename of
416591af7014SMax Reitz          * the underlying file should suffice for this one as well */
416691af7014SMax Reitz         if (bs->file->exact_filename[0] && !has_open_options) {
416791af7014SMax Reitz             strcpy(bs->exact_filename, bs->file->exact_filename);
416891af7014SMax Reitz         }
416991af7014SMax Reitz         /* Reconstructing the full options QDict is simple for most format block
417091af7014SMax Reitz          * drivers, as long as the full options are known for the underlying
417191af7014SMax Reitz          * file BDS. The full options QDict of that file BDS should somehow
417291af7014SMax Reitz          * contain a representation of the filename, therefore the following
417391af7014SMax Reitz          * suffices without querying the (exact_)filename of this BDS. */
417491af7014SMax Reitz         if (bs->file->full_open_options) {
417591af7014SMax Reitz             qdict_put_obj(opts, "driver",
417691af7014SMax Reitz                           QOBJECT(qstring_from_str(drv->format_name)));
417791af7014SMax Reitz             QINCREF(bs->file->full_open_options);
417891af7014SMax Reitz             qdict_put_obj(opts, "file", QOBJECT(bs->file->full_open_options));
417991af7014SMax Reitz 
418091af7014SMax Reitz             bs->full_open_options = opts;
418191af7014SMax Reitz         } else {
418291af7014SMax Reitz             QDECREF(opts);
418391af7014SMax Reitz         }
418491af7014SMax Reitz     } else if (!bs->full_open_options && qdict_size(bs->options)) {
418591af7014SMax Reitz         /* There is no underlying file BDS (at least referenced by BDS.file),
418691af7014SMax Reitz          * so the full options QDict should be equal to the options given
418791af7014SMax Reitz          * specifically for this block device when it was opened (plus the
418891af7014SMax Reitz          * driver specification).
418991af7014SMax Reitz          * Because those options don't change, there is no need to update
419091af7014SMax Reitz          * full_open_options when it's already set. */
419191af7014SMax Reitz 
419291af7014SMax Reitz         opts = qdict_new();
419391af7014SMax Reitz         append_open_options(opts, bs);
419491af7014SMax Reitz         qdict_put_obj(opts, "driver",
419591af7014SMax Reitz                       QOBJECT(qstring_from_str(drv->format_name)));
419691af7014SMax Reitz 
419791af7014SMax Reitz         if (bs->exact_filename[0]) {
419891af7014SMax Reitz             /* This may not work for all block protocol drivers (some may
419991af7014SMax Reitz              * require this filename to be parsed), but we have to find some
420091af7014SMax Reitz              * default solution here, so just include it. If some block driver
420191af7014SMax Reitz              * does not support pure options without any filename at all or
420291af7014SMax Reitz              * needs some special format of the options QDict, it needs to
420391af7014SMax Reitz              * implement the driver-specific bdrv_refresh_filename() function.
420491af7014SMax Reitz              */
420591af7014SMax Reitz             qdict_put_obj(opts, "filename",
420691af7014SMax Reitz                           QOBJECT(qstring_from_str(bs->exact_filename)));
420791af7014SMax Reitz         }
420891af7014SMax Reitz 
420991af7014SMax Reitz         bs->full_open_options = opts;
421091af7014SMax Reitz     }
421191af7014SMax Reitz 
421291af7014SMax Reitz     if (bs->exact_filename[0]) {
421391af7014SMax Reitz         pstrcpy(bs->filename, sizeof(bs->filename), bs->exact_filename);
421491af7014SMax Reitz     } else if (bs->full_open_options) {
421591af7014SMax Reitz         QString *json = qobject_to_json(QOBJECT(bs->full_open_options));
421691af7014SMax Reitz         snprintf(bs->filename, sizeof(bs->filename), "json:%s",
421791af7014SMax Reitz                  qstring_get_str(json));
421891af7014SMax Reitz         QDECREF(json);
421991af7014SMax Reitz     }
422091af7014SMax Reitz }
42215366d0c8SBenoît Canet 
42225366d0c8SBenoît Canet /* This accessor function purpose is to allow the device models to access the
42235366d0c8SBenoît Canet  * BlockAcctStats structure embedded inside a BlockDriverState without being
42245366d0c8SBenoît Canet  * aware of the BlockDriverState structure layout.
42255366d0c8SBenoît Canet  * It will go away when the BlockAcctStats structure will be moved inside
42265366d0c8SBenoît Canet  * the device models.
42275366d0c8SBenoît Canet  */
42285366d0c8SBenoît Canet BlockAcctStats *bdrv_get_stats(BlockDriverState *bs)
42295366d0c8SBenoît Canet {
42305366d0c8SBenoît Canet     return &bs->stats;
42315366d0c8SBenoît Canet }
4232