xref: /openbmc/qemu/block.c (revision c5fbe57111ef59c315a71cd80e8b0af59e36ff21)
1fc01f7e7Sbellard /*
2fc01f7e7Sbellard  * QEMU System Emulator block driver
3fc01f7e7Sbellard  *
4fc01f7e7Sbellard  * Copyright (c) 2003 Fabrice Bellard
5fc01f7e7Sbellard  *
6fc01f7e7Sbellard  * Permission is hereby granted, free of charge, to any person obtaining a copy
7fc01f7e7Sbellard  * of this software and associated documentation files (the "Software"), to deal
8fc01f7e7Sbellard  * in the Software without restriction, including without limitation the rights
9fc01f7e7Sbellard  * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10fc01f7e7Sbellard  * copies of the Software, and to permit persons to whom the Software is
11fc01f7e7Sbellard  * furnished to do so, subject to the following conditions:
12fc01f7e7Sbellard  *
13fc01f7e7Sbellard  * The above copyright notice and this permission notice shall be included in
14fc01f7e7Sbellard  * all copies or substantial portions of the Software.
15fc01f7e7Sbellard  *
16fc01f7e7Sbellard  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17fc01f7e7Sbellard  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18fc01f7e7Sbellard  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19fc01f7e7Sbellard  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20fc01f7e7Sbellard  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21fc01f7e7Sbellard  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22fc01f7e7Sbellard  * THE SOFTWARE.
23fc01f7e7Sbellard  */
243990d09aSblueswir1 #include "config-host.h"
25faf07963Spbrook #include "qemu-common.h"
266d519a5fSStefan Hajnoczi #include "trace.h"
27376253ecSaliguori #include "monitor.h"
28ea2384d3Sbellard #include "block_int.h"
295efa9d5aSAnthony Liguori #include "module.h"
30d15e5465SLuiz Capitulino #include "qemu-objects.h"
3168485420SKevin Wolf #include "qemu-coroutine.h"
32fc01f7e7Sbellard 
3371e72a19SJuan Quintela #ifdef CONFIG_BSD
347674e7bfSbellard #include <sys/types.h>
357674e7bfSbellard #include <sys/stat.h>
367674e7bfSbellard #include <sys/ioctl.h>
3772cf2d4fSBlue Swirl #include <sys/queue.h>
38c5e97233Sblueswir1 #ifndef __DragonFly__
397674e7bfSbellard #include <sys/disk.h>
407674e7bfSbellard #endif
41c5e97233Sblueswir1 #endif
427674e7bfSbellard 
4349dc768dSaliguori #ifdef _WIN32
4449dc768dSaliguori #include <windows.h>
4549dc768dSaliguori #endif
4649dc768dSaliguori 
477d4b4ba5SMarkus Armbruster static void bdrv_dev_change_media_cb(BlockDriverState *bs, bool load);
48f141eafeSaliguori static BlockDriverAIOCB *bdrv_aio_readv_em(BlockDriverState *bs,
49f141eafeSaliguori         int64_t sector_num, QEMUIOVector *qiov, int nb_sectors,
50c87c0672Saliguori         BlockDriverCompletionFunc *cb, void *opaque);
51f141eafeSaliguori static BlockDriverAIOCB *bdrv_aio_writev_em(BlockDriverState *bs,
52f141eafeSaliguori         int64_t sector_num, QEMUIOVector *qiov, int nb_sectors,
53ce1a14dcSpbrook         BlockDriverCompletionFunc *cb, void *opaque);
54b2e12bc6SChristoph Hellwig static BlockDriverAIOCB *bdrv_aio_flush_em(BlockDriverState *bs,
55b2e12bc6SChristoph Hellwig         BlockDriverCompletionFunc *cb, void *opaque);
56016f5cf6SAlexander Graf static BlockDriverAIOCB *bdrv_aio_noop_em(BlockDriverState *bs,
57016f5cf6SAlexander Graf         BlockDriverCompletionFunc *cb, void *opaque);
5883f64091Sbellard static int bdrv_read_em(BlockDriverState *bs, int64_t sector_num,
5983f64091Sbellard                         uint8_t *buf, int nb_sectors);
6083f64091Sbellard static int bdrv_write_em(BlockDriverState *bs, int64_t sector_num,
6183f64091Sbellard                          const uint8_t *buf, int nb_sectors);
6268485420SKevin Wolf static BlockDriverAIOCB *bdrv_co_aio_readv_em(BlockDriverState *bs,
6368485420SKevin Wolf         int64_t sector_num, QEMUIOVector *qiov, int nb_sectors,
6468485420SKevin Wolf         BlockDriverCompletionFunc *cb, void *opaque);
6568485420SKevin Wolf static BlockDriverAIOCB *bdrv_co_aio_writev_em(BlockDriverState *bs,
6668485420SKevin Wolf         int64_t sector_num, QEMUIOVector *qiov, int nb_sectors,
6768485420SKevin Wolf         BlockDriverCompletionFunc *cb, void *opaque);
68f9f05dc5SKevin Wolf static int coroutine_fn bdrv_co_readv_em(BlockDriverState *bs,
69f9f05dc5SKevin Wolf                                          int64_t sector_num, int nb_sectors,
70f9f05dc5SKevin Wolf                                          QEMUIOVector *iov);
71f9f05dc5SKevin Wolf static int coroutine_fn bdrv_co_writev_em(BlockDriverState *bs,
72f9f05dc5SKevin Wolf                                          int64_t sector_num, int nb_sectors,
73f9f05dc5SKevin Wolf                                          QEMUIOVector *iov);
74e7a8a783SKevin Wolf static int coroutine_fn bdrv_co_flush_em(BlockDriverState *bs);
75*c5fbe571SStefan Hajnoczi static int coroutine_fn bdrv_co_do_readv(BlockDriverState *bs,
76*c5fbe571SStefan Hajnoczi     int64_t sector_num, int nb_sectors, QEMUIOVector *qiov);
77ec530c81Sbellard 
781b7bdbc1SStefan Hajnoczi static QTAILQ_HEAD(, BlockDriverState) bdrv_states =
791b7bdbc1SStefan Hajnoczi     QTAILQ_HEAD_INITIALIZER(bdrv_states);
807ee930d0Sblueswir1 
818a22f02aSStefan Hajnoczi static QLIST_HEAD(, BlockDriver) bdrv_drivers =
828a22f02aSStefan Hajnoczi     QLIST_HEAD_INITIALIZER(bdrv_drivers);
83ea2384d3Sbellard 
84f9092b10SMarkus Armbruster /* The device to use for VM snapshots */
85f9092b10SMarkus Armbruster static BlockDriverState *bs_snapshots;
86f9092b10SMarkus Armbruster 
87eb852011SMarkus Armbruster /* If non-zero, use only whitelisted block drivers */
88eb852011SMarkus Armbruster static int use_bdrv_whitelist;
89eb852011SMarkus Armbruster 
909e0b22f4SStefan Hajnoczi #ifdef _WIN32
919e0b22f4SStefan Hajnoczi static int is_windows_drive_prefix(const char *filename)
929e0b22f4SStefan Hajnoczi {
939e0b22f4SStefan Hajnoczi     return (((filename[0] >= 'a' && filename[0] <= 'z') ||
949e0b22f4SStefan Hajnoczi              (filename[0] >= 'A' && filename[0] <= 'Z')) &&
959e0b22f4SStefan Hajnoczi             filename[1] == ':');
969e0b22f4SStefan Hajnoczi }
979e0b22f4SStefan Hajnoczi 
989e0b22f4SStefan Hajnoczi int is_windows_drive(const char *filename)
999e0b22f4SStefan Hajnoczi {
1009e0b22f4SStefan Hajnoczi     if (is_windows_drive_prefix(filename) &&
1019e0b22f4SStefan Hajnoczi         filename[2] == '\0')
1029e0b22f4SStefan Hajnoczi         return 1;
1039e0b22f4SStefan Hajnoczi     if (strstart(filename, "\\\\.\\", NULL) ||
1049e0b22f4SStefan Hajnoczi         strstart(filename, "//./", NULL))
1059e0b22f4SStefan Hajnoczi         return 1;
1069e0b22f4SStefan Hajnoczi     return 0;
1079e0b22f4SStefan Hajnoczi }
1089e0b22f4SStefan Hajnoczi #endif
1099e0b22f4SStefan Hajnoczi 
1109e0b22f4SStefan Hajnoczi /* check if the path starts with "<protocol>:" */
1119e0b22f4SStefan Hajnoczi static int path_has_protocol(const char *path)
1129e0b22f4SStefan Hajnoczi {
1139e0b22f4SStefan Hajnoczi #ifdef _WIN32
1149e0b22f4SStefan Hajnoczi     if (is_windows_drive(path) ||
1159e0b22f4SStefan Hajnoczi         is_windows_drive_prefix(path)) {
1169e0b22f4SStefan Hajnoczi         return 0;
1179e0b22f4SStefan Hajnoczi     }
1189e0b22f4SStefan Hajnoczi #endif
1199e0b22f4SStefan Hajnoczi 
1209e0b22f4SStefan Hajnoczi     return strchr(path, ':') != NULL;
1219e0b22f4SStefan Hajnoczi }
1229e0b22f4SStefan Hajnoczi 
12383f64091Sbellard int path_is_absolute(const char *path)
12483f64091Sbellard {
12583f64091Sbellard     const char *p;
12621664424Sbellard #ifdef _WIN32
12721664424Sbellard     /* specific case for names like: "\\.\d:" */
12821664424Sbellard     if (*path == '/' || *path == '\\')
12921664424Sbellard         return 1;
13021664424Sbellard #endif
13183f64091Sbellard     p = strchr(path, ':');
13283f64091Sbellard     if (p)
13383f64091Sbellard         p++;
13483f64091Sbellard     else
13583f64091Sbellard         p = path;
1363b9f94e1Sbellard #ifdef _WIN32
1373b9f94e1Sbellard     return (*p == '/' || *p == '\\');
1383b9f94e1Sbellard #else
1393b9f94e1Sbellard     return (*p == '/');
1403b9f94e1Sbellard #endif
14183f64091Sbellard }
14283f64091Sbellard 
14383f64091Sbellard /* if filename is absolute, just copy it to dest. Otherwise, build a
14483f64091Sbellard    path to it by considering it is relative to base_path. URL are
14583f64091Sbellard    supported. */
14683f64091Sbellard void path_combine(char *dest, int dest_size,
14783f64091Sbellard                   const char *base_path,
14883f64091Sbellard                   const char *filename)
14983f64091Sbellard {
15083f64091Sbellard     const char *p, *p1;
15183f64091Sbellard     int len;
15283f64091Sbellard 
15383f64091Sbellard     if (dest_size <= 0)
15483f64091Sbellard         return;
15583f64091Sbellard     if (path_is_absolute(filename)) {
15683f64091Sbellard         pstrcpy(dest, dest_size, filename);
15783f64091Sbellard     } else {
15883f64091Sbellard         p = strchr(base_path, ':');
15983f64091Sbellard         if (p)
16083f64091Sbellard             p++;
16183f64091Sbellard         else
16283f64091Sbellard             p = base_path;
1633b9f94e1Sbellard         p1 = strrchr(base_path, '/');
1643b9f94e1Sbellard #ifdef _WIN32
1653b9f94e1Sbellard         {
1663b9f94e1Sbellard             const char *p2;
1673b9f94e1Sbellard             p2 = strrchr(base_path, '\\');
1683b9f94e1Sbellard             if (!p1 || p2 > p1)
1693b9f94e1Sbellard                 p1 = p2;
1703b9f94e1Sbellard         }
1713b9f94e1Sbellard #endif
17283f64091Sbellard         if (p1)
17383f64091Sbellard             p1++;
17483f64091Sbellard         else
17583f64091Sbellard             p1 = base_path;
17683f64091Sbellard         if (p1 > p)
17783f64091Sbellard             p = p1;
17883f64091Sbellard         len = p - base_path;
17983f64091Sbellard         if (len > dest_size - 1)
18083f64091Sbellard             len = dest_size - 1;
18183f64091Sbellard         memcpy(dest, base_path, len);
18283f64091Sbellard         dest[len] = '\0';
18383f64091Sbellard         pstrcat(dest, dest_size, filename);
18483f64091Sbellard     }
18583f64091Sbellard }
18683f64091Sbellard 
1875efa9d5aSAnthony Liguori void bdrv_register(BlockDriver *bdrv)
188ea2384d3Sbellard {
18968485420SKevin Wolf     if (bdrv->bdrv_co_readv) {
19068485420SKevin Wolf         /* Emulate AIO by coroutines, and sync by AIO */
19168485420SKevin Wolf         bdrv->bdrv_aio_readv = bdrv_co_aio_readv_em;
19268485420SKevin Wolf         bdrv->bdrv_aio_writev = bdrv_co_aio_writev_em;
19368485420SKevin Wolf         bdrv->bdrv_read = bdrv_read_em;
19468485420SKevin Wolf         bdrv->bdrv_write = bdrv_write_em;
195f9f05dc5SKevin Wolf      } else {
196f9f05dc5SKevin Wolf         bdrv->bdrv_co_readv = bdrv_co_readv_em;
197f9f05dc5SKevin Wolf         bdrv->bdrv_co_writev = bdrv_co_writev_em;
198f9f05dc5SKevin Wolf 
199f9f05dc5SKevin Wolf         if (!bdrv->bdrv_aio_readv) {
20083f64091Sbellard             /* add AIO emulation layer */
201f141eafeSaliguori             bdrv->bdrv_aio_readv = bdrv_aio_readv_em;
202f141eafeSaliguori             bdrv->bdrv_aio_writev = bdrv_aio_writev_em;
203eda578e5Saliguori         } else if (!bdrv->bdrv_read) {
20483f64091Sbellard             /* add synchronous IO emulation layer */
20583f64091Sbellard             bdrv->bdrv_read = bdrv_read_em;
20683f64091Sbellard             bdrv->bdrv_write = bdrv_write_em;
20783f64091Sbellard         }
208f9f05dc5SKevin Wolf     }
209b2e12bc6SChristoph Hellwig 
210b2e12bc6SChristoph Hellwig     if (!bdrv->bdrv_aio_flush)
211b2e12bc6SChristoph Hellwig         bdrv->bdrv_aio_flush = bdrv_aio_flush_em;
212b2e12bc6SChristoph Hellwig 
2138a22f02aSStefan Hajnoczi     QLIST_INSERT_HEAD(&bdrv_drivers, bdrv, list);
214ea2384d3Sbellard }
215b338082bSbellard 
216b338082bSbellard /* create a new block device (by default it is empty) */
217b338082bSbellard BlockDriverState *bdrv_new(const char *device_name)
218fc01f7e7Sbellard {
2191b7bdbc1SStefan Hajnoczi     BlockDriverState *bs;
220b338082bSbellard 
2217267c094SAnthony Liguori     bs = g_malloc0(sizeof(BlockDriverState));
222b338082bSbellard     pstrcpy(bs->device_name, sizeof(bs->device_name), device_name);
223ea2384d3Sbellard     if (device_name[0] != '\0') {
2241b7bdbc1SStefan Hajnoczi         QTAILQ_INSERT_TAIL(&bdrv_states, bs, list);
225ea2384d3Sbellard     }
22628a7282aSLuiz Capitulino     bdrv_iostatus_disable(bs);
227b338082bSbellard     return bs;
228b338082bSbellard }
229b338082bSbellard 
230ea2384d3Sbellard BlockDriver *bdrv_find_format(const char *format_name)
231ea2384d3Sbellard {
232ea2384d3Sbellard     BlockDriver *drv1;
2338a22f02aSStefan Hajnoczi     QLIST_FOREACH(drv1, &bdrv_drivers, list) {
2348a22f02aSStefan Hajnoczi         if (!strcmp(drv1->format_name, format_name)) {
235ea2384d3Sbellard             return drv1;
236ea2384d3Sbellard         }
2378a22f02aSStefan Hajnoczi     }
238ea2384d3Sbellard     return NULL;
239ea2384d3Sbellard }
240ea2384d3Sbellard 
241eb852011SMarkus Armbruster static int bdrv_is_whitelisted(BlockDriver *drv)
242eb852011SMarkus Armbruster {
243eb852011SMarkus Armbruster     static const char *whitelist[] = {
244eb852011SMarkus Armbruster         CONFIG_BDRV_WHITELIST
245eb852011SMarkus Armbruster     };
246eb852011SMarkus Armbruster     const char **p;
247eb852011SMarkus Armbruster 
248eb852011SMarkus Armbruster     if (!whitelist[0])
249eb852011SMarkus Armbruster         return 1;               /* no whitelist, anything goes */
250eb852011SMarkus Armbruster 
251eb852011SMarkus Armbruster     for (p = whitelist; *p; p++) {
252eb852011SMarkus Armbruster         if (!strcmp(drv->format_name, *p)) {
253eb852011SMarkus Armbruster             return 1;
254eb852011SMarkus Armbruster         }
255eb852011SMarkus Armbruster     }
256eb852011SMarkus Armbruster     return 0;
257eb852011SMarkus Armbruster }
258eb852011SMarkus Armbruster 
259eb852011SMarkus Armbruster BlockDriver *bdrv_find_whitelisted_format(const char *format_name)
260eb852011SMarkus Armbruster {
261eb852011SMarkus Armbruster     BlockDriver *drv = bdrv_find_format(format_name);
262eb852011SMarkus Armbruster     return drv && bdrv_is_whitelisted(drv) ? drv : NULL;
263eb852011SMarkus Armbruster }
264eb852011SMarkus Armbruster 
2650e7e1989SKevin Wolf int bdrv_create(BlockDriver *drv, const char* filename,
2660e7e1989SKevin Wolf     QEMUOptionParameter *options)
267ea2384d3Sbellard {
268ea2384d3Sbellard     if (!drv->bdrv_create)
269ea2384d3Sbellard         return -ENOTSUP;
2700e7e1989SKevin Wolf 
2710e7e1989SKevin Wolf     return drv->bdrv_create(filename, options);
272ea2384d3Sbellard }
273ea2384d3Sbellard 
27484a12e66SChristoph Hellwig int bdrv_create_file(const char* filename, QEMUOptionParameter *options)
27584a12e66SChristoph Hellwig {
27684a12e66SChristoph Hellwig     BlockDriver *drv;
27784a12e66SChristoph Hellwig 
278b50cbabcSMORITA Kazutaka     drv = bdrv_find_protocol(filename);
27984a12e66SChristoph Hellwig     if (drv == NULL) {
28016905d71SStefan Hajnoczi         return -ENOENT;
28184a12e66SChristoph Hellwig     }
28284a12e66SChristoph Hellwig 
28384a12e66SChristoph Hellwig     return bdrv_create(drv, filename, options);
28484a12e66SChristoph Hellwig }
28584a12e66SChristoph Hellwig 
286d5249393Sbellard #ifdef _WIN32
28795389c86Sbellard void get_tmp_filename(char *filename, int size)
288d5249393Sbellard {
2893b9f94e1Sbellard     char temp_dir[MAX_PATH];
2903b9f94e1Sbellard 
2913b9f94e1Sbellard     GetTempPath(MAX_PATH, temp_dir);
2923b9f94e1Sbellard     GetTempFileName(temp_dir, "qem", 0, filename);
293d5249393Sbellard }
294d5249393Sbellard #else
29595389c86Sbellard void get_tmp_filename(char *filename, int size)
296ea2384d3Sbellard {
297ea2384d3Sbellard     int fd;
2987ccfb2ebSblueswir1     const char *tmpdir;
299d5249393Sbellard     /* XXX: race condition possible */
3000badc1eeSaurel32     tmpdir = getenv("TMPDIR");
3010badc1eeSaurel32     if (!tmpdir)
3020badc1eeSaurel32         tmpdir = "/tmp";
3030badc1eeSaurel32     snprintf(filename, size, "%s/vl.XXXXXX", tmpdir);
304ea2384d3Sbellard     fd = mkstemp(filename);
305ea2384d3Sbellard     close(fd);
306ea2384d3Sbellard }
307d5249393Sbellard #endif
308ea2384d3Sbellard 
309f3a5d3f8SChristoph Hellwig /*
310f3a5d3f8SChristoph Hellwig  * Detect host devices. By convention, /dev/cdrom[N] is always
311f3a5d3f8SChristoph Hellwig  * recognized as a host CDROM.
312f3a5d3f8SChristoph Hellwig  */
313f3a5d3f8SChristoph Hellwig static BlockDriver *find_hdev_driver(const char *filename)
314f3a5d3f8SChristoph Hellwig {
315508c7cb3SChristoph Hellwig     int score_max = 0, score;
316508c7cb3SChristoph Hellwig     BlockDriver *drv = NULL, *d;
317f3a5d3f8SChristoph Hellwig 
3188a22f02aSStefan Hajnoczi     QLIST_FOREACH(d, &bdrv_drivers, list) {
319508c7cb3SChristoph Hellwig         if (d->bdrv_probe_device) {
320508c7cb3SChristoph Hellwig             score = d->bdrv_probe_device(filename);
321508c7cb3SChristoph Hellwig             if (score > score_max) {
322508c7cb3SChristoph Hellwig                 score_max = score;
323508c7cb3SChristoph Hellwig                 drv = d;
324f3a5d3f8SChristoph Hellwig             }
325508c7cb3SChristoph Hellwig         }
326f3a5d3f8SChristoph Hellwig     }
327f3a5d3f8SChristoph Hellwig 
328508c7cb3SChristoph Hellwig     return drv;
329f3a5d3f8SChristoph Hellwig }
330f3a5d3f8SChristoph Hellwig 
331b50cbabcSMORITA Kazutaka BlockDriver *bdrv_find_protocol(const char *filename)
33284a12e66SChristoph Hellwig {
33384a12e66SChristoph Hellwig     BlockDriver *drv1;
33484a12e66SChristoph Hellwig     char protocol[128];
33584a12e66SChristoph Hellwig     int len;
33684a12e66SChristoph Hellwig     const char *p;
33784a12e66SChristoph Hellwig 
33866f82ceeSKevin Wolf     /* TODO Drivers without bdrv_file_open must be specified explicitly */
33966f82ceeSKevin Wolf 
34039508e7aSChristoph Hellwig     /*
34139508e7aSChristoph Hellwig      * XXX(hch): we really should not let host device detection
34239508e7aSChristoph Hellwig      * override an explicit protocol specification, but moving this
34339508e7aSChristoph Hellwig      * later breaks access to device names with colons in them.
34439508e7aSChristoph Hellwig      * Thanks to the brain-dead persistent naming schemes on udev-
34539508e7aSChristoph Hellwig      * based Linux systems those actually are quite common.
34639508e7aSChristoph Hellwig      */
34784a12e66SChristoph Hellwig     drv1 = find_hdev_driver(filename);
34839508e7aSChristoph Hellwig     if (drv1) {
34984a12e66SChristoph Hellwig         return drv1;
35084a12e66SChristoph Hellwig     }
35139508e7aSChristoph Hellwig 
3529e0b22f4SStefan Hajnoczi     if (!path_has_protocol(filename)) {
35339508e7aSChristoph Hellwig         return bdrv_find_format("file");
35439508e7aSChristoph Hellwig     }
3559e0b22f4SStefan Hajnoczi     p = strchr(filename, ':');
3569e0b22f4SStefan Hajnoczi     assert(p != NULL);
35784a12e66SChristoph Hellwig     len = p - filename;
35884a12e66SChristoph Hellwig     if (len > sizeof(protocol) - 1)
35984a12e66SChristoph Hellwig         len = sizeof(protocol) - 1;
36084a12e66SChristoph Hellwig     memcpy(protocol, filename, len);
36184a12e66SChristoph Hellwig     protocol[len] = '\0';
36284a12e66SChristoph Hellwig     QLIST_FOREACH(drv1, &bdrv_drivers, list) {
36384a12e66SChristoph Hellwig         if (drv1->protocol_name &&
36484a12e66SChristoph Hellwig             !strcmp(drv1->protocol_name, protocol)) {
36584a12e66SChristoph Hellwig             return drv1;
36684a12e66SChristoph Hellwig         }
36784a12e66SChristoph Hellwig     }
36884a12e66SChristoph Hellwig     return NULL;
36984a12e66SChristoph Hellwig }
37084a12e66SChristoph Hellwig 
371c98ac35dSStefan Weil static int find_image_format(const char *filename, BlockDriver **pdrv)
372ea2384d3Sbellard {
37383f64091Sbellard     int ret, score, score_max;
374ea2384d3Sbellard     BlockDriver *drv1, *drv;
37583f64091Sbellard     uint8_t buf[2048];
37683f64091Sbellard     BlockDriverState *bs;
377ea2384d3Sbellard 
378f5edb014SNaphtali Sprei     ret = bdrv_file_open(&bs, filename, 0);
379c98ac35dSStefan Weil     if (ret < 0) {
380c98ac35dSStefan Weil         *pdrv = NULL;
381c98ac35dSStefan Weil         return ret;
382c98ac35dSStefan Weil     }
383f8ea0b00SNicholas Bellinger 
38408a00559SKevin Wolf     /* Return the raw BlockDriver * to scsi-generic devices or empty drives */
38508a00559SKevin Wolf     if (bs->sg || !bdrv_is_inserted(bs)) {
3861a396859SNicholas A. Bellinger         bdrv_delete(bs);
387c98ac35dSStefan Weil         drv = bdrv_find_format("raw");
388c98ac35dSStefan Weil         if (!drv) {
389c98ac35dSStefan Weil             ret = -ENOENT;
390c98ac35dSStefan Weil         }
391c98ac35dSStefan Weil         *pdrv = drv;
392c98ac35dSStefan Weil         return ret;
3931a396859SNicholas A. Bellinger     }
394f8ea0b00SNicholas Bellinger 
39583f64091Sbellard     ret = bdrv_pread(bs, 0, buf, sizeof(buf));
39683f64091Sbellard     bdrv_delete(bs);
397ea2384d3Sbellard     if (ret < 0) {
398c98ac35dSStefan Weil         *pdrv = NULL;
399c98ac35dSStefan Weil         return ret;
400ea2384d3Sbellard     }
401ea2384d3Sbellard 
402ea2384d3Sbellard     score_max = 0;
40384a12e66SChristoph Hellwig     drv = NULL;
4048a22f02aSStefan Hajnoczi     QLIST_FOREACH(drv1, &bdrv_drivers, list) {
40583f64091Sbellard         if (drv1->bdrv_probe) {
406ea2384d3Sbellard             score = drv1->bdrv_probe(buf, ret, filename);
407ea2384d3Sbellard             if (score > score_max) {
408ea2384d3Sbellard                 score_max = score;
409ea2384d3Sbellard                 drv = drv1;
410ea2384d3Sbellard             }
411ea2384d3Sbellard         }
41283f64091Sbellard     }
413c98ac35dSStefan Weil     if (!drv) {
414c98ac35dSStefan Weil         ret = -ENOENT;
415c98ac35dSStefan Weil     }
416c98ac35dSStefan Weil     *pdrv = drv;
417c98ac35dSStefan Weil     return ret;
418ea2384d3Sbellard }
419ea2384d3Sbellard 
42051762288SStefan Hajnoczi /**
42151762288SStefan Hajnoczi  * Set the current 'total_sectors' value
42251762288SStefan Hajnoczi  */
42351762288SStefan Hajnoczi static int refresh_total_sectors(BlockDriverState *bs, int64_t hint)
42451762288SStefan Hajnoczi {
42551762288SStefan Hajnoczi     BlockDriver *drv = bs->drv;
42651762288SStefan Hajnoczi 
427396759adSNicholas Bellinger     /* Do not attempt drv->bdrv_getlength() on scsi-generic devices */
428396759adSNicholas Bellinger     if (bs->sg)
429396759adSNicholas Bellinger         return 0;
430396759adSNicholas Bellinger 
43151762288SStefan Hajnoczi     /* query actual device if possible, otherwise just trust the hint */
43251762288SStefan Hajnoczi     if (drv->bdrv_getlength) {
43351762288SStefan Hajnoczi         int64_t length = drv->bdrv_getlength(bs);
43451762288SStefan Hajnoczi         if (length < 0) {
43551762288SStefan Hajnoczi             return length;
43651762288SStefan Hajnoczi         }
43751762288SStefan Hajnoczi         hint = length >> BDRV_SECTOR_BITS;
43851762288SStefan Hajnoczi     }
43951762288SStefan Hajnoczi 
44051762288SStefan Hajnoczi     bs->total_sectors = hint;
44151762288SStefan Hajnoczi     return 0;
44251762288SStefan Hajnoczi }
44351762288SStefan Hajnoczi 
444c3993cdcSStefan Hajnoczi /**
445c3993cdcSStefan Hajnoczi  * Set open flags for a given cache mode
446c3993cdcSStefan Hajnoczi  *
447c3993cdcSStefan Hajnoczi  * Return 0 on success, -1 if the cache mode was invalid.
448c3993cdcSStefan Hajnoczi  */
449c3993cdcSStefan Hajnoczi int bdrv_parse_cache_flags(const char *mode, int *flags)
450c3993cdcSStefan Hajnoczi {
451c3993cdcSStefan Hajnoczi     *flags &= ~BDRV_O_CACHE_MASK;
452c3993cdcSStefan Hajnoczi 
453c3993cdcSStefan Hajnoczi     if (!strcmp(mode, "off") || !strcmp(mode, "none")) {
454c3993cdcSStefan Hajnoczi         *flags |= BDRV_O_NOCACHE | BDRV_O_CACHE_WB;
45592196b2fSStefan Hajnoczi     } else if (!strcmp(mode, "directsync")) {
45692196b2fSStefan Hajnoczi         *flags |= BDRV_O_NOCACHE;
457c3993cdcSStefan Hajnoczi     } else if (!strcmp(mode, "writeback")) {
458c3993cdcSStefan Hajnoczi         *flags |= BDRV_O_CACHE_WB;
459c3993cdcSStefan Hajnoczi     } else if (!strcmp(mode, "unsafe")) {
460c3993cdcSStefan Hajnoczi         *flags |= BDRV_O_CACHE_WB;
461c3993cdcSStefan Hajnoczi         *flags |= BDRV_O_NO_FLUSH;
462c3993cdcSStefan Hajnoczi     } else if (!strcmp(mode, "writethrough")) {
463c3993cdcSStefan Hajnoczi         /* this is the default */
464c3993cdcSStefan Hajnoczi     } else {
465c3993cdcSStefan Hajnoczi         return -1;
466c3993cdcSStefan Hajnoczi     }
467c3993cdcSStefan Hajnoczi 
468c3993cdcSStefan Hajnoczi     return 0;
469c3993cdcSStefan Hajnoczi }
470c3993cdcSStefan Hajnoczi 
471b6ce07aaSKevin Wolf /*
47257915332SKevin Wolf  * Common part for opening disk images and files
47357915332SKevin Wolf  */
47457915332SKevin Wolf static int bdrv_open_common(BlockDriverState *bs, const char *filename,
47557915332SKevin Wolf     int flags, BlockDriver *drv)
47657915332SKevin Wolf {
47757915332SKevin Wolf     int ret, open_flags;
47857915332SKevin Wolf 
47957915332SKevin Wolf     assert(drv != NULL);
48057915332SKevin Wolf 
48128dcee10SStefan Hajnoczi     trace_bdrv_open_common(bs, filename, flags, drv->format_name);
48228dcee10SStefan Hajnoczi 
48366f82ceeSKevin Wolf     bs->file = NULL;
48451762288SStefan Hajnoczi     bs->total_sectors = 0;
48557915332SKevin Wolf     bs->encrypted = 0;
48657915332SKevin Wolf     bs->valid_key = 0;
48757915332SKevin Wolf     bs->open_flags = flags;
48857915332SKevin Wolf     bs->buffer_alignment = 512;
48957915332SKevin Wolf 
49057915332SKevin Wolf     pstrcpy(bs->filename, sizeof(bs->filename), filename);
49157915332SKevin Wolf 
49257915332SKevin Wolf     if (use_bdrv_whitelist && !bdrv_is_whitelisted(drv)) {
49357915332SKevin Wolf         return -ENOTSUP;
49457915332SKevin Wolf     }
49557915332SKevin Wolf 
49657915332SKevin Wolf     bs->drv = drv;
4977267c094SAnthony Liguori     bs->opaque = g_malloc0(drv->instance_size);
49857915332SKevin Wolf 
499a6599793SChristoph Hellwig     if (flags & BDRV_O_CACHE_WB)
50057915332SKevin Wolf         bs->enable_write_cache = 1;
50157915332SKevin Wolf 
50257915332SKevin Wolf     /*
50357915332SKevin Wolf      * Clear flags that are internal to the block layer before opening the
50457915332SKevin Wolf      * image.
50557915332SKevin Wolf      */
50657915332SKevin Wolf     open_flags = flags & ~(BDRV_O_SNAPSHOT | BDRV_O_NO_BACKING);
50757915332SKevin Wolf 
50857915332SKevin Wolf     /*
509ebabb67aSStefan Weil      * Snapshots should be writable.
51057915332SKevin Wolf      */
51157915332SKevin Wolf     if (bs->is_temporary) {
51257915332SKevin Wolf         open_flags |= BDRV_O_RDWR;
51357915332SKevin Wolf     }
51457915332SKevin Wolf 
51566f82ceeSKevin Wolf     /* Open the image, either directly or using a protocol */
51666f82ceeSKevin Wolf     if (drv->bdrv_file_open) {
51766f82ceeSKevin Wolf         ret = drv->bdrv_file_open(bs, filename, open_flags);
51866f82ceeSKevin Wolf     } else {
51966f82ceeSKevin Wolf         ret = bdrv_file_open(&bs->file, filename, open_flags);
52066f82ceeSKevin Wolf         if (ret >= 0) {
52166f82ceeSKevin Wolf             ret = drv->bdrv_open(bs, open_flags);
52266f82ceeSKevin Wolf         }
52366f82ceeSKevin Wolf     }
52466f82ceeSKevin Wolf 
52557915332SKevin Wolf     if (ret < 0) {
52657915332SKevin Wolf         goto free_and_fail;
52757915332SKevin Wolf     }
52857915332SKevin Wolf 
52957915332SKevin Wolf     bs->keep_read_only = bs->read_only = !(open_flags & BDRV_O_RDWR);
53051762288SStefan Hajnoczi 
53151762288SStefan Hajnoczi     ret = refresh_total_sectors(bs, bs->total_sectors);
53251762288SStefan Hajnoczi     if (ret < 0) {
53351762288SStefan Hajnoczi         goto free_and_fail;
53457915332SKevin Wolf     }
53551762288SStefan Hajnoczi 
53657915332SKevin Wolf #ifndef _WIN32
53757915332SKevin Wolf     if (bs->is_temporary) {
53857915332SKevin Wolf         unlink(filename);
53957915332SKevin Wolf     }
54057915332SKevin Wolf #endif
54157915332SKevin Wolf     return 0;
54257915332SKevin Wolf 
54357915332SKevin Wolf free_and_fail:
54466f82ceeSKevin Wolf     if (bs->file) {
54566f82ceeSKevin Wolf         bdrv_delete(bs->file);
54666f82ceeSKevin Wolf         bs->file = NULL;
54766f82ceeSKevin Wolf     }
5487267c094SAnthony Liguori     g_free(bs->opaque);
54957915332SKevin Wolf     bs->opaque = NULL;
55057915332SKevin Wolf     bs->drv = NULL;
55157915332SKevin Wolf     return ret;
55257915332SKevin Wolf }
55357915332SKevin Wolf 
55457915332SKevin Wolf /*
555b6ce07aaSKevin Wolf  * Opens a file using a protocol (file, host_device, nbd, ...)
556b6ce07aaSKevin Wolf  */
55783f64091Sbellard int bdrv_file_open(BlockDriverState **pbs, const char *filename, int flags)
558b338082bSbellard {
55983f64091Sbellard     BlockDriverState *bs;
5606db95603SChristoph Hellwig     BlockDriver *drv;
56183f64091Sbellard     int ret;
5623b0d4f61Sbellard 
563b50cbabcSMORITA Kazutaka     drv = bdrv_find_protocol(filename);
5646db95603SChristoph Hellwig     if (!drv) {
5656db95603SChristoph Hellwig         return -ENOENT;
5666db95603SChristoph Hellwig     }
5676db95603SChristoph Hellwig 
56883f64091Sbellard     bs = bdrv_new("");
569b6ce07aaSKevin Wolf     ret = bdrv_open_common(bs, filename, flags, drv);
57083f64091Sbellard     if (ret < 0) {
57183f64091Sbellard         bdrv_delete(bs);
57283f64091Sbellard         return ret;
5733b0d4f61Sbellard     }
57471d0770cSaliguori     bs->growable = 1;
57583f64091Sbellard     *pbs = bs;
57683f64091Sbellard     return 0;
5773b0d4f61Sbellard }
5783b0d4f61Sbellard 
579b6ce07aaSKevin Wolf /*
580b6ce07aaSKevin Wolf  * Opens a disk image (raw, qcow2, vmdk, ...)
581b6ce07aaSKevin Wolf  */
582d6e9098eSKevin Wolf int bdrv_open(BlockDriverState *bs, const char *filename, int flags,
583ea2384d3Sbellard               BlockDriver *drv)
584ea2384d3Sbellard {
585b6ce07aaSKevin Wolf     int ret;
58633e3963eSbellard 
58783f64091Sbellard     if (flags & BDRV_O_SNAPSHOT) {
588ea2384d3Sbellard         BlockDriverState *bs1;
589ea2384d3Sbellard         int64_t total_size;
5907c96d46eSaliguori         int is_protocol = 0;
59191a073a9SKevin Wolf         BlockDriver *bdrv_qcow2;
59291a073a9SKevin Wolf         QEMUOptionParameter *options;
593b6ce07aaSKevin Wolf         char tmp_filename[PATH_MAX];
594b6ce07aaSKevin Wolf         char backing_filename[PATH_MAX];
59533e3963eSbellard 
596ea2384d3Sbellard         /* if snapshot, we create a temporary backing file and open it
597ea2384d3Sbellard            instead of opening 'filename' directly */
598ea2384d3Sbellard 
599ea2384d3Sbellard         /* if there is a backing file, use it */
600ea2384d3Sbellard         bs1 = bdrv_new("");
601d6e9098eSKevin Wolf         ret = bdrv_open(bs1, filename, 0, drv);
60251d7c00cSaliguori         if (ret < 0) {
603ea2384d3Sbellard             bdrv_delete(bs1);
60451d7c00cSaliguori             return ret;
605ea2384d3Sbellard         }
6063e82990bSJes Sorensen         total_size = bdrv_getlength(bs1) & BDRV_SECTOR_MASK;
6077c96d46eSaliguori 
6087c96d46eSaliguori         if (bs1->drv && bs1->drv->protocol_name)
6097c96d46eSaliguori             is_protocol = 1;
6107c96d46eSaliguori 
611ea2384d3Sbellard         bdrv_delete(bs1);
612ea2384d3Sbellard 
613ea2384d3Sbellard         get_tmp_filename(tmp_filename, sizeof(tmp_filename));
6147c96d46eSaliguori 
6157c96d46eSaliguori         /* Real path is meaningless for protocols */
6167c96d46eSaliguori         if (is_protocol)
6177c96d46eSaliguori             snprintf(backing_filename, sizeof(backing_filename),
6187c96d46eSaliguori                      "%s", filename);
619114cdfa9SKirill A. Shutemov         else if (!realpath(filename, backing_filename))
620114cdfa9SKirill A. Shutemov             return -errno;
6217c96d46eSaliguori 
62291a073a9SKevin Wolf         bdrv_qcow2 = bdrv_find_format("qcow2");
62391a073a9SKevin Wolf         options = parse_option_parameters("", bdrv_qcow2->create_options, NULL);
62491a073a9SKevin Wolf 
6253e82990bSJes Sorensen         set_option_parameter_int(options, BLOCK_OPT_SIZE, total_size);
62691a073a9SKevin Wolf         set_option_parameter(options, BLOCK_OPT_BACKING_FILE, backing_filename);
62791a073a9SKevin Wolf         if (drv) {
62891a073a9SKevin Wolf             set_option_parameter(options, BLOCK_OPT_BACKING_FMT,
62991a073a9SKevin Wolf                 drv->format_name);
63091a073a9SKevin Wolf         }
63191a073a9SKevin Wolf 
63291a073a9SKevin Wolf         ret = bdrv_create(bdrv_qcow2, tmp_filename, options);
633d748768cSJan Kiszka         free_option_parameters(options);
63451d7c00cSaliguori         if (ret < 0) {
63551d7c00cSaliguori             return ret;
636ea2384d3Sbellard         }
63791a073a9SKevin Wolf 
638ea2384d3Sbellard         filename = tmp_filename;
63991a073a9SKevin Wolf         drv = bdrv_qcow2;
640ea2384d3Sbellard         bs->is_temporary = 1;
641ea2384d3Sbellard     }
642ea2384d3Sbellard 
643b6ce07aaSKevin Wolf     /* Find the right image format driver */
6446db95603SChristoph Hellwig     if (!drv) {
645c98ac35dSStefan Weil         ret = find_image_format(filename, &drv);
646ea2384d3Sbellard     }
6476987307cSChristoph Hellwig 
64851d7c00cSaliguori     if (!drv) {
64951d7c00cSaliguori         goto unlink_and_fail;
65083f64091Sbellard     }
651b6ce07aaSKevin Wolf 
652b6ce07aaSKevin Wolf     /* Open the image */
653b6ce07aaSKevin Wolf     ret = bdrv_open_common(bs, filename, flags, drv);
654b6ce07aaSKevin Wolf     if (ret < 0) {
6556987307cSChristoph Hellwig         goto unlink_and_fail;
6566987307cSChristoph Hellwig     }
6576987307cSChristoph Hellwig 
658b6ce07aaSKevin Wolf     /* If there is a backing file, use it */
659b6ce07aaSKevin Wolf     if ((flags & BDRV_O_NO_BACKING) == 0 && bs->backing_file[0] != '\0') {
660b6ce07aaSKevin Wolf         char backing_filename[PATH_MAX];
661b6ce07aaSKevin Wolf         int back_flags;
662b6ce07aaSKevin Wolf         BlockDriver *back_drv = NULL;
663b6ce07aaSKevin Wolf 
664b6ce07aaSKevin Wolf         bs->backing_hd = bdrv_new("");
665df2dbb4aSStefan Hajnoczi 
666df2dbb4aSStefan Hajnoczi         if (path_has_protocol(bs->backing_file)) {
667df2dbb4aSStefan Hajnoczi             pstrcpy(backing_filename, sizeof(backing_filename),
668df2dbb4aSStefan Hajnoczi                     bs->backing_file);
669df2dbb4aSStefan Hajnoczi         } else {
670b6ce07aaSKevin Wolf             path_combine(backing_filename, sizeof(backing_filename),
671b6ce07aaSKevin Wolf                          filename, bs->backing_file);
672df2dbb4aSStefan Hajnoczi         }
673df2dbb4aSStefan Hajnoczi 
674df2dbb4aSStefan Hajnoczi         if (bs->backing_format[0] != '\0') {
675b6ce07aaSKevin Wolf             back_drv = bdrv_find_format(bs->backing_format);
676df2dbb4aSStefan Hajnoczi         }
677b6ce07aaSKevin Wolf 
678b6ce07aaSKevin Wolf         /* backing files always opened read-only */
679b6ce07aaSKevin Wolf         back_flags =
680b6ce07aaSKevin Wolf             flags & ~(BDRV_O_RDWR | BDRV_O_SNAPSHOT | BDRV_O_NO_BACKING);
681b6ce07aaSKevin Wolf 
682b6ce07aaSKevin Wolf         ret = bdrv_open(bs->backing_hd, backing_filename, back_flags, back_drv);
683b6ce07aaSKevin Wolf         if (ret < 0) {
684b6ce07aaSKevin Wolf             bdrv_close(bs);
685b6ce07aaSKevin Wolf             return ret;
686b6ce07aaSKevin Wolf         }
687b6ce07aaSKevin Wolf         if (bs->is_temporary) {
688b6ce07aaSKevin Wolf             bs->backing_hd->keep_read_only = !(flags & BDRV_O_RDWR);
689b6ce07aaSKevin Wolf         } else {
690b6ce07aaSKevin Wolf             /* base image inherits from "parent" */
691b6ce07aaSKevin Wolf             bs->backing_hd->keep_read_only = bs->keep_read_only;
692b6ce07aaSKevin Wolf         }
693b6ce07aaSKevin Wolf     }
694b6ce07aaSKevin Wolf 
695b6ce07aaSKevin Wolf     if (!bdrv_key_required(bs)) {
6967d4b4ba5SMarkus Armbruster         bdrv_dev_change_media_cb(bs, true);
697b6ce07aaSKevin Wolf     }
698b6ce07aaSKevin Wolf 
699b6ce07aaSKevin Wolf     return 0;
700b6ce07aaSKevin Wolf 
701b6ce07aaSKevin Wolf unlink_and_fail:
702b6ce07aaSKevin Wolf     if (bs->is_temporary) {
703b6ce07aaSKevin Wolf         unlink(filename);
704b6ce07aaSKevin Wolf     }
705b6ce07aaSKevin Wolf     return ret;
706b6ce07aaSKevin Wolf }
707b6ce07aaSKevin Wolf 
708fc01f7e7Sbellard void bdrv_close(BlockDriverState *bs)
709fc01f7e7Sbellard {
71019cb3738Sbellard     if (bs->drv) {
711f9092b10SMarkus Armbruster         if (bs == bs_snapshots) {
712f9092b10SMarkus Armbruster             bs_snapshots = NULL;
713f9092b10SMarkus Armbruster         }
714557df6acSStefan Hajnoczi         if (bs->backing_hd) {
715ea2384d3Sbellard             bdrv_delete(bs->backing_hd);
716557df6acSStefan Hajnoczi             bs->backing_hd = NULL;
717557df6acSStefan Hajnoczi         }
718ea2384d3Sbellard         bs->drv->bdrv_close(bs);
7197267c094SAnthony Liguori         g_free(bs->opaque);
720ea2384d3Sbellard #ifdef _WIN32
721ea2384d3Sbellard         if (bs->is_temporary) {
722ea2384d3Sbellard             unlink(bs->filename);
723ea2384d3Sbellard         }
72467b915a5Sbellard #endif
725ea2384d3Sbellard         bs->opaque = NULL;
726ea2384d3Sbellard         bs->drv = NULL;
727b338082bSbellard 
72866f82ceeSKevin Wolf         if (bs->file != NULL) {
72966f82ceeSKevin Wolf             bdrv_close(bs->file);
73066f82ceeSKevin Wolf         }
73166f82ceeSKevin Wolf 
7327d4b4ba5SMarkus Armbruster         bdrv_dev_change_media_cb(bs, false);
733b338082bSbellard     }
734b338082bSbellard }
735b338082bSbellard 
7362bc93fedSMORITA Kazutaka void bdrv_close_all(void)
7372bc93fedSMORITA Kazutaka {
7382bc93fedSMORITA Kazutaka     BlockDriverState *bs;
7392bc93fedSMORITA Kazutaka 
7402bc93fedSMORITA Kazutaka     QTAILQ_FOREACH(bs, &bdrv_states, list) {
7412bc93fedSMORITA Kazutaka         bdrv_close(bs);
7422bc93fedSMORITA Kazutaka     }
7432bc93fedSMORITA Kazutaka }
7442bc93fedSMORITA Kazutaka 
745d22b2f41SRyan Harper /* make a BlockDriverState anonymous by removing from bdrv_state list.
746d22b2f41SRyan Harper    Also, NULL terminate the device_name to prevent double remove */
747d22b2f41SRyan Harper void bdrv_make_anon(BlockDriverState *bs)
748d22b2f41SRyan Harper {
749d22b2f41SRyan Harper     if (bs->device_name[0] != '\0') {
750d22b2f41SRyan Harper         QTAILQ_REMOVE(&bdrv_states, bs, list);
751d22b2f41SRyan Harper     }
752d22b2f41SRyan Harper     bs->device_name[0] = '\0';
753d22b2f41SRyan Harper }
754d22b2f41SRyan Harper 
755b338082bSbellard void bdrv_delete(BlockDriverState *bs)
756b338082bSbellard {
757fa879d62SMarkus Armbruster     assert(!bs->dev);
75818846deeSMarkus Armbruster 
7591b7bdbc1SStefan Hajnoczi     /* remove from list, if necessary */
760d22b2f41SRyan Harper     bdrv_make_anon(bs);
76134c6f050Saurel32 
762b338082bSbellard     bdrv_close(bs);
76366f82ceeSKevin Wolf     if (bs->file != NULL) {
76466f82ceeSKevin Wolf         bdrv_delete(bs->file);
76566f82ceeSKevin Wolf     }
76666f82ceeSKevin Wolf 
767f9092b10SMarkus Armbruster     assert(bs != bs_snapshots);
7687267c094SAnthony Liguori     g_free(bs);
769fc01f7e7Sbellard }
770fc01f7e7Sbellard 
771fa879d62SMarkus Armbruster int bdrv_attach_dev(BlockDriverState *bs, void *dev)
772fa879d62SMarkus Armbruster /* TODO change to DeviceState *dev when all users are qdevified */
77318846deeSMarkus Armbruster {
774fa879d62SMarkus Armbruster     if (bs->dev) {
77518846deeSMarkus Armbruster         return -EBUSY;
77618846deeSMarkus Armbruster     }
777fa879d62SMarkus Armbruster     bs->dev = dev;
77828a7282aSLuiz Capitulino     bdrv_iostatus_reset(bs);
77918846deeSMarkus Armbruster     return 0;
78018846deeSMarkus Armbruster }
78118846deeSMarkus Armbruster 
782fa879d62SMarkus Armbruster /* TODO qdevified devices don't use this, remove when devices are qdevified */
783fa879d62SMarkus Armbruster void bdrv_attach_dev_nofail(BlockDriverState *bs, void *dev)
78418846deeSMarkus Armbruster {
785fa879d62SMarkus Armbruster     if (bdrv_attach_dev(bs, dev) < 0) {
786fa879d62SMarkus Armbruster         abort();
787fa879d62SMarkus Armbruster     }
788fa879d62SMarkus Armbruster }
789fa879d62SMarkus Armbruster 
790fa879d62SMarkus Armbruster void bdrv_detach_dev(BlockDriverState *bs, void *dev)
791fa879d62SMarkus Armbruster /* TODO change to DeviceState *dev when all users are qdevified */
792fa879d62SMarkus Armbruster {
793fa879d62SMarkus Armbruster     assert(bs->dev == dev);
794fa879d62SMarkus Armbruster     bs->dev = NULL;
7950e49de52SMarkus Armbruster     bs->dev_ops = NULL;
7960e49de52SMarkus Armbruster     bs->dev_opaque = NULL;
79729e05f20SMarkus Armbruster     bs->buffer_alignment = 512;
79818846deeSMarkus Armbruster }
79918846deeSMarkus Armbruster 
800fa879d62SMarkus Armbruster /* TODO change to return DeviceState * when all users are qdevified */
801fa879d62SMarkus Armbruster void *bdrv_get_attached_dev(BlockDriverState *bs)
80218846deeSMarkus Armbruster {
803fa879d62SMarkus Armbruster     return bs->dev;
80418846deeSMarkus Armbruster }
80518846deeSMarkus Armbruster 
8060e49de52SMarkus Armbruster void bdrv_set_dev_ops(BlockDriverState *bs, const BlockDevOps *ops,
8070e49de52SMarkus Armbruster                       void *opaque)
8080e49de52SMarkus Armbruster {
8090e49de52SMarkus Armbruster     bs->dev_ops = ops;
8100e49de52SMarkus Armbruster     bs->dev_opaque = opaque;
8112c6942faSMarkus Armbruster     if (bdrv_dev_has_removable_media(bs) && bs == bs_snapshots) {
8122c6942faSMarkus Armbruster         bs_snapshots = NULL;
8132c6942faSMarkus Armbruster     }
8140e49de52SMarkus Armbruster }
8150e49de52SMarkus Armbruster 
8167d4b4ba5SMarkus Armbruster static void bdrv_dev_change_media_cb(BlockDriverState *bs, bool load)
8170e49de52SMarkus Armbruster {
818145feb17SMarkus Armbruster     if (bs->dev_ops && bs->dev_ops->change_media_cb) {
8197d4b4ba5SMarkus Armbruster         bs->dev_ops->change_media_cb(bs->dev_opaque, load);
820145feb17SMarkus Armbruster     }
821145feb17SMarkus Armbruster }
822145feb17SMarkus Armbruster 
8232c6942faSMarkus Armbruster bool bdrv_dev_has_removable_media(BlockDriverState *bs)
8242c6942faSMarkus Armbruster {
8252c6942faSMarkus Armbruster     return !bs->dev || (bs->dev_ops && bs->dev_ops->change_media_cb);
8262c6942faSMarkus Armbruster }
8272c6942faSMarkus Armbruster 
828e4def80bSMarkus Armbruster bool bdrv_dev_is_tray_open(BlockDriverState *bs)
829e4def80bSMarkus Armbruster {
830e4def80bSMarkus Armbruster     if (bs->dev_ops && bs->dev_ops->is_tray_open) {
831e4def80bSMarkus Armbruster         return bs->dev_ops->is_tray_open(bs->dev_opaque);
832e4def80bSMarkus Armbruster     }
833e4def80bSMarkus Armbruster     return false;
834e4def80bSMarkus Armbruster }
835e4def80bSMarkus Armbruster 
836145feb17SMarkus Armbruster static void bdrv_dev_resize_cb(BlockDriverState *bs)
837145feb17SMarkus Armbruster {
838145feb17SMarkus Armbruster     if (bs->dev_ops && bs->dev_ops->resize_cb) {
839145feb17SMarkus Armbruster         bs->dev_ops->resize_cb(bs->dev_opaque);
8400e49de52SMarkus Armbruster     }
8410e49de52SMarkus Armbruster }
8420e49de52SMarkus Armbruster 
843f107639aSMarkus Armbruster bool bdrv_dev_is_medium_locked(BlockDriverState *bs)
844f107639aSMarkus Armbruster {
845f107639aSMarkus Armbruster     if (bs->dev_ops && bs->dev_ops->is_medium_locked) {
846f107639aSMarkus Armbruster         return bs->dev_ops->is_medium_locked(bs->dev_opaque);
847f107639aSMarkus Armbruster     }
848f107639aSMarkus Armbruster     return false;
849f107639aSMarkus Armbruster }
850f107639aSMarkus Armbruster 
851e97fc193Saliguori /*
852e97fc193Saliguori  * Run consistency checks on an image
853e97fc193Saliguori  *
854e076f338SKevin Wolf  * Returns 0 if the check could be completed (it doesn't mean that the image is
855a1c7273bSStefan Weil  * free of errors) or -errno when an internal error occurred. The results of the
856e076f338SKevin Wolf  * check are stored in res.
857e97fc193Saliguori  */
858e076f338SKevin Wolf int bdrv_check(BlockDriverState *bs, BdrvCheckResult *res)
859e97fc193Saliguori {
860e97fc193Saliguori     if (bs->drv->bdrv_check == NULL) {
861e97fc193Saliguori         return -ENOTSUP;
862e97fc193Saliguori     }
863e97fc193Saliguori 
864e076f338SKevin Wolf     memset(res, 0, sizeof(*res));
8659ac228e0SKevin Wolf     return bs->drv->bdrv_check(bs, res);
866e97fc193Saliguori }
867e97fc193Saliguori 
8688a426614SKevin Wolf #define COMMIT_BUF_SECTORS 2048
8698a426614SKevin Wolf 
87033e3963eSbellard /* commit COW file into the raw image */
87133e3963eSbellard int bdrv_commit(BlockDriverState *bs)
87233e3963eSbellard {
87319cb3738Sbellard     BlockDriver *drv = bs->drv;
874ee181196SKevin Wolf     BlockDriver *backing_drv;
8758a426614SKevin Wolf     int64_t sector, total_sectors;
8768a426614SKevin Wolf     int n, ro, open_flags;
8774dca4b63SNaphtali Sprei     int ret = 0, rw_ret = 0;
8788a426614SKevin Wolf     uint8_t *buf;
8794dca4b63SNaphtali Sprei     char filename[1024];
8804dca4b63SNaphtali Sprei     BlockDriverState *bs_rw, *bs_ro;
88133e3963eSbellard 
88219cb3738Sbellard     if (!drv)
88319cb3738Sbellard         return -ENOMEDIUM;
88433e3963eSbellard 
8854dca4b63SNaphtali Sprei     if (!bs->backing_hd) {
8864dca4b63SNaphtali Sprei         return -ENOTSUP;
8874dca4b63SNaphtali Sprei     }
8884dca4b63SNaphtali Sprei 
8894dca4b63SNaphtali Sprei     if (bs->backing_hd->keep_read_only) {
890ea2384d3Sbellard         return -EACCES;
89133e3963eSbellard     }
89233e3963eSbellard 
893ee181196SKevin Wolf     backing_drv = bs->backing_hd->drv;
8944dca4b63SNaphtali Sprei     ro = bs->backing_hd->read_only;
8954dca4b63SNaphtali Sprei     strncpy(filename, bs->backing_hd->filename, sizeof(filename));
8964dca4b63SNaphtali Sprei     open_flags =  bs->backing_hd->open_flags;
8974dca4b63SNaphtali Sprei 
8984dca4b63SNaphtali Sprei     if (ro) {
8994dca4b63SNaphtali Sprei         /* re-open as RW */
9004dca4b63SNaphtali Sprei         bdrv_delete(bs->backing_hd);
9014dca4b63SNaphtali Sprei         bs->backing_hd = NULL;
9024dca4b63SNaphtali Sprei         bs_rw = bdrv_new("");
903ee181196SKevin Wolf         rw_ret = bdrv_open(bs_rw, filename, open_flags | BDRV_O_RDWR,
904ee181196SKevin Wolf             backing_drv);
9054dca4b63SNaphtali Sprei         if (rw_ret < 0) {
9064dca4b63SNaphtali Sprei             bdrv_delete(bs_rw);
9074dca4b63SNaphtali Sprei             /* try to re-open read-only */
9084dca4b63SNaphtali Sprei             bs_ro = bdrv_new("");
909ee181196SKevin Wolf             ret = bdrv_open(bs_ro, filename, open_flags & ~BDRV_O_RDWR,
910ee181196SKevin Wolf                 backing_drv);
9114dca4b63SNaphtali Sprei             if (ret < 0) {
9124dca4b63SNaphtali Sprei                 bdrv_delete(bs_ro);
9134dca4b63SNaphtali Sprei                 /* drive not functional anymore */
9144dca4b63SNaphtali Sprei                 bs->drv = NULL;
9154dca4b63SNaphtali Sprei                 return ret;
9164dca4b63SNaphtali Sprei             }
9174dca4b63SNaphtali Sprei             bs->backing_hd = bs_ro;
9184dca4b63SNaphtali Sprei             return rw_ret;
9194dca4b63SNaphtali Sprei         }
9204dca4b63SNaphtali Sprei         bs->backing_hd = bs_rw;
921ea2384d3Sbellard     }
922ea2384d3Sbellard 
9236ea44308SJan Kiszka     total_sectors = bdrv_getlength(bs) >> BDRV_SECTOR_BITS;
9247267c094SAnthony Liguori     buf = g_malloc(COMMIT_BUF_SECTORS * BDRV_SECTOR_SIZE);
9258a426614SKevin Wolf 
9268a426614SKevin Wolf     for (sector = 0; sector < total_sectors; sector += n) {
9278a426614SKevin Wolf         if (drv->bdrv_is_allocated(bs, sector, COMMIT_BUF_SECTORS, &n)) {
9288a426614SKevin Wolf 
9298a426614SKevin Wolf             if (bdrv_read(bs, sector, buf, n) != 0) {
9304dca4b63SNaphtali Sprei                 ret = -EIO;
9314dca4b63SNaphtali Sprei                 goto ro_cleanup;
93233e3963eSbellard             }
93333e3963eSbellard 
9348a426614SKevin Wolf             if (bdrv_write(bs->backing_hd, sector, buf, n) != 0) {
9354dca4b63SNaphtali Sprei                 ret = -EIO;
9364dca4b63SNaphtali Sprei                 goto ro_cleanup;
93733e3963eSbellard             }
93833e3963eSbellard         }
93933e3963eSbellard     }
94095389c86Sbellard 
9411d44952fSChristoph Hellwig     if (drv->bdrv_make_empty) {
9421d44952fSChristoph Hellwig         ret = drv->bdrv_make_empty(bs);
9431d44952fSChristoph Hellwig         bdrv_flush(bs);
9441d44952fSChristoph Hellwig     }
94595389c86Sbellard 
9463f5075aeSChristoph Hellwig     /*
9473f5075aeSChristoph Hellwig      * Make sure all data we wrote to the backing device is actually
9483f5075aeSChristoph Hellwig      * stable on disk.
9493f5075aeSChristoph Hellwig      */
9503f5075aeSChristoph Hellwig     if (bs->backing_hd)
9513f5075aeSChristoph Hellwig         bdrv_flush(bs->backing_hd);
9524dca4b63SNaphtali Sprei 
9534dca4b63SNaphtali Sprei ro_cleanup:
9547267c094SAnthony Liguori     g_free(buf);
9554dca4b63SNaphtali Sprei 
9564dca4b63SNaphtali Sprei     if (ro) {
9574dca4b63SNaphtali Sprei         /* re-open as RO */
9584dca4b63SNaphtali Sprei         bdrv_delete(bs->backing_hd);
9594dca4b63SNaphtali Sprei         bs->backing_hd = NULL;
9604dca4b63SNaphtali Sprei         bs_ro = bdrv_new("");
961ee181196SKevin Wolf         ret = bdrv_open(bs_ro, filename, open_flags & ~BDRV_O_RDWR,
962ee181196SKevin Wolf             backing_drv);
9634dca4b63SNaphtali Sprei         if (ret < 0) {
9644dca4b63SNaphtali Sprei             bdrv_delete(bs_ro);
9654dca4b63SNaphtali Sprei             /* drive not functional anymore */
9664dca4b63SNaphtali Sprei             bs->drv = NULL;
9674dca4b63SNaphtali Sprei             return ret;
9684dca4b63SNaphtali Sprei         }
9694dca4b63SNaphtali Sprei         bs->backing_hd = bs_ro;
9704dca4b63SNaphtali Sprei         bs->backing_hd->keep_read_only = 0;
9714dca4b63SNaphtali Sprei     }
9724dca4b63SNaphtali Sprei 
9731d44952fSChristoph Hellwig     return ret;
97433e3963eSbellard }
97533e3963eSbellard 
9766ab4b5abSMarkus Armbruster void bdrv_commit_all(void)
9776ab4b5abSMarkus Armbruster {
9786ab4b5abSMarkus Armbruster     BlockDriverState *bs;
9796ab4b5abSMarkus Armbruster 
9806ab4b5abSMarkus Armbruster     QTAILQ_FOREACH(bs, &bdrv_states, list) {
9816ab4b5abSMarkus Armbruster         bdrv_commit(bs);
9826ab4b5abSMarkus Armbruster     }
9836ab4b5abSMarkus Armbruster }
9846ab4b5abSMarkus Armbruster 
985756e6736SKevin Wolf /*
986756e6736SKevin Wolf  * Return values:
987756e6736SKevin Wolf  * 0        - success
988756e6736SKevin Wolf  * -EINVAL  - backing format specified, but no file
989756e6736SKevin Wolf  * -ENOSPC  - can't update the backing file because no space is left in the
990756e6736SKevin Wolf  *            image file header
991756e6736SKevin Wolf  * -ENOTSUP - format driver doesn't support changing the backing file
992756e6736SKevin Wolf  */
993756e6736SKevin Wolf int bdrv_change_backing_file(BlockDriverState *bs,
994756e6736SKevin Wolf     const char *backing_file, const char *backing_fmt)
995756e6736SKevin Wolf {
996756e6736SKevin Wolf     BlockDriver *drv = bs->drv;
997756e6736SKevin Wolf 
998756e6736SKevin Wolf     if (drv->bdrv_change_backing_file != NULL) {
999756e6736SKevin Wolf         return drv->bdrv_change_backing_file(bs, backing_file, backing_fmt);
1000756e6736SKevin Wolf     } else {
1001756e6736SKevin Wolf         return -ENOTSUP;
1002756e6736SKevin Wolf     }
1003756e6736SKevin Wolf }
1004756e6736SKevin Wolf 
100571d0770cSaliguori static int bdrv_check_byte_request(BlockDriverState *bs, int64_t offset,
100671d0770cSaliguori                                    size_t size)
100771d0770cSaliguori {
100871d0770cSaliguori     int64_t len;
100971d0770cSaliguori 
101071d0770cSaliguori     if (!bdrv_is_inserted(bs))
101171d0770cSaliguori         return -ENOMEDIUM;
101271d0770cSaliguori 
101371d0770cSaliguori     if (bs->growable)
101471d0770cSaliguori         return 0;
101571d0770cSaliguori 
101671d0770cSaliguori     len = bdrv_getlength(bs);
101771d0770cSaliguori 
1018fbb7b4e0SKevin Wolf     if (offset < 0)
1019fbb7b4e0SKevin Wolf         return -EIO;
1020fbb7b4e0SKevin Wolf 
1021fbb7b4e0SKevin Wolf     if ((offset > len) || (len - offset < size))
102271d0770cSaliguori         return -EIO;
102371d0770cSaliguori 
102471d0770cSaliguori     return 0;
102571d0770cSaliguori }
102671d0770cSaliguori 
102771d0770cSaliguori static int bdrv_check_request(BlockDriverState *bs, int64_t sector_num,
102871d0770cSaliguori                               int nb_sectors)
102971d0770cSaliguori {
1030eb5a3165SJes Sorensen     return bdrv_check_byte_request(bs, sector_num * BDRV_SECTOR_SIZE,
1031eb5a3165SJes Sorensen                                    nb_sectors * BDRV_SECTOR_SIZE);
103271d0770cSaliguori }
103371d0770cSaliguori 
1034e7a8a783SKevin Wolf static inline bool bdrv_has_async_rw(BlockDriver *drv)
1035e7a8a783SKevin Wolf {
1036e7a8a783SKevin Wolf     return drv->bdrv_co_readv != bdrv_co_readv_em
1037e7a8a783SKevin Wolf         || drv->bdrv_aio_readv != bdrv_aio_readv_em;
1038e7a8a783SKevin Wolf }
1039e7a8a783SKevin Wolf 
1040e7a8a783SKevin Wolf static inline bool bdrv_has_async_flush(BlockDriver *drv)
1041e7a8a783SKevin Wolf {
1042e7a8a783SKevin Wolf     return drv->bdrv_aio_flush != bdrv_aio_flush_em;
1043e7a8a783SKevin Wolf }
1044e7a8a783SKevin Wolf 
104519cb3738Sbellard /* return < 0 if error. See bdrv_write() for the return codes */
1046fc01f7e7Sbellard int bdrv_read(BlockDriverState *bs, int64_t sector_num,
1047fc01f7e7Sbellard               uint8_t *buf, int nb_sectors)
1048fc01f7e7Sbellard {
1049ea2384d3Sbellard     BlockDriver *drv = bs->drv;
1050fc01f7e7Sbellard 
105119cb3738Sbellard     if (!drv)
105219cb3738Sbellard         return -ENOMEDIUM;
1053e7a8a783SKevin Wolf 
1054e7a8a783SKevin Wolf     if (bdrv_has_async_rw(drv) && qemu_in_coroutine()) {
1055e7a8a783SKevin Wolf         QEMUIOVector qiov;
1056e7a8a783SKevin Wolf         struct iovec iov = {
1057e7a8a783SKevin Wolf             .iov_base = (void *)buf,
1058e7a8a783SKevin Wolf             .iov_len = nb_sectors * BDRV_SECTOR_SIZE,
1059e7a8a783SKevin Wolf         };
1060e7a8a783SKevin Wolf 
1061e7a8a783SKevin Wolf         qemu_iovec_init_external(&qiov, &iov, 1);
1062e7a8a783SKevin Wolf         return bdrv_co_readv(bs, sector_num, nb_sectors, &qiov);
1063e7a8a783SKevin Wolf     }
1064e7a8a783SKevin Wolf 
106571d0770cSaliguori     if (bdrv_check_request(bs, sector_num, nb_sectors))
106671d0770cSaliguori         return -EIO;
1067b338082bSbellard 
106883f64091Sbellard     return drv->bdrv_read(bs, sector_num, buf, nb_sectors);
106983f64091Sbellard }
1070fc01f7e7Sbellard 
10717cd1e32aSlirans@il.ibm.com static void set_dirty_bitmap(BlockDriverState *bs, int64_t sector_num,
10727cd1e32aSlirans@il.ibm.com                              int nb_sectors, int dirty)
10737cd1e32aSlirans@il.ibm.com {
10747cd1e32aSlirans@il.ibm.com     int64_t start, end;
1075c6d22830SJan Kiszka     unsigned long val, idx, bit;
1076a55eb92cSJan Kiszka 
10776ea44308SJan Kiszka     start = sector_num / BDRV_SECTORS_PER_DIRTY_CHUNK;
1078c6d22830SJan Kiszka     end = (sector_num + nb_sectors - 1) / BDRV_SECTORS_PER_DIRTY_CHUNK;
10797cd1e32aSlirans@il.ibm.com 
10807cd1e32aSlirans@il.ibm.com     for (; start <= end; start++) {
1081c6d22830SJan Kiszka         idx = start / (sizeof(unsigned long) * 8);
1082c6d22830SJan Kiszka         bit = start % (sizeof(unsigned long) * 8);
1083c6d22830SJan Kiszka         val = bs->dirty_bitmap[idx];
1084c6d22830SJan Kiszka         if (dirty) {
10856d59fec1SMarcelo Tosatti             if (!(val & (1UL << bit))) {
1086aaa0eb75SLiran Schour                 bs->dirty_count++;
10876d59fec1SMarcelo Tosatti                 val |= 1UL << bit;
1088aaa0eb75SLiran Schour             }
1089c6d22830SJan Kiszka         } else {
10906d59fec1SMarcelo Tosatti             if (val & (1UL << bit)) {
1091aaa0eb75SLiran Schour                 bs->dirty_count--;
10926d59fec1SMarcelo Tosatti                 val &= ~(1UL << bit);
1093c6d22830SJan Kiszka             }
1094aaa0eb75SLiran Schour         }
1095c6d22830SJan Kiszka         bs->dirty_bitmap[idx] = val;
10967cd1e32aSlirans@il.ibm.com     }
10977cd1e32aSlirans@il.ibm.com }
10987cd1e32aSlirans@il.ibm.com 
109919cb3738Sbellard /* Return < 0 if error. Important errors are:
110019cb3738Sbellard   -EIO         generic I/O error (may happen for all errors)
110119cb3738Sbellard   -ENOMEDIUM   No media inserted.
110219cb3738Sbellard   -EINVAL      Invalid sector number or nb_sectors
110319cb3738Sbellard   -EACCES      Trying to write a read-only device
110419cb3738Sbellard */
1105fc01f7e7Sbellard int bdrv_write(BlockDriverState *bs, int64_t sector_num,
1106fc01f7e7Sbellard                const uint8_t *buf, int nb_sectors)
1107fc01f7e7Sbellard {
110883f64091Sbellard     BlockDriver *drv = bs->drv;
1109e7a8a783SKevin Wolf 
111019cb3738Sbellard     if (!bs->drv)
111119cb3738Sbellard         return -ENOMEDIUM;
1112e7a8a783SKevin Wolf 
1113e7a8a783SKevin Wolf     if (bdrv_has_async_rw(drv) && qemu_in_coroutine()) {
1114e7a8a783SKevin Wolf         QEMUIOVector qiov;
1115e7a8a783SKevin Wolf         struct iovec iov = {
1116e7a8a783SKevin Wolf             .iov_base = (void *)buf,
1117e7a8a783SKevin Wolf             .iov_len = nb_sectors * BDRV_SECTOR_SIZE,
1118e7a8a783SKevin Wolf         };
1119e7a8a783SKevin Wolf 
1120e7a8a783SKevin Wolf         qemu_iovec_init_external(&qiov, &iov, 1);
1121e7a8a783SKevin Wolf         return bdrv_co_writev(bs, sector_num, nb_sectors, &qiov);
1122e7a8a783SKevin Wolf     }
1123e7a8a783SKevin Wolf 
11240849bf08Sbellard     if (bs->read_only)
112519cb3738Sbellard         return -EACCES;
112671d0770cSaliguori     if (bdrv_check_request(bs, sector_num, nb_sectors))
112771d0770cSaliguori         return -EIO;
112871d0770cSaliguori 
1129c6d22830SJan Kiszka     if (bs->dirty_bitmap) {
11307cd1e32aSlirans@il.ibm.com         set_dirty_bitmap(bs, sector_num, nb_sectors, 1);
11317cd1e32aSlirans@il.ibm.com     }
11327cd1e32aSlirans@il.ibm.com 
1133294cc35fSKevin Wolf     if (bs->wr_highest_sector < sector_num + nb_sectors - 1) {
1134294cc35fSKevin Wolf         bs->wr_highest_sector = sector_num + nb_sectors - 1;
1135294cc35fSKevin Wolf     }
1136294cc35fSKevin Wolf 
113783f64091Sbellard     return drv->bdrv_write(bs, sector_num, buf, nb_sectors);
113883f64091Sbellard }
113983f64091Sbellard 
1140eda578e5Saliguori int bdrv_pread(BlockDriverState *bs, int64_t offset,
1141eda578e5Saliguori                void *buf, int count1)
114283f64091Sbellard {
11436ea44308SJan Kiszka     uint8_t tmp_buf[BDRV_SECTOR_SIZE];
114483f64091Sbellard     int len, nb_sectors, count;
114583f64091Sbellard     int64_t sector_num;
11469a8c4cceSKevin Wolf     int ret;
114783f64091Sbellard 
114883f64091Sbellard     count = count1;
114983f64091Sbellard     /* first read to align to sector start */
11506ea44308SJan Kiszka     len = (BDRV_SECTOR_SIZE - offset) & (BDRV_SECTOR_SIZE - 1);
115183f64091Sbellard     if (len > count)
115283f64091Sbellard         len = count;
11536ea44308SJan Kiszka     sector_num = offset >> BDRV_SECTOR_BITS;
115483f64091Sbellard     if (len > 0) {
11559a8c4cceSKevin Wolf         if ((ret = bdrv_read(bs, sector_num, tmp_buf, 1)) < 0)
11569a8c4cceSKevin Wolf             return ret;
11576ea44308SJan Kiszka         memcpy(buf, tmp_buf + (offset & (BDRV_SECTOR_SIZE - 1)), len);
115883f64091Sbellard         count -= len;
115983f64091Sbellard         if (count == 0)
116083f64091Sbellard             return count1;
116183f64091Sbellard         sector_num++;
116283f64091Sbellard         buf += len;
116383f64091Sbellard     }
116483f64091Sbellard 
116583f64091Sbellard     /* read the sectors "in place" */
11666ea44308SJan Kiszka     nb_sectors = count >> BDRV_SECTOR_BITS;
116783f64091Sbellard     if (nb_sectors > 0) {
11689a8c4cceSKevin Wolf         if ((ret = bdrv_read(bs, sector_num, buf, nb_sectors)) < 0)
11699a8c4cceSKevin Wolf             return ret;
117083f64091Sbellard         sector_num += nb_sectors;
11716ea44308SJan Kiszka         len = nb_sectors << BDRV_SECTOR_BITS;
117283f64091Sbellard         buf += len;
117383f64091Sbellard         count -= len;
117483f64091Sbellard     }
117583f64091Sbellard 
117683f64091Sbellard     /* add data from the last sector */
117783f64091Sbellard     if (count > 0) {
11789a8c4cceSKevin Wolf         if ((ret = bdrv_read(bs, sector_num, tmp_buf, 1)) < 0)
11799a8c4cceSKevin Wolf             return ret;
118083f64091Sbellard         memcpy(buf, tmp_buf, count);
118183f64091Sbellard     }
118283f64091Sbellard     return count1;
118383f64091Sbellard }
118483f64091Sbellard 
1185eda578e5Saliguori int bdrv_pwrite(BlockDriverState *bs, int64_t offset,
1186eda578e5Saliguori                 const void *buf, int count1)
118783f64091Sbellard {
11886ea44308SJan Kiszka     uint8_t tmp_buf[BDRV_SECTOR_SIZE];
118983f64091Sbellard     int len, nb_sectors, count;
119083f64091Sbellard     int64_t sector_num;
11919a8c4cceSKevin Wolf     int ret;
119283f64091Sbellard 
119383f64091Sbellard     count = count1;
119483f64091Sbellard     /* first write to align to sector start */
11956ea44308SJan Kiszka     len = (BDRV_SECTOR_SIZE - offset) & (BDRV_SECTOR_SIZE - 1);
119683f64091Sbellard     if (len > count)
119783f64091Sbellard         len = count;
11986ea44308SJan Kiszka     sector_num = offset >> BDRV_SECTOR_BITS;
119983f64091Sbellard     if (len > 0) {
12009a8c4cceSKevin Wolf         if ((ret = bdrv_read(bs, sector_num, tmp_buf, 1)) < 0)
12019a8c4cceSKevin Wolf             return ret;
12026ea44308SJan Kiszka         memcpy(tmp_buf + (offset & (BDRV_SECTOR_SIZE - 1)), buf, len);
12039a8c4cceSKevin Wolf         if ((ret = bdrv_write(bs, sector_num, tmp_buf, 1)) < 0)
12049a8c4cceSKevin Wolf             return ret;
120583f64091Sbellard         count -= len;
120683f64091Sbellard         if (count == 0)
120783f64091Sbellard             return count1;
120883f64091Sbellard         sector_num++;
120983f64091Sbellard         buf += len;
121083f64091Sbellard     }
121183f64091Sbellard 
121283f64091Sbellard     /* write the sectors "in place" */
12136ea44308SJan Kiszka     nb_sectors = count >> BDRV_SECTOR_BITS;
121483f64091Sbellard     if (nb_sectors > 0) {
12159a8c4cceSKevin Wolf         if ((ret = bdrv_write(bs, sector_num, buf, nb_sectors)) < 0)
12169a8c4cceSKevin Wolf             return ret;
121783f64091Sbellard         sector_num += nb_sectors;
12186ea44308SJan Kiszka         len = nb_sectors << BDRV_SECTOR_BITS;
121983f64091Sbellard         buf += len;
122083f64091Sbellard         count -= len;
122183f64091Sbellard     }
122283f64091Sbellard 
122383f64091Sbellard     /* add data from the last sector */
122483f64091Sbellard     if (count > 0) {
12259a8c4cceSKevin Wolf         if ((ret = bdrv_read(bs, sector_num, tmp_buf, 1)) < 0)
12269a8c4cceSKevin Wolf             return ret;
122783f64091Sbellard         memcpy(tmp_buf, buf, count);
12289a8c4cceSKevin Wolf         if ((ret = bdrv_write(bs, sector_num, tmp_buf, 1)) < 0)
12299a8c4cceSKevin Wolf             return ret;
123083f64091Sbellard     }
123183f64091Sbellard     return count1;
123283f64091Sbellard }
123383f64091Sbellard 
1234f08145feSKevin Wolf /*
1235f08145feSKevin Wolf  * Writes to the file and ensures that no writes are reordered across this
1236f08145feSKevin Wolf  * request (acts as a barrier)
1237f08145feSKevin Wolf  *
1238f08145feSKevin Wolf  * Returns 0 on success, -errno in error cases.
1239f08145feSKevin Wolf  */
1240f08145feSKevin Wolf int bdrv_pwrite_sync(BlockDriverState *bs, int64_t offset,
1241f08145feSKevin Wolf     const void *buf, int count)
1242f08145feSKevin Wolf {
1243f08145feSKevin Wolf     int ret;
1244f08145feSKevin Wolf 
1245f08145feSKevin Wolf     ret = bdrv_pwrite(bs, offset, buf, count);
1246f08145feSKevin Wolf     if (ret < 0) {
1247f08145feSKevin Wolf         return ret;
1248f08145feSKevin Wolf     }
1249f08145feSKevin Wolf 
125092196b2fSStefan Hajnoczi     /* No flush needed for cache modes that use O_DSYNC */
125192196b2fSStefan Hajnoczi     if ((bs->open_flags & BDRV_O_CACHE_WB) != 0) {
1252f08145feSKevin Wolf         bdrv_flush(bs);
1253f08145feSKevin Wolf     }
1254f08145feSKevin Wolf 
1255f08145feSKevin Wolf     return 0;
1256f08145feSKevin Wolf }
1257f08145feSKevin Wolf 
1258*c5fbe571SStefan Hajnoczi /*
1259*c5fbe571SStefan Hajnoczi  * Handle a read request in coroutine context
1260*c5fbe571SStefan Hajnoczi  */
1261*c5fbe571SStefan Hajnoczi static int coroutine_fn bdrv_co_do_readv(BlockDriverState *bs,
1262*c5fbe571SStefan Hajnoczi     int64_t sector_num, int nb_sectors, QEMUIOVector *qiov)
1263da1fa91dSKevin Wolf {
1264da1fa91dSKevin Wolf     BlockDriver *drv = bs->drv;
1265da1fa91dSKevin Wolf 
1266da1fa91dSKevin Wolf     if (!drv) {
1267da1fa91dSKevin Wolf         return -ENOMEDIUM;
1268da1fa91dSKevin Wolf     }
1269da1fa91dSKevin Wolf     if (bdrv_check_request(bs, sector_num, nb_sectors)) {
1270da1fa91dSKevin Wolf         return -EIO;
1271da1fa91dSKevin Wolf     }
1272da1fa91dSKevin Wolf 
1273da1fa91dSKevin Wolf     return drv->bdrv_co_readv(bs, sector_num, nb_sectors, qiov);
1274da1fa91dSKevin Wolf }
1275da1fa91dSKevin Wolf 
1276*c5fbe571SStefan Hajnoczi int coroutine_fn bdrv_co_readv(BlockDriverState *bs, int64_t sector_num,
1277da1fa91dSKevin Wolf     int nb_sectors, QEMUIOVector *qiov)
1278da1fa91dSKevin Wolf {
1279*c5fbe571SStefan Hajnoczi     trace_bdrv_co_readv(bs, sector_num, nb_sectors);
1280da1fa91dSKevin Wolf 
1281*c5fbe571SStefan Hajnoczi     return bdrv_co_do_readv(bs, sector_num, nb_sectors, qiov);
1282*c5fbe571SStefan Hajnoczi }
1283*c5fbe571SStefan Hajnoczi 
1284*c5fbe571SStefan Hajnoczi /*
1285*c5fbe571SStefan Hajnoczi  * Handle a write request in coroutine context
1286*c5fbe571SStefan Hajnoczi  */
1287*c5fbe571SStefan Hajnoczi static int coroutine_fn bdrv_co_do_writev(BlockDriverState *bs,
1288*c5fbe571SStefan Hajnoczi     int64_t sector_num, int nb_sectors, QEMUIOVector *qiov)
1289*c5fbe571SStefan Hajnoczi {
1290*c5fbe571SStefan Hajnoczi     BlockDriver *drv = bs->drv;
1291da1fa91dSKevin Wolf 
1292da1fa91dSKevin Wolf     if (!bs->drv) {
1293da1fa91dSKevin Wolf         return -ENOMEDIUM;
1294da1fa91dSKevin Wolf     }
1295da1fa91dSKevin Wolf     if (bs->read_only) {
1296da1fa91dSKevin Wolf         return -EACCES;
1297da1fa91dSKevin Wolf     }
1298da1fa91dSKevin Wolf     if (bdrv_check_request(bs, sector_num, nb_sectors)) {
1299da1fa91dSKevin Wolf         return -EIO;
1300da1fa91dSKevin Wolf     }
1301da1fa91dSKevin Wolf 
1302da1fa91dSKevin Wolf     if (bs->dirty_bitmap) {
1303da1fa91dSKevin Wolf         set_dirty_bitmap(bs, sector_num, nb_sectors, 1);
1304da1fa91dSKevin Wolf     }
1305da1fa91dSKevin Wolf 
1306da1fa91dSKevin Wolf     if (bs->wr_highest_sector < sector_num + nb_sectors - 1) {
1307da1fa91dSKevin Wolf         bs->wr_highest_sector = sector_num + nb_sectors - 1;
1308da1fa91dSKevin Wolf     }
1309da1fa91dSKevin Wolf 
1310da1fa91dSKevin Wolf     return drv->bdrv_co_writev(bs, sector_num, nb_sectors, qiov);
1311da1fa91dSKevin Wolf }
1312da1fa91dSKevin Wolf 
1313*c5fbe571SStefan Hajnoczi int coroutine_fn bdrv_co_writev(BlockDriverState *bs, int64_t sector_num,
1314*c5fbe571SStefan Hajnoczi     int nb_sectors, QEMUIOVector *qiov)
1315*c5fbe571SStefan Hajnoczi {
1316*c5fbe571SStefan Hajnoczi     trace_bdrv_co_writev(bs, sector_num, nb_sectors);
1317*c5fbe571SStefan Hajnoczi 
1318*c5fbe571SStefan Hajnoczi     return bdrv_co_do_writev(bs, sector_num, nb_sectors, qiov);
1319*c5fbe571SStefan Hajnoczi }
1320*c5fbe571SStefan Hajnoczi 
132183f64091Sbellard /**
132283f64091Sbellard  * Truncate file to 'offset' bytes (needed only for file protocols)
132383f64091Sbellard  */
132483f64091Sbellard int bdrv_truncate(BlockDriverState *bs, int64_t offset)
132583f64091Sbellard {
132683f64091Sbellard     BlockDriver *drv = bs->drv;
132751762288SStefan Hajnoczi     int ret;
132883f64091Sbellard     if (!drv)
132919cb3738Sbellard         return -ENOMEDIUM;
133083f64091Sbellard     if (!drv->bdrv_truncate)
133183f64091Sbellard         return -ENOTSUP;
133259f2689dSNaphtali Sprei     if (bs->read_only)
133359f2689dSNaphtali Sprei         return -EACCES;
13348591675fSMarcelo Tosatti     if (bdrv_in_use(bs))
13358591675fSMarcelo Tosatti         return -EBUSY;
133651762288SStefan Hajnoczi     ret = drv->bdrv_truncate(bs, offset);
133751762288SStefan Hajnoczi     if (ret == 0) {
133851762288SStefan Hajnoczi         ret = refresh_total_sectors(bs, offset >> BDRV_SECTOR_BITS);
1339145feb17SMarkus Armbruster         bdrv_dev_resize_cb(bs);
134051762288SStefan Hajnoczi     }
134151762288SStefan Hajnoczi     return ret;
134283f64091Sbellard }
134383f64091Sbellard 
134483f64091Sbellard /**
13454a1d5e1fSFam Zheng  * Length of a allocated file in bytes. Sparse files are counted by actual
13464a1d5e1fSFam Zheng  * allocated space. Return < 0 if error or unknown.
13474a1d5e1fSFam Zheng  */
13484a1d5e1fSFam Zheng int64_t bdrv_get_allocated_file_size(BlockDriverState *bs)
13494a1d5e1fSFam Zheng {
13504a1d5e1fSFam Zheng     BlockDriver *drv = bs->drv;
13514a1d5e1fSFam Zheng     if (!drv) {
13524a1d5e1fSFam Zheng         return -ENOMEDIUM;
13534a1d5e1fSFam Zheng     }
13544a1d5e1fSFam Zheng     if (drv->bdrv_get_allocated_file_size) {
13554a1d5e1fSFam Zheng         return drv->bdrv_get_allocated_file_size(bs);
13564a1d5e1fSFam Zheng     }
13574a1d5e1fSFam Zheng     if (bs->file) {
13584a1d5e1fSFam Zheng         return bdrv_get_allocated_file_size(bs->file);
13594a1d5e1fSFam Zheng     }
13604a1d5e1fSFam Zheng     return -ENOTSUP;
13614a1d5e1fSFam Zheng }
13624a1d5e1fSFam Zheng 
13634a1d5e1fSFam Zheng /**
136483f64091Sbellard  * Length of a file in bytes. Return < 0 if error or unknown.
136583f64091Sbellard  */
136683f64091Sbellard int64_t bdrv_getlength(BlockDriverState *bs)
136783f64091Sbellard {
136883f64091Sbellard     BlockDriver *drv = bs->drv;
136983f64091Sbellard     if (!drv)
137019cb3738Sbellard         return -ENOMEDIUM;
137151762288SStefan Hajnoczi 
13722c6942faSMarkus Armbruster     if (bs->growable || bdrv_dev_has_removable_media(bs)) {
137346a4e4e6SStefan Hajnoczi         if (drv->bdrv_getlength) {
137483f64091Sbellard             return drv->bdrv_getlength(bs);
1375fc01f7e7Sbellard         }
137646a4e4e6SStefan Hajnoczi     }
137746a4e4e6SStefan Hajnoczi     return bs->total_sectors * BDRV_SECTOR_SIZE;
137846a4e4e6SStefan Hajnoczi }
1379fc01f7e7Sbellard 
138019cb3738Sbellard /* return 0 as number of sectors if no device present or error */
138196b8f136Sths void bdrv_get_geometry(BlockDriverState *bs, uint64_t *nb_sectors_ptr)
1382fc01f7e7Sbellard {
138319cb3738Sbellard     int64_t length;
138419cb3738Sbellard     length = bdrv_getlength(bs);
138519cb3738Sbellard     if (length < 0)
138619cb3738Sbellard         length = 0;
138719cb3738Sbellard     else
13886ea44308SJan Kiszka         length = length >> BDRV_SECTOR_BITS;
138919cb3738Sbellard     *nb_sectors_ptr = length;
1390fc01f7e7Sbellard }
1391cf98951bSbellard 
1392f3d54fc4Saliguori struct partition {
1393f3d54fc4Saliguori         uint8_t boot_ind;           /* 0x80 - active */
1394f3d54fc4Saliguori         uint8_t head;               /* starting head */
1395f3d54fc4Saliguori         uint8_t sector;             /* starting sector */
1396f3d54fc4Saliguori         uint8_t cyl;                /* starting cylinder */
1397f3d54fc4Saliguori         uint8_t sys_ind;            /* What partition type */
1398f3d54fc4Saliguori         uint8_t end_head;           /* end head */
1399f3d54fc4Saliguori         uint8_t end_sector;         /* end sector */
1400f3d54fc4Saliguori         uint8_t end_cyl;            /* end cylinder */
1401f3d54fc4Saliguori         uint32_t start_sect;        /* starting sector counting from 0 */
1402f3d54fc4Saliguori         uint32_t nr_sects;          /* nr of sectors in partition */
1403541dc0d4SStefan Weil } QEMU_PACKED;
1404f3d54fc4Saliguori 
1405f3d54fc4Saliguori /* try to guess the disk logical geometry from the MSDOS partition table. Return 0 if OK, -1 if could not guess */
1406f3d54fc4Saliguori static int guess_disk_lchs(BlockDriverState *bs,
1407f3d54fc4Saliguori                            int *pcylinders, int *pheads, int *psectors)
1408f3d54fc4Saliguori {
1409eb5a3165SJes Sorensen     uint8_t buf[BDRV_SECTOR_SIZE];
1410f3d54fc4Saliguori     int ret, i, heads, sectors, cylinders;
1411f3d54fc4Saliguori     struct partition *p;
1412f3d54fc4Saliguori     uint32_t nr_sects;
1413a38131b6Sblueswir1     uint64_t nb_sectors;
1414f3d54fc4Saliguori 
1415f3d54fc4Saliguori     bdrv_get_geometry(bs, &nb_sectors);
1416f3d54fc4Saliguori 
1417f3d54fc4Saliguori     ret = bdrv_read(bs, 0, buf, 1);
1418f3d54fc4Saliguori     if (ret < 0)
1419f3d54fc4Saliguori         return -1;
1420f3d54fc4Saliguori     /* test msdos magic */
1421f3d54fc4Saliguori     if (buf[510] != 0x55 || buf[511] != 0xaa)
1422f3d54fc4Saliguori         return -1;
1423f3d54fc4Saliguori     for(i = 0; i < 4; i++) {
1424f3d54fc4Saliguori         p = ((struct partition *)(buf + 0x1be)) + i;
1425f3d54fc4Saliguori         nr_sects = le32_to_cpu(p->nr_sects);
1426f3d54fc4Saliguori         if (nr_sects && p->end_head) {
1427f3d54fc4Saliguori             /* We make the assumption that the partition terminates on
1428f3d54fc4Saliguori                a cylinder boundary */
1429f3d54fc4Saliguori             heads = p->end_head + 1;
1430f3d54fc4Saliguori             sectors = p->end_sector & 63;
1431f3d54fc4Saliguori             if (sectors == 0)
1432f3d54fc4Saliguori                 continue;
1433f3d54fc4Saliguori             cylinders = nb_sectors / (heads * sectors);
1434f3d54fc4Saliguori             if (cylinders < 1 || cylinders > 16383)
1435f3d54fc4Saliguori                 continue;
1436f3d54fc4Saliguori             *pheads = heads;
1437f3d54fc4Saliguori             *psectors = sectors;
1438f3d54fc4Saliguori             *pcylinders = cylinders;
1439f3d54fc4Saliguori #if 0
1440f3d54fc4Saliguori             printf("guessed geometry: LCHS=%d %d %d\n",
1441f3d54fc4Saliguori                    cylinders, heads, sectors);
1442f3d54fc4Saliguori #endif
1443f3d54fc4Saliguori             return 0;
1444f3d54fc4Saliguori         }
1445f3d54fc4Saliguori     }
1446f3d54fc4Saliguori     return -1;
1447f3d54fc4Saliguori }
1448f3d54fc4Saliguori 
1449f3d54fc4Saliguori void bdrv_guess_geometry(BlockDriverState *bs, int *pcyls, int *pheads, int *psecs)
1450f3d54fc4Saliguori {
1451f3d54fc4Saliguori     int translation, lba_detected = 0;
1452f3d54fc4Saliguori     int cylinders, heads, secs;
1453a38131b6Sblueswir1     uint64_t nb_sectors;
1454f3d54fc4Saliguori 
1455f3d54fc4Saliguori     /* if a geometry hint is available, use it */
1456f3d54fc4Saliguori     bdrv_get_geometry(bs, &nb_sectors);
1457f3d54fc4Saliguori     bdrv_get_geometry_hint(bs, &cylinders, &heads, &secs);
1458f3d54fc4Saliguori     translation = bdrv_get_translation_hint(bs);
1459f3d54fc4Saliguori     if (cylinders != 0) {
1460f3d54fc4Saliguori         *pcyls = cylinders;
1461f3d54fc4Saliguori         *pheads = heads;
1462f3d54fc4Saliguori         *psecs = secs;
1463f3d54fc4Saliguori     } else {
1464f3d54fc4Saliguori         if (guess_disk_lchs(bs, &cylinders, &heads, &secs) == 0) {
1465f3d54fc4Saliguori             if (heads > 16) {
1466f3d54fc4Saliguori                 /* if heads > 16, it means that a BIOS LBA
1467f3d54fc4Saliguori                    translation was active, so the default
1468f3d54fc4Saliguori                    hardware geometry is OK */
1469f3d54fc4Saliguori                 lba_detected = 1;
1470f3d54fc4Saliguori                 goto default_geometry;
1471f3d54fc4Saliguori             } else {
1472f3d54fc4Saliguori                 *pcyls = cylinders;
1473f3d54fc4Saliguori                 *pheads = heads;
1474f3d54fc4Saliguori                 *psecs = secs;
1475f3d54fc4Saliguori                 /* disable any translation to be in sync with
1476f3d54fc4Saliguori                    the logical geometry */
1477f3d54fc4Saliguori                 if (translation == BIOS_ATA_TRANSLATION_AUTO) {
1478f3d54fc4Saliguori                     bdrv_set_translation_hint(bs,
1479f3d54fc4Saliguori                                               BIOS_ATA_TRANSLATION_NONE);
1480f3d54fc4Saliguori                 }
1481f3d54fc4Saliguori             }
1482f3d54fc4Saliguori         } else {
1483f3d54fc4Saliguori         default_geometry:
1484f3d54fc4Saliguori             /* if no geometry, use a standard physical disk geometry */
1485f3d54fc4Saliguori             cylinders = nb_sectors / (16 * 63);
1486f3d54fc4Saliguori 
1487f3d54fc4Saliguori             if (cylinders > 16383)
1488f3d54fc4Saliguori                 cylinders = 16383;
1489f3d54fc4Saliguori             else if (cylinders < 2)
1490f3d54fc4Saliguori                 cylinders = 2;
1491f3d54fc4Saliguori             *pcyls = cylinders;
1492f3d54fc4Saliguori             *pheads = 16;
1493f3d54fc4Saliguori             *psecs = 63;
1494f3d54fc4Saliguori             if ((lba_detected == 1) && (translation == BIOS_ATA_TRANSLATION_AUTO)) {
1495f3d54fc4Saliguori                 if ((*pcyls * *pheads) <= 131072) {
1496f3d54fc4Saliguori                     bdrv_set_translation_hint(bs,
1497f3d54fc4Saliguori                                               BIOS_ATA_TRANSLATION_LARGE);
1498f3d54fc4Saliguori                 } else {
1499f3d54fc4Saliguori                     bdrv_set_translation_hint(bs,
1500f3d54fc4Saliguori                                               BIOS_ATA_TRANSLATION_LBA);
1501f3d54fc4Saliguori                 }
1502f3d54fc4Saliguori             }
1503f3d54fc4Saliguori         }
1504f3d54fc4Saliguori         bdrv_set_geometry_hint(bs, *pcyls, *pheads, *psecs);
1505f3d54fc4Saliguori     }
1506f3d54fc4Saliguori }
1507f3d54fc4Saliguori 
1508b338082bSbellard void bdrv_set_geometry_hint(BlockDriverState *bs,
1509b338082bSbellard                             int cyls, int heads, int secs)
1510b338082bSbellard {
1511b338082bSbellard     bs->cyls = cyls;
1512b338082bSbellard     bs->heads = heads;
1513b338082bSbellard     bs->secs = secs;
1514b338082bSbellard }
1515b338082bSbellard 
151646d4767dSbellard void bdrv_set_translation_hint(BlockDriverState *bs, int translation)
151746d4767dSbellard {
151846d4767dSbellard     bs->translation = translation;
151946d4767dSbellard }
152046d4767dSbellard 
1521b338082bSbellard void bdrv_get_geometry_hint(BlockDriverState *bs,
1522b338082bSbellard                             int *pcyls, int *pheads, int *psecs)
1523b338082bSbellard {
1524b338082bSbellard     *pcyls = bs->cyls;
1525b338082bSbellard     *pheads = bs->heads;
1526b338082bSbellard     *psecs = bs->secs;
1527b338082bSbellard }
1528b338082bSbellard 
15295bbdbb46SBlue Swirl /* Recognize floppy formats */
15305bbdbb46SBlue Swirl typedef struct FDFormat {
15315bbdbb46SBlue Swirl     FDriveType drive;
15325bbdbb46SBlue Swirl     uint8_t last_sect;
15335bbdbb46SBlue Swirl     uint8_t max_track;
15345bbdbb46SBlue Swirl     uint8_t max_head;
15355bbdbb46SBlue Swirl } FDFormat;
15365bbdbb46SBlue Swirl 
15375bbdbb46SBlue Swirl static const FDFormat fd_formats[] = {
15385bbdbb46SBlue Swirl     /* First entry is default format */
15395bbdbb46SBlue Swirl     /* 1.44 MB 3"1/2 floppy disks */
15405bbdbb46SBlue Swirl     { FDRIVE_DRV_144, 18, 80, 1, },
15415bbdbb46SBlue Swirl     { FDRIVE_DRV_144, 20, 80, 1, },
15425bbdbb46SBlue Swirl     { FDRIVE_DRV_144, 21, 80, 1, },
15435bbdbb46SBlue Swirl     { FDRIVE_DRV_144, 21, 82, 1, },
15445bbdbb46SBlue Swirl     { FDRIVE_DRV_144, 21, 83, 1, },
15455bbdbb46SBlue Swirl     { FDRIVE_DRV_144, 22, 80, 1, },
15465bbdbb46SBlue Swirl     { FDRIVE_DRV_144, 23, 80, 1, },
15475bbdbb46SBlue Swirl     { FDRIVE_DRV_144, 24, 80, 1, },
15485bbdbb46SBlue Swirl     /* 2.88 MB 3"1/2 floppy disks */
15495bbdbb46SBlue Swirl     { FDRIVE_DRV_288, 36, 80, 1, },
15505bbdbb46SBlue Swirl     { FDRIVE_DRV_288, 39, 80, 1, },
15515bbdbb46SBlue Swirl     { FDRIVE_DRV_288, 40, 80, 1, },
15525bbdbb46SBlue Swirl     { FDRIVE_DRV_288, 44, 80, 1, },
15535bbdbb46SBlue Swirl     { FDRIVE_DRV_288, 48, 80, 1, },
15545bbdbb46SBlue Swirl     /* 720 kB 3"1/2 floppy disks */
15555bbdbb46SBlue Swirl     { FDRIVE_DRV_144,  9, 80, 1, },
15565bbdbb46SBlue Swirl     { FDRIVE_DRV_144, 10, 80, 1, },
15575bbdbb46SBlue Swirl     { FDRIVE_DRV_144, 10, 82, 1, },
15585bbdbb46SBlue Swirl     { FDRIVE_DRV_144, 10, 83, 1, },
15595bbdbb46SBlue Swirl     { FDRIVE_DRV_144, 13, 80, 1, },
15605bbdbb46SBlue Swirl     { FDRIVE_DRV_144, 14, 80, 1, },
15615bbdbb46SBlue Swirl     /* 1.2 MB 5"1/4 floppy disks */
15625bbdbb46SBlue Swirl     { FDRIVE_DRV_120, 15, 80, 1, },
15635bbdbb46SBlue Swirl     { FDRIVE_DRV_120, 18, 80, 1, },
15645bbdbb46SBlue Swirl     { FDRIVE_DRV_120, 18, 82, 1, },
15655bbdbb46SBlue Swirl     { FDRIVE_DRV_120, 18, 83, 1, },
15665bbdbb46SBlue Swirl     { FDRIVE_DRV_120, 20, 80, 1, },
15675bbdbb46SBlue Swirl     /* 720 kB 5"1/4 floppy disks */
15685bbdbb46SBlue Swirl     { FDRIVE_DRV_120,  9, 80, 1, },
15695bbdbb46SBlue Swirl     { FDRIVE_DRV_120, 11, 80, 1, },
15705bbdbb46SBlue Swirl     /* 360 kB 5"1/4 floppy disks */
15715bbdbb46SBlue Swirl     { FDRIVE_DRV_120,  9, 40, 1, },
15725bbdbb46SBlue Swirl     { FDRIVE_DRV_120,  9, 40, 0, },
15735bbdbb46SBlue Swirl     { FDRIVE_DRV_120, 10, 41, 1, },
15745bbdbb46SBlue Swirl     { FDRIVE_DRV_120, 10, 42, 1, },
15755bbdbb46SBlue Swirl     /* 320 kB 5"1/4 floppy disks */
15765bbdbb46SBlue Swirl     { FDRIVE_DRV_120,  8, 40, 1, },
15775bbdbb46SBlue Swirl     { FDRIVE_DRV_120,  8, 40, 0, },
15785bbdbb46SBlue Swirl     /* 360 kB must match 5"1/4 better than 3"1/2... */
15795bbdbb46SBlue Swirl     { FDRIVE_DRV_144,  9, 80, 0, },
15805bbdbb46SBlue Swirl     /* end */
15815bbdbb46SBlue Swirl     { FDRIVE_DRV_NONE, -1, -1, 0, },
15825bbdbb46SBlue Swirl };
15835bbdbb46SBlue Swirl 
15845bbdbb46SBlue Swirl void bdrv_get_floppy_geometry_hint(BlockDriverState *bs, int *nb_heads,
15855bbdbb46SBlue Swirl                                    int *max_track, int *last_sect,
15865bbdbb46SBlue Swirl                                    FDriveType drive_in, FDriveType *drive)
15875bbdbb46SBlue Swirl {
15885bbdbb46SBlue Swirl     const FDFormat *parse;
15895bbdbb46SBlue Swirl     uint64_t nb_sectors, size;
15905bbdbb46SBlue Swirl     int i, first_match, match;
15915bbdbb46SBlue Swirl 
15925bbdbb46SBlue Swirl     bdrv_get_geometry_hint(bs, nb_heads, max_track, last_sect);
15935bbdbb46SBlue Swirl     if (*nb_heads != 0 && *max_track != 0 && *last_sect != 0) {
15945bbdbb46SBlue Swirl         /* User defined disk */
15955bbdbb46SBlue Swirl     } else {
15965bbdbb46SBlue Swirl         bdrv_get_geometry(bs, &nb_sectors);
15975bbdbb46SBlue Swirl         match = -1;
15985bbdbb46SBlue Swirl         first_match = -1;
15995bbdbb46SBlue Swirl         for (i = 0; ; i++) {
16005bbdbb46SBlue Swirl             parse = &fd_formats[i];
16015bbdbb46SBlue Swirl             if (parse->drive == FDRIVE_DRV_NONE) {
16025bbdbb46SBlue Swirl                 break;
16035bbdbb46SBlue Swirl             }
16045bbdbb46SBlue Swirl             if (drive_in == parse->drive ||
16055bbdbb46SBlue Swirl                 drive_in == FDRIVE_DRV_NONE) {
16065bbdbb46SBlue Swirl                 size = (parse->max_head + 1) * parse->max_track *
16075bbdbb46SBlue Swirl                     parse->last_sect;
16085bbdbb46SBlue Swirl                 if (nb_sectors == size) {
16095bbdbb46SBlue Swirl                     match = i;
16105bbdbb46SBlue Swirl                     break;
16115bbdbb46SBlue Swirl                 }
16125bbdbb46SBlue Swirl                 if (first_match == -1) {
16135bbdbb46SBlue Swirl                     first_match = i;
16145bbdbb46SBlue Swirl                 }
16155bbdbb46SBlue Swirl             }
16165bbdbb46SBlue Swirl         }
16175bbdbb46SBlue Swirl         if (match == -1) {
16185bbdbb46SBlue Swirl             if (first_match == -1) {
16195bbdbb46SBlue Swirl                 match = 1;
16205bbdbb46SBlue Swirl             } else {
16215bbdbb46SBlue Swirl                 match = first_match;
16225bbdbb46SBlue Swirl             }
16235bbdbb46SBlue Swirl             parse = &fd_formats[match];
16245bbdbb46SBlue Swirl         }
16255bbdbb46SBlue Swirl         *nb_heads = parse->max_head + 1;
16265bbdbb46SBlue Swirl         *max_track = parse->max_track;
16275bbdbb46SBlue Swirl         *last_sect = parse->last_sect;
16285bbdbb46SBlue Swirl         *drive = parse->drive;
16295bbdbb46SBlue Swirl     }
16305bbdbb46SBlue Swirl }
16315bbdbb46SBlue Swirl 
163246d4767dSbellard int bdrv_get_translation_hint(BlockDriverState *bs)
163346d4767dSbellard {
163446d4767dSbellard     return bs->translation;
163546d4767dSbellard }
163646d4767dSbellard 
1637abd7f68dSMarkus Armbruster void bdrv_set_on_error(BlockDriverState *bs, BlockErrorAction on_read_error,
1638abd7f68dSMarkus Armbruster                        BlockErrorAction on_write_error)
1639abd7f68dSMarkus Armbruster {
1640abd7f68dSMarkus Armbruster     bs->on_read_error = on_read_error;
1641abd7f68dSMarkus Armbruster     bs->on_write_error = on_write_error;
1642abd7f68dSMarkus Armbruster }
1643abd7f68dSMarkus Armbruster 
1644abd7f68dSMarkus Armbruster BlockErrorAction bdrv_get_on_error(BlockDriverState *bs, int is_read)
1645abd7f68dSMarkus Armbruster {
1646abd7f68dSMarkus Armbruster     return is_read ? bs->on_read_error : bs->on_write_error;
1647abd7f68dSMarkus Armbruster }
1648abd7f68dSMarkus Armbruster 
1649b338082bSbellard int bdrv_is_read_only(BlockDriverState *bs)
1650b338082bSbellard {
1651b338082bSbellard     return bs->read_only;
1652b338082bSbellard }
1653b338082bSbellard 
1654985a03b0Sths int bdrv_is_sg(BlockDriverState *bs)
1655985a03b0Sths {
1656985a03b0Sths     return bs->sg;
1657985a03b0Sths }
1658985a03b0Sths 
1659e900a7b7SChristoph Hellwig int bdrv_enable_write_cache(BlockDriverState *bs)
1660e900a7b7SChristoph Hellwig {
1661e900a7b7SChristoph Hellwig     return bs->enable_write_cache;
1662e900a7b7SChristoph Hellwig }
1663e900a7b7SChristoph Hellwig 
1664ea2384d3Sbellard int bdrv_is_encrypted(BlockDriverState *bs)
1665ea2384d3Sbellard {
1666ea2384d3Sbellard     if (bs->backing_hd && bs->backing_hd->encrypted)
1667ea2384d3Sbellard         return 1;
1668ea2384d3Sbellard     return bs->encrypted;
1669ea2384d3Sbellard }
1670ea2384d3Sbellard 
1671c0f4ce77Saliguori int bdrv_key_required(BlockDriverState *bs)
1672c0f4ce77Saliguori {
1673c0f4ce77Saliguori     BlockDriverState *backing_hd = bs->backing_hd;
1674c0f4ce77Saliguori 
1675c0f4ce77Saliguori     if (backing_hd && backing_hd->encrypted && !backing_hd->valid_key)
1676c0f4ce77Saliguori         return 1;
1677c0f4ce77Saliguori     return (bs->encrypted && !bs->valid_key);
1678c0f4ce77Saliguori }
1679c0f4ce77Saliguori 
1680ea2384d3Sbellard int bdrv_set_key(BlockDriverState *bs, const char *key)
1681ea2384d3Sbellard {
1682ea2384d3Sbellard     int ret;
1683ea2384d3Sbellard     if (bs->backing_hd && bs->backing_hd->encrypted) {
1684ea2384d3Sbellard         ret = bdrv_set_key(bs->backing_hd, key);
1685ea2384d3Sbellard         if (ret < 0)
1686ea2384d3Sbellard             return ret;
1687ea2384d3Sbellard         if (!bs->encrypted)
1688ea2384d3Sbellard             return 0;
1689ea2384d3Sbellard     }
1690fd04a2aeSShahar Havivi     if (!bs->encrypted) {
1691fd04a2aeSShahar Havivi         return -EINVAL;
1692fd04a2aeSShahar Havivi     } else if (!bs->drv || !bs->drv->bdrv_set_key) {
1693fd04a2aeSShahar Havivi         return -ENOMEDIUM;
1694fd04a2aeSShahar Havivi     }
1695c0f4ce77Saliguori     ret = bs->drv->bdrv_set_key(bs, key);
1696bb5fc20fSaliguori     if (ret < 0) {
1697bb5fc20fSaliguori         bs->valid_key = 0;
1698bb5fc20fSaliguori     } else if (!bs->valid_key) {
1699bb5fc20fSaliguori         bs->valid_key = 1;
1700bb5fc20fSaliguori         /* call the change callback now, we skipped it on open */
17017d4b4ba5SMarkus Armbruster         bdrv_dev_change_media_cb(bs, true);
1702bb5fc20fSaliguori     }
1703c0f4ce77Saliguori     return ret;
1704ea2384d3Sbellard }
1705ea2384d3Sbellard 
1706ea2384d3Sbellard void bdrv_get_format(BlockDriverState *bs, char *buf, int buf_size)
1707ea2384d3Sbellard {
170819cb3738Sbellard     if (!bs->drv) {
1709ea2384d3Sbellard         buf[0] = '\0';
1710ea2384d3Sbellard     } else {
1711ea2384d3Sbellard         pstrcpy(buf, buf_size, bs->drv->format_name);
1712ea2384d3Sbellard     }
1713ea2384d3Sbellard }
1714ea2384d3Sbellard 
1715ea2384d3Sbellard void bdrv_iterate_format(void (*it)(void *opaque, const char *name),
1716ea2384d3Sbellard                          void *opaque)
1717ea2384d3Sbellard {
1718ea2384d3Sbellard     BlockDriver *drv;
1719ea2384d3Sbellard 
17208a22f02aSStefan Hajnoczi     QLIST_FOREACH(drv, &bdrv_drivers, list) {
1721ea2384d3Sbellard         it(opaque, drv->format_name);
1722ea2384d3Sbellard     }
1723ea2384d3Sbellard }
1724ea2384d3Sbellard 
1725b338082bSbellard BlockDriverState *bdrv_find(const char *name)
1726b338082bSbellard {
1727b338082bSbellard     BlockDriverState *bs;
1728b338082bSbellard 
17291b7bdbc1SStefan Hajnoczi     QTAILQ_FOREACH(bs, &bdrv_states, list) {
17301b7bdbc1SStefan Hajnoczi         if (!strcmp(name, bs->device_name)) {
1731b338082bSbellard             return bs;
1732b338082bSbellard         }
17331b7bdbc1SStefan Hajnoczi     }
1734b338082bSbellard     return NULL;
1735b338082bSbellard }
1736b338082bSbellard 
17372f399b0aSMarkus Armbruster BlockDriverState *bdrv_next(BlockDriverState *bs)
17382f399b0aSMarkus Armbruster {
17392f399b0aSMarkus Armbruster     if (!bs) {
17402f399b0aSMarkus Armbruster         return QTAILQ_FIRST(&bdrv_states);
17412f399b0aSMarkus Armbruster     }
17422f399b0aSMarkus Armbruster     return QTAILQ_NEXT(bs, list);
17432f399b0aSMarkus Armbruster }
17442f399b0aSMarkus Armbruster 
174551de9760Saliguori void bdrv_iterate(void (*it)(void *opaque, BlockDriverState *bs), void *opaque)
174681d0912dSbellard {
174781d0912dSbellard     BlockDriverState *bs;
174881d0912dSbellard 
17491b7bdbc1SStefan Hajnoczi     QTAILQ_FOREACH(bs, &bdrv_states, list) {
175051de9760Saliguori         it(opaque, bs);
175181d0912dSbellard     }
175281d0912dSbellard }
175381d0912dSbellard 
1754ea2384d3Sbellard const char *bdrv_get_device_name(BlockDriverState *bs)
1755ea2384d3Sbellard {
1756ea2384d3Sbellard     return bs->device_name;
1757ea2384d3Sbellard }
1758ea2384d3Sbellard 
1759205ef796SKevin Wolf int bdrv_flush(BlockDriverState *bs)
17607a6cba61Spbrook {
1761016f5cf6SAlexander Graf     if (bs->open_flags & BDRV_O_NO_FLUSH) {
1762205ef796SKevin Wolf         return 0;
1763016f5cf6SAlexander Graf     }
1764016f5cf6SAlexander Graf 
1765e7a8a783SKevin Wolf     if (bs->drv && bdrv_has_async_flush(bs->drv) && qemu_in_coroutine()) {
1766e7a8a783SKevin Wolf         return bdrv_co_flush_em(bs);
1767e7a8a783SKevin Wolf     }
1768e7a8a783SKevin Wolf 
1769205ef796SKevin Wolf     if (bs->drv && bs->drv->bdrv_flush) {
1770205ef796SKevin Wolf         return bs->drv->bdrv_flush(bs);
1771205ef796SKevin Wolf     }
1772205ef796SKevin Wolf 
1773205ef796SKevin Wolf     /*
1774205ef796SKevin Wolf      * Some block drivers always operate in either writethrough or unsafe mode
1775205ef796SKevin Wolf      * and don't support bdrv_flush therefore. Usually qemu doesn't know how
1776205ef796SKevin Wolf      * the server works (because the behaviour is hardcoded or depends on
1777205ef796SKevin Wolf      * server-side configuration), so we can't ensure that everything is safe
1778205ef796SKevin Wolf      * on disk. Returning an error doesn't work because that would break guests
1779205ef796SKevin Wolf      * even if the server operates in writethrough mode.
1780205ef796SKevin Wolf      *
1781205ef796SKevin Wolf      * Let's hope the user knows what he's doing.
1782205ef796SKevin Wolf      */
1783205ef796SKevin Wolf     return 0;
17847a6cba61Spbrook }
17857a6cba61Spbrook 
1786c6ca28d6Saliguori void bdrv_flush_all(void)
1787c6ca28d6Saliguori {
1788c6ca28d6Saliguori     BlockDriverState *bs;
1789c6ca28d6Saliguori 
17901b7bdbc1SStefan Hajnoczi     QTAILQ_FOREACH(bs, &bdrv_states, list) {
1791c602a489SMarkus Armbruster         if (!bdrv_is_read_only(bs) && bdrv_is_inserted(bs)) {
1792c6ca28d6Saliguori             bdrv_flush(bs);
1793c6ca28d6Saliguori         }
17941b7bdbc1SStefan Hajnoczi     }
17951b7bdbc1SStefan Hajnoczi }
1796c6ca28d6Saliguori 
1797f2feebbdSKevin Wolf int bdrv_has_zero_init(BlockDriverState *bs)
1798f2feebbdSKevin Wolf {
1799f2feebbdSKevin Wolf     assert(bs->drv);
1800f2feebbdSKevin Wolf 
1801336c1c12SKevin Wolf     if (bs->drv->bdrv_has_zero_init) {
1802336c1c12SKevin Wolf         return bs->drv->bdrv_has_zero_init(bs);
1803f2feebbdSKevin Wolf     }
1804f2feebbdSKevin Wolf 
1805f2feebbdSKevin Wolf     return 1;
1806f2feebbdSKevin Wolf }
1807f2feebbdSKevin Wolf 
1808bb8bf76fSChristoph Hellwig int bdrv_discard(BlockDriverState *bs, int64_t sector_num, int nb_sectors)
1809bb8bf76fSChristoph Hellwig {
1810bb8bf76fSChristoph Hellwig     if (!bs->drv) {
1811bb8bf76fSChristoph Hellwig         return -ENOMEDIUM;
1812bb8bf76fSChristoph Hellwig     }
1813bb8bf76fSChristoph Hellwig     if (!bs->drv->bdrv_discard) {
1814bb8bf76fSChristoph Hellwig         return 0;
1815bb8bf76fSChristoph Hellwig     }
1816bb8bf76fSChristoph Hellwig     return bs->drv->bdrv_discard(bs, sector_num, nb_sectors);
1817bb8bf76fSChristoph Hellwig }
1818bb8bf76fSChristoph Hellwig 
1819f58c7b35Sths /*
1820f58c7b35Sths  * Returns true iff the specified sector is present in the disk image. Drivers
1821f58c7b35Sths  * not implementing the functionality are assumed to not support backing files,
1822f58c7b35Sths  * hence all their sectors are reported as allocated.
1823f58c7b35Sths  *
1824f58c7b35Sths  * 'pnum' is set to the number of sectors (including and immediately following
1825f58c7b35Sths  * the specified sector) that are known to be in the same
1826f58c7b35Sths  * allocated/unallocated state.
1827f58c7b35Sths  *
1828f58c7b35Sths  * 'nb_sectors' is the max value 'pnum' should be set to.
1829f58c7b35Sths  */
1830f58c7b35Sths int bdrv_is_allocated(BlockDriverState *bs, int64_t sector_num, int nb_sectors,
1831f58c7b35Sths 	int *pnum)
1832f58c7b35Sths {
1833f58c7b35Sths     int64_t n;
1834f58c7b35Sths     if (!bs->drv->bdrv_is_allocated) {
1835f58c7b35Sths         if (sector_num >= bs->total_sectors) {
1836f58c7b35Sths             *pnum = 0;
1837f58c7b35Sths             return 0;
1838f58c7b35Sths         }
1839f58c7b35Sths         n = bs->total_sectors - sector_num;
1840f58c7b35Sths         *pnum = (n < nb_sectors) ? (n) : (nb_sectors);
1841f58c7b35Sths         return 1;
1842f58c7b35Sths     }
1843f58c7b35Sths     return bs->drv->bdrv_is_allocated(bs, sector_num, nb_sectors, pnum);
1844f58c7b35Sths }
1845f58c7b35Sths 
18462582bfedSLuiz Capitulino void bdrv_mon_event(const BlockDriverState *bdrv,
18472582bfedSLuiz Capitulino                     BlockMonEventAction action, int is_read)
18482582bfedSLuiz Capitulino {
18492582bfedSLuiz Capitulino     QObject *data;
18502582bfedSLuiz Capitulino     const char *action_str;
18512582bfedSLuiz Capitulino 
18522582bfedSLuiz Capitulino     switch (action) {
18532582bfedSLuiz Capitulino     case BDRV_ACTION_REPORT:
18542582bfedSLuiz Capitulino         action_str = "report";
18552582bfedSLuiz Capitulino         break;
18562582bfedSLuiz Capitulino     case BDRV_ACTION_IGNORE:
18572582bfedSLuiz Capitulino         action_str = "ignore";
18582582bfedSLuiz Capitulino         break;
18592582bfedSLuiz Capitulino     case BDRV_ACTION_STOP:
18602582bfedSLuiz Capitulino         action_str = "stop";
18612582bfedSLuiz Capitulino         break;
18622582bfedSLuiz Capitulino     default:
18632582bfedSLuiz Capitulino         abort();
18642582bfedSLuiz Capitulino     }
18652582bfedSLuiz Capitulino 
18662582bfedSLuiz Capitulino     data = qobject_from_jsonf("{ 'device': %s, 'action': %s, 'operation': %s }",
18672582bfedSLuiz Capitulino                               bdrv->device_name,
18682582bfedSLuiz Capitulino                               action_str,
18692582bfedSLuiz Capitulino                               is_read ? "read" : "write");
18702582bfedSLuiz Capitulino     monitor_protocol_event(QEVENT_BLOCK_IO_ERROR, data);
18712582bfedSLuiz Capitulino 
18722582bfedSLuiz Capitulino     qobject_decref(data);
18732582bfedSLuiz Capitulino }
18742582bfedSLuiz Capitulino 
1875d15e5465SLuiz Capitulino static void bdrv_print_dict(QObject *obj, void *opaque)
1876b338082bSbellard {
1877d15e5465SLuiz Capitulino     QDict *bs_dict;
1878d15e5465SLuiz Capitulino     Monitor *mon = opaque;
1879b338082bSbellard 
1880d15e5465SLuiz Capitulino     bs_dict = qobject_to_qdict(obj);
1881d15e5465SLuiz Capitulino 
1882d8aeeb31SMarkus Armbruster     monitor_printf(mon, "%s: removable=%d",
1883d15e5465SLuiz Capitulino                         qdict_get_str(bs_dict, "device"),
1884d15e5465SLuiz Capitulino                         qdict_get_bool(bs_dict, "removable"));
1885d15e5465SLuiz Capitulino 
1886d15e5465SLuiz Capitulino     if (qdict_get_bool(bs_dict, "removable")) {
1887d15e5465SLuiz Capitulino         monitor_printf(mon, " locked=%d", qdict_get_bool(bs_dict, "locked"));
1888e4def80bSMarkus Armbruster         monitor_printf(mon, " tray-open=%d",
1889e4def80bSMarkus Armbruster                        qdict_get_bool(bs_dict, "tray-open"));
1890b338082bSbellard     }
1891d2078cc2SLuiz Capitulino 
1892d2078cc2SLuiz Capitulino     if (qdict_haskey(bs_dict, "io-status")) {
1893d2078cc2SLuiz Capitulino         monitor_printf(mon, " io-status=%s", qdict_get_str(bs_dict, "io-status"));
1894d2078cc2SLuiz Capitulino     }
1895d2078cc2SLuiz Capitulino 
1896d15e5465SLuiz Capitulino     if (qdict_haskey(bs_dict, "inserted")) {
1897d15e5465SLuiz Capitulino         QDict *qdict = qobject_to_qdict(qdict_get(bs_dict, "inserted"));
1898d15e5465SLuiz Capitulino 
1899376253ecSaliguori         monitor_printf(mon, " file=");
1900d15e5465SLuiz Capitulino         monitor_print_filename(mon, qdict_get_str(qdict, "file"));
1901d15e5465SLuiz Capitulino         if (qdict_haskey(qdict, "backing_file")) {
1902376253ecSaliguori             monitor_printf(mon, " backing_file=");
1903d15e5465SLuiz Capitulino             monitor_print_filename(mon, qdict_get_str(qdict, "backing_file"));
1904fef30743Sths         }
1905d15e5465SLuiz Capitulino         monitor_printf(mon, " ro=%d drv=%s encrypted=%d",
1906d15e5465SLuiz Capitulino                             qdict_get_bool(qdict, "ro"),
1907d15e5465SLuiz Capitulino                             qdict_get_str(qdict, "drv"),
1908d15e5465SLuiz Capitulino                             qdict_get_bool(qdict, "encrypted"));
1909b338082bSbellard     } else {
1910376253ecSaliguori         monitor_printf(mon, " [not inserted]");
1911b338082bSbellard     }
1912d15e5465SLuiz Capitulino 
1913376253ecSaliguori     monitor_printf(mon, "\n");
1914b338082bSbellard }
1915d15e5465SLuiz Capitulino 
1916d15e5465SLuiz Capitulino void bdrv_info_print(Monitor *mon, const QObject *data)
1917d15e5465SLuiz Capitulino {
1918d15e5465SLuiz Capitulino     qlist_iter(qobject_to_qlist(data), bdrv_print_dict, mon);
1919d15e5465SLuiz Capitulino }
1920d15e5465SLuiz Capitulino 
1921f04ef601SLuiz Capitulino static const char *const io_status_name[BDRV_IOS_MAX] = {
1922f04ef601SLuiz Capitulino     [BDRV_IOS_OK] = "ok",
1923f04ef601SLuiz Capitulino     [BDRV_IOS_FAILED] = "failed",
1924f04ef601SLuiz Capitulino     [BDRV_IOS_ENOSPC] = "nospace",
1925f04ef601SLuiz Capitulino };
1926f04ef601SLuiz Capitulino 
1927d15e5465SLuiz Capitulino void bdrv_info(Monitor *mon, QObject **ret_data)
1928d15e5465SLuiz Capitulino {
1929d15e5465SLuiz Capitulino     QList *bs_list;
1930d15e5465SLuiz Capitulino     BlockDriverState *bs;
1931d15e5465SLuiz Capitulino 
1932d15e5465SLuiz Capitulino     bs_list = qlist_new();
1933d15e5465SLuiz Capitulino 
19341b7bdbc1SStefan Hajnoczi     QTAILQ_FOREACH(bs, &bdrv_states, list) {
1935d15e5465SLuiz Capitulino         QObject *bs_obj;
1936e4def80bSMarkus Armbruster         QDict *bs_dict;
1937d15e5465SLuiz Capitulino 
1938d8aeeb31SMarkus Armbruster         bs_obj = qobject_from_jsonf("{ 'device': %s, 'type': 'unknown', "
1939d15e5465SLuiz Capitulino                                     "'removable': %i, 'locked': %i }",
19402c6942faSMarkus Armbruster                                     bs->device_name,
19412c6942faSMarkus Armbruster                                     bdrv_dev_has_removable_media(bs),
1942f107639aSMarkus Armbruster                                     bdrv_dev_is_medium_locked(bs));
1943e4def80bSMarkus Armbruster         bs_dict = qobject_to_qdict(bs_obj);
1944d15e5465SLuiz Capitulino 
1945e4def80bSMarkus Armbruster         if (bdrv_dev_has_removable_media(bs)) {
1946e4def80bSMarkus Armbruster             qdict_put(bs_dict, "tray-open",
1947e4def80bSMarkus Armbruster                       qbool_from_int(bdrv_dev_is_tray_open(bs)));
1948e4def80bSMarkus Armbruster         }
1949f04ef601SLuiz Capitulino 
1950f04ef601SLuiz Capitulino         if (bdrv_iostatus_is_enabled(bs)) {
1951f04ef601SLuiz Capitulino             qdict_put(bs_dict, "io-status",
1952f04ef601SLuiz Capitulino                       qstring_from_str(io_status_name[bs->iostatus]));
1953f04ef601SLuiz Capitulino         }
1954f04ef601SLuiz Capitulino 
1955d15e5465SLuiz Capitulino         if (bs->drv) {
1956d15e5465SLuiz Capitulino             QObject *obj;
1957d15e5465SLuiz Capitulino 
1958d15e5465SLuiz Capitulino             obj = qobject_from_jsonf("{ 'file': %s, 'ro': %i, 'drv': %s, "
1959d15e5465SLuiz Capitulino                                      "'encrypted': %i }",
1960d15e5465SLuiz Capitulino                                      bs->filename, bs->read_only,
1961d15e5465SLuiz Capitulino                                      bs->drv->format_name,
1962d15e5465SLuiz Capitulino                                      bdrv_is_encrypted(bs));
1963d15e5465SLuiz Capitulino             if (bs->backing_file[0] != '\0') {
1964d15e5465SLuiz Capitulino                 QDict *qdict = qobject_to_qdict(obj);
1965d15e5465SLuiz Capitulino                 qdict_put(qdict, "backing_file",
1966d15e5465SLuiz Capitulino                           qstring_from_str(bs->backing_file));
1967d15e5465SLuiz Capitulino             }
1968d15e5465SLuiz Capitulino 
1969d15e5465SLuiz Capitulino             qdict_put_obj(bs_dict, "inserted", obj);
1970d15e5465SLuiz Capitulino         }
1971d15e5465SLuiz Capitulino         qlist_append_obj(bs_list, bs_obj);
1972d15e5465SLuiz Capitulino     }
1973d15e5465SLuiz Capitulino 
1974d15e5465SLuiz Capitulino     *ret_data = QOBJECT(bs_list);
1975b338082bSbellard }
1976a36e69ddSths 
1977218a536aSLuiz Capitulino static void bdrv_stats_iter(QObject *data, void *opaque)
1978a36e69ddSths {
1979218a536aSLuiz Capitulino     QDict *qdict;
1980218a536aSLuiz Capitulino     Monitor *mon = opaque;
1981218a536aSLuiz Capitulino 
1982218a536aSLuiz Capitulino     qdict = qobject_to_qdict(data);
1983218a536aSLuiz Capitulino     monitor_printf(mon, "%s:", qdict_get_str(qdict, "device"));
1984218a536aSLuiz Capitulino 
1985218a536aSLuiz Capitulino     qdict = qobject_to_qdict(qdict_get(qdict, "stats"));
1986218a536aSLuiz Capitulino     monitor_printf(mon, " rd_bytes=%" PRId64
1987218a536aSLuiz Capitulino                         " wr_bytes=%" PRId64
1988218a536aSLuiz Capitulino                         " rd_operations=%" PRId64
1989218a536aSLuiz Capitulino                         " wr_operations=%" PRId64
1990e8045d67SChristoph Hellwig                         " flush_operations=%" PRId64
1991c488c7f6SChristoph Hellwig                         " wr_total_time_ns=%" PRId64
1992c488c7f6SChristoph Hellwig                         " rd_total_time_ns=%" PRId64
1993c488c7f6SChristoph Hellwig                         " flush_total_time_ns=%" PRId64
1994218a536aSLuiz Capitulino                         "\n",
1995218a536aSLuiz Capitulino                         qdict_get_int(qdict, "rd_bytes"),
1996218a536aSLuiz Capitulino                         qdict_get_int(qdict, "wr_bytes"),
1997218a536aSLuiz Capitulino                         qdict_get_int(qdict, "rd_operations"),
1998e8045d67SChristoph Hellwig                         qdict_get_int(qdict, "wr_operations"),
1999c488c7f6SChristoph Hellwig                         qdict_get_int(qdict, "flush_operations"),
2000c488c7f6SChristoph Hellwig                         qdict_get_int(qdict, "wr_total_time_ns"),
2001c488c7f6SChristoph Hellwig                         qdict_get_int(qdict, "rd_total_time_ns"),
2002c488c7f6SChristoph Hellwig                         qdict_get_int(qdict, "flush_total_time_ns"));
2003218a536aSLuiz Capitulino }
2004218a536aSLuiz Capitulino 
2005218a536aSLuiz Capitulino void bdrv_stats_print(Monitor *mon, const QObject *data)
2006218a536aSLuiz Capitulino {
2007218a536aSLuiz Capitulino     qlist_iter(qobject_to_qlist(data), bdrv_stats_iter, mon);
2008218a536aSLuiz Capitulino }
2009218a536aSLuiz Capitulino 
2010294cc35fSKevin Wolf static QObject* bdrv_info_stats_bs(BlockDriverState *bs)
2011294cc35fSKevin Wolf {
2012294cc35fSKevin Wolf     QObject *res;
2013294cc35fSKevin Wolf     QDict *dict;
2014294cc35fSKevin Wolf 
2015294cc35fSKevin Wolf     res = qobject_from_jsonf("{ 'stats': {"
2016294cc35fSKevin Wolf                              "'rd_bytes': %" PRId64 ","
2017294cc35fSKevin Wolf                              "'wr_bytes': %" PRId64 ","
2018294cc35fSKevin Wolf                              "'rd_operations': %" PRId64 ","
2019294cc35fSKevin Wolf                              "'wr_operations': %" PRId64 ","
2020e8045d67SChristoph Hellwig                              "'wr_highest_offset': %" PRId64 ","
2021c488c7f6SChristoph Hellwig                              "'flush_operations': %" PRId64 ","
2022c488c7f6SChristoph Hellwig                              "'wr_total_time_ns': %" PRId64 ","
2023c488c7f6SChristoph Hellwig                              "'rd_total_time_ns': %" PRId64 ","
2024c488c7f6SChristoph Hellwig                              "'flush_total_time_ns': %" PRId64
2025294cc35fSKevin Wolf                              "} }",
2026a597e79cSChristoph Hellwig                              bs->nr_bytes[BDRV_ACCT_READ],
2027a597e79cSChristoph Hellwig                              bs->nr_bytes[BDRV_ACCT_WRITE],
2028a597e79cSChristoph Hellwig                              bs->nr_ops[BDRV_ACCT_READ],
2029a597e79cSChristoph Hellwig                              bs->nr_ops[BDRV_ACCT_WRITE],
20305ffbbc67SBlue Swirl                              bs->wr_highest_sector *
2031e8045d67SChristoph Hellwig                              (uint64_t)BDRV_SECTOR_SIZE,
2032c488c7f6SChristoph Hellwig                              bs->nr_ops[BDRV_ACCT_FLUSH],
2033c488c7f6SChristoph Hellwig                              bs->total_time_ns[BDRV_ACCT_WRITE],
2034c488c7f6SChristoph Hellwig                              bs->total_time_ns[BDRV_ACCT_READ],
2035c488c7f6SChristoph Hellwig                              bs->total_time_ns[BDRV_ACCT_FLUSH]);
2036294cc35fSKevin Wolf     dict  = qobject_to_qdict(res);
2037294cc35fSKevin Wolf 
2038294cc35fSKevin Wolf     if (*bs->device_name) {
2039294cc35fSKevin Wolf         qdict_put(dict, "device", qstring_from_str(bs->device_name));
2040294cc35fSKevin Wolf     }
2041294cc35fSKevin Wolf 
2042294cc35fSKevin Wolf     if (bs->file) {
2043294cc35fSKevin Wolf         QObject *parent = bdrv_info_stats_bs(bs->file);
2044294cc35fSKevin Wolf         qdict_put_obj(dict, "parent", parent);
2045294cc35fSKevin Wolf     }
2046294cc35fSKevin Wolf 
2047294cc35fSKevin Wolf     return res;
2048294cc35fSKevin Wolf }
2049294cc35fSKevin Wolf 
2050218a536aSLuiz Capitulino void bdrv_info_stats(Monitor *mon, QObject **ret_data)
2051218a536aSLuiz Capitulino {
2052218a536aSLuiz Capitulino     QObject *obj;
2053218a536aSLuiz Capitulino     QList *devices;
2054a36e69ddSths     BlockDriverState *bs;
2055a36e69ddSths 
2056218a536aSLuiz Capitulino     devices = qlist_new();
2057218a536aSLuiz Capitulino 
20581b7bdbc1SStefan Hajnoczi     QTAILQ_FOREACH(bs, &bdrv_states, list) {
2059294cc35fSKevin Wolf         obj = bdrv_info_stats_bs(bs);
2060218a536aSLuiz Capitulino         qlist_append_obj(devices, obj);
2061a36e69ddSths     }
2062218a536aSLuiz Capitulino 
2063218a536aSLuiz Capitulino     *ret_data = QOBJECT(devices);
2064a36e69ddSths }
2065ea2384d3Sbellard 
2066045df330Saliguori const char *bdrv_get_encrypted_filename(BlockDriverState *bs)
2067045df330Saliguori {
2068045df330Saliguori     if (bs->backing_hd && bs->backing_hd->encrypted)
2069045df330Saliguori         return bs->backing_file;
2070045df330Saliguori     else if (bs->encrypted)
2071045df330Saliguori         return bs->filename;
2072045df330Saliguori     else
2073045df330Saliguori         return NULL;
2074045df330Saliguori }
2075045df330Saliguori 
207683f64091Sbellard void bdrv_get_backing_filename(BlockDriverState *bs,
207783f64091Sbellard                                char *filename, int filename_size)
207883f64091Sbellard {
2079b783e409SKevin Wolf     if (!bs->backing_file) {
208083f64091Sbellard         pstrcpy(filename, filename_size, "");
208183f64091Sbellard     } else {
208283f64091Sbellard         pstrcpy(filename, filename_size, bs->backing_file);
208383f64091Sbellard     }
208483f64091Sbellard }
208583f64091Sbellard 
2086faea38e7Sbellard int bdrv_write_compressed(BlockDriverState *bs, int64_t sector_num,
2087faea38e7Sbellard                           const uint8_t *buf, int nb_sectors)
2088faea38e7Sbellard {
2089faea38e7Sbellard     BlockDriver *drv = bs->drv;
2090faea38e7Sbellard     if (!drv)
209119cb3738Sbellard         return -ENOMEDIUM;
2092faea38e7Sbellard     if (!drv->bdrv_write_compressed)
2093faea38e7Sbellard         return -ENOTSUP;
2094fbb7b4e0SKevin Wolf     if (bdrv_check_request(bs, sector_num, nb_sectors))
2095fbb7b4e0SKevin Wolf         return -EIO;
20967cd1e32aSlirans@il.ibm.com 
2097c6d22830SJan Kiszka     if (bs->dirty_bitmap) {
20987cd1e32aSlirans@il.ibm.com         set_dirty_bitmap(bs, sector_num, nb_sectors, 1);
20997cd1e32aSlirans@il.ibm.com     }
21007cd1e32aSlirans@il.ibm.com 
2101faea38e7Sbellard     return drv->bdrv_write_compressed(bs, sector_num, buf, nb_sectors);
2102faea38e7Sbellard }
2103faea38e7Sbellard 
2104faea38e7Sbellard int bdrv_get_info(BlockDriverState *bs, BlockDriverInfo *bdi)
2105faea38e7Sbellard {
2106faea38e7Sbellard     BlockDriver *drv = bs->drv;
2107faea38e7Sbellard     if (!drv)
210819cb3738Sbellard         return -ENOMEDIUM;
2109faea38e7Sbellard     if (!drv->bdrv_get_info)
2110faea38e7Sbellard         return -ENOTSUP;
2111faea38e7Sbellard     memset(bdi, 0, sizeof(*bdi));
2112faea38e7Sbellard     return drv->bdrv_get_info(bs, bdi);
2113faea38e7Sbellard }
2114faea38e7Sbellard 
211545566e9cSChristoph Hellwig int bdrv_save_vmstate(BlockDriverState *bs, const uint8_t *buf,
211645566e9cSChristoph Hellwig                       int64_t pos, int size)
2117178e08a5Saliguori {
2118178e08a5Saliguori     BlockDriver *drv = bs->drv;
2119178e08a5Saliguori     if (!drv)
2120178e08a5Saliguori         return -ENOMEDIUM;
21217cdb1f6dSMORITA Kazutaka     if (drv->bdrv_save_vmstate)
212245566e9cSChristoph Hellwig         return drv->bdrv_save_vmstate(bs, buf, pos, size);
21237cdb1f6dSMORITA Kazutaka     if (bs->file)
21247cdb1f6dSMORITA Kazutaka         return bdrv_save_vmstate(bs->file, buf, pos, size);
21257cdb1f6dSMORITA Kazutaka     return -ENOTSUP;
2126178e08a5Saliguori }
2127178e08a5Saliguori 
212845566e9cSChristoph Hellwig int bdrv_load_vmstate(BlockDriverState *bs, uint8_t *buf,
212945566e9cSChristoph Hellwig                       int64_t pos, int size)
2130178e08a5Saliguori {
2131178e08a5Saliguori     BlockDriver *drv = bs->drv;
2132178e08a5Saliguori     if (!drv)
2133178e08a5Saliguori         return -ENOMEDIUM;
21347cdb1f6dSMORITA Kazutaka     if (drv->bdrv_load_vmstate)
213545566e9cSChristoph Hellwig         return drv->bdrv_load_vmstate(bs, buf, pos, size);
21367cdb1f6dSMORITA Kazutaka     if (bs->file)
21377cdb1f6dSMORITA Kazutaka         return bdrv_load_vmstate(bs->file, buf, pos, size);
21387cdb1f6dSMORITA Kazutaka     return -ENOTSUP;
2139178e08a5Saliguori }
2140178e08a5Saliguori 
21418b9b0cc2SKevin Wolf void bdrv_debug_event(BlockDriverState *bs, BlkDebugEvent event)
21428b9b0cc2SKevin Wolf {
21438b9b0cc2SKevin Wolf     BlockDriver *drv = bs->drv;
21448b9b0cc2SKevin Wolf 
21458b9b0cc2SKevin Wolf     if (!drv || !drv->bdrv_debug_event) {
21468b9b0cc2SKevin Wolf         return;
21478b9b0cc2SKevin Wolf     }
21488b9b0cc2SKevin Wolf 
21498b9b0cc2SKevin Wolf     return drv->bdrv_debug_event(bs, event);
21508b9b0cc2SKevin Wolf 
21518b9b0cc2SKevin Wolf }
21528b9b0cc2SKevin Wolf 
2153faea38e7Sbellard /**************************************************************/
2154faea38e7Sbellard /* handling of snapshots */
2155faea38e7Sbellard 
2156feeee5acSMiguel Di Ciurcio Filho int bdrv_can_snapshot(BlockDriverState *bs)
2157feeee5acSMiguel Di Ciurcio Filho {
2158feeee5acSMiguel Di Ciurcio Filho     BlockDriver *drv = bs->drv;
215907b70bfbSMarkus Armbruster     if (!drv || !bdrv_is_inserted(bs) || bdrv_is_read_only(bs)) {
2160feeee5acSMiguel Di Ciurcio Filho         return 0;
2161feeee5acSMiguel Di Ciurcio Filho     }
2162feeee5acSMiguel Di Ciurcio Filho 
2163feeee5acSMiguel Di Ciurcio Filho     if (!drv->bdrv_snapshot_create) {
2164feeee5acSMiguel Di Ciurcio Filho         if (bs->file != NULL) {
2165feeee5acSMiguel Di Ciurcio Filho             return bdrv_can_snapshot(bs->file);
2166feeee5acSMiguel Di Ciurcio Filho         }
2167feeee5acSMiguel Di Ciurcio Filho         return 0;
2168feeee5acSMiguel Di Ciurcio Filho     }
2169feeee5acSMiguel Di Ciurcio Filho 
2170feeee5acSMiguel Di Ciurcio Filho     return 1;
2171feeee5acSMiguel Di Ciurcio Filho }
2172feeee5acSMiguel Di Ciurcio Filho 
2173199630b6SBlue Swirl int bdrv_is_snapshot(BlockDriverState *bs)
2174199630b6SBlue Swirl {
2175199630b6SBlue Swirl     return !!(bs->open_flags & BDRV_O_SNAPSHOT);
2176199630b6SBlue Swirl }
2177199630b6SBlue Swirl 
2178f9092b10SMarkus Armbruster BlockDriverState *bdrv_snapshots(void)
2179f9092b10SMarkus Armbruster {
2180f9092b10SMarkus Armbruster     BlockDriverState *bs;
2181f9092b10SMarkus Armbruster 
21823ac906f7SMarkus Armbruster     if (bs_snapshots) {
2183f9092b10SMarkus Armbruster         return bs_snapshots;
21843ac906f7SMarkus Armbruster     }
2185f9092b10SMarkus Armbruster 
2186f9092b10SMarkus Armbruster     bs = NULL;
2187f9092b10SMarkus Armbruster     while ((bs = bdrv_next(bs))) {
2188f9092b10SMarkus Armbruster         if (bdrv_can_snapshot(bs)) {
21893ac906f7SMarkus Armbruster             bs_snapshots = bs;
21903ac906f7SMarkus Armbruster             return bs;
2191f9092b10SMarkus Armbruster         }
2192f9092b10SMarkus Armbruster     }
2193f9092b10SMarkus Armbruster     return NULL;
2194f9092b10SMarkus Armbruster }
2195f9092b10SMarkus Armbruster 
2196faea38e7Sbellard int bdrv_snapshot_create(BlockDriverState *bs,
2197faea38e7Sbellard                          QEMUSnapshotInfo *sn_info)
2198faea38e7Sbellard {
2199faea38e7Sbellard     BlockDriver *drv = bs->drv;
2200faea38e7Sbellard     if (!drv)
220119cb3738Sbellard         return -ENOMEDIUM;
22027cdb1f6dSMORITA Kazutaka     if (drv->bdrv_snapshot_create)
2203faea38e7Sbellard         return drv->bdrv_snapshot_create(bs, sn_info);
22047cdb1f6dSMORITA Kazutaka     if (bs->file)
22057cdb1f6dSMORITA Kazutaka         return bdrv_snapshot_create(bs->file, sn_info);
22067cdb1f6dSMORITA Kazutaka     return -ENOTSUP;
2207faea38e7Sbellard }
2208faea38e7Sbellard 
2209faea38e7Sbellard int bdrv_snapshot_goto(BlockDriverState *bs,
2210faea38e7Sbellard                        const char *snapshot_id)
2211faea38e7Sbellard {
2212faea38e7Sbellard     BlockDriver *drv = bs->drv;
22137cdb1f6dSMORITA Kazutaka     int ret, open_ret;
22147cdb1f6dSMORITA Kazutaka 
2215faea38e7Sbellard     if (!drv)
221619cb3738Sbellard         return -ENOMEDIUM;
22177cdb1f6dSMORITA Kazutaka     if (drv->bdrv_snapshot_goto)
2218faea38e7Sbellard         return drv->bdrv_snapshot_goto(bs, snapshot_id);
22197cdb1f6dSMORITA Kazutaka 
22207cdb1f6dSMORITA Kazutaka     if (bs->file) {
22217cdb1f6dSMORITA Kazutaka         drv->bdrv_close(bs);
22227cdb1f6dSMORITA Kazutaka         ret = bdrv_snapshot_goto(bs->file, snapshot_id);
22237cdb1f6dSMORITA Kazutaka         open_ret = drv->bdrv_open(bs, bs->open_flags);
22247cdb1f6dSMORITA Kazutaka         if (open_ret < 0) {
22257cdb1f6dSMORITA Kazutaka             bdrv_delete(bs->file);
22267cdb1f6dSMORITA Kazutaka             bs->drv = NULL;
22277cdb1f6dSMORITA Kazutaka             return open_ret;
22287cdb1f6dSMORITA Kazutaka         }
22297cdb1f6dSMORITA Kazutaka         return ret;
22307cdb1f6dSMORITA Kazutaka     }
22317cdb1f6dSMORITA Kazutaka 
22327cdb1f6dSMORITA Kazutaka     return -ENOTSUP;
2233faea38e7Sbellard }
2234faea38e7Sbellard 
2235faea38e7Sbellard int bdrv_snapshot_delete(BlockDriverState *bs, const char *snapshot_id)
2236faea38e7Sbellard {
2237faea38e7Sbellard     BlockDriver *drv = bs->drv;
2238faea38e7Sbellard     if (!drv)
223919cb3738Sbellard         return -ENOMEDIUM;
22407cdb1f6dSMORITA Kazutaka     if (drv->bdrv_snapshot_delete)
2241faea38e7Sbellard         return drv->bdrv_snapshot_delete(bs, snapshot_id);
22427cdb1f6dSMORITA Kazutaka     if (bs->file)
22437cdb1f6dSMORITA Kazutaka         return bdrv_snapshot_delete(bs->file, snapshot_id);
22447cdb1f6dSMORITA Kazutaka     return -ENOTSUP;
2245faea38e7Sbellard }
2246faea38e7Sbellard 
2247faea38e7Sbellard int bdrv_snapshot_list(BlockDriverState *bs,
2248faea38e7Sbellard                        QEMUSnapshotInfo **psn_info)
2249faea38e7Sbellard {
2250faea38e7Sbellard     BlockDriver *drv = bs->drv;
2251faea38e7Sbellard     if (!drv)
225219cb3738Sbellard         return -ENOMEDIUM;
22537cdb1f6dSMORITA Kazutaka     if (drv->bdrv_snapshot_list)
2254faea38e7Sbellard         return drv->bdrv_snapshot_list(bs, psn_info);
22557cdb1f6dSMORITA Kazutaka     if (bs->file)
22567cdb1f6dSMORITA Kazutaka         return bdrv_snapshot_list(bs->file, psn_info);
22577cdb1f6dSMORITA Kazutaka     return -ENOTSUP;
2258faea38e7Sbellard }
2259faea38e7Sbellard 
226051ef6727Sedison int bdrv_snapshot_load_tmp(BlockDriverState *bs,
226151ef6727Sedison         const char *snapshot_name)
226251ef6727Sedison {
226351ef6727Sedison     BlockDriver *drv = bs->drv;
226451ef6727Sedison     if (!drv) {
226551ef6727Sedison         return -ENOMEDIUM;
226651ef6727Sedison     }
226751ef6727Sedison     if (!bs->read_only) {
226851ef6727Sedison         return -EINVAL;
226951ef6727Sedison     }
227051ef6727Sedison     if (drv->bdrv_snapshot_load_tmp) {
227151ef6727Sedison         return drv->bdrv_snapshot_load_tmp(bs, snapshot_name);
227251ef6727Sedison     }
227351ef6727Sedison     return -ENOTSUP;
227451ef6727Sedison }
227551ef6727Sedison 
2276faea38e7Sbellard #define NB_SUFFIXES 4
2277faea38e7Sbellard 
2278faea38e7Sbellard char *get_human_readable_size(char *buf, int buf_size, int64_t size)
2279faea38e7Sbellard {
2280faea38e7Sbellard     static const char suffixes[NB_SUFFIXES] = "KMGT";
2281faea38e7Sbellard     int64_t base;
2282faea38e7Sbellard     int i;
2283faea38e7Sbellard 
2284faea38e7Sbellard     if (size <= 999) {
2285faea38e7Sbellard         snprintf(buf, buf_size, "%" PRId64, size);
2286faea38e7Sbellard     } else {
2287faea38e7Sbellard         base = 1024;
2288faea38e7Sbellard         for(i = 0; i < NB_SUFFIXES; i++) {
2289faea38e7Sbellard             if (size < (10 * base)) {
2290faea38e7Sbellard                 snprintf(buf, buf_size, "%0.1f%c",
2291faea38e7Sbellard                          (double)size / base,
2292faea38e7Sbellard                          suffixes[i]);
2293faea38e7Sbellard                 break;
2294faea38e7Sbellard             } else if (size < (1000 * base) || i == (NB_SUFFIXES - 1)) {
2295faea38e7Sbellard                 snprintf(buf, buf_size, "%" PRId64 "%c",
2296faea38e7Sbellard                          ((size + (base >> 1)) / base),
2297faea38e7Sbellard                          suffixes[i]);
2298faea38e7Sbellard                 break;
2299faea38e7Sbellard             }
2300faea38e7Sbellard             base = base * 1024;
2301faea38e7Sbellard         }
2302faea38e7Sbellard     }
2303faea38e7Sbellard     return buf;
2304faea38e7Sbellard }
2305faea38e7Sbellard 
2306faea38e7Sbellard char *bdrv_snapshot_dump(char *buf, int buf_size, QEMUSnapshotInfo *sn)
2307faea38e7Sbellard {
2308faea38e7Sbellard     char buf1[128], date_buf[128], clock_buf[128];
23093b9f94e1Sbellard #ifdef _WIN32
23103b9f94e1Sbellard     struct tm *ptm;
23113b9f94e1Sbellard #else
2312faea38e7Sbellard     struct tm tm;
23133b9f94e1Sbellard #endif
2314faea38e7Sbellard     time_t ti;
2315faea38e7Sbellard     int64_t secs;
2316faea38e7Sbellard 
2317faea38e7Sbellard     if (!sn) {
2318faea38e7Sbellard         snprintf(buf, buf_size,
2319faea38e7Sbellard                  "%-10s%-20s%7s%20s%15s",
2320faea38e7Sbellard                  "ID", "TAG", "VM SIZE", "DATE", "VM CLOCK");
2321faea38e7Sbellard     } else {
2322faea38e7Sbellard         ti = sn->date_sec;
23233b9f94e1Sbellard #ifdef _WIN32
23243b9f94e1Sbellard         ptm = localtime(&ti);
23253b9f94e1Sbellard         strftime(date_buf, sizeof(date_buf),
23263b9f94e1Sbellard                  "%Y-%m-%d %H:%M:%S", ptm);
23273b9f94e1Sbellard #else
2328faea38e7Sbellard         localtime_r(&ti, &tm);
2329faea38e7Sbellard         strftime(date_buf, sizeof(date_buf),
2330faea38e7Sbellard                  "%Y-%m-%d %H:%M:%S", &tm);
23313b9f94e1Sbellard #endif
2332faea38e7Sbellard         secs = sn->vm_clock_nsec / 1000000000;
2333faea38e7Sbellard         snprintf(clock_buf, sizeof(clock_buf),
2334faea38e7Sbellard                  "%02d:%02d:%02d.%03d",
2335faea38e7Sbellard                  (int)(secs / 3600),
2336faea38e7Sbellard                  (int)((secs / 60) % 60),
2337faea38e7Sbellard                  (int)(secs % 60),
2338faea38e7Sbellard                  (int)((sn->vm_clock_nsec / 1000000) % 1000));
2339faea38e7Sbellard         snprintf(buf, buf_size,
2340faea38e7Sbellard                  "%-10s%-20s%7s%20s%15s",
2341faea38e7Sbellard                  sn->id_str, sn->name,
2342faea38e7Sbellard                  get_human_readable_size(buf1, sizeof(buf1), sn->vm_state_size),
2343faea38e7Sbellard                  date_buf,
2344faea38e7Sbellard                  clock_buf);
2345faea38e7Sbellard     }
2346faea38e7Sbellard     return buf;
2347faea38e7Sbellard }
2348faea38e7Sbellard 
2349ea2384d3Sbellard /**************************************************************/
235083f64091Sbellard /* async I/Os */
2351ea2384d3Sbellard 
23523b69e4b9Saliguori BlockDriverAIOCB *bdrv_aio_readv(BlockDriverState *bs, int64_t sector_num,
2353f141eafeSaliguori                                  QEMUIOVector *qiov, int nb_sectors,
235483f64091Sbellard                                  BlockDriverCompletionFunc *cb, void *opaque)
2355ea2384d3Sbellard {
235683f64091Sbellard     BlockDriver *drv = bs->drv;
2357ea2384d3Sbellard 
2358bbf0a440SStefan Hajnoczi     trace_bdrv_aio_readv(bs, sector_num, nb_sectors, opaque);
2359bbf0a440SStefan Hajnoczi 
236019cb3738Sbellard     if (!drv)
2361ce1a14dcSpbrook         return NULL;
236271d0770cSaliguori     if (bdrv_check_request(bs, sector_num, nb_sectors))
236371d0770cSaliguori         return NULL;
236483f64091Sbellard 
2365a597e79cSChristoph Hellwig     return drv->bdrv_aio_readv(bs, sector_num, qiov, nb_sectors,
2366f141eafeSaliguori                                cb, opaque);
236783f64091Sbellard }
236883f64091Sbellard 
23694dcafbb1SMarcelo Tosatti typedef struct BlockCompleteData {
23704dcafbb1SMarcelo Tosatti     BlockDriverCompletionFunc *cb;
23714dcafbb1SMarcelo Tosatti     void *opaque;
23724dcafbb1SMarcelo Tosatti     BlockDriverState *bs;
23734dcafbb1SMarcelo Tosatti     int64_t sector_num;
23744dcafbb1SMarcelo Tosatti     int nb_sectors;
23754dcafbb1SMarcelo Tosatti } BlockCompleteData;
23764dcafbb1SMarcelo Tosatti 
23774dcafbb1SMarcelo Tosatti static void block_complete_cb(void *opaque, int ret)
23784dcafbb1SMarcelo Tosatti {
23794dcafbb1SMarcelo Tosatti     BlockCompleteData *b = opaque;
23804dcafbb1SMarcelo Tosatti 
23814dcafbb1SMarcelo Tosatti     if (b->bs->dirty_bitmap) {
23824dcafbb1SMarcelo Tosatti         set_dirty_bitmap(b->bs, b->sector_num, b->nb_sectors, 1);
23834dcafbb1SMarcelo Tosatti     }
23844dcafbb1SMarcelo Tosatti     b->cb(b->opaque, ret);
23857267c094SAnthony Liguori     g_free(b);
23864dcafbb1SMarcelo Tosatti }
23874dcafbb1SMarcelo Tosatti 
23884dcafbb1SMarcelo Tosatti static BlockCompleteData *blk_dirty_cb_alloc(BlockDriverState *bs,
23894dcafbb1SMarcelo Tosatti                                              int64_t sector_num,
23904dcafbb1SMarcelo Tosatti                                              int nb_sectors,
23914dcafbb1SMarcelo Tosatti                                              BlockDriverCompletionFunc *cb,
23924dcafbb1SMarcelo Tosatti                                              void *opaque)
23934dcafbb1SMarcelo Tosatti {
23947267c094SAnthony Liguori     BlockCompleteData *blkdata = g_malloc0(sizeof(BlockCompleteData));
23954dcafbb1SMarcelo Tosatti 
23964dcafbb1SMarcelo Tosatti     blkdata->bs = bs;
23974dcafbb1SMarcelo Tosatti     blkdata->cb = cb;
23984dcafbb1SMarcelo Tosatti     blkdata->opaque = opaque;
23994dcafbb1SMarcelo Tosatti     blkdata->sector_num = sector_num;
24004dcafbb1SMarcelo Tosatti     blkdata->nb_sectors = nb_sectors;
24014dcafbb1SMarcelo Tosatti 
24024dcafbb1SMarcelo Tosatti     return blkdata;
24034dcafbb1SMarcelo Tosatti }
24044dcafbb1SMarcelo Tosatti 
2405f141eafeSaliguori BlockDriverAIOCB *bdrv_aio_writev(BlockDriverState *bs, int64_t sector_num,
2406f141eafeSaliguori                                   QEMUIOVector *qiov, int nb_sectors,
240783f64091Sbellard                                   BlockDriverCompletionFunc *cb, void *opaque)
24087674e7bfSbellard {
240983f64091Sbellard     BlockDriver *drv = bs->drv;
2410a36e69ddSths     BlockDriverAIOCB *ret;
24114dcafbb1SMarcelo Tosatti     BlockCompleteData *blk_cb_data;
241283f64091Sbellard 
2413bbf0a440SStefan Hajnoczi     trace_bdrv_aio_writev(bs, sector_num, nb_sectors, opaque);
2414bbf0a440SStefan Hajnoczi 
241519cb3738Sbellard     if (!drv)
2416ce1a14dcSpbrook         return NULL;
241783f64091Sbellard     if (bs->read_only)
2418ce1a14dcSpbrook         return NULL;
241971d0770cSaliguori     if (bdrv_check_request(bs, sector_num, nb_sectors))
242071d0770cSaliguori         return NULL;
242183f64091Sbellard 
2422c6d22830SJan Kiszka     if (bs->dirty_bitmap) {
24234dcafbb1SMarcelo Tosatti         blk_cb_data = blk_dirty_cb_alloc(bs, sector_num, nb_sectors, cb,
24244dcafbb1SMarcelo Tosatti                                          opaque);
24254dcafbb1SMarcelo Tosatti         cb = &block_complete_cb;
24264dcafbb1SMarcelo Tosatti         opaque = blk_cb_data;
24277cd1e32aSlirans@il.ibm.com     }
24287cd1e32aSlirans@il.ibm.com 
2429f141eafeSaliguori     ret = drv->bdrv_aio_writev(bs, sector_num, qiov, nb_sectors,
2430f141eafeSaliguori                                cb, opaque);
2431a36e69ddSths 
2432a36e69ddSths     if (ret) {
2433294cc35fSKevin Wolf         if (bs->wr_highest_sector < sector_num + nb_sectors - 1) {
2434294cc35fSKevin Wolf             bs->wr_highest_sector = sector_num + nb_sectors - 1;
2435294cc35fSKevin Wolf         }
2436a36e69ddSths     }
2437a36e69ddSths 
2438a36e69ddSths     return ret;
243983f64091Sbellard }
244083f64091Sbellard 
244140b4f539SKevin Wolf 
244240b4f539SKevin Wolf typedef struct MultiwriteCB {
244340b4f539SKevin Wolf     int error;
244440b4f539SKevin Wolf     int num_requests;
244540b4f539SKevin Wolf     int num_callbacks;
244640b4f539SKevin Wolf     struct {
244740b4f539SKevin Wolf         BlockDriverCompletionFunc *cb;
244840b4f539SKevin Wolf         void *opaque;
244940b4f539SKevin Wolf         QEMUIOVector *free_qiov;
245040b4f539SKevin Wolf         void *free_buf;
245140b4f539SKevin Wolf     } callbacks[];
245240b4f539SKevin Wolf } MultiwriteCB;
245340b4f539SKevin Wolf 
245440b4f539SKevin Wolf static void multiwrite_user_cb(MultiwriteCB *mcb)
245540b4f539SKevin Wolf {
245640b4f539SKevin Wolf     int i;
245740b4f539SKevin Wolf 
245840b4f539SKevin Wolf     for (i = 0; i < mcb->num_callbacks; i++) {
245940b4f539SKevin Wolf         mcb->callbacks[i].cb(mcb->callbacks[i].opaque, mcb->error);
24601e1ea48dSStefan Hajnoczi         if (mcb->callbacks[i].free_qiov) {
24611e1ea48dSStefan Hajnoczi             qemu_iovec_destroy(mcb->callbacks[i].free_qiov);
24621e1ea48dSStefan Hajnoczi         }
24637267c094SAnthony Liguori         g_free(mcb->callbacks[i].free_qiov);
2464f8a83245SHerve Poussineau         qemu_vfree(mcb->callbacks[i].free_buf);
246540b4f539SKevin Wolf     }
246640b4f539SKevin Wolf }
246740b4f539SKevin Wolf 
246840b4f539SKevin Wolf static void multiwrite_cb(void *opaque, int ret)
246940b4f539SKevin Wolf {
247040b4f539SKevin Wolf     MultiwriteCB *mcb = opaque;
247140b4f539SKevin Wolf 
24726d519a5fSStefan Hajnoczi     trace_multiwrite_cb(mcb, ret);
24736d519a5fSStefan Hajnoczi 
2474cb6d3ca0SKevin Wolf     if (ret < 0 && !mcb->error) {
247540b4f539SKevin Wolf         mcb->error = ret;
247640b4f539SKevin Wolf     }
247740b4f539SKevin Wolf 
247840b4f539SKevin Wolf     mcb->num_requests--;
247940b4f539SKevin Wolf     if (mcb->num_requests == 0) {
248040b4f539SKevin Wolf         multiwrite_user_cb(mcb);
24817267c094SAnthony Liguori         g_free(mcb);
248240b4f539SKevin Wolf     }
248340b4f539SKevin Wolf }
248440b4f539SKevin Wolf 
248540b4f539SKevin Wolf static int multiwrite_req_compare(const void *a, const void *b)
248640b4f539SKevin Wolf {
248777be4366SChristoph Hellwig     const BlockRequest *req1 = a, *req2 = b;
248877be4366SChristoph Hellwig 
248977be4366SChristoph Hellwig     /*
249077be4366SChristoph Hellwig      * Note that we can't simply subtract req2->sector from req1->sector
249177be4366SChristoph Hellwig      * here as that could overflow the return value.
249277be4366SChristoph Hellwig      */
249377be4366SChristoph Hellwig     if (req1->sector > req2->sector) {
249477be4366SChristoph Hellwig         return 1;
249577be4366SChristoph Hellwig     } else if (req1->sector < req2->sector) {
249677be4366SChristoph Hellwig         return -1;
249777be4366SChristoph Hellwig     } else {
249877be4366SChristoph Hellwig         return 0;
249977be4366SChristoph Hellwig     }
250040b4f539SKevin Wolf }
250140b4f539SKevin Wolf 
250240b4f539SKevin Wolf /*
250340b4f539SKevin Wolf  * Takes a bunch of requests and tries to merge them. Returns the number of
250440b4f539SKevin Wolf  * requests that remain after merging.
250540b4f539SKevin Wolf  */
250640b4f539SKevin Wolf static int multiwrite_merge(BlockDriverState *bs, BlockRequest *reqs,
250740b4f539SKevin Wolf     int num_reqs, MultiwriteCB *mcb)
250840b4f539SKevin Wolf {
250940b4f539SKevin Wolf     int i, outidx;
251040b4f539SKevin Wolf 
251140b4f539SKevin Wolf     // Sort requests by start sector
251240b4f539SKevin Wolf     qsort(reqs, num_reqs, sizeof(*reqs), &multiwrite_req_compare);
251340b4f539SKevin Wolf 
251440b4f539SKevin Wolf     // Check if adjacent requests touch the same clusters. If so, combine them,
251540b4f539SKevin Wolf     // filling up gaps with zero sectors.
251640b4f539SKevin Wolf     outidx = 0;
251740b4f539SKevin Wolf     for (i = 1; i < num_reqs; i++) {
251840b4f539SKevin Wolf         int merge = 0;
251940b4f539SKevin Wolf         int64_t oldreq_last = reqs[outidx].sector + reqs[outidx].nb_sectors;
252040b4f539SKevin Wolf 
252140b4f539SKevin Wolf         // This handles the cases that are valid for all block drivers, namely
252240b4f539SKevin Wolf         // exactly sequential writes and overlapping writes.
252340b4f539SKevin Wolf         if (reqs[i].sector <= oldreq_last) {
252440b4f539SKevin Wolf             merge = 1;
252540b4f539SKevin Wolf         }
252640b4f539SKevin Wolf 
252740b4f539SKevin Wolf         // The block driver may decide that it makes sense to combine requests
252840b4f539SKevin Wolf         // even if there is a gap of some sectors between them. In this case,
252940b4f539SKevin Wolf         // the gap is filled with zeros (therefore only applicable for yet
253040b4f539SKevin Wolf         // unused space in format like qcow2).
253140b4f539SKevin Wolf         if (!merge && bs->drv->bdrv_merge_requests) {
253240b4f539SKevin Wolf             merge = bs->drv->bdrv_merge_requests(bs, &reqs[outidx], &reqs[i]);
253340b4f539SKevin Wolf         }
253440b4f539SKevin Wolf 
2535e2a305fbSChristoph Hellwig         if (reqs[outidx].qiov->niov + reqs[i].qiov->niov + 1 > IOV_MAX) {
2536e2a305fbSChristoph Hellwig             merge = 0;
2537e2a305fbSChristoph Hellwig         }
2538e2a305fbSChristoph Hellwig 
253940b4f539SKevin Wolf         if (merge) {
254040b4f539SKevin Wolf             size_t size;
25417267c094SAnthony Liguori             QEMUIOVector *qiov = g_malloc0(sizeof(*qiov));
254240b4f539SKevin Wolf             qemu_iovec_init(qiov,
254340b4f539SKevin Wolf                 reqs[outidx].qiov->niov + reqs[i].qiov->niov + 1);
254440b4f539SKevin Wolf 
254540b4f539SKevin Wolf             // Add the first request to the merged one. If the requests are
254640b4f539SKevin Wolf             // overlapping, drop the last sectors of the first request.
254740b4f539SKevin Wolf             size = (reqs[i].sector - reqs[outidx].sector) << 9;
254840b4f539SKevin Wolf             qemu_iovec_concat(qiov, reqs[outidx].qiov, size);
254940b4f539SKevin Wolf 
255040b4f539SKevin Wolf             // We might need to add some zeros between the two requests
255140b4f539SKevin Wolf             if (reqs[i].sector > oldreq_last) {
255240b4f539SKevin Wolf                 size_t zero_bytes = (reqs[i].sector - oldreq_last) << 9;
255340b4f539SKevin Wolf                 uint8_t *buf = qemu_blockalign(bs, zero_bytes);
255440b4f539SKevin Wolf                 memset(buf, 0, zero_bytes);
255540b4f539SKevin Wolf                 qemu_iovec_add(qiov, buf, zero_bytes);
255640b4f539SKevin Wolf                 mcb->callbacks[i].free_buf = buf;
255740b4f539SKevin Wolf             }
255840b4f539SKevin Wolf 
255940b4f539SKevin Wolf             // Add the second request
256040b4f539SKevin Wolf             qemu_iovec_concat(qiov, reqs[i].qiov, reqs[i].qiov->size);
256140b4f539SKevin Wolf 
2562cbf1dff2SKevin Wolf             reqs[outidx].nb_sectors = qiov->size >> 9;
256340b4f539SKevin Wolf             reqs[outidx].qiov = qiov;
256440b4f539SKevin Wolf 
256540b4f539SKevin Wolf             mcb->callbacks[i].free_qiov = reqs[outidx].qiov;
256640b4f539SKevin Wolf         } else {
256740b4f539SKevin Wolf             outidx++;
256840b4f539SKevin Wolf             reqs[outidx].sector     = reqs[i].sector;
256940b4f539SKevin Wolf             reqs[outidx].nb_sectors = reqs[i].nb_sectors;
257040b4f539SKevin Wolf             reqs[outidx].qiov       = reqs[i].qiov;
257140b4f539SKevin Wolf         }
257240b4f539SKevin Wolf     }
257340b4f539SKevin Wolf 
257440b4f539SKevin Wolf     return outidx + 1;
257540b4f539SKevin Wolf }
257640b4f539SKevin Wolf 
257740b4f539SKevin Wolf /*
257840b4f539SKevin Wolf  * Submit multiple AIO write requests at once.
257940b4f539SKevin Wolf  *
258040b4f539SKevin Wolf  * On success, the function returns 0 and all requests in the reqs array have
258140b4f539SKevin Wolf  * been submitted. In error case this function returns -1, and any of the
258240b4f539SKevin Wolf  * requests may or may not be submitted yet. In particular, this means that the
258340b4f539SKevin Wolf  * callback will be called for some of the requests, for others it won't. The
258440b4f539SKevin Wolf  * caller must check the error field of the BlockRequest to wait for the right
258540b4f539SKevin Wolf  * callbacks (if error != 0, no callback will be called).
258640b4f539SKevin Wolf  *
258740b4f539SKevin Wolf  * The implementation may modify the contents of the reqs array, e.g. to merge
258840b4f539SKevin Wolf  * requests. However, the fields opaque and error are left unmodified as they
258940b4f539SKevin Wolf  * are used to signal failure for a single request to the caller.
259040b4f539SKevin Wolf  */
259140b4f539SKevin Wolf int bdrv_aio_multiwrite(BlockDriverState *bs, BlockRequest *reqs, int num_reqs)
259240b4f539SKevin Wolf {
259340b4f539SKevin Wolf     BlockDriverAIOCB *acb;
259440b4f539SKevin Wolf     MultiwriteCB *mcb;
259540b4f539SKevin Wolf     int i;
259640b4f539SKevin Wolf 
2597301db7c2SRyan Harper     /* don't submit writes if we don't have a medium */
2598301db7c2SRyan Harper     if (bs->drv == NULL) {
2599301db7c2SRyan Harper         for (i = 0; i < num_reqs; i++) {
2600301db7c2SRyan Harper             reqs[i].error = -ENOMEDIUM;
2601301db7c2SRyan Harper         }
2602301db7c2SRyan Harper         return -1;
2603301db7c2SRyan Harper     }
2604301db7c2SRyan Harper 
260540b4f539SKevin Wolf     if (num_reqs == 0) {
260640b4f539SKevin Wolf         return 0;
260740b4f539SKevin Wolf     }
260840b4f539SKevin Wolf 
260940b4f539SKevin Wolf     // Create MultiwriteCB structure
26107267c094SAnthony Liguori     mcb = g_malloc0(sizeof(*mcb) + num_reqs * sizeof(*mcb->callbacks));
261140b4f539SKevin Wolf     mcb->num_requests = 0;
261240b4f539SKevin Wolf     mcb->num_callbacks = num_reqs;
261340b4f539SKevin Wolf 
261440b4f539SKevin Wolf     for (i = 0; i < num_reqs; i++) {
261540b4f539SKevin Wolf         mcb->callbacks[i].cb = reqs[i].cb;
261640b4f539SKevin Wolf         mcb->callbacks[i].opaque = reqs[i].opaque;
261740b4f539SKevin Wolf     }
261840b4f539SKevin Wolf 
261940b4f539SKevin Wolf     // Check for mergable requests
262040b4f539SKevin Wolf     num_reqs = multiwrite_merge(bs, reqs, num_reqs, mcb);
262140b4f539SKevin Wolf 
26226d519a5fSStefan Hajnoczi     trace_bdrv_aio_multiwrite(mcb, mcb->num_callbacks, num_reqs);
26236d519a5fSStefan Hajnoczi 
2624453f9a16SKevin Wolf     /*
2625453f9a16SKevin Wolf      * Run the aio requests. As soon as one request can't be submitted
2626453f9a16SKevin Wolf      * successfully, fail all requests that are not yet submitted (we must
2627453f9a16SKevin Wolf      * return failure for all requests anyway)
2628453f9a16SKevin Wolf      *
2629453f9a16SKevin Wolf      * num_requests cannot be set to the right value immediately: If
2630453f9a16SKevin Wolf      * bdrv_aio_writev fails for some request, num_requests would be too high
2631453f9a16SKevin Wolf      * and therefore multiwrite_cb() would never recognize the multiwrite
2632453f9a16SKevin Wolf      * request as completed. We also cannot use the loop variable i to set it
2633453f9a16SKevin Wolf      * when the first request fails because the callback may already have been
2634453f9a16SKevin Wolf      * called for previously submitted requests. Thus, num_requests must be
2635453f9a16SKevin Wolf      * incremented for each request that is submitted.
2636453f9a16SKevin Wolf      *
2637453f9a16SKevin Wolf      * The problem that callbacks may be called early also means that we need
2638453f9a16SKevin Wolf      * to take care that num_requests doesn't become 0 before all requests are
2639453f9a16SKevin Wolf      * submitted - multiwrite_cb() would consider the multiwrite request
2640453f9a16SKevin Wolf      * completed. A dummy request that is "completed" by a manual call to
2641453f9a16SKevin Wolf      * multiwrite_cb() takes care of this.
2642453f9a16SKevin Wolf      */
2643453f9a16SKevin Wolf     mcb->num_requests = 1;
2644453f9a16SKevin Wolf 
26456d519a5fSStefan Hajnoczi     // Run the aio requests
264640b4f539SKevin Wolf     for (i = 0; i < num_reqs; i++) {
2647453f9a16SKevin Wolf         mcb->num_requests++;
264840b4f539SKevin Wolf         acb = bdrv_aio_writev(bs, reqs[i].sector, reqs[i].qiov,
264940b4f539SKevin Wolf             reqs[i].nb_sectors, multiwrite_cb, mcb);
265040b4f539SKevin Wolf 
265140b4f539SKevin Wolf         if (acb == NULL) {
265240b4f539SKevin Wolf             // We can only fail the whole thing if no request has been
265340b4f539SKevin Wolf             // submitted yet. Otherwise we'll wait for the submitted AIOs to
265440b4f539SKevin Wolf             // complete and report the error in the callback.
2655453f9a16SKevin Wolf             if (i == 0) {
26566d519a5fSStefan Hajnoczi                 trace_bdrv_aio_multiwrite_earlyfail(mcb);
265740b4f539SKevin Wolf                 goto fail;
265840b4f539SKevin Wolf             } else {
26596d519a5fSStefan Hajnoczi                 trace_bdrv_aio_multiwrite_latefail(mcb, i);
26607eb58a6cSKevin Wolf                 multiwrite_cb(mcb, -EIO);
266140b4f539SKevin Wolf                 break;
266240b4f539SKevin Wolf             }
266340b4f539SKevin Wolf         }
266440b4f539SKevin Wolf     }
266540b4f539SKevin Wolf 
2666453f9a16SKevin Wolf     /* Complete the dummy request */
2667453f9a16SKevin Wolf     multiwrite_cb(mcb, 0);
2668453f9a16SKevin Wolf 
266940b4f539SKevin Wolf     return 0;
267040b4f539SKevin Wolf 
267140b4f539SKevin Wolf fail:
2672453f9a16SKevin Wolf     for (i = 0; i < mcb->num_callbacks; i++) {
2673453f9a16SKevin Wolf         reqs[i].error = -EIO;
2674453f9a16SKevin Wolf     }
26757267c094SAnthony Liguori     g_free(mcb);
267640b4f539SKevin Wolf     return -1;
267740b4f539SKevin Wolf }
267840b4f539SKevin Wolf 
2679b2e12bc6SChristoph Hellwig BlockDriverAIOCB *bdrv_aio_flush(BlockDriverState *bs,
2680b2e12bc6SChristoph Hellwig         BlockDriverCompletionFunc *cb, void *opaque)
2681b2e12bc6SChristoph Hellwig {
2682b2e12bc6SChristoph Hellwig     BlockDriver *drv = bs->drv;
2683b2e12bc6SChristoph Hellwig 
2684a13aac04SStefan Hajnoczi     trace_bdrv_aio_flush(bs, opaque);
2685a13aac04SStefan Hajnoczi 
2686016f5cf6SAlexander Graf     if (bs->open_flags & BDRV_O_NO_FLUSH) {
2687016f5cf6SAlexander Graf         return bdrv_aio_noop_em(bs, cb, opaque);
2688016f5cf6SAlexander Graf     }
2689016f5cf6SAlexander Graf 
2690b2e12bc6SChristoph Hellwig     if (!drv)
2691b2e12bc6SChristoph Hellwig         return NULL;
2692b2e12bc6SChristoph Hellwig     return drv->bdrv_aio_flush(bs, cb, opaque);
2693b2e12bc6SChristoph Hellwig }
2694b2e12bc6SChristoph Hellwig 
269583f64091Sbellard void bdrv_aio_cancel(BlockDriverAIOCB *acb)
269683f64091Sbellard {
26976bbff9a0Saliguori     acb->pool->cancel(acb);
269883f64091Sbellard }
269983f64091Sbellard 
270083f64091Sbellard 
270183f64091Sbellard /**************************************************************/
270283f64091Sbellard /* async block device emulation */
270383f64091Sbellard 
2704c16b5a2cSChristoph Hellwig typedef struct BlockDriverAIOCBSync {
2705c16b5a2cSChristoph Hellwig     BlockDriverAIOCB common;
2706c16b5a2cSChristoph Hellwig     QEMUBH *bh;
2707c16b5a2cSChristoph Hellwig     int ret;
2708c16b5a2cSChristoph Hellwig     /* vector translation state */
2709c16b5a2cSChristoph Hellwig     QEMUIOVector *qiov;
2710c16b5a2cSChristoph Hellwig     uint8_t *bounce;
2711c16b5a2cSChristoph Hellwig     int is_write;
2712c16b5a2cSChristoph Hellwig } BlockDriverAIOCBSync;
2713c16b5a2cSChristoph Hellwig 
2714c16b5a2cSChristoph Hellwig static void bdrv_aio_cancel_em(BlockDriverAIOCB *blockacb)
2715c16b5a2cSChristoph Hellwig {
2716b666d239SKevin Wolf     BlockDriverAIOCBSync *acb =
2717b666d239SKevin Wolf         container_of(blockacb, BlockDriverAIOCBSync, common);
27186a7ad299SDor Laor     qemu_bh_delete(acb->bh);
271936afc451SAvi Kivity     acb->bh = NULL;
2720c16b5a2cSChristoph Hellwig     qemu_aio_release(acb);
2721c16b5a2cSChristoph Hellwig }
2722c16b5a2cSChristoph Hellwig 
2723c16b5a2cSChristoph Hellwig static AIOPool bdrv_em_aio_pool = {
2724c16b5a2cSChristoph Hellwig     .aiocb_size         = sizeof(BlockDriverAIOCBSync),
2725c16b5a2cSChristoph Hellwig     .cancel             = bdrv_aio_cancel_em,
2726c16b5a2cSChristoph Hellwig };
2727c16b5a2cSChristoph Hellwig 
272883f64091Sbellard static void bdrv_aio_bh_cb(void *opaque)
2729beac80cdSbellard {
2730ce1a14dcSpbrook     BlockDriverAIOCBSync *acb = opaque;
2731f141eafeSaliguori 
2732f141eafeSaliguori     if (!acb->is_write)
2733f141eafeSaliguori         qemu_iovec_from_buffer(acb->qiov, acb->bounce, acb->qiov->size);
2734ceb42de8Saliguori     qemu_vfree(acb->bounce);
2735ce1a14dcSpbrook     acb->common.cb(acb->common.opaque, acb->ret);
27366a7ad299SDor Laor     qemu_bh_delete(acb->bh);
273736afc451SAvi Kivity     acb->bh = NULL;
2738ce1a14dcSpbrook     qemu_aio_release(acb);
2739beac80cdSbellard }
2740beac80cdSbellard 
2741f141eafeSaliguori static BlockDriverAIOCB *bdrv_aio_rw_vector(BlockDriverState *bs,
2742f141eafeSaliguori                                             int64_t sector_num,
2743f141eafeSaliguori                                             QEMUIOVector *qiov,
2744f141eafeSaliguori                                             int nb_sectors,
2745f141eafeSaliguori                                             BlockDriverCompletionFunc *cb,
2746f141eafeSaliguori                                             void *opaque,
2747f141eafeSaliguori                                             int is_write)
2748f141eafeSaliguori 
2749ea2384d3Sbellard {
2750ce1a14dcSpbrook     BlockDriverAIOCBSync *acb;
275183f64091Sbellard 
2752c16b5a2cSChristoph Hellwig     acb = qemu_aio_get(&bdrv_em_aio_pool, bs, cb, opaque);
2753f141eafeSaliguori     acb->is_write = is_write;
2754f141eafeSaliguori     acb->qiov = qiov;
2755e268ca52Saliguori     acb->bounce = qemu_blockalign(bs, qiov->size);
2756f141eafeSaliguori 
2757ce1a14dcSpbrook     if (!acb->bh)
2758ce1a14dcSpbrook         acb->bh = qemu_bh_new(bdrv_aio_bh_cb, acb);
2759f141eafeSaliguori 
2760f141eafeSaliguori     if (is_write) {
2761f141eafeSaliguori         qemu_iovec_to_buffer(acb->qiov, acb->bounce);
27621ed20acfSStefan Hajnoczi         acb->ret = bs->drv->bdrv_write(bs, sector_num, acb->bounce, nb_sectors);
2763f141eafeSaliguori     } else {
27641ed20acfSStefan Hajnoczi         acb->ret = bs->drv->bdrv_read(bs, sector_num, acb->bounce, nb_sectors);
2765f141eafeSaliguori     }
2766f141eafeSaliguori 
2767ce1a14dcSpbrook     qemu_bh_schedule(acb->bh);
2768f141eafeSaliguori 
2769ce1a14dcSpbrook     return &acb->common;
27707a6cba61Spbrook }
27717a6cba61Spbrook 
2772f141eafeSaliguori static BlockDriverAIOCB *bdrv_aio_readv_em(BlockDriverState *bs,
2773f141eafeSaliguori         int64_t sector_num, QEMUIOVector *qiov, int nb_sectors,
2774ce1a14dcSpbrook         BlockDriverCompletionFunc *cb, void *opaque)
277583f64091Sbellard {
2776f141eafeSaliguori     return bdrv_aio_rw_vector(bs, sector_num, qiov, nb_sectors, cb, opaque, 0);
277783f64091Sbellard }
277883f64091Sbellard 
2779f141eafeSaliguori static BlockDriverAIOCB *bdrv_aio_writev_em(BlockDriverState *bs,
2780f141eafeSaliguori         int64_t sector_num, QEMUIOVector *qiov, int nb_sectors,
2781f141eafeSaliguori         BlockDriverCompletionFunc *cb, void *opaque)
2782f141eafeSaliguori {
2783f141eafeSaliguori     return bdrv_aio_rw_vector(bs, sector_num, qiov, nb_sectors, cb, opaque, 1);
2784f141eafeSaliguori }
2785f141eafeSaliguori 
278668485420SKevin Wolf 
278768485420SKevin Wolf typedef struct BlockDriverAIOCBCoroutine {
278868485420SKevin Wolf     BlockDriverAIOCB common;
278968485420SKevin Wolf     BlockRequest req;
279068485420SKevin Wolf     bool is_write;
279168485420SKevin Wolf     QEMUBH* bh;
279268485420SKevin Wolf } BlockDriverAIOCBCoroutine;
279368485420SKevin Wolf 
279468485420SKevin Wolf static void bdrv_aio_co_cancel_em(BlockDriverAIOCB *blockacb)
279568485420SKevin Wolf {
279668485420SKevin Wolf     qemu_aio_flush();
279768485420SKevin Wolf }
279868485420SKevin Wolf 
279968485420SKevin Wolf static AIOPool bdrv_em_co_aio_pool = {
280068485420SKevin Wolf     .aiocb_size         = sizeof(BlockDriverAIOCBCoroutine),
280168485420SKevin Wolf     .cancel             = bdrv_aio_co_cancel_em,
280268485420SKevin Wolf };
280368485420SKevin Wolf 
280468485420SKevin Wolf static void bdrv_co_rw_bh(void *opaque)
280568485420SKevin Wolf {
280668485420SKevin Wolf     BlockDriverAIOCBCoroutine *acb = opaque;
280768485420SKevin Wolf 
280868485420SKevin Wolf     acb->common.cb(acb->common.opaque, acb->req.error);
280968485420SKevin Wolf     qemu_bh_delete(acb->bh);
281068485420SKevin Wolf     qemu_aio_release(acb);
281168485420SKevin Wolf }
281268485420SKevin Wolf 
281368485420SKevin Wolf static void coroutine_fn bdrv_co_rw(void *opaque)
281468485420SKevin Wolf {
281568485420SKevin Wolf     BlockDriverAIOCBCoroutine *acb = opaque;
281668485420SKevin Wolf     BlockDriverState *bs = acb->common.bs;
281768485420SKevin Wolf 
281868485420SKevin Wolf     if (!acb->is_write) {
281968485420SKevin Wolf         acb->req.error = bs->drv->bdrv_co_readv(bs, acb->req.sector,
282068485420SKevin Wolf             acb->req.nb_sectors, acb->req.qiov);
282168485420SKevin Wolf     } else {
282268485420SKevin Wolf         acb->req.error = bs->drv->bdrv_co_writev(bs, acb->req.sector,
282368485420SKevin Wolf             acb->req.nb_sectors, acb->req.qiov);
282468485420SKevin Wolf     }
282568485420SKevin Wolf 
282668485420SKevin Wolf     acb->bh = qemu_bh_new(bdrv_co_rw_bh, acb);
282768485420SKevin Wolf     qemu_bh_schedule(acb->bh);
282868485420SKevin Wolf }
282968485420SKevin Wolf 
283068485420SKevin Wolf static BlockDriverAIOCB *bdrv_co_aio_rw_vector(BlockDriverState *bs,
283168485420SKevin Wolf                                                int64_t sector_num,
283268485420SKevin Wolf                                                QEMUIOVector *qiov,
283368485420SKevin Wolf                                                int nb_sectors,
283468485420SKevin Wolf                                                BlockDriverCompletionFunc *cb,
283568485420SKevin Wolf                                                void *opaque,
283668485420SKevin Wolf                                                bool is_write)
283768485420SKevin Wolf {
283868485420SKevin Wolf     Coroutine *co;
283968485420SKevin Wolf     BlockDriverAIOCBCoroutine *acb;
284068485420SKevin Wolf 
284168485420SKevin Wolf     acb = qemu_aio_get(&bdrv_em_co_aio_pool, bs, cb, opaque);
284268485420SKevin Wolf     acb->req.sector = sector_num;
284368485420SKevin Wolf     acb->req.nb_sectors = nb_sectors;
284468485420SKevin Wolf     acb->req.qiov = qiov;
284568485420SKevin Wolf     acb->is_write = is_write;
284668485420SKevin Wolf 
284768485420SKevin Wolf     co = qemu_coroutine_create(bdrv_co_rw);
284868485420SKevin Wolf     qemu_coroutine_enter(co, acb);
284968485420SKevin Wolf 
285068485420SKevin Wolf     return &acb->common;
285168485420SKevin Wolf }
285268485420SKevin Wolf 
285368485420SKevin Wolf static BlockDriverAIOCB *bdrv_co_aio_readv_em(BlockDriverState *bs,
285468485420SKevin Wolf         int64_t sector_num, QEMUIOVector *qiov, int nb_sectors,
285568485420SKevin Wolf         BlockDriverCompletionFunc *cb, void *opaque)
285668485420SKevin Wolf {
285768485420SKevin Wolf     return bdrv_co_aio_rw_vector(bs, sector_num, qiov, nb_sectors, cb, opaque,
285868485420SKevin Wolf                                  false);
285968485420SKevin Wolf }
286068485420SKevin Wolf 
286168485420SKevin Wolf static BlockDriverAIOCB *bdrv_co_aio_writev_em(BlockDriverState *bs,
286268485420SKevin Wolf         int64_t sector_num, QEMUIOVector *qiov, int nb_sectors,
286368485420SKevin Wolf         BlockDriverCompletionFunc *cb, void *opaque)
286468485420SKevin Wolf {
286568485420SKevin Wolf     return bdrv_co_aio_rw_vector(bs, sector_num, qiov, nb_sectors, cb, opaque,
286668485420SKevin Wolf                                  true);
286768485420SKevin Wolf }
286868485420SKevin Wolf 
2869b2e12bc6SChristoph Hellwig static BlockDriverAIOCB *bdrv_aio_flush_em(BlockDriverState *bs,
2870b2e12bc6SChristoph Hellwig         BlockDriverCompletionFunc *cb, void *opaque)
2871b2e12bc6SChristoph Hellwig {
2872b2e12bc6SChristoph Hellwig     BlockDriverAIOCBSync *acb;
2873b2e12bc6SChristoph Hellwig 
2874b2e12bc6SChristoph Hellwig     acb = qemu_aio_get(&bdrv_em_aio_pool, bs, cb, opaque);
2875b2e12bc6SChristoph Hellwig     acb->is_write = 1; /* don't bounce in the completion hadler */
2876b2e12bc6SChristoph Hellwig     acb->qiov = NULL;
2877b2e12bc6SChristoph Hellwig     acb->bounce = NULL;
2878b2e12bc6SChristoph Hellwig     acb->ret = 0;
2879b2e12bc6SChristoph Hellwig 
2880b2e12bc6SChristoph Hellwig     if (!acb->bh)
2881b2e12bc6SChristoph Hellwig         acb->bh = qemu_bh_new(bdrv_aio_bh_cb, acb);
2882b2e12bc6SChristoph Hellwig 
2883b2e12bc6SChristoph Hellwig     bdrv_flush(bs);
2884b2e12bc6SChristoph Hellwig     qemu_bh_schedule(acb->bh);
2885b2e12bc6SChristoph Hellwig     return &acb->common;
2886b2e12bc6SChristoph Hellwig }
2887b2e12bc6SChristoph Hellwig 
2888016f5cf6SAlexander Graf static BlockDriverAIOCB *bdrv_aio_noop_em(BlockDriverState *bs,
2889016f5cf6SAlexander Graf         BlockDriverCompletionFunc *cb, void *opaque)
2890016f5cf6SAlexander Graf {
2891016f5cf6SAlexander Graf     BlockDriverAIOCBSync *acb;
2892016f5cf6SAlexander Graf 
2893016f5cf6SAlexander Graf     acb = qemu_aio_get(&bdrv_em_aio_pool, bs, cb, opaque);
2894016f5cf6SAlexander Graf     acb->is_write = 1; /* don't bounce in the completion handler */
2895016f5cf6SAlexander Graf     acb->qiov = NULL;
2896016f5cf6SAlexander Graf     acb->bounce = NULL;
2897016f5cf6SAlexander Graf     acb->ret = 0;
2898016f5cf6SAlexander Graf 
2899016f5cf6SAlexander Graf     if (!acb->bh) {
2900016f5cf6SAlexander Graf         acb->bh = qemu_bh_new(bdrv_aio_bh_cb, acb);
2901016f5cf6SAlexander Graf     }
2902016f5cf6SAlexander Graf 
2903016f5cf6SAlexander Graf     qemu_bh_schedule(acb->bh);
2904016f5cf6SAlexander Graf     return &acb->common;
2905016f5cf6SAlexander Graf }
2906016f5cf6SAlexander Graf 
290783f64091Sbellard /**************************************************************/
290883f64091Sbellard /* sync block device emulation */
290983f64091Sbellard 
291083f64091Sbellard static void bdrv_rw_em_cb(void *opaque, int ret)
291183f64091Sbellard {
291283f64091Sbellard     *(int *)opaque = ret;
291383f64091Sbellard }
291483f64091Sbellard 
291583f64091Sbellard #define NOT_DONE 0x7fffffff
291683f64091Sbellard 
291783f64091Sbellard static int bdrv_read_em(BlockDriverState *bs, int64_t sector_num,
291883f64091Sbellard                         uint8_t *buf, int nb_sectors)
291983f64091Sbellard {
2920ce1a14dcSpbrook     int async_ret;
2921ce1a14dcSpbrook     BlockDriverAIOCB *acb;
2922f141eafeSaliguori     struct iovec iov;
2923f141eafeSaliguori     QEMUIOVector qiov;
292483f64091Sbellard 
292583f64091Sbellard     async_ret = NOT_DONE;
29263f4cb3d3Sblueswir1     iov.iov_base = (void *)buf;
2927eb5a3165SJes Sorensen     iov.iov_len = nb_sectors * BDRV_SECTOR_SIZE;
2928f141eafeSaliguori     qemu_iovec_init_external(&qiov, &iov, 1);
29291ed20acfSStefan Hajnoczi 
29301ed20acfSStefan Hajnoczi     acb = bs->drv->bdrv_aio_readv(bs, sector_num, &qiov, nb_sectors,
293183f64091Sbellard                                   bdrv_rw_em_cb, &async_ret);
293265d6b3d8SKevin Wolf     if (acb == NULL) {
293365d6b3d8SKevin Wolf         async_ret = -1;
293465d6b3d8SKevin Wolf         goto fail;
293565d6b3d8SKevin Wolf     }
2936baf35cb9Saliguori 
293783f64091Sbellard     while (async_ret == NOT_DONE) {
293883f64091Sbellard         qemu_aio_wait();
293983f64091Sbellard     }
2940baf35cb9Saliguori 
294165d6b3d8SKevin Wolf 
294265d6b3d8SKevin Wolf fail:
294383f64091Sbellard     return async_ret;
294483f64091Sbellard }
294583f64091Sbellard 
294683f64091Sbellard static int bdrv_write_em(BlockDriverState *bs, int64_t sector_num,
294783f64091Sbellard                          const uint8_t *buf, int nb_sectors)
294883f64091Sbellard {
2949ce1a14dcSpbrook     int async_ret;
2950ce1a14dcSpbrook     BlockDriverAIOCB *acb;
2951f141eafeSaliguori     struct iovec iov;
2952f141eafeSaliguori     QEMUIOVector qiov;
295383f64091Sbellard 
295483f64091Sbellard     async_ret = NOT_DONE;
2955f141eafeSaliguori     iov.iov_base = (void *)buf;
2956eb5a3165SJes Sorensen     iov.iov_len = nb_sectors * BDRV_SECTOR_SIZE;
2957f141eafeSaliguori     qemu_iovec_init_external(&qiov, &iov, 1);
29581ed20acfSStefan Hajnoczi 
29591ed20acfSStefan Hajnoczi     acb = bs->drv->bdrv_aio_writev(bs, sector_num, &qiov, nb_sectors,
296083f64091Sbellard                                    bdrv_rw_em_cb, &async_ret);
296165d6b3d8SKevin Wolf     if (acb == NULL) {
296265d6b3d8SKevin Wolf         async_ret = -1;
296365d6b3d8SKevin Wolf         goto fail;
296465d6b3d8SKevin Wolf     }
296583f64091Sbellard     while (async_ret == NOT_DONE) {
296683f64091Sbellard         qemu_aio_wait();
296783f64091Sbellard     }
296865d6b3d8SKevin Wolf 
296965d6b3d8SKevin Wolf fail:
297083f64091Sbellard     return async_ret;
297183f64091Sbellard }
2972ea2384d3Sbellard 
2973ea2384d3Sbellard void bdrv_init(void)
2974ea2384d3Sbellard {
29755efa9d5aSAnthony Liguori     module_call_init(MODULE_INIT_BLOCK);
2976ea2384d3Sbellard }
2977ce1a14dcSpbrook 
2978eb852011SMarkus Armbruster void bdrv_init_with_whitelist(void)
2979eb852011SMarkus Armbruster {
2980eb852011SMarkus Armbruster     use_bdrv_whitelist = 1;
2981eb852011SMarkus Armbruster     bdrv_init();
2982eb852011SMarkus Armbruster }
2983eb852011SMarkus Armbruster 
2984c16b5a2cSChristoph Hellwig void *qemu_aio_get(AIOPool *pool, BlockDriverState *bs,
29856bbff9a0Saliguori                    BlockDriverCompletionFunc *cb, void *opaque)
29866bbff9a0Saliguori {
2987ce1a14dcSpbrook     BlockDriverAIOCB *acb;
2988ce1a14dcSpbrook 
29896bbff9a0Saliguori     if (pool->free_aiocb) {
29906bbff9a0Saliguori         acb = pool->free_aiocb;
29916bbff9a0Saliguori         pool->free_aiocb = acb->next;
2992ce1a14dcSpbrook     } else {
29937267c094SAnthony Liguori         acb = g_malloc0(pool->aiocb_size);
29946bbff9a0Saliguori         acb->pool = pool;
2995ce1a14dcSpbrook     }
2996ce1a14dcSpbrook     acb->bs = bs;
2997ce1a14dcSpbrook     acb->cb = cb;
2998ce1a14dcSpbrook     acb->opaque = opaque;
2999ce1a14dcSpbrook     return acb;
3000ce1a14dcSpbrook }
3001ce1a14dcSpbrook 
3002ce1a14dcSpbrook void qemu_aio_release(void *p)
3003ce1a14dcSpbrook {
30046bbff9a0Saliguori     BlockDriverAIOCB *acb = (BlockDriverAIOCB *)p;
30056bbff9a0Saliguori     AIOPool *pool = acb->pool;
30066bbff9a0Saliguori     acb->next = pool->free_aiocb;
30076bbff9a0Saliguori     pool->free_aiocb = acb;
3008ce1a14dcSpbrook }
300919cb3738Sbellard 
301019cb3738Sbellard /**************************************************************/
3011f9f05dc5SKevin Wolf /* Coroutine block device emulation */
3012f9f05dc5SKevin Wolf 
3013f9f05dc5SKevin Wolf typedef struct CoroutineIOCompletion {
3014f9f05dc5SKevin Wolf     Coroutine *coroutine;
3015f9f05dc5SKevin Wolf     int ret;
3016f9f05dc5SKevin Wolf } CoroutineIOCompletion;
3017f9f05dc5SKevin Wolf 
3018f9f05dc5SKevin Wolf static void bdrv_co_io_em_complete(void *opaque, int ret)
3019f9f05dc5SKevin Wolf {
3020f9f05dc5SKevin Wolf     CoroutineIOCompletion *co = opaque;
3021f9f05dc5SKevin Wolf 
3022f9f05dc5SKevin Wolf     co->ret = ret;
3023f9f05dc5SKevin Wolf     qemu_coroutine_enter(co->coroutine, NULL);
3024f9f05dc5SKevin Wolf }
3025f9f05dc5SKevin Wolf 
3026f9f05dc5SKevin Wolf static int coroutine_fn bdrv_co_io_em(BlockDriverState *bs, int64_t sector_num,
3027f9f05dc5SKevin Wolf                                       int nb_sectors, QEMUIOVector *iov,
3028f9f05dc5SKevin Wolf                                       bool is_write)
3029f9f05dc5SKevin Wolf {
3030f9f05dc5SKevin Wolf     CoroutineIOCompletion co = {
3031f9f05dc5SKevin Wolf         .coroutine = qemu_coroutine_self(),
3032f9f05dc5SKevin Wolf     };
3033f9f05dc5SKevin Wolf     BlockDriverAIOCB *acb;
3034f9f05dc5SKevin Wolf 
3035f9f05dc5SKevin Wolf     if (is_write) {
3036a652d160SStefan Hajnoczi         acb = bs->drv->bdrv_aio_writev(bs, sector_num, iov, nb_sectors,
3037f9f05dc5SKevin Wolf                                        bdrv_co_io_em_complete, &co);
3038f9f05dc5SKevin Wolf     } else {
3039a652d160SStefan Hajnoczi         acb = bs->drv->bdrv_aio_readv(bs, sector_num, iov, nb_sectors,
3040f9f05dc5SKevin Wolf                                       bdrv_co_io_em_complete, &co);
3041f9f05dc5SKevin Wolf     }
3042f9f05dc5SKevin Wolf 
304359370aaaSStefan Hajnoczi     trace_bdrv_co_io_em(bs, sector_num, nb_sectors, is_write, acb);
3044f9f05dc5SKevin Wolf     if (!acb) {
3045f9f05dc5SKevin Wolf         return -EIO;
3046f9f05dc5SKevin Wolf     }
3047f9f05dc5SKevin Wolf     qemu_coroutine_yield();
3048f9f05dc5SKevin Wolf 
3049f9f05dc5SKevin Wolf     return co.ret;
3050f9f05dc5SKevin Wolf }
3051f9f05dc5SKevin Wolf 
3052f9f05dc5SKevin Wolf static int coroutine_fn bdrv_co_readv_em(BlockDriverState *bs,
3053f9f05dc5SKevin Wolf                                          int64_t sector_num, int nb_sectors,
3054f9f05dc5SKevin Wolf                                          QEMUIOVector *iov)
3055f9f05dc5SKevin Wolf {
3056f9f05dc5SKevin Wolf     return bdrv_co_io_em(bs, sector_num, nb_sectors, iov, false);
3057f9f05dc5SKevin Wolf }
3058f9f05dc5SKevin Wolf 
3059f9f05dc5SKevin Wolf static int coroutine_fn bdrv_co_writev_em(BlockDriverState *bs,
3060f9f05dc5SKevin Wolf                                          int64_t sector_num, int nb_sectors,
3061f9f05dc5SKevin Wolf                                          QEMUIOVector *iov)
3062f9f05dc5SKevin Wolf {
3063f9f05dc5SKevin Wolf     return bdrv_co_io_em(bs, sector_num, nb_sectors, iov, true);
3064f9f05dc5SKevin Wolf }
3065f9f05dc5SKevin Wolf 
3066e7a8a783SKevin Wolf static int coroutine_fn bdrv_co_flush_em(BlockDriverState *bs)
3067e7a8a783SKevin Wolf {
3068e7a8a783SKevin Wolf     CoroutineIOCompletion co = {
3069e7a8a783SKevin Wolf         .coroutine = qemu_coroutine_self(),
3070e7a8a783SKevin Wolf     };
3071e7a8a783SKevin Wolf     BlockDriverAIOCB *acb;
3072e7a8a783SKevin Wolf 
3073e7a8a783SKevin Wolf     acb = bdrv_aio_flush(bs, bdrv_co_io_em_complete, &co);
3074e7a8a783SKevin Wolf     if (!acb) {
3075e7a8a783SKevin Wolf         return -EIO;
3076e7a8a783SKevin Wolf     }
3077e7a8a783SKevin Wolf     qemu_coroutine_yield();
3078e7a8a783SKevin Wolf     return co.ret;
3079e7a8a783SKevin Wolf }
3080e7a8a783SKevin Wolf 
3081f9f05dc5SKevin Wolf /**************************************************************/
308219cb3738Sbellard /* removable device support */
308319cb3738Sbellard 
308419cb3738Sbellard /**
308519cb3738Sbellard  * Return TRUE if the media is present
308619cb3738Sbellard  */
308719cb3738Sbellard int bdrv_is_inserted(BlockDriverState *bs)
308819cb3738Sbellard {
308919cb3738Sbellard     BlockDriver *drv = bs->drv;
3090a1aff5bfSMarkus Armbruster 
309119cb3738Sbellard     if (!drv)
309219cb3738Sbellard         return 0;
309319cb3738Sbellard     if (!drv->bdrv_is_inserted)
3094a1aff5bfSMarkus Armbruster         return 1;
3095a1aff5bfSMarkus Armbruster     return drv->bdrv_is_inserted(bs);
309619cb3738Sbellard }
309719cb3738Sbellard 
309819cb3738Sbellard /**
30998e49ca46SMarkus Armbruster  * Return whether the media changed since the last call to this
31008e49ca46SMarkus Armbruster  * function, or -ENOTSUP if we don't know.  Most drivers don't know.
310119cb3738Sbellard  */
310219cb3738Sbellard int bdrv_media_changed(BlockDriverState *bs)
310319cb3738Sbellard {
310419cb3738Sbellard     BlockDriver *drv = bs->drv;
310519cb3738Sbellard 
31068e49ca46SMarkus Armbruster     if (drv && drv->bdrv_media_changed) {
31078e49ca46SMarkus Armbruster         return drv->bdrv_media_changed(bs);
31088e49ca46SMarkus Armbruster     }
31098e49ca46SMarkus Armbruster     return -ENOTSUP;
311019cb3738Sbellard }
311119cb3738Sbellard 
311219cb3738Sbellard /**
311319cb3738Sbellard  * If eject_flag is TRUE, eject the media. Otherwise, close the tray
311419cb3738Sbellard  */
3115fdec4404SMarkus Armbruster void bdrv_eject(BlockDriverState *bs, int eject_flag)
311619cb3738Sbellard {
311719cb3738Sbellard     BlockDriver *drv = bs->drv;
311819cb3738Sbellard 
3119822e1cd1SMarkus Armbruster     if (drv && drv->bdrv_eject) {
3120822e1cd1SMarkus Armbruster         drv->bdrv_eject(bs, eject_flag);
312119cb3738Sbellard     }
312219cb3738Sbellard }
312319cb3738Sbellard 
312419cb3738Sbellard /**
312519cb3738Sbellard  * Lock or unlock the media (if it is locked, the user won't be able
312619cb3738Sbellard  * to eject it manually).
312719cb3738Sbellard  */
3128025e849aSMarkus Armbruster void bdrv_lock_medium(BlockDriverState *bs, bool locked)
312919cb3738Sbellard {
313019cb3738Sbellard     BlockDriver *drv = bs->drv;
313119cb3738Sbellard 
3132025e849aSMarkus Armbruster     trace_bdrv_lock_medium(bs, locked);
3133b8c6d095SStefan Hajnoczi 
3134025e849aSMarkus Armbruster     if (drv && drv->bdrv_lock_medium) {
3135025e849aSMarkus Armbruster         drv->bdrv_lock_medium(bs, locked);
313619cb3738Sbellard     }
313719cb3738Sbellard }
3138985a03b0Sths 
3139985a03b0Sths /* needed for generic scsi interface */
3140985a03b0Sths 
3141985a03b0Sths int bdrv_ioctl(BlockDriverState *bs, unsigned long int req, void *buf)
3142985a03b0Sths {
3143985a03b0Sths     BlockDriver *drv = bs->drv;
3144985a03b0Sths 
3145985a03b0Sths     if (drv && drv->bdrv_ioctl)
3146985a03b0Sths         return drv->bdrv_ioctl(bs, req, buf);
3147985a03b0Sths     return -ENOTSUP;
3148985a03b0Sths }
31497d780669Saliguori 
3150221f715dSaliguori BlockDriverAIOCB *bdrv_aio_ioctl(BlockDriverState *bs,
3151221f715dSaliguori         unsigned long int req, void *buf,
31527d780669Saliguori         BlockDriverCompletionFunc *cb, void *opaque)
31537d780669Saliguori {
3154221f715dSaliguori     BlockDriver *drv = bs->drv;
31557d780669Saliguori 
3156221f715dSaliguori     if (drv && drv->bdrv_aio_ioctl)
3157221f715dSaliguori         return drv->bdrv_aio_ioctl(bs, req, buf, cb, opaque);
3158221f715dSaliguori     return NULL;
31597d780669Saliguori }
3160e268ca52Saliguori 
31617b6f9300SMarkus Armbruster void bdrv_set_buffer_alignment(BlockDriverState *bs, int align)
31627b6f9300SMarkus Armbruster {
31637b6f9300SMarkus Armbruster     bs->buffer_alignment = align;
31647b6f9300SMarkus Armbruster }
31657cd1e32aSlirans@il.ibm.com 
3166e268ca52Saliguori void *qemu_blockalign(BlockDriverState *bs, size_t size)
3167e268ca52Saliguori {
3168e268ca52Saliguori     return qemu_memalign((bs && bs->buffer_alignment) ? bs->buffer_alignment : 512, size);
3169e268ca52Saliguori }
31707cd1e32aSlirans@il.ibm.com 
31717cd1e32aSlirans@il.ibm.com void bdrv_set_dirty_tracking(BlockDriverState *bs, int enable)
31727cd1e32aSlirans@il.ibm.com {
31737cd1e32aSlirans@il.ibm.com     int64_t bitmap_size;
3174a55eb92cSJan Kiszka 
3175aaa0eb75SLiran Schour     bs->dirty_count = 0;
31767cd1e32aSlirans@il.ibm.com     if (enable) {
3177c6d22830SJan Kiszka         if (!bs->dirty_bitmap) {
3178c6d22830SJan Kiszka             bitmap_size = (bdrv_getlength(bs) >> BDRV_SECTOR_BITS) +
3179c6d22830SJan Kiszka                     BDRV_SECTORS_PER_DIRTY_CHUNK * 8 - 1;
3180c6d22830SJan Kiszka             bitmap_size /= BDRV_SECTORS_PER_DIRTY_CHUNK * 8;
31817cd1e32aSlirans@il.ibm.com 
31827267c094SAnthony Liguori             bs->dirty_bitmap = g_malloc0(bitmap_size);
31837cd1e32aSlirans@il.ibm.com         }
31847cd1e32aSlirans@il.ibm.com     } else {
3185c6d22830SJan Kiszka         if (bs->dirty_bitmap) {
31867267c094SAnthony Liguori             g_free(bs->dirty_bitmap);
3187c6d22830SJan Kiszka             bs->dirty_bitmap = NULL;
31887cd1e32aSlirans@il.ibm.com         }
31897cd1e32aSlirans@il.ibm.com     }
31907cd1e32aSlirans@il.ibm.com }
31917cd1e32aSlirans@il.ibm.com 
31927cd1e32aSlirans@il.ibm.com int bdrv_get_dirty(BlockDriverState *bs, int64_t sector)
31937cd1e32aSlirans@il.ibm.com {
31946ea44308SJan Kiszka     int64_t chunk = sector / (int64_t)BDRV_SECTORS_PER_DIRTY_CHUNK;
31957cd1e32aSlirans@il.ibm.com 
3196c6d22830SJan Kiszka     if (bs->dirty_bitmap &&
3197c6d22830SJan Kiszka         (sector << BDRV_SECTOR_BITS) < bdrv_getlength(bs)) {
31986d59fec1SMarcelo Tosatti         return !!(bs->dirty_bitmap[chunk / (sizeof(unsigned long) * 8)] &
31996d59fec1SMarcelo Tosatti             (1UL << (chunk % (sizeof(unsigned long) * 8))));
32007cd1e32aSlirans@il.ibm.com     } else {
32017cd1e32aSlirans@il.ibm.com         return 0;
32027cd1e32aSlirans@il.ibm.com     }
32037cd1e32aSlirans@il.ibm.com }
32047cd1e32aSlirans@il.ibm.com 
32057cd1e32aSlirans@il.ibm.com void bdrv_reset_dirty(BlockDriverState *bs, int64_t cur_sector,
32067cd1e32aSlirans@il.ibm.com                       int nr_sectors)
32077cd1e32aSlirans@il.ibm.com {
32087cd1e32aSlirans@il.ibm.com     set_dirty_bitmap(bs, cur_sector, nr_sectors, 0);
32097cd1e32aSlirans@il.ibm.com }
3210aaa0eb75SLiran Schour 
3211aaa0eb75SLiran Schour int64_t bdrv_get_dirty_count(BlockDriverState *bs)
3212aaa0eb75SLiran Schour {
3213aaa0eb75SLiran Schour     return bs->dirty_count;
3214aaa0eb75SLiran Schour }
3215f88e1a42SJes Sorensen 
3216db593f25SMarcelo Tosatti void bdrv_set_in_use(BlockDriverState *bs, int in_use)
3217db593f25SMarcelo Tosatti {
3218db593f25SMarcelo Tosatti     assert(bs->in_use != in_use);
3219db593f25SMarcelo Tosatti     bs->in_use = in_use;
3220db593f25SMarcelo Tosatti }
3221db593f25SMarcelo Tosatti 
3222db593f25SMarcelo Tosatti int bdrv_in_use(BlockDriverState *bs)
3223db593f25SMarcelo Tosatti {
3224db593f25SMarcelo Tosatti     return bs->in_use;
3225db593f25SMarcelo Tosatti }
3226db593f25SMarcelo Tosatti 
322728a7282aSLuiz Capitulino void bdrv_iostatus_enable(BlockDriverState *bs)
322828a7282aSLuiz Capitulino {
322928a7282aSLuiz Capitulino     bs->iostatus = BDRV_IOS_OK;
323028a7282aSLuiz Capitulino }
323128a7282aSLuiz Capitulino 
323228a7282aSLuiz Capitulino /* The I/O status is only enabled if the drive explicitly
323328a7282aSLuiz Capitulino  * enables it _and_ the VM is configured to stop on errors */
323428a7282aSLuiz Capitulino bool bdrv_iostatus_is_enabled(const BlockDriverState *bs)
323528a7282aSLuiz Capitulino {
323628a7282aSLuiz Capitulino     return (bs->iostatus != BDRV_IOS_INVAL &&
323728a7282aSLuiz Capitulino            (bs->on_write_error == BLOCK_ERR_STOP_ENOSPC ||
323828a7282aSLuiz Capitulino             bs->on_write_error == BLOCK_ERR_STOP_ANY    ||
323928a7282aSLuiz Capitulino             bs->on_read_error == BLOCK_ERR_STOP_ANY));
324028a7282aSLuiz Capitulino }
324128a7282aSLuiz Capitulino 
324228a7282aSLuiz Capitulino void bdrv_iostatus_disable(BlockDriverState *bs)
324328a7282aSLuiz Capitulino {
324428a7282aSLuiz Capitulino     bs->iostatus = BDRV_IOS_INVAL;
324528a7282aSLuiz Capitulino }
324628a7282aSLuiz Capitulino 
324728a7282aSLuiz Capitulino void bdrv_iostatus_reset(BlockDriverState *bs)
324828a7282aSLuiz Capitulino {
324928a7282aSLuiz Capitulino     if (bdrv_iostatus_is_enabled(bs)) {
325028a7282aSLuiz Capitulino         bs->iostatus = BDRV_IOS_OK;
325128a7282aSLuiz Capitulino     }
325228a7282aSLuiz Capitulino }
325328a7282aSLuiz Capitulino 
325428a7282aSLuiz Capitulino /* XXX: Today this is set by device models because it makes the implementation
325528a7282aSLuiz Capitulino    quite simple. However, the block layer knows about the error, so it's
325628a7282aSLuiz Capitulino    possible to implement this without device models being involved */
325728a7282aSLuiz Capitulino void bdrv_iostatus_set_err(BlockDriverState *bs, int error)
325828a7282aSLuiz Capitulino {
325928a7282aSLuiz Capitulino     if (bdrv_iostatus_is_enabled(bs) && bs->iostatus == BDRV_IOS_OK) {
326028a7282aSLuiz Capitulino         assert(error >= 0);
326128a7282aSLuiz Capitulino         bs->iostatus = error == ENOSPC ? BDRV_IOS_ENOSPC : BDRV_IOS_FAILED;
326228a7282aSLuiz Capitulino     }
326328a7282aSLuiz Capitulino }
326428a7282aSLuiz Capitulino 
3265a597e79cSChristoph Hellwig void
3266a597e79cSChristoph Hellwig bdrv_acct_start(BlockDriverState *bs, BlockAcctCookie *cookie, int64_t bytes,
3267a597e79cSChristoph Hellwig         enum BlockAcctType type)
3268a597e79cSChristoph Hellwig {
3269a597e79cSChristoph Hellwig     assert(type < BDRV_MAX_IOTYPE);
3270a597e79cSChristoph Hellwig 
3271a597e79cSChristoph Hellwig     cookie->bytes = bytes;
3272c488c7f6SChristoph Hellwig     cookie->start_time_ns = get_clock();
3273a597e79cSChristoph Hellwig     cookie->type = type;
3274a597e79cSChristoph Hellwig }
3275a597e79cSChristoph Hellwig 
3276a597e79cSChristoph Hellwig void
3277a597e79cSChristoph Hellwig bdrv_acct_done(BlockDriverState *bs, BlockAcctCookie *cookie)
3278a597e79cSChristoph Hellwig {
3279a597e79cSChristoph Hellwig     assert(cookie->type < BDRV_MAX_IOTYPE);
3280a597e79cSChristoph Hellwig 
3281a597e79cSChristoph Hellwig     bs->nr_bytes[cookie->type] += cookie->bytes;
3282a597e79cSChristoph Hellwig     bs->nr_ops[cookie->type]++;
3283c488c7f6SChristoph Hellwig     bs->total_time_ns[cookie->type] += get_clock() - cookie->start_time_ns;
3284a597e79cSChristoph Hellwig }
3285a597e79cSChristoph Hellwig 
3286f88e1a42SJes Sorensen int bdrv_img_create(const char *filename, const char *fmt,
3287f88e1a42SJes Sorensen                     const char *base_filename, const char *base_fmt,
3288f88e1a42SJes Sorensen                     char *options, uint64_t img_size, int flags)
3289f88e1a42SJes Sorensen {
3290f88e1a42SJes Sorensen     QEMUOptionParameter *param = NULL, *create_options = NULL;
3291d220894eSKevin Wolf     QEMUOptionParameter *backing_fmt, *backing_file, *size;
3292f88e1a42SJes Sorensen     BlockDriverState *bs = NULL;
3293f88e1a42SJes Sorensen     BlockDriver *drv, *proto_drv;
329496df67d1SStefan Hajnoczi     BlockDriver *backing_drv = NULL;
3295f88e1a42SJes Sorensen     int ret = 0;
3296f88e1a42SJes Sorensen 
3297f88e1a42SJes Sorensen     /* Find driver and parse its options */
3298f88e1a42SJes Sorensen     drv = bdrv_find_format(fmt);
3299f88e1a42SJes Sorensen     if (!drv) {
3300f88e1a42SJes Sorensen         error_report("Unknown file format '%s'", fmt);
33014f70f249SJes Sorensen         ret = -EINVAL;
3302f88e1a42SJes Sorensen         goto out;
3303f88e1a42SJes Sorensen     }
3304f88e1a42SJes Sorensen 
3305f88e1a42SJes Sorensen     proto_drv = bdrv_find_protocol(filename);
3306f88e1a42SJes Sorensen     if (!proto_drv) {
3307f88e1a42SJes Sorensen         error_report("Unknown protocol '%s'", filename);
33084f70f249SJes Sorensen         ret = -EINVAL;
3309f88e1a42SJes Sorensen         goto out;
3310f88e1a42SJes Sorensen     }
3311f88e1a42SJes Sorensen 
3312f88e1a42SJes Sorensen     create_options = append_option_parameters(create_options,
3313f88e1a42SJes Sorensen                                               drv->create_options);
3314f88e1a42SJes Sorensen     create_options = append_option_parameters(create_options,
3315f88e1a42SJes Sorensen                                               proto_drv->create_options);
3316f88e1a42SJes Sorensen 
3317f88e1a42SJes Sorensen     /* Create parameter list with default values */
3318f88e1a42SJes Sorensen     param = parse_option_parameters("", create_options, param);
3319f88e1a42SJes Sorensen 
3320f88e1a42SJes Sorensen     set_option_parameter_int(param, BLOCK_OPT_SIZE, img_size);
3321f88e1a42SJes Sorensen 
3322f88e1a42SJes Sorensen     /* Parse -o options */
3323f88e1a42SJes Sorensen     if (options) {
3324f88e1a42SJes Sorensen         param = parse_option_parameters(options, create_options, param);
3325f88e1a42SJes Sorensen         if (param == NULL) {
3326f88e1a42SJes Sorensen             error_report("Invalid options for file format '%s'.", fmt);
33274f70f249SJes Sorensen             ret = -EINVAL;
3328f88e1a42SJes Sorensen             goto out;
3329f88e1a42SJes Sorensen         }
3330f88e1a42SJes Sorensen     }
3331f88e1a42SJes Sorensen 
3332f88e1a42SJes Sorensen     if (base_filename) {
3333f88e1a42SJes Sorensen         if (set_option_parameter(param, BLOCK_OPT_BACKING_FILE,
3334f88e1a42SJes Sorensen                                  base_filename)) {
3335f88e1a42SJes Sorensen             error_report("Backing file not supported for file format '%s'",
3336f88e1a42SJes Sorensen                          fmt);
33374f70f249SJes Sorensen             ret = -EINVAL;
3338f88e1a42SJes Sorensen             goto out;
3339f88e1a42SJes Sorensen         }
3340f88e1a42SJes Sorensen     }
3341f88e1a42SJes Sorensen 
3342f88e1a42SJes Sorensen     if (base_fmt) {
3343f88e1a42SJes Sorensen         if (set_option_parameter(param, BLOCK_OPT_BACKING_FMT, base_fmt)) {
3344f88e1a42SJes Sorensen             error_report("Backing file format not supported for file "
3345f88e1a42SJes Sorensen                          "format '%s'", fmt);
33464f70f249SJes Sorensen             ret = -EINVAL;
3347f88e1a42SJes Sorensen             goto out;
3348f88e1a42SJes Sorensen         }
3349f88e1a42SJes Sorensen     }
3350f88e1a42SJes Sorensen 
3351792da93aSJes Sorensen     backing_file = get_option_parameter(param, BLOCK_OPT_BACKING_FILE);
3352792da93aSJes Sorensen     if (backing_file && backing_file->value.s) {
3353792da93aSJes Sorensen         if (!strcmp(filename, backing_file->value.s)) {
3354792da93aSJes Sorensen             error_report("Error: Trying to create an image with the "
3355792da93aSJes Sorensen                          "same filename as the backing file");
33564f70f249SJes Sorensen             ret = -EINVAL;
3357792da93aSJes Sorensen             goto out;
3358792da93aSJes Sorensen         }
3359792da93aSJes Sorensen     }
3360792da93aSJes Sorensen 
3361f88e1a42SJes Sorensen     backing_fmt = get_option_parameter(param, BLOCK_OPT_BACKING_FMT);
3362f88e1a42SJes Sorensen     if (backing_fmt && backing_fmt->value.s) {
336396df67d1SStefan Hajnoczi         backing_drv = bdrv_find_format(backing_fmt->value.s);
336496df67d1SStefan Hajnoczi         if (!backing_drv) {
3365f88e1a42SJes Sorensen             error_report("Unknown backing file format '%s'",
3366f88e1a42SJes Sorensen                          backing_fmt->value.s);
33674f70f249SJes Sorensen             ret = -EINVAL;
3368f88e1a42SJes Sorensen             goto out;
3369f88e1a42SJes Sorensen         }
3370f88e1a42SJes Sorensen     }
3371f88e1a42SJes Sorensen 
3372f88e1a42SJes Sorensen     // The size for the image must always be specified, with one exception:
3373f88e1a42SJes Sorensen     // If we are using a backing file, we can obtain the size from there
3374d220894eSKevin Wolf     size = get_option_parameter(param, BLOCK_OPT_SIZE);
3375d220894eSKevin Wolf     if (size && size->value.n == -1) {
3376f88e1a42SJes Sorensen         if (backing_file && backing_file->value.s) {
3377f88e1a42SJes Sorensen             uint64_t size;
3378f88e1a42SJes Sorensen             char buf[32];
3379f88e1a42SJes Sorensen 
3380f88e1a42SJes Sorensen             bs = bdrv_new("");
3381f88e1a42SJes Sorensen 
338296df67d1SStefan Hajnoczi             ret = bdrv_open(bs, backing_file->value.s, flags, backing_drv);
3383f88e1a42SJes Sorensen             if (ret < 0) {
338496df67d1SStefan Hajnoczi                 error_report("Could not open '%s'", backing_file->value.s);
3385f88e1a42SJes Sorensen                 goto out;
3386f88e1a42SJes Sorensen             }
3387f88e1a42SJes Sorensen             bdrv_get_geometry(bs, &size);
3388f88e1a42SJes Sorensen             size *= 512;
3389f88e1a42SJes Sorensen 
3390f88e1a42SJes Sorensen             snprintf(buf, sizeof(buf), "%" PRId64, size);
3391f88e1a42SJes Sorensen             set_option_parameter(param, BLOCK_OPT_SIZE, buf);
3392f88e1a42SJes Sorensen         } else {
3393f88e1a42SJes Sorensen             error_report("Image creation needs a size parameter");
33944f70f249SJes Sorensen             ret = -EINVAL;
3395f88e1a42SJes Sorensen             goto out;
3396f88e1a42SJes Sorensen         }
3397f88e1a42SJes Sorensen     }
3398f88e1a42SJes Sorensen 
3399f88e1a42SJes Sorensen     printf("Formatting '%s', fmt=%s ", filename, fmt);
3400f88e1a42SJes Sorensen     print_option_parameters(param);
3401f88e1a42SJes Sorensen     puts("");
3402f88e1a42SJes Sorensen 
3403f88e1a42SJes Sorensen     ret = bdrv_create(drv, filename, param);
3404f88e1a42SJes Sorensen 
3405f88e1a42SJes Sorensen     if (ret < 0) {
3406f88e1a42SJes Sorensen         if (ret == -ENOTSUP) {
3407f88e1a42SJes Sorensen             error_report("Formatting or formatting option not supported for "
3408f88e1a42SJes Sorensen                          "file format '%s'", fmt);
3409f88e1a42SJes Sorensen         } else if (ret == -EFBIG) {
3410f88e1a42SJes Sorensen             error_report("The image size is too large for file format '%s'",
3411f88e1a42SJes Sorensen                          fmt);
3412f88e1a42SJes Sorensen         } else {
3413f88e1a42SJes Sorensen             error_report("%s: error while creating %s: %s", filename, fmt,
3414f88e1a42SJes Sorensen                          strerror(-ret));
3415f88e1a42SJes Sorensen         }
3416f88e1a42SJes Sorensen     }
3417f88e1a42SJes Sorensen 
3418f88e1a42SJes Sorensen out:
3419f88e1a42SJes Sorensen     free_option_parameters(create_options);
3420f88e1a42SJes Sorensen     free_option_parameters(param);
3421f88e1a42SJes Sorensen 
3422f88e1a42SJes Sorensen     if (bs) {
3423f88e1a42SJes Sorensen         bdrv_delete(bs);
3424f88e1a42SJes Sorensen     }
34254f70f249SJes Sorensen 
34264f70f249SJes Sorensen     return ret;
3427f88e1a42SJes Sorensen }
3428