1fc01f7e7Sbellard /* 2fc01f7e7Sbellard * QEMU System Emulator block driver 3fc01f7e7Sbellard * 4fc01f7e7Sbellard * Copyright (c) 2003 Fabrice Bellard 5fc01f7e7Sbellard * 6fc01f7e7Sbellard * Permission is hereby granted, free of charge, to any person obtaining a copy 7fc01f7e7Sbellard * of this software and associated documentation files (the "Software"), to deal 8fc01f7e7Sbellard * in the Software without restriction, including without limitation the rights 9fc01f7e7Sbellard * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell 10fc01f7e7Sbellard * copies of the Software, and to permit persons to whom the Software is 11fc01f7e7Sbellard * furnished to do so, subject to the following conditions: 12fc01f7e7Sbellard * 13fc01f7e7Sbellard * The above copyright notice and this permission notice shall be included in 14fc01f7e7Sbellard * all copies or substantial portions of the Software. 15fc01f7e7Sbellard * 16fc01f7e7Sbellard * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 17fc01f7e7Sbellard * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 18fc01f7e7Sbellard * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 19fc01f7e7Sbellard * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 20fc01f7e7Sbellard * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 21fc01f7e7Sbellard * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN 22fc01f7e7Sbellard * THE SOFTWARE. 23fc01f7e7Sbellard */ 243990d09aSblueswir1 #include "config-host.h" 25faf07963Spbrook #include "qemu-common.h" 266d519a5fSStefan Hajnoczi #include "trace.h" 27376253ecSaliguori #include "monitor.h" 28ea2384d3Sbellard #include "block_int.h" 295efa9d5aSAnthony Liguori #include "module.h" 30d15e5465SLuiz Capitulino #include "qemu-objects.h" 31fc01f7e7Sbellard 3271e72a19SJuan Quintela #ifdef CONFIG_BSD 337674e7bfSbellard #include <sys/types.h> 347674e7bfSbellard #include <sys/stat.h> 357674e7bfSbellard #include <sys/ioctl.h> 3672cf2d4fSBlue Swirl #include <sys/queue.h> 37c5e97233Sblueswir1 #ifndef __DragonFly__ 387674e7bfSbellard #include <sys/disk.h> 397674e7bfSbellard #endif 40c5e97233Sblueswir1 #endif 417674e7bfSbellard 4249dc768dSaliguori #ifdef _WIN32 4349dc768dSaliguori #include <windows.h> 4449dc768dSaliguori #endif 4549dc768dSaliguori 46f141eafeSaliguori static BlockDriverAIOCB *bdrv_aio_readv_em(BlockDriverState *bs, 47f141eafeSaliguori int64_t sector_num, QEMUIOVector *qiov, int nb_sectors, 48c87c0672Saliguori BlockDriverCompletionFunc *cb, void *opaque); 49f141eafeSaliguori static BlockDriverAIOCB *bdrv_aio_writev_em(BlockDriverState *bs, 50f141eafeSaliguori int64_t sector_num, QEMUIOVector *qiov, int nb_sectors, 51ce1a14dcSpbrook BlockDriverCompletionFunc *cb, void *opaque); 52b2e12bc6SChristoph Hellwig static BlockDriverAIOCB *bdrv_aio_flush_em(BlockDriverState *bs, 53b2e12bc6SChristoph Hellwig BlockDriverCompletionFunc *cb, void *opaque); 54016f5cf6SAlexander Graf static BlockDriverAIOCB *bdrv_aio_noop_em(BlockDriverState *bs, 55016f5cf6SAlexander Graf BlockDriverCompletionFunc *cb, void *opaque); 5683f64091Sbellard static int bdrv_read_em(BlockDriverState *bs, int64_t sector_num, 5783f64091Sbellard uint8_t *buf, int nb_sectors); 5883f64091Sbellard static int bdrv_write_em(BlockDriverState *bs, int64_t sector_num, 5983f64091Sbellard const uint8_t *buf, int nb_sectors); 60ec530c81Sbellard 611b7bdbc1SStefan Hajnoczi static QTAILQ_HEAD(, BlockDriverState) bdrv_states = 621b7bdbc1SStefan Hajnoczi QTAILQ_HEAD_INITIALIZER(bdrv_states); 637ee930d0Sblueswir1 648a22f02aSStefan Hajnoczi static QLIST_HEAD(, BlockDriver) bdrv_drivers = 658a22f02aSStefan Hajnoczi QLIST_HEAD_INITIALIZER(bdrv_drivers); 66ea2384d3Sbellard 67f9092b10SMarkus Armbruster /* The device to use for VM snapshots */ 68f9092b10SMarkus Armbruster static BlockDriverState *bs_snapshots; 69f9092b10SMarkus Armbruster 70eb852011SMarkus Armbruster /* If non-zero, use only whitelisted block drivers */ 71eb852011SMarkus Armbruster static int use_bdrv_whitelist; 72eb852011SMarkus Armbruster 739e0b22f4SStefan Hajnoczi #ifdef _WIN32 749e0b22f4SStefan Hajnoczi static int is_windows_drive_prefix(const char *filename) 759e0b22f4SStefan Hajnoczi { 769e0b22f4SStefan Hajnoczi return (((filename[0] >= 'a' && filename[0] <= 'z') || 779e0b22f4SStefan Hajnoczi (filename[0] >= 'A' && filename[0] <= 'Z')) && 789e0b22f4SStefan Hajnoczi filename[1] == ':'); 799e0b22f4SStefan Hajnoczi } 809e0b22f4SStefan Hajnoczi 819e0b22f4SStefan Hajnoczi int is_windows_drive(const char *filename) 829e0b22f4SStefan Hajnoczi { 839e0b22f4SStefan Hajnoczi if (is_windows_drive_prefix(filename) && 849e0b22f4SStefan Hajnoczi filename[2] == '\0') 859e0b22f4SStefan Hajnoczi return 1; 869e0b22f4SStefan Hajnoczi if (strstart(filename, "\\\\.\\", NULL) || 879e0b22f4SStefan Hajnoczi strstart(filename, "//./", NULL)) 889e0b22f4SStefan Hajnoczi return 1; 899e0b22f4SStefan Hajnoczi return 0; 909e0b22f4SStefan Hajnoczi } 919e0b22f4SStefan Hajnoczi #endif 929e0b22f4SStefan Hajnoczi 939e0b22f4SStefan Hajnoczi /* check if the path starts with "<protocol>:" */ 949e0b22f4SStefan Hajnoczi static int path_has_protocol(const char *path) 959e0b22f4SStefan Hajnoczi { 969e0b22f4SStefan Hajnoczi #ifdef _WIN32 979e0b22f4SStefan Hajnoczi if (is_windows_drive(path) || 989e0b22f4SStefan Hajnoczi is_windows_drive_prefix(path)) { 999e0b22f4SStefan Hajnoczi return 0; 1009e0b22f4SStefan Hajnoczi } 1019e0b22f4SStefan Hajnoczi #endif 1029e0b22f4SStefan Hajnoczi 1039e0b22f4SStefan Hajnoczi return strchr(path, ':') != NULL; 1049e0b22f4SStefan Hajnoczi } 1059e0b22f4SStefan Hajnoczi 10683f64091Sbellard int path_is_absolute(const char *path) 10783f64091Sbellard { 10883f64091Sbellard const char *p; 10921664424Sbellard #ifdef _WIN32 11021664424Sbellard /* specific case for names like: "\\.\d:" */ 11121664424Sbellard if (*path == '/' || *path == '\\') 11221664424Sbellard return 1; 11321664424Sbellard #endif 11483f64091Sbellard p = strchr(path, ':'); 11583f64091Sbellard if (p) 11683f64091Sbellard p++; 11783f64091Sbellard else 11883f64091Sbellard p = path; 1193b9f94e1Sbellard #ifdef _WIN32 1203b9f94e1Sbellard return (*p == '/' || *p == '\\'); 1213b9f94e1Sbellard #else 1223b9f94e1Sbellard return (*p == '/'); 1233b9f94e1Sbellard #endif 12483f64091Sbellard } 12583f64091Sbellard 12683f64091Sbellard /* if filename is absolute, just copy it to dest. Otherwise, build a 12783f64091Sbellard path to it by considering it is relative to base_path. URL are 12883f64091Sbellard supported. */ 12983f64091Sbellard void path_combine(char *dest, int dest_size, 13083f64091Sbellard const char *base_path, 13183f64091Sbellard const char *filename) 13283f64091Sbellard { 13383f64091Sbellard const char *p, *p1; 13483f64091Sbellard int len; 13583f64091Sbellard 13683f64091Sbellard if (dest_size <= 0) 13783f64091Sbellard return; 13883f64091Sbellard if (path_is_absolute(filename)) { 13983f64091Sbellard pstrcpy(dest, dest_size, filename); 14083f64091Sbellard } else { 14183f64091Sbellard p = strchr(base_path, ':'); 14283f64091Sbellard if (p) 14383f64091Sbellard p++; 14483f64091Sbellard else 14583f64091Sbellard p = base_path; 1463b9f94e1Sbellard p1 = strrchr(base_path, '/'); 1473b9f94e1Sbellard #ifdef _WIN32 1483b9f94e1Sbellard { 1493b9f94e1Sbellard const char *p2; 1503b9f94e1Sbellard p2 = strrchr(base_path, '\\'); 1513b9f94e1Sbellard if (!p1 || p2 > p1) 1523b9f94e1Sbellard p1 = p2; 1533b9f94e1Sbellard } 1543b9f94e1Sbellard #endif 15583f64091Sbellard if (p1) 15683f64091Sbellard p1++; 15783f64091Sbellard else 15883f64091Sbellard p1 = base_path; 15983f64091Sbellard if (p1 > p) 16083f64091Sbellard p = p1; 16183f64091Sbellard len = p - base_path; 16283f64091Sbellard if (len > dest_size - 1) 16383f64091Sbellard len = dest_size - 1; 16483f64091Sbellard memcpy(dest, base_path, len); 16583f64091Sbellard dest[len] = '\0'; 16683f64091Sbellard pstrcat(dest, dest_size, filename); 16783f64091Sbellard } 16883f64091Sbellard } 16983f64091Sbellard 1705efa9d5aSAnthony Liguori void bdrv_register(BlockDriver *bdrv) 171ea2384d3Sbellard { 172f141eafeSaliguori if (!bdrv->bdrv_aio_readv) { 17383f64091Sbellard /* add AIO emulation layer */ 174f141eafeSaliguori bdrv->bdrv_aio_readv = bdrv_aio_readv_em; 175f141eafeSaliguori bdrv->bdrv_aio_writev = bdrv_aio_writev_em; 176eda578e5Saliguori } else if (!bdrv->bdrv_read) { 17783f64091Sbellard /* add synchronous IO emulation layer */ 17883f64091Sbellard bdrv->bdrv_read = bdrv_read_em; 17983f64091Sbellard bdrv->bdrv_write = bdrv_write_em; 18083f64091Sbellard } 181b2e12bc6SChristoph Hellwig 182b2e12bc6SChristoph Hellwig if (!bdrv->bdrv_aio_flush) 183b2e12bc6SChristoph Hellwig bdrv->bdrv_aio_flush = bdrv_aio_flush_em; 184b2e12bc6SChristoph Hellwig 1858a22f02aSStefan Hajnoczi QLIST_INSERT_HEAD(&bdrv_drivers, bdrv, list); 186ea2384d3Sbellard } 187b338082bSbellard 188b338082bSbellard /* create a new block device (by default it is empty) */ 189b338082bSbellard BlockDriverState *bdrv_new(const char *device_name) 190fc01f7e7Sbellard { 1911b7bdbc1SStefan Hajnoczi BlockDriverState *bs; 192b338082bSbellard 193b338082bSbellard bs = qemu_mallocz(sizeof(BlockDriverState)); 194b338082bSbellard pstrcpy(bs->device_name, sizeof(bs->device_name), device_name); 195ea2384d3Sbellard if (device_name[0] != '\0') { 1961b7bdbc1SStefan Hajnoczi QTAILQ_INSERT_TAIL(&bdrv_states, bs, list); 197ea2384d3Sbellard } 198b338082bSbellard return bs; 199b338082bSbellard } 200b338082bSbellard 201ea2384d3Sbellard BlockDriver *bdrv_find_format(const char *format_name) 202ea2384d3Sbellard { 203ea2384d3Sbellard BlockDriver *drv1; 2048a22f02aSStefan Hajnoczi QLIST_FOREACH(drv1, &bdrv_drivers, list) { 2058a22f02aSStefan Hajnoczi if (!strcmp(drv1->format_name, format_name)) { 206ea2384d3Sbellard return drv1; 207ea2384d3Sbellard } 2088a22f02aSStefan Hajnoczi } 209ea2384d3Sbellard return NULL; 210ea2384d3Sbellard } 211ea2384d3Sbellard 212eb852011SMarkus Armbruster static int bdrv_is_whitelisted(BlockDriver *drv) 213eb852011SMarkus Armbruster { 214eb852011SMarkus Armbruster static const char *whitelist[] = { 215eb852011SMarkus Armbruster CONFIG_BDRV_WHITELIST 216eb852011SMarkus Armbruster }; 217eb852011SMarkus Armbruster const char **p; 218eb852011SMarkus Armbruster 219eb852011SMarkus Armbruster if (!whitelist[0]) 220eb852011SMarkus Armbruster return 1; /* no whitelist, anything goes */ 221eb852011SMarkus Armbruster 222eb852011SMarkus Armbruster for (p = whitelist; *p; p++) { 223eb852011SMarkus Armbruster if (!strcmp(drv->format_name, *p)) { 224eb852011SMarkus Armbruster return 1; 225eb852011SMarkus Armbruster } 226eb852011SMarkus Armbruster } 227eb852011SMarkus Armbruster return 0; 228eb852011SMarkus Armbruster } 229eb852011SMarkus Armbruster 230eb852011SMarkus Armbruster BlockDriver *bdrv_find_whitelisted_format(const char *format_name) 231eb852011SMarkus Armbruster { 232eb852011SMarkus Armbruster BlockDriver *drv = bdrv_find_format(format_name); 233eb852011SMarkus Armbruster return drv && bdrv_is_whitelisted(drv) ? drv : NULL; 234eb852011SMarkus Armbruster } 235eb852011SMarkus Armbruster 2360e7e1989SKevin Wolf int bdrv_create(BlockDriver *drv, const char* filename, 2370e7e1989SKevin Wolf QEMUOptionParameter *options) 238ea2384d3Sbellard { 239ea2384d3Sbellard if (!drv->bdrv_create) 240ea2384d3Sbellard return -ENOTSUP; 2410e7e1989SKevin Wolf 2420e7e1989SKevin Wolf return drv->bdrv_create(filename, options); 243ea2384d3Sbellard } 244ea2384d3Sbellard 24584a12e66SChristoph Hellwig int bdrv_create_file(const char* filename, QEMUOptionParameter *options) 24684a12e66SChristoph Hellwig { 24784a12e66SChristoph Hellwig BlockDriver *drv; 24884a12e66SChristoph Hellwig 249b50cbabcSMORITA Kazutaka drv = bdrv_find_protocol(filename); 25084a12e66SChristoph Hellwig if (drv == NULL) { 25116905d71SStefan Hajnoczi return -ENOENT; 25284a12e66SChristoph Hellwig } 25384a12e66SChristoph Hellwig 25484a12e66SChristoph Hellwig return bdrv_create(drv, filename, options); 25584a12e66SChristoph Hellwig } 25684a12e66SChristoph Hellwig 257d5249393Sbellard #ifdef _WIN32 25895389c86Sbellard void get_tmp_filename(char *filename, int size) 259d5249393Sbellard { 2603b9f94e1Sbellard char temp_dir[MAX_PATH]; 2613b9f94e1Sbellard 2623b9f94e1Sbellard GetTempPath(MAX_PATH, temp_dir); 2633b9f94e1Sbellard GetTempFileName(temp_dir, "qem", 0, filename); 264d5249393Sbellard } 265d5249393Sbellard #else 26695389c86Sbellard void get_tmp_filename(char *filename, int size) 267ea2384d3Sbellard { 268ea2384d3Sbellard int fd; 2697ccfb2ebSblueswir1 const char *tmpdir; 270d5249393Sbellard /* XXX: race condition possible */ 2710badc1eeSaurel32 tmpdir = getenv("TMPDIR"); 2720badc1eeSaurel32 if (!tmpdir) 2730badc1eeSaurel32 tmpdir = "/tmp"; 2740badc1eeSaurel32 snprintf(filename, size, "%s/vl.XXXXXX", tmpdir); 275ea2384d3Sbellard fd = mkstemp(filename); 276ea2384d3Sbellard close(fd); 277ea2384d3Sbellard } 278d5249393Sbellard #endif 279ea2384d3Sbellard 280f3a5d3f8SChristoph Hellwig /* 281f3a5d3f8SChristoph Hellwig * Detect host devices. By convention, /dev/cdrom[N] is always 282f3a5d3f8SChristoph Hellwig * recognized as a host CDROM. 283f3a5d3f8SChristoph Hellwig */ 284f3a5d3f8SChristoph Hellwig static BlockDriver *find_hdev_driver(const char *filename) 285f3a5d3f8SChristoph Hellwig { 286508c7cb3SChristoph Hellwig int score_max = 0, score; 287508c7cb3SChristoph Hellwig BlockDriver *drv = NULL, *d; 288f3a5d3f8SChristoph Hellwig 2898a22f02aSStefan Hajnoczi QLIST_FOREACH(d, &bdrv_drivers, list) { 290508c7cb3SChristoph Hellwig if (d->bdrv_probe_device) { 291508c7cb3SChristoph Hellwig score = d->bdrv_probe_device(filename); 292508c7cb3SChristoph Hellwig if (score > score_max) { 293508c7cb3SChristoph Hellwig score_max = score; 294508c7cb3SChristoph Hellwig drv = d; 295f3a5d3f8SChristoph Hellwig } 296508c7cb3SChristoph Hellwig } 297f3a5d3f8SChristoph Hellwig } 298f3a5d3f8SChristoph Hellwig 299508c7cb3SChristoph Hellwig return drv; 300f3a5d3f8SChristoph Hellwig } 301f3a5d3f8SChristoph Hellwig 302b50cbabcSMORITA Kazutaka BlockDriver *bdrv_find_protocol(const char *filename) 30384a12e66SChristoph Hellwig { 30484a12e66SChristoph Hellwig BlockDriver *drv1; 30584a12e66SChristoph Hellwig char protocol[128]; 30684a12e66SChristoph Hellwig int len; 30784a12e66SChristoph Hellwig const char *p; 30884a12e66SChristoph Hellwig 30966f82ceeSKevin Wolf /* TODO Drivers without bdrv_file_open must be specified explicitly */ 31066f82ceeSKevin Wolf 31139508e7aSChristoph Hellwig /* 31239508e7aSChristoph Hellwig * XXX(hch): we really should not let host device detection 31339508e7aSChristoph Hellwig * override an explicit protocol specification, but moving this 31439508e7aSChristoph Hellwig * later breaks access to device names with colons in them. 31539508e7aSChristoph Hellwig * Thanks to the brain-dead persistent naming schemes on udev- 31639508e7aSChristoph Hellwig * based Linux systems those actually are quite common. 31739508e7aSChristoph Hellwig */ 31884a12e66SChristoph Hellwig drv1 = find_hdev_driver(filename); 31939508e7aSChristoph Hellwig if (drv1) { 32084a12e66SChristoph Hellwig return drv1; 32184a12e66SChristoph Hellwig } 32239508e7aSChristoph Hellwig 3239e0b22f4SStefan Hajnoczi if (!path_has_protocol(filename)) { 32439508e7aSChristoph Hellwig return bdrv_find_format("file"); 32539508e7aSChristoph Hellwig } 3269e0b22f4SStefan Hajnoczi p = strchr(filename, ':'); 3279e0b22f4SStefan Hajnoczi assert(p != NULL); 32884a12e66SChristoph Hellwig len = p - filename; 32984a12e66SChristoph Hellwig if (len > sizeof(protocol) - 1) 33084a12e66SChristoph Hellwig len = sizeof(protocol) - 1; 33184a12e66SChristoph Hellwig memcpy(protocol, filename, len); 33284a12e66SChristoph Hellwig protocol[len] = '\0'; 33384a12e66SChristoph Hellwig QLIST_FOREACH(drv1, &bdrv_drivers, list) { 33484a12e66SChristoph Hellwig if (drv1->protocol_name && 33584a12e66SChristoph Hellwig !strcmp(drv1->protocol_name, protocol)) { 33684a12e66SChristoph Hellwig return drv1; 33784a12e66SChristoph Hellwig } 33884a12e66SChristoph Hellwig } 33984a12e66SChristoph Hellwig return NULL; 34084a12e66SChristoph Hellwig } 34184a12e66SChristoph Hellwig 342c98ac35dSStefan Weil static int find_image_format(const char *filename, BlockDriver **pdrv) 343ea2384d3Sbellard { 34483f64091Sbellard int ret, score, score_max; 345ea2384d3Sbellard BlockDriver *drv1, *drv; 34683f64091Sbellard uint8_t buf[2048]; 34783f64091Sbellard BlockDriverState *bs; 348ea2384d3Sbellard 349f5edb014SNaphtali Sprei ret = bdrv_file_open(&bs, filename, 0); 350c98ac35dSStefan Weil if (ret < 0) { 351c98ac35dSStefan Weil *pdrv = NULL; 352c98ac35dSStefan Weil return ret; 353c98ac35dSStefan Weil } 354f8ea0b00SNicholas Bellinger 35508a00559SKevin Wolf /* Return the raw BlockDriver * to scsi-generic devices or empty drives */ 35608a00559SKevin Wolf if (bs->sg || !bdrv_is_inserted(bs)) { 3571a396859SNicholas A. Bellinger bdrv_delete(bs); 358c98ac35dSStefan Weil drv = bdrv_find_format("raw"); 359c98ac35dSStefan Weil if (!drv) { 360c98ac35dSStefan Weil ret = -ENOENT; 361c98ac35dSStefan Weil } 362c98ac35dSStefan Weil *pdrv = drv; 363c98ac35dSStefan Weil return ret; 3641a396859SNicholas A. Bellinger } 365f8ea0b00SNicholas Bellinger 36683f64091Sbellard ret = bdrv_pread(bs, 0, buf, sizeof(buf)); 36783f64091Sbellard bdrv_delete(bs); 368ea2384d3Sbellard if (ret < 0) { 369c98ac35dSStefan Weil *pdrv = NULL; 370c98ac35dSStefan Weil return ret; 371ea2384d3Sbellard } 372ea2384d3Sbellard 373ea2384d3Sbellard score_max = 0; 37484a12e66SChristoph Hellwig drv = NULL; 3758a22f02aSStefan Hajnoczi QLIST_FOREACH(drv1, &bdrv_drivers, list) { 37683f64091Sbellard if (drv1->bdrv_probe) { 377ea2384d3Sbellard score = drv1->bdrv_probe(buf, ret, filename); 378ea2384d3Sbellard if (score > score_max) { 379ea2384d3Sbellard score_max = score; 380ea2384d3Sbellard drv = drv1; 381ea2384d3Sbellard } 382ea2384d3Sbellard } 38383f64091Sbellard } 384c98ac35dSStefan Weil if (!drv) { 385c98ac35dSStefan Weil ret = -ENOENT; 386c98ac35dSStefan Weil } 387c98ac35dSStefan Weil *pdrv = drv; 388c98ac35dSStefan Weil return ret; 389ea2384d3Sbellard } 390ea2384d3Sbellard 39151762288SStefan Hajnoczi /** 39251762288SStefan Hajnoczi * Set the current 'total_sectors' value 39351762288SStefan Hajnoczi */ 39451762288SStefan Hajnoczi static int refresh_total_sectors(BlockDriverState *bs, int64_t hint) 39551762288SStefan Hajnoczi { 39651762288SStefan Hajnoczi BlockDriver *drv = bs->drv; 39751762288SStefan Hajnoczi 398396759adSNicholas Bellinger /* Do not attempt drv->bdrv_getlength() on scsi-generic devices */ 399396759adSNicholas Bellinger if (bs->sg) 400396759adSNicholas Bellinger return 0; 401396759adSNicholas Bellinger 40251762288SStefan Hajnoczi /* query actual device if possible, otherwise just trust the hint */ 40351762288SStefan Hajnoczi if (drv->bdrv_getlength) { 40451762288SStefan Hajnoczi int64_t length = drv->bdrv_getlength(bs); 40551762288SStefan Hajnoczi if (length < 0) { 40651762288SStefan Hajnoczi return length; 40751762288SStefan Hajnoczi } 40851762288SStefan Hajnoczi hint = length >> BDRV_SECTOR_BITS; 40951762288SStefan Hajnoczi } 41051762288SStefan Hajnoczi 41151762288SStefan Hajnoczi bs->total_sectors = hint; 41251762288SStefan Hajnoczi return 0; 41351762288SStefan Hajnoczi } 41451762288SStefan Hajnoczi 415b6ce07aaSKevin Wolf /* 41657915332SKevin Wolf * Common part for opening disk images and files 41757915332SKevin Wolf */ 41857915332SKevin Wolf static int bdrv_open_common(BlockDriverState *bs, const char *filename, 41957915332SKevin Wolf int flags, BlockDriver *drv) 42057915332SKevin Wolf { 42157915332SKevin Wolf int ret, open_flags; 42257915332SKevin Wolf 42357915332SKevin Wolf assert(drv != NULL); 42457915332SKevin Wolf 42566f82ceeSKevin Wolf bs->file = NULL; 42651762288SStefan Hajnoczi bs->total_sectors = 0; 42757915332SKevin Wolf bs->encrypted = 0; 42857915332SKevin Wolf bs->valid_key = 0; 42957915332SKevin Wolf bs->open_flags = flags; 43057915332SKevin Wolf /* buffer_alignment defaulted to 512, drivers can change this value */ 43157915332SKevin Wolf bs->buffer_alignment = 512; 43257915332SKevin Wolf 43357915332SKevin Wolf pstrcpy(bs->filename, sizeof(bs->filename), filename); 43457915332SKevin Wolf 43557915332SKevin Wolf if (use_bdrv_whitelist && !bdrv_is_whitelisted(drv)) { 43657915332SKevin Wolf return -ENOTSUP; 43757915332SKevin Wolf } 43857915332SKevin Wolf 43957915332SKevin Wolf bs->drv = drv; 44057915332SKevin Wolf bs->opaque = qemu_mallocz(drv->instance_size); 44157915332SKevin Wolf 442a6599793SChristoph Hellwig if (flags & BDRV_O_CACHE_WB) 44357915332SKevin Wolf bs->enable_write_cache = 1; 44457915332SKevin Wolf 44557915332SKevin Wolf /* 44657915332SKevin Wolf * Clear flags that are internal to the block layer before opening the 44757915332SKevin Wolf * image. 44857915332SKevin Wolf */ 44957915332SKevin Wolf open_flags = flags & ~(BDRV_O_SNAPSHOT | BDRV_O_NO_BACKING); 45057915332SKevin Wolf 45157915332SKevin Wolf /* 452ebabb67aSStefan Weil * Snapshots should be writable. 45357915332SKevin Wolf */ 45457915332SKevin Wolf if (bs->is_temporary) { 45557915332SKevin Wolf open_flags |= BDRV_O_RDWR; 45657915332SKevin Wolf } 45757915332SKevin Wolf 45866f82ceeSKevin Wolf /* Open the image, either directly or using a protocol */ 45966f82ceeSKevin Wolf if (drv->bdrv_file_open) { 46066f82ceeSKevin Wolf ret = drv->bdrv_file_open(bs, filename, open_flags); 46166f82ceeSKevin Wolf } else { 46266f82ceeSKevin Wolf ret = bdrv_file_open(&bs->file, filename, open_flags); 46366f82ceeSKevin Wolf if (ret >= 0) { 46466f82ceeSKevin Wolf ret = drv->bdrv_open(bs, open_flags); 46566f82ceeSKevin Wolf } 46666f82ceeSKevin Wolf } 46766f82ceeSKevin Wolf 46857915332SKevin Wolf if (ret < 0) { 46957915332SKevin Wolf goto free_and_fail; 47057915332SKevin Wolf } 47157915332SKevin Wolf 47257915332SKevin Wolf bs->keep_read_only = bs->read_only = !(open_flags & BDRV_O_RDWR); 47351762288SStefan Hajnoczi 47451762288SStefan Hajnoczi ret = refresh_total_sectors(bs, bs->total_sectors); 47551762288SStefan Hajnoczi if (ret < 0) { 47651762288SStefan Hajnoczi goto free_and_fail; 47757915332SKevin Wolf } 47851762288SStefan Hajnoczi 47957915332SKevin Wolf #ifndef _WIN32 48057915332SKevin Wolf if (bs->is_temporary) { 48157915332SKevin Wolf unlink(filename); 48257915332SKevin Wolf } 48357915332SKevin Wolf #endif 48457915332SKevin Wolf return 0; 48557915332SKevin Wolf 48657915332SKevin Wolf free_and_fail: 48766f82ceeSKevin Wolf if (bs->file) { 48866f82ceeSKevin Wolf bdrv_delete(bs->file); 48966f82ceeSKevin Wolf bs->file = NULL; 49066f82ceeSKevin Wolf } 49157915332SKevin Wolf qemu_free(bs->opaque); 49257915332SKevin Wolf bs->opaque = NULL; 49357915332SKevin Wolf bs->drv = NULL; 49457915332SKevin Wolf return ret; 49557915332SKevin Wolf } 49657915332SKevin Wolf 49757915332SKevin Wolf /* 498b6ce07aaSKevin Wolf * Opens a file using a protocol (file, host_device, nbd, ...) 499b6ce07aaSKevin Wolf */ 50083f64091Sbellard int bdrv_file_open(BlockDriverState **pbs, const char *filename, int flags) 501b338082bSbellard { 50283f64091Sbellard BlockDriverState *bs; 5036db95603SChristoph Hellwig BlockDriver *drv; 50483f64091Sbellard int ret; 5053b0d4f61Sbellard 506b50cbabcSMORITA Kazutaka drv = bdrv_find_protocol(filename); 5076db95603SChristoph Hellwig if (!drv) { 5086db95603SChristoph Hellwig return -ENOENT; 5096db95603SChristoph Hellwig } 5106db95603SChristoph Hellwig 51183f64091Sbellard bs = bdrv_new(""); 512b6ce07aaSKevin Wolf ret = bdrv_open_common(bs, filename, flags, drv); 51383f64091Sbellard if (ret < 0) { 51483f64091Sbellard bdrv_delete(bs); 51583f64091Sbellard return ret; 5163b0d4f61Sbellard } 51771d0770cSaliguori bs->growable = 1; 51883f64091Sbellard *pbs = bs; 51983f64091Sbellard return 0; 5203b0d4f61Sbellard } 5213b0d4f61Sbellard 522b6ce07aaSKevin Wolf /* 523b6ce07aaSKevin Wolf * Opens a disk image (raw, qcow2, vmdk, ...) 524b6ce07aaSKevin Wolf */ 525d6e9098eSKevin Wolf int bdrv_open(BlockDriverState *bs, const char *filename, int flags, 526ea2384d3Sbellard BlockDriver *drv) 527ea2384d3Sbellard { 528b6ce07aaSKevin Wolf int ret; 52933e3963eSbellard 53083f64091Sbellard if (flags & BDRV_O_SNAPSHOT) { 531ea2384d3Sbellard BlockDriverState *bs1; 532ea2384d3Sbellard int64_t total_size; 5337c96d46eSaliguori int is_protocol = 0; 53491a073a9SKevin Wolf BlockDriver *bdrv_qcow2; 53591a073a9SKevin Wolf QEMUOptionParameter *options; 536b6ce07aaSKevin Wolf char tmp_filename[PATH_MAX]; 537b6ce07aaSKevin Wolf char backing_filename[PATH_MAX]; 53833e3963eSbellard 539ea2384d3Sbellard /* if snapshot, we create a temporary backing file and open it 540ea2384d3Sbellard instead of opening 'filename' directly */ 541ea2384d3Sbellard 542ea2384d3Sbellard /* if there is a backing file, use it */ 543ea2384d3Sbellard bs1 = bdrv_new(""); 544d6e9098eSKevin Wolf ret = bdrv_open(bs1, filename, 0, drv); 54551d7c00cSaliguori if (ret < 0) { 546ea2384d3Sbellard bdrv_delete(bs1); 54751d7c00cSaliguori return ret; 548ea2384d3Sbellard } 5493e82990bSJes Sorensen total_size = bdrv_getlength(bs1) & BDRV_SECTOR_MASK; 5507c96d46eSaliguori 5517c96d46eSaliguori if (bs1->drv && bs1->drv->protocol_name) 5527c96d46eSaliguori is_protocol = 1; 5537c96d46eSaliguori 554ea2384d3Sbellard bdrv_delete(bs1); 555ea2384d3Sbellard 556ea2384d3Sbellard get_tmp_filename(tmp_filename, sizeof(tmp_filename)); 5577c96d46eSaliguori 5587c96d46eSaliguori /* Real path is meaningless for protocols */ 5597c96d46eSaliguori if (is_protocol) 5607c96d46eSaliguori snprintf(backing_filename, sizeof(backing_filename), 5617c96d46eSaliguori "%s", filename); 562114cdfa9SKirill A. Shutemov else if (!realpath(filename, backing_filename)) 563114cdfa9SKirill A. Shutemov return -errno; 5647c96d46eSaliguori 56591a073a9SKevin Wolf bdrv_qcow2 = bdrv_find_format("qcow2"); 56691a073a9SKevin Wolf options = parse_option_parameters("", bdrv_qcow2->create_options, NULL); 56791a073a9SKevin Wolf 5683e82990bSJes Sorensen set_option_parameter_int(options, BLOCK_OPT_SIZE, total_size); 56991a073a9SKevin Wolf set_option_parameter(options, BLOCK_OPT_BACKING_FILE, backing_filename); 57091a073a9SKevin Wolf if (drv) { 57191a073a9SKevin Wolf set_option_parameter(options, BLOCK_OPT_BACKING_FMT, 57291a073a9SKevin Wolf drv->format_name); 57391a073a9SKevin Wolf } 57491a073a9SKevin Wolf 57591a073a9SKevin Wolf ret = bdrv_create(bdrv_qcow2, tmp_filename, options); 576d748768cSJan Kiszka free_option_parameters(options); 57751d7c00cSaliguori if (ret < 0) { 57851d7c00cSaliguori return ret; 579ea2384d3Sbellard } 58091a073a9SKevin Wolf 581ea2384d3Sbellard filename = tmp_filename; 58291a073a9SKevin Wolf drv = bdrv_qcow2; 583ea2384d3Sbellard bs->is_temporary = 1; 584ea2384d3Sbellard } 585ea2384d3Sbellard 586b6ce07aaSKevin Wolf /* Find the right image format driver */ 5876db95603SChristoph Hellwig if (!drv) { 588c98ac35dSStefan Weil ret = find_image_format(filename, &drv); 589ea2384d3Sbellard } 5906987307cSChristoph Hellwig 59151d7c00cSaliguori if (!drv) { 59251d7c00cSaliguori goto unlink_and_fail; 59383f64091Sbellard } 594b6ce07aaSKevin Wolf 595b6ce07aaSKevin Wolf /* Open the image */ 596b6ce07aaSKevin Wolf ret = bdrv_open_common(bs, filename, flags, drv); 597b6ce07aaSKevin Wolf if (ret < 0) { 5986987307cSChristoph Hellwig goto unlink_and_fail; 5996987307cSChristoph Hellwig } 6006987307cSChristoph Hellwig 601b6ce07aaSKevin Wolf /* If there is a backing file, use it */ 602b6ce07aaSKevin Wolf if ((flags & BDRV_O_NO_BACKING) == 0 && bs->backing_file[0] != '\0') { 603b6ce07aaSKevin Wolf char backing_filename[PATH_MAX]; 604b6ce07aaSKevin Wolf int back_flags; 605b6ce07aaSKevin Wolf BlockDriver *back_drv = NULL; 606b6ce07aaSKevin Wolf 607b6ce07aaSKevin Wolf bs->backing_hd = bdrv_new(""); 608df2dbb4aSStefan Hajnoczi 609df2dbb4aSStefan Hajnoczi if (path_has_protocol(bs->backing_file)) { 610df2dbb4aSStefan Hajnoczi pstrcpy(backing_filename, sizeof(backing_filename), 611df2dbb4aSStefan Hajnoczi bs->backing_file); 612df2dbb4aSStefan Hajnoczi } else { 613b6ce07aaSKevin Wolf path_combine(backing_filename, sizeof(backing_filename), 614b6ce07aaSKevin Wolf filename, bs->backing_file); 615df2dbb4aSStefan Hajnoczi } 616df2dbb4aSStefan Hajnoczi 617df2dbb4aSStefan Hajnoczi if (bs->backing_format[0] != '\0') { 618b6ce07aaSKevin Wolf back_drv = bdrv_find_format(bs->backing_format); 619df2dbb4aSStefan Hajnoczi } 620b6ce07aaSKevin Wolf 621b6ce07aaSKevin Wolf /* backing files always opened read-only */ 622b6ce07aaSKevin Wolf back_flags = 623b6ce07aaSKevin Wolf flags & ~(BDRV_O_RDWR | BDRV_O_SNAPSHOT | BDRV_O_NO_BACKING); 624b6ce07aaSKevin Wolf 625b6ce07aaSKevin Wolf ret = bdrv_open(bs->backing_hd, backing_filename, back_flags, back_drv); 626b6ce07aaSKevin Wolf if (ret < 0) { 627b6ce07aaSKevin Wolf bdrv_close(bs); 628b6ce07aaSKevin Wolf return ret; 629b6ce07aaSKevin Wolf } 630b6ce07aaSKevin Wolf if (bs->is_temporary) { 631b6ce07aaSKevin Wolf bs->backing_hd->keep_read_only = !(flags & BDRV_O_RDWR); 632b6ce07aaSKevin Wolf } else { 633b6ce07aaSKevin Wolf /* base image inherits from "parent" */ 634b6ce07aaSKevin Wolf bs->backing_hd->keep_read_only = bs->keep_read_only; 635b6ce07aaSKevin Wolf } 636b6ce07aaSKevin Wolf } 637b6ce07aaSKevin Wolf 638b6ce07aaSKevin Wolf if (!bdrv_key_required(bs)) { 639b6ce07aaSKevin Wolf /* call the change callback */ 640b6ce07aaSKevin Wolf bs->media_changed = 1; 641b6ce07aaSKevin Wolf if (bs->change_cb) 642db97ee6aSChristoph Hellwig bs->change_cb(bs->change_opaque, CHANGE_MEDIA); 643b6ce07aaSKevin Wolf } 644b6ce07aaSKevin Wolf 645b6ce07aaSKevin Wolf return 0; 646b6ce07aaSKevin Wolf 647b6ce07aaSKevin Wolf unlink_and_fail: 648b6ce07aaSKevin Wolf if (bs->is_temporary) { 649b6ce07aaSKevin Wolf unlink(filename); 650b6ce07aaSKevin Wolf } 651b6ce07aaSKevin Wolf return ret; 652b6ce07aaSKevin Wolf } 653b6ce07aaSKevin Wolf 654fc01f7e7Sbellard void bdrv_close(BlockDriverState *bs) 655fc01f7e7Sbellard { 65619cb3738Sbellard if (bs->drv) { 657f9092b10SMarkus Armbruster if (bs == bs_snapshots) { 658f9092b10SMarkus Armbruster bs_snapshots = NULL; 659f9092b10SMarkus Armbruster } 660557df6acSStefan Hajnoczi if (bs->backing_hd) { 661ea2384d3Sbellard bdrv_delete(bs->backing_hd); 662557df6acSStefan Hajnoczi bs->backing_hd = NULL; 663557df6acSStefan Hajnoczi } 664ea2384d3Sbellard bs->drv->bdrv_close(bs); 665ea2384d3Sbellard qemu_free(bs->opaque); 666ea2384d3Sbellard #ifdef _WIN32 667ea2384d3Sbellard if (bs->is_temporary) { 668ea2384d3Sbellard unlink(bs->filename); 669ea2384d3Sbellard } 67067b915a5Sbellard #endif 671ea2384d3Sbellard bs->opaque = NULL; 672ea2384d3Sbellard bs->drv = NULL; 673b338082bSbellard 67466f82ceeSKevin Wolf if (bs->file != NULL) { 67566f82ceeSKevin Wolf bdrv_close(bs->file); 67666f82ceeSKevin Wolf } 67766f82ceeSKevin Wolf 678b338082bSbellard /* call the change callback */ 67919cb3738Sbellard bs->media_changed = 1; 680b338082bSbellard if (bs->change_cb) 681db97ee6aSChristoph Hellwig bs->change_cb(bs->change_opaque, CHANGE_MEDIA); 682b338082bSbellard } 683b338082bSbellard } 684b338082bSbellard 6852bc93fedSMORITA Kazutaka void bdrv_close_all(void) 6862bc93fedSMORITA Kazutaka { 6872bc93fedSMORITA Kazutaka BlockDriverState *bs; 6882bc93fedSMORITA Kazutaka 6892bc93fedSMORITA Kazutaka QTAILQ_FOREACH(bs, &bdrv_states, list) { 6902bc93fedSMORITA Kazutaka bdrv_close(bs); 6912bc93fedSMORITA Kazutaka } 6922bc93fedSMORITA Kazutaka } 6932bc93fedSMORITA Kazutaka 694d22b2f41SRyan Harper /* make a BlockDriverState anonymous by removing from bdrv_state list. 695d22b2f41SRyan Harper Also, NULL terminate the device_name to prevent double remove */ 696d22b2f41SRyan Harper void bdrv_make_anon(BlockDriverState *bs) 697d22b2f41SRyan Harper { 698d22b2f41SRyan Harper if (bs->device_name[0] != '\0') { 699d22b2f41SRyan Harper QTAILQ_REMOVE(&bdrv_states, bs, list); 700d22b2f41SRyan Harper } 701d22b2f41SRyan Harper bs->device_name[0] = '\0'; 702d22b2f41SRyan Harper } 703d22b2f41SRyan Harper 704b338082bSbellard void bdrv_delete(BlockDriverState *bs) 705b338082bSbellard { 70618846deeSMarkus Armbruster assert(!bs->peer); 70718846deeSMarkus Armbruster 7081b7bdbc1SStefan Hajnoczi /* remove from list, if necessary */ 709d22b2f41SRyan Harper bdrv_make_anon(bs); 71034c6f050Saurel32 711b338082bSbellard bdrv_close(bs); 71266f82ceeSKevin Wolf if (bs->file != NULL) { 71366f82ceeSKevin Wolf bdrv_delete(bs->file); 71466f82ceeSKevin Wolf } 71566f82ceeSKevin Wolf 716f9092b10SMarkus Armbruster assert(bs != bs_snapshots); 717b338082bSbellard qemu_free(bs); 718fc01f7e7Sbellard } 719fc01f7e7Sbellard 72018846deeSMarkus Armbruster int bdrv_attach(BlockDriverState *bs, DeviceState *qdev) 72118846deeSMarkus Armbruster { 72218846deeSMarkus Armbruster if (bs->peer) { 72318846deeSMarkus Armbruster return -EBUSY; 72418846deeSMarkus Armbruster } 72518846deeSMarkus Armbruster bs->peer = qdev; 72618846deeSMarkus Armbruster return 0; 72718846deeSMarkus Armbruster } 72818846deeSMarkus Armbruster 72918846deeSMarkus Armbruster void bdrv_detach(BlockDriverState *bs, DeviceState *qdev) 73018846deeSMarkus Armbruster { 73118846deeSMarkus Armbruster assert(bs->peer == qdev); 73218846deeSMarkus Armbruster bs->peer = NULL; 733a19712b0SMarkus Armbruster bs->change_cb = NULL; 734a19712b0SMarkus Armbruster bs->change_opaque = NULL; 73518846deeSMarkus Armbruster } 73618846deeSMarkus Armbruster 73718846deeSMarkus Armbruster DeviceState *bdrv_get_attached(BlockDriverState *bs) 73818846deeSMarkus Armbruster { 73918846deeSMarkus Armbruster return bs->peer; 74018846deeSMarkus Armbruster } 74118846deeSMarkus Armbruster 742e97fc193Saliguori /* 743e97fc193Saliguori * Run consistency checks on an image 744e97fc193Saliguori * 745e076f338SKevin Wolf * Returns 0 if the check could be completed (it doesn't mean that the image is 746a1c7273bSStefan Weil * free of errors) or -errno when an internal error occurred. The results of the 747e076f338SKevin Wolf * check are stored in res. 748e97fc193Saliguori */ 749e076f338SKevin Wolf int bdrv_check(BlockDriverState *bs, BdrvCheckResult *res) 750e97fc193Saliguori { 751e97fc193Saliguori if (bs->drv->bdrv_check == NULL) { 752e97fc193Saliguori return -ENOTSUP; 753e97fc193Saliguori } 754e97fc193Saliguori 755e076f338SKevin Wolf memset(res, 0, sizeof(*res)); 7569ac228e0SKevin Wolf return bs->drv->bdrv_check(bs, res); 757e97fc193Saliguori } 758e97fc193Saliguori 7598a426614SKevin Wolf #define COMMIT_BUF_SECTORS 2048 7608a426614SKevin Wolf 76133e3963eSbellard /* commit COW file into the raw image */ 76233e3963eSbellard int bdrv_commit(BlockDriverState *bs) 76333e3963eSbellard { 76419cb3738Sbellard BlockDriver *drv = bs->drv; 765ee181196SKevin Wolf BlockDriver *backing_drv; 7668a426614SKevin Wolf int64_t sector, total_sectors; 7678a426614SKevin Wolf int n, ro, open_flags; 7684dca4b63SNaphtali Sprei int ret = 0, rw_ret = 0; 7698a426614SKevin Wolf uint8_t *buf; 7704dca4b63SNaphtali Sprei char filename[1024]; 7714dca4b63SNaphtali Sprei BlockDriverState *bs_rw, *bs_ro; 77233e3963eSbellard 77319cb3738Sbellard if (!drv) 77419cb3738Sbellard return -ENOMEDIUM; 77533e3963eSbellard 7764dca4b63SNaphtali Sprei if (!bs->backing_hd) { 7774dca4b63SNaphtali Sprei return -ENOTSUP; 7784dca4b63SNaphtali Sprei } 7794dca4b63SNaphtali Sprei 7804dca4b63SNaphtali Sprei if (bs->backing_hd->keep_read_only) { 781ea2384d3Sbellard return -EACCES; 78233e3963eSbellard } 78333e3963eSbellard 784ee181196SKevin Wolf backing_drv = bs->backing_hd->drv; 7854dca4b63SNaphtali Sprei ro = bs->backing_hd->read_only; 7864dca4b63SNaphtali Sprei strncpy(filename, bs->backing_hd->filename, sizeof(filename)); 7874dca4b63SNaphtali Sprei open_flags = bs->backing_hd->open_flags; 7884dca4b63SNaphtali Sprei 7894dca4b63SNaphtali Sprei if (ro) { 7904dca4b63SNaphtali Sprei /* re-open as RW */ 7914dca4b63SNaphtali Sprei bdrv_delete(bs->backing_hd); 7924dca4b63SNaphtali Sprei bs->backing_hd = NULL; 7934dca4b63SNaphtali Sprei bs_rw = bdrv_new(""); 794ee181196SKevin Wolf rw_ret = bdrv_open(bs_rw, filename, open_flags | BDRV_O_RDWR, 795ee181196SKevin Wolf backing_drv); 7964dca4b63SNaphtali Sprei if (rw_ret < 0) { 7974dca4b63SNaphtali Sprei bdrv_delete(bs_rw); 7984dca4b63SNaphtali Sprei /* try to re-open read-only */ 7994dca4b63SNaphtali Sprei bs_ro = bdrv_new(""); 800ee181196SKevin Wolf ret = bdrv_open(bs_ro, filename, open_flags & ~BDRV_O_RDWR, 801ee181196SKevin Wolf backing_drv); 8024dca4b63SNaphtali Sprei if (ret < 0) { 8034dca4b63SNaphtali Sprei bdrv_delete(bs_ro); 8044dca4b63SNaphtali Sprei /* drive not functional anymore */ 8054dca4b63SNaphtali Sprei bs->drv = NULL; 8064dca4b63SNaphtali Sprei return ret; 8074dca4b63SNaphtali Sprei } 8084dca4b63SNaphtali Sprei bs->backing_hd = bs_ro; 8094dca4b63SNaphtali Sprei return rw_ret; 8104dca4b63SNaphtali Sprei } 8114dca4b63SNaphtali Sprei bs->backing_hd = bs_rw; 812ea2384d3Sbellard } 813ea2384d3Sbellard 8146ea44308SJan Kiszka total_sectors = bdrv_getlength(bs) >> BDRV_SECTOR_BITS; 8158a426614SKevin Wolf buf = qemu_malloc(COMMIT_BUF_SECTORS * BDRV_SECTOR_SIZE); 8168a426614SKevin Wolf 8178a426614SKevin Wolf for (sector = 0; sector < total_sectors; sector += n) { 8188a426614SKevin Wolf if (drv->bdrv_is_allocated(bs, sector, COMMIT_BUF_SECTORS, &n)) { 8198a426614SKevin Wolf 8208a426614SKevin Wolf if (bdrv_read(bs, sector, buf, n) != 0) { 8214dca4b63SNaphtali Sprei ret = -EIO; 8224dca4b63SNaphtali Sprei goto ro_cleanup; 82333e3963eSbellard } 82433e3963eSbellard 8258a426614SKevin Wolf if (bdrv_write(bs->backing_hd, sector, buf, n) != 0) { 8264dca4b63SNaphtali Sprei ret = -EIO; 8274dca4b63SNaphtali Sprei goto ro_cleanup; 82833e3963eSbellard } 82933e3963eSbellard } 83033e3963eSbellard } 83195389c86Sbellard 8321d44952fSChristoph Hellwig if (drv->bdrv_make_empty) { 8331d44952fSChristoph Hellwig ret = drv->bdrv_make_empty(bs); 8341d44952fSChristoph Hellwig bdrv_flush(bs); 8351d44952fSChristoph Hellwig } 83695389c86Sbellard 8373f5075aeSChristoph Hellwig /* 8383f5075aeSChristoph Hellwig * Make sure all data we wrote to the backing device is actually 8393f5075aeSChristoph Hellwig * stable on disk. 8403f5075aeSChristoph Hellwig */ 8413f5075aeSChristoph Hellwig if (bs->backing_hd) 8423f5075aeSChristoph Hellwig bdrv_flush(bs->backing_hd); 8434dca4b63SNaphtali Sprei 8444dca4b63SNaphtali Sprei ro_cleanup: 8458a426614SKevin Wolf qemu_free(buf); 8464dca4b63SNaphtali Sprei 8474dca4b63SNaphtali Sprei if (ro) { 8484dca4b63SNaphtali Sprei /* re-open as RO */ 8494dca4b63SNaphtali Sprei bdrv_delete(bs->backing_hd); 8504dca4b63SNaphtali Sprei bs->backing_hd = NULL; 8514dca4b63SNaphtali Sprei bs_ro = bdrv_new(""); 852ee181196SKevin Wolf ret = bdrv_open(bs_ro, filename, open_flags & ~BDRV_O_RDWR, 853ee181196SKevin Wolf backing_drv); 8544dca4b63SNaphtali Sprei if (ret < 0) { 8554dca4b63SNaphtali Sprei bdrv_delete(bs_ro); 8564dca4b63SNaphtali Sprei /* drive not functional anymore */ 8574dca4b63SNaphtali Sprei bs->drv = NULL; 8584dca4b63SNaphtali Sprei return ret; 8594dca4b63SNaphtali Sprei } 8604dca4b63SNaphtali Sprei bs->backing_hd = bs_ro; 8614dca4b63SNaphtali Sprei bs->backing_hd->keep_read_only = 0; 8624dca4b63SNaphtali Sprei } 8634dca4b63SNaphtali Sprei 8641d44952fSChristoph Hellwig return ret; 86533e3963eSbellard } 86633e3963eSbellard 8676ab4b5abSMarkus Armbruster void bdrv_commit_all(void) 8686ab4b5abSMarkus Armbruster { 8696ab4b5abSMarkus Armbruster BlockDriverState *bs; 8706ab4b5abSMarkus Armbruster 8716ab4b5abSMarkus Armbruster QTAILQ_FOREACH(bs, &bdrv_states, list) { 8726ab4b5abSMarkus Armbruster bdrv_commit(bs); 8736ab4b5abSMarkus Armbruster } 8746ab4b5abSMarkus Armbruster } 8756ab4b5abSMarkus Armbruster 876756e6736SKevin Wolf /* 877756e6736SKevin Wolf * Return values: 878756e6736SKevin Wolf * 0 - success 879756e6736SKevin Wolf * -EINVAL - backing format specified, but no file 880756e6736SKevin Wolf * -ENOSPC - can't update the backing file because no space is left in the 881756e6736SKevin Wolf * image file header 882756e6736SKevin Wolf * -ENOTSUP - format driver doesn't support changing the backing file 883756e6736SKevin Wolf */ 884756e6736SKevin Wolf int bdrv_change_backing_file(BlockDriverState *bs, 885756e6736SKevin Wolf const char *backing_file, const char *backing_fmt) 886756e6736SKevin Wolf { 887756e6736SKevin Wolf BlockDriver *drv = bs->drv; 888756e6736SKevin Wolf 889756e6736SKevin Wolf if (drv->bdrv_change_backing_file != NULL) { 890756e6736SKevin Wolf return drv->bdrv_change_backing_file(bs, backing_file, backing_fmt); 891756e6736SKevin Wolf } else { 892756e6736SKevin Wolf return -ENOTSUP; 893756e6736SKevin Wolf } 894756e6736SKevin Wolf } 895756e6736SKevin Wolf 89671d0770cSaliguori static int bdrv_check_byte_request(BlockDriverState *bs, int64_t offset, 89771d0770cSaliguori size_t size) 89871d0770cSaliguori { 89971d0770cSaliguori int64_t len; 90071d0770cSaliguori 90171d0770cSaliguori if (!bdrv_is_inserted(bs)) 90271d0770cSaliguori return -ENOMEDIUM; 90371d0770cSaliguori 90471d0770cSaliguori if (bs->growable) 90571d0770cSaliguori return 0; 90671d0770cSaliguori 90771d0770cSaliguori len = bdrv_getlength(bs); 90871d0770cSaliguori 909fbb7b4e0SKevin Wolf if (offset < 0) 910fbb7b4e0SKevin Wolf return -EIO; 911fbb7b4e0SKevin Wolf 912fbb7b4e0SKevin Wolf if ((offset > len) || (len - offset < size)) 91371d0770cSaliguori return -EIO; 91471d0770cSaliguori 91571d0770cSaliguori return 0; 91671d0770cSaliguori } 91771d0770cSaliguori 91871d0770cSaliguori static int bdrv_check_request(BlockDriverState *bs, int64_t sector_num, 91971d0770cSaliguori int nb_sectors) 92071d0770cSaliguori { 921eb5a3165SJes Sorensen return bdrv_check_byte_request(bs, sector_num * BDRV_SECTOR_SIZE, 922eb5a3165SJes Sorensen nb_sectors * BDRV_SECTOR_SIZE); 92371d0770cSaliguori } 92471d0770cSaliguori 92519cb3738Sbellard /* return < 0 if error. See bdrv_write() for the return codes */ 926fc01f7e7Sbellard int bdrv_read(BlockDriverState *bs, int64_t sector_num, 927fc01f7e7Sbellard uint8_t *buf, int nb_sectors) 928fc01f7e7Sbellard { 929ea2384d3Sbellard BlockDriver *drv = bs->drv; 930fc01f7e7Sbellard 93119cb3738Sbellard if (!drv) 93219cb3738Sbellard return -ENOMEDIUM; 93371d0770cSaliguori if (bdrv_check_request(bs, sector_num, nb_sectors)) 93471d0770cSaliguori return -EIO; 935b338082bSbellard 93683f64091Sbellard return drv->bdrv_read(bs, sector_num, buf, nb_sectors); 93783f64091Sbellard } 938fc01f7e7Sbellard 9397cd1e32aSlirans@il.ibm.com static void set_dirty_bitmap(BlockDriverState *bs, int64_t sector_num, 9407cd1e32aSlirans@il.ibm.com int nb_sectors, int dirty) 9417cd1e32aSlirans@il.ibm.com { 9427cd1e32aSlirans@il.ibm.com int64_t start, end; 943c6d22830SJan Kiszka unsigned long val, idx, bit; 944a55eb92cSJan Kiszka 9456ea44308SJan Kiszka start = sector_num / BDRV_SECTORS_PER_DIRTY_CHUNK; 946c6d22830SJan Kiszka end = (sector_num + nb_sectors - 1) / BDRV_SECTORS_PER_DIRTY_CHUNK; 9477cd1e32aSlirans@il.ibm.com 9487cd1e32aSlirans@il.ibm.com for (; start <= end; start++) { 949c6d22830SJan Kiszka idx = start / (sizeof(unsigned long) * 8); 950c6d22830SJan Kiszka bit = start % (sizeof(unsigned long) * 8); 951c6d22830SJan Kiszka val = bs->dirty_bitmap[idx]; 952c6d22830SJan Kiszka if (dirty) { 9536d59fec1SMarcelo Tosatti if (!(val & (1UL << bit))) { 954aaa0eb75SLiran Schour bs->dirty_count++; 9556d59fec1SMarcelo Tosatti val |= 1UL << bit; 956aaa0eb75SLiran Schour } 957c6d22830SJan Kiszka } else { 9586d59fec1SMarcelo Tosatti if (val & (1UL << bit)) { 959aaa0eb75SLiran Schour bs->dirty_count--; 9606d59fec1SMarcelo Tosatti val &= ~(1UL << bit); 961c6d22830SJan Kiszka } 962aaa0eb75SLiran Schour } 963c6d22830SJan Kiszka bs->dirty_bitmap[idx] = val; 9647cd1e32aSlirans@il.ibm.com } 9657cd1e32aSlirans@il.ibm.com } 9667cd1e32aSlirans@il.ibm.com 96719cb3738Sbellard /* Return < 0 if error. Important errors are: 96819cb3738Sbellard -EIO generic I/O error (may happen for all errors) 96919cb3738Sbellard -ENOMEDIUM No media inserted. 97019cb3738Sbellard -EINVAL Invalid sector number or nb_sectors 97119cb3738Sbellard -EACCES Trying to write a read-only device 97219cb3738Sbellard */ 973fc01f7e7Sbellard int bdrv_write(BlockDriverState *bs, int64_t sector_num, 974fc01f7e7Sbellard const uint8_t *buf, int nb_sectors) 975fc01f7e7Sbellard { 97683f64091Sbellard BlockDriver *drv = bs->drv; 97719cb3738Sbellard if (!bs->drv) 97819cb3738Sbellard return -ENOMEDIUM; 9790849bf08Sbellard if (bs->read_only) 98019cb3738Sbellard return -EACCES; 98171d0770cSaliguori if (bdrv_check_request(bs, sector_num, nb_sectors)) 98271d0770cSaliguori return -EIO; 98371d0770cSaliguori 984c6d22830SJan Kiszka if (bs->dirty_bitmap) { 9857cd1e32aSlirans@il.ibm.com set_dirty_bitmap(bs, sector_num, nb_sectors, 1); 9867cd1e32aSlirans@il.ibm.com } 9877cd1e32aSlirans@il.ibm.com 988294cc35fSKevin Wolf if (bs->wr_highest_sector < sector_num + nb_sectors - 1) { 989294cc35fSKevin Wolf bs->wr_highest_sector = sector_num + nb_sectors - 1; 990294cc35fSKevin Wolf } 991294cc35fSKevin Wolf 99283f64091Sbellard return drv->bdrv_write(bs, sector_num, buf, nb_sectors); 99383f64091Sbellard } 99483f64091Sbellard 995eda578e5Saliguori int bdrv_pread(BlockDriverState *bs, int64_t offset, 996eda578e5Saliguori void *buf, int count1) 99783f64091Sbellard { 9986ea44308SJan Kiszka uint8_t tmp_buf[BDRV_SECTOR_SIZE]; 99983f64091Sbellard int len, nb_sectors, count; 100083f64091Sbellard int64_t sector_num; 10019a8c4cceSKevin Wolf int ret; 100283f64091Sbellard 100383f64091Sbellard count = count1; 100483f64091Sbellard /* first read to align to sector start */ 10056ea44308SJan Kiszka len = (BDRV_SECTOR_SIZE - offset) & (BDRV_SECTOR_SIZE - 1); 100683f64091Sbellard if (len > count) 100783f64091Sbellard len = count; 10086ea44308SJan Kiszka sector_num = offset >> BDRV_SECTOR_BITS; 100983f64091Sbellard if (len > 0) { 10109a8c4cceSKevin Wolf if ((ret = bdrv_read(bs, sector_num, tmp_buf, 1)) < 0) 10119a8c4cceSKevin Wolf return ret; 10126ea44308SJan Kiszka memcpy(buf, tmp_buf + (offset & (BDRV_SECTOR_SIZE - 1)), len); 101383f64091Sbellard count -= len; 101483f64091Sbellard if (count == 0) 101583f64091Sbellard return count1; 101683f64091Sbellard sector_num++; 101783f64091Sbellard buf += len; 101883f64091Sbellard } 101983f64091Sbellard 102083f64091Sbellard /* read the sectors "in place" */ 10216ea44308SJan Kiszka nb_sectors = count >> BDRV_SECTOR_BITS; 102283f64091Sbellard if (nb_sectors > 0) { 10239a8c4cceSKevin Wolf if ((ret = bdrv_read(bs, sector_num, buf, nb_sectors)) < 0) 10249a8c4cceSKevin Wolf return ret; 102583f64091Sbellard sector_num += nb_sectors; 10266ea44308SJan Kiszka len = nb_sectors << BDRV_SECTOR_BITS; 102783f64091Sbellard buf += len; 102883f64091Sbellard count -= len; 102983f64091Sbellard } 103083f64091Sbellard 103183f64091Sbellard /* add data from the last sector */ 103283f64091Sbellard if (count > 0) { 10339a8c4cceSKevin Wolf if ((ret = bdrv_read(bs, sector_num, tmp_buf, 1)) < 0) 10349a8c4cceSKevin Wolf return ret; 103583f64091Sbellard memcpy(buf, tmp_buf, count); 103683f64091Sbellard } 103783f64091Sbellard return count1; 103883f64091Sbellard } 103983f64091Sbellard 1040eda578e5Saliguori int bdrv_pwrite(BlockDriverState *bs, int64_t offset, 1041eda578e5Saliguori const void *buf, int count1) 104283f64091Sbellard { 10436ea44308SJan Kiszka uint8_t tmp_buf[BDRV_SECTOR_SIZE]; 104483f64091Sbellard int len, nb_sectors, count; 104583f64091Sbellard int64_t sector_num; 10469a8c4cceSKevin Wolf int ret; 104783f64091Sbellard 104883f64091Sbellard count = count1; 104983f64091Sbellard /* first write to align to sector start */ 10506ea44308SJan Kiszka len = (BDRV_SECTOR_SIZE - offset) & (BDRV_SECTOR_SIZE - 1); 105183f64091Sbellard if (len > count) 105283f64091Sbellard len = count; 10536ea44308SJan Kiszka sector_num = offset >> BDRV_SECTOR_BITS; 105483f64091Sbellard if (len > 0) { 10559a8c4cceSKevin Wolf if ((ret = bdrv_read(bs, sector_num, tmp_buf, 1)) < 0) 10569a8c4cceSKevin Wolf return ret; 10576ea44308SJan Kiszka memcpy(tmp_buf + (offset & (BDRV_SECTOR_SIZE - 1)), buf, len); 10589a8c4cceSKevin Wolf if ((ret = bdrv_write(bs, sector_num, tmp_buf, 1)) < 0) 10599a8c4cceSKevin Wolf return ret; 106083f64091Sbellard count -= len; 106183f64091Sbellard if (count == 0) 106283f64091Sbellard return count1; 106383f64091Sbellard sector_num++; 106483f64091Sbellard buf += len; 106583f64091Sbellard } 106683f64091Sbellard 106783f64091Sbellard /* write the sectors "in place" */ 10686ea44308SJan Kiszka nb_sectors = count >> BDRV_SECTOR_BITS; 106983f64091Sbellard if (nb_sectors > 0) { 10709a8c4cceSKevin Wolf if ((ret = bdrv_write(bs, sector_num, buf, nb_sectors)) < 0) 10719a8c4cceSKevin Wolf return ret; 107283f64091Sbellard sector_num += nb_sectors; 10736ea44308SJan Kiszka len = nb_sectors << BDRV_SECTOR_BITS; 107483f64091Sbellard buf += len; 107583f64091Sbellard count -= len; 107683f64091Sbellard } 107783f64091Sbellard 107883f64091Sbellard /* add data from the last sector */ 107983f64091Sbellard if (count > 0) { 10809a8c4cceSKevin Wolf if ((ret = bdrv_read(bs, sector_num, tmp_buf, 1)) < 0) 10819a8c4cceSKevin Wolf return ret; 108283f64091Sbellard memcpy(tmp_buf, buf, count); 10839a8c4cceSKevin Wolf if ((ret = bdrv_write(bs, sector_num, tmp_buf, 1)) < 0) 10849a8c4cceSKevin Wolf return ret; 108583f64091Sbellard } 108683f64091Sbellard return count1; 108783f64091Sbellard } 108883f64091Sbellard 1089f08145feSKevin Wolf /* 1090f08145feSKevin Wolf * Writes to the file and ensures that no writes are reordered across this 1091f08145feSKevin Wolf * request (acts as a barrier) 1092f08145feSKevin Wolf * 1093f08145feSKevin Wolf * Returns 0 on success, -errno in error cases. 1094f08145feSKevin Wolf */ 1095f08145feSKevin Wolf int bdrv_pwrite_sync(BlockDriverState *bs, int64_t offset, 1096f08145feSKevin Wolf const void *buf, int count) 1097f08145feSKevin Wolf { 1098f08145feSKevin Wolf int ret; 1099f08145feSKevin Wolf 1100f08145feSKevin Wolf ret = bdrv_pwrite(bs, offset, buf, count); 1101f08145feSKevin Wolf if (ret < 0) { 1102f08145feSKevin Wolf return ret; 1103f08145feSKevin Wolf } 1104f08145feSKevin Wolf 1105f08145feSKevin Wolf /* No flush needed for cache=writethrough, it uses O_DSYNC */ 1106f08145feSKevin Wolf if ((bs->open_flags & BDRV_O_CACHE_MASK) != 0) { 1107f08145feSKevin Wolf bdrv_flush(bs); 1108f08145feSKevin Wolf } 1109f08145feSKevin Wolf 1110f08145feSKevin Wolf return 0; 1111f08145feSKevin Wolf } 1112f08145feSKevin Wolf 1113*da1fa91dSKevin Wolf int coroutine_fn bdrv_co_readv(BlockDriverState *bs, int64_t sector_num, 1114*da1fa91dSKevin Wolf int nb_sectors, QEMUIOVector *qiov) 1115*da1fa91dSKevin Wolf { 1116*da1fa91dSKevin Wolf BlockDriver *drv = bs->drv; 1117*da1fa91dSKevin Wolf 1118*da1fa91dSKevin Wolf trace_bdrv_co_readv(bs, sector_num, nb_sectors); 1119*da1fa91dSKevin Wolf 1120*da1fa91dSKevin Wolf if (!drv) { 1121*da1fa91dSKevin Wolf return -ENOMEDIUM; 1122*da1fa91dSKevin Wolf } 1123*da1fa91dSKevin Wolf if (bdrv_check_request(bs, sector_num, nb_sectors)) { 1124*da1fa91dSKevin Wolf return -EIO; 1125*da1fa91dSKevin Wolf } 1126*da1fa91dSKevin Wolf 1127*da1fa91dSKevin Wolf return drv->bdrv_co_readv(bs, sector_num, nb_sectors, qiov); 1128*da1fa91dSKevin Wolf } 1129*da1fa91dSKevin Wolf 1130*da1fa91dSKevin Wolf int coroutine_fn bdrv_co_writev(BlockDriverState *bs, int64_t sector_num, 1131*da1fa91dSKevin Wolf int nb_sectors, QEMUIOVector *qiov) 1132*da1fa91dSKevin Wolf { 1133*da1fa91dSKevin Wolf BlockDriver *drv = bs->drv; 1134*da1fa91dSKevin Wolf 1135*da1fa91dSKevin Wolf trace_bdrv_co_writev(bs, sector_num, nb_sectors); 1136*da1fa91dSKevin Wolf 1137*da1fa91dSKevin Wolf if (!bs->drv) { 1138*da1fa91dSKevin Wolf return -ENOMEDIUM; 1139*da1fa91dSKevin Wolf } 1140*da1fa91dSKevin Wolf if (bs->read_only) { 1141*da1fa91dSKevin Wolf return -EACCES; 1142*da1fa91dSKevin Wolf } 1143*da1fa91dSKevin Wolf if (bdrv_check_request(bs, sector_num, nb_sectors)) { 1144*da1fa91dSKevin Wolf return -EIO; 1145*da1fa91dSKevin Wolf } 1146*da1fa91dSKevin Wolf 1147*da1fa91dSKevin Wolf if (bs->dirty_bitmap) { 1148*da1fa91dSKevin Wolf set_dirty_bitmap(bs, sector_num, nb_sectors, 1); 1149*da1fa91dSKevin Wolf } 1150*da1fa91dSKevin Wolf 1151*da1fa91dSKevin Wolf if (bs->wr_highest_sector < sector_num + nb_sectors - 1) { 1152*da1fa91dSKevin Wolf bs->wr_highest_sector = sector_num + nb_sectors - 1; 1153*da1fa91dSKevin Wolf } 1154*da1fa91dSKevin Wolf 1155*da1fa91dSKevin Wolf return drv->bdrv_co_writev(bs, sector_num, nb_sectors, qiov); 1156*da1fa91dSKevin Wolf } 1157*da1fa91dSKevin Wolf 115883f64091Sbellard /** 115983f64091Sbellard * Truncate file to 'offset' bytes (needed only for file protocols) 116083f64091Sbellard */ 116183f64091Sbellard int bdrv_truncate(BlockDriverState *bs, int64_t offset) 116283f64091Sbellard { 116383f64091Sbellard BlockDriver *drv = bs->drv; 116451762288SStefan Hajnoczi int ret; 116583f64091Sbellard if (!drv) 116619cb3738Sbellard return -ENOMEDIUM; 116783f64091Sbellard if (!drv->bdrv_truncate) 116883f64091Sbellard return -ENOTSUP; 116959f2689dSNaphtali Sprei if (bs->read_only) 117059f2689dSNaphtali Sprei return -EACCES; 11718591675fSMarcelo Tosatti if (bdrv_in_use(bs)) 11728591675fSMarcelo Tosatti return -EBUSY; 117351762288SStefan Hajnoczi ret = drv->bdrv_truncate(bs, offset); 117451762288SStefan Hajnoczi if (ret == 0) { 117551762288SStefan Hajnoczi ret = refresh_total_sectors(bs, offset >> BDRV_SECTOR_BITS); 1176db97ee6aSChristoph Hellwig if (bs->change_cb) { 1177db97ee6aSChristoph Hellwig bs->change_cb(bs->change_opaque, CHANGE_SIZE); 1178db97ee6aSChristoph Hellwig } 117951762288SStefan Hajnoczi } 118051762288SStefan Hajnoczi return ret; 118183f64091Sbellard } 118283f64091Sbellard 118383f64091Sbellard /** 11844a1d5e1fSFam Zheng * Length of a allocated file in bytes. Sparse files are counted by actual 11854a1d5e1fSFam Zheng * allocated space. Return < 0 if error or unknown. 11864a1d5e1fSFam Zheng */ 11874a1d5e1fSFam Zheng int64_t bdrv_get_allocated_file_size(BlockDriverState *bs) 11884a1d5e1fSFam Zheng { 11894a1d5e1fSFam Zheng BlockDriver *drv = bs->drv; 11904a1d5e1fSFam Zheng if (!drv) { 11914a1d5e1fSFam Zheng return -ENOMEDIUM; 11924a1d5e1fSFam Zheng } 11934a1d5e1fSFam Zheng if (drv->bdrv_get_allocated_file_size) { 11944a1d5e1fSFam Zheng return drv->bdrv_get_allocated_file_size(bs); 11954a1d5e1fSFam Zheng } 11964a1d5e1fSFam Zheng if (bs->file) { 11974a1d5e1fSFam Zheng return bdrv_get_allocated_file_size(bs->file); 11984a1d5e1fSFam Zheng } 11994a1d5e1fSFam Zheng return -ENOTSUP; 12004a1d5e1fSFam Zheng } 12014a1d5e1fSFam Zheng 12024a1d5e1fSFam Zheng /** 120383f64091Sbellard * Length of a file in bytes. Return < 0 if error or unknown. 120483f64091Sbellard */ 120583f64091Sbellard int64_t bdrv_getlength(BlockDriverState *bs) 120683f64091Sbellard { 120783f64091Sbellard BlockDriver *drv = bs->drv; 120883f64091Sbellard if (!drv) 120919cb3738Sbellard return -ENOMEDIUM; 121051762288SStefan Hajnoczi 121146a4e4e6SStefan Hajnoczi if (bs->growable || bs->removable) { 121246a4e4e6SStefan Hajnoczi if (drv->bdrv_getlength) { 121383f64091Sbellard return drv->bdrv_getlength(bs); 1214fc01f7e7Sbellard } 121546a4e4e6SStefan Hajnoczi } 121646a4e4e6SStefan Hajnoczi return bs->total_sectors * BDRV_SECTOR_SIZE; 121746a4e4e6SStefan Hajnoczi } 1218fc01f7e7Sbellard 121919cb3738Sbellard /* return 0 as number of sectors if no device present or error */ 122096b8f136Sths void bdrv_get_geometry(BlockDriverState *bs, uint64_t *nb_sectors_ptr) 1221fc01f7e7Sbellard { 122219cb3738Sbellard int64_t length; 122319cb3738Sbellard length = bdrv_getlength(bs); 122419cb3738Sbellard if (length < 0) 122519cb3738Sbellard length = 0; 122619cb3738Sbellard else 12276ea44308SJan Kiszka length = length >> BDRV_SECTOR_BITS; 122819cb3738Sbellard *nb_sectors_ptr = length; 1229fc01f7e7Sbellard } 1230cf98951bSbellard 1231f3d54fc4Saliguori struct partition { 1232f3d54fc4Saliguori uint8_t boot_ind; /* 0x80 - active */ 1233f3d54fc4Saliguori uint8_t head; /* starting head */ 1234f3d54fc4Saliguori uint8_t sector; /* starting sector */ 1235f3d54fc4Saliguori uint8_t cyl; /* starting cylinder */ 1236f3d54fc4Saliguori uint8_t sys_ind; /* What partition type */ 1237f3d54fc4Saliguori uint8_t end_head; /* end head */ 1238f3d54fc4Saliguori uint8_t end_sector; /* end sector */ 1239f3d54fc4Saliguori uint8_t end_cyl; /* end cylinder */ 1240f3d54fc4Saliguori uint32_t start_sect; /* starting sector counting from 0 */ 1241f3d54fc4Saliguori uint32_t nr_sects; /* nr of sectors in partition */ 1242f3d54fc4Saliguori } __attribute__((packed)); 1243f3d54fc4Saliguori 1244f3d54fc4Saliguori /* try to guess the disk logical geometry from the MSDOS partition table. Return 0 if OK, -1 if could not guess */ 1245f3d54fc4Saliguori static int guess_disk_lchs(BlockDriverState *bs, 1246f3d54fc4Saliguori int *pcylinders, int *pheads, int *psectors) 1247f3d54fc4Saliguori { 1248eb5a3165SJes Sorensen uint8_t buf[BDRV_SECTOR_SIZE]; 1249f3d54fc4Saliguori int ret, i, heads, sectors, cylinders; 1250f3d54fc4Saliguori struct partition *p; 1251f3d54fc4Saliguori uint32_t nr_sects; 1252a38131b6Sblueswir1 uint64_t nb_sectors; 1253f3d54fc4Saliguori 1254f3d54fc4Saliguori bdrv_get_geometry(bs, &nb_sectors); 1255f3d54fc4Saliguori 1256f3d54fc4Saliguori ret = bdrv_read(bs, 0, buf, 1); 1257f3d54fc4Saliguori if (ret < 0) 1258f3d54fc4Saliguori return -1; 1259f3d54fc4Saliguori /* test msdos magic */ 1260f3d54fc4Saliguori if (buf[510] != 0x55 || buf[511] != 0xaa) 1261f3d54fc4Saliguori return -1; 1262f3d54fc4Saliguori for(i = 0; i < 4; i++) { 1263f3d54fc4Saliguori p = ((struct partition *)(buf + 0x1be)) + i; 1264f3d54fc4Saliguori nr_sects = le32_to_cpu(p->nr_sects); 1265f3d54fc4Saliguori if (nr_sects && p->end_head) { 1266f3d54fc4Saliguori /* We make the assumption that the partition terminates on 1267f3d54fc4Saliguori a cylinder boundary */ 1268f3d54fc4Saliguori heads = p->end_head + 1; 1269f3d54fc4Saliguori sectors = p->end_sector & 63; 1270f3d54fc4Saliguori if (sectors == 0) 1271f3d54fc4Saliguori continue; 1272f3d54fc4Saliguori cylinders = nb_sectors / (heads * sectors); 1273f3d54fc4Saliguori if (cylinders < 1 || cylinders > 16383) 1274f3d54fc4Saliguori continue; 1275f3d54fc4Saliguori *pheads = heads; 1276f3d54fc4Saliguori *psectors = sectors; 1277f3d54fc4Saliguori *pcylinders = cylinders; 1278f3d54fc4Saliguori #if 0 1279f3d54fc4Saliguori printf("guessed geometry: LCHS=%d %d %d\n", 1280f3d54fc4Saliguori cylinders, heads, sectors); 1281f3d54fc4Saliguori #endif 1282f3d54fc4Saliguori return 0; 1283f3d54fc4Saliguori } 1284f3d54fc4Saliguori } 1285f3d54fc4Saliguori return -1; 1286f3d54fc4Saliguori } 1287f3d54fc4Saliguori 1288f3d54fc4Saliguori void bdrv_guess_geometry(BlockDriverState *bs, int *pcyls, int *pheads, int *psecs) 1289f3d54fc4Saliguori { 1290f3d54fc4Saliguori int translation, lba_detected = 0; 1291f3d54fc4Saliguori int cylinders, heads, secs; 1292a38131b6Sblueswir1 uint64_t nb_sectors; 1293f3d54fc4Saliguori 1294f3d54fc4Saliguori /* if a geometry hint is available, use it */ 1295f3d54fc4Saliguori bdrv_get_geometry(bs, &nb_sectors); 1296f3d54fc4Saliguori bdrv_get_geometry_hint(bs, &cylinders, &heads, &secs); 1297f3d54fc4Saliguori translation = bdrv_get_translation_hint(bs); 1298f3d54fc4Saliguori if (cylinders != 0) { 1299f3d54fc4Saliguori *pcyls = cylinders; 1300f3d54fc4Saliguori *pheads = heads; 1301f3d54fc4Saliguori *psecs = secs; 1302f3d54fc4Saliguori } else { 1303f3d54fc4Saliguori if (guess_disk_lchs(bs, &cylinders, &heads, &secs) == 0) { 1304f3d54fc4Saliguori if (heads > 16) { 1305f3d54fc4Saliguori /* if heads > 16, it means that a BIOS LBA 1306f3d54fc4Saliguori translation was active, so the default 1307f3d54fc4Saliguori hardware geometry is OK */ 1308f3d54fc4Saliguori lba_detected = 1; 1309f3d54fc4Saliguori goto default_geometry; 1310f3d54fc4Saliguori } else { 1311f3d54fc4Saliguori *pcyls = cylinders; 1312f3d54fc4Saliguori *pheads = heads; 1313f3d54fc4Saliguori *psecs = secs; 1314f3d54fc4Saliguori /* disable any translation to be in sync with 1315f3d54fc4Saliguori the logical geometry */ 1316f3d54fc4Saliguori if (translation == BIOS_ATA_TRANSLATION_AUTO) { 1317f3d54fc4Saliguori bdrv_set_translation_hint(bs, 1318f3d54fc4Saliguori BIOS_ATA_TRANSLATION_NONE); 1319f3d54fc4Saliguori } 1320f3d54fc4Saliguori } 1321f3d54fc4Saliguori } else { 1322f3d54fc4Saliguori default_geometry: 1323f3d54fc4Saliguori /* if no geometry, use a standard physical disk geometry */ 1324f3d54fc4Saliguori cylinders = nb_sectors / (16 * 63); 1325f3d54fc4Saliguori 1326f3d54fc4Saliguori if (cylinders > 16383) 1327f3d54fc4Saliguori cylinders = 16383; 1328f3d54fc4Saliguori else if (cylinders < 2) 1329f3d54fc4Saliguori cylinders = 2; 1330f3d54fc4Saliguori *pcyls = cylinders; 1331f3d54fc4Saliguori *pheads = 16; 1332f3d54fc4Saliguori *psecs = 63; 1333f3d54fc4Saliguori if ((lba_detected == 1) && (translation == BIOS_ATA_TRANSLATION_AUTO)) { 1334f3d54fc4Saliguori if ((*pcyls * *pheads) <= 131072) { 1335f3d54fc4Saliguori bdrv_set_translation_hint(bs, 1336f3d54fc4Saliguori BIOS_ATA_TRANSLATION_LARGE); 1337f3d54fc4Saliguori } else { 1338f3d54fc4Saliguori bdrv_set_translation_hint(bs, 1339f3d54fc4Saliguori BIOS_ATA_TRANSLATION_LBA); 1340f3d54fc4Saliguori } 1341f3d54fc4Saliguori } 1342f3d54fc4Saliguori } 1343f3d54fc4Saliguori bdrv_set_geometry_hint(bs, *pcyls, *pheads, *psecs); 1344f3d54fc4Saliguori } 1345f3d54fc4Saliguori } 1346f3d54fc4Saliguori 1347b338082bSbellard void bdrv_set_geometry_hint(BlockDriverState *bs, 1348b338082bSbellard int cyls, int heads, int secs) 1349b338082bSbellard { 1350b338082bSbellard bs->cyls = cyls; 1351b338082bSbellard bs->heads = heads; 1352b338082bSbellard bs->secs = secs; 1353b338082bSbellard } 1354b338082bSbellard 135546d4767dSbellard void bdrv_set_translation_hint(BlockDriverState *bs, int translation) 135646d4767dSbellard { 135746d4767dSbellard bs->translation = translation; 135846d4767dSbellard } 135946d4767dSbellard 1360b338082bSbellard void bdrv_get_geometry_hint(BlockDriverState *bs, 1361b338082bSbellard int *pcyls, int *pheads, int *psecs) 1362b338082bSbellard { 1363b338082bSbellard *pcyls = bs->cyls; 1364b338082bSbellard *pheads = bs->heads; 1365b338082bSbellard *psecs = bs->secs; 1366b338082bSbellard } 1367b338082bSbellard 13685bbdbb46SBlue Swirl /* Recognize floppy formats */ 13695bbdbb46SBlue Swirl typedef struct FDFormat { 13705bbdbb46SBlue Swirl FDriveType drive; 13715bbdbb46SBlue Swirl uint8_t last_sect; 13725bbdbb46SBlue Swirl uint8_t max_track; 13735bbdbb46SBlue Swirl uint8_t max_head; 13745bbdbb46SBlue Swirl } FDFormat; 13755bbdbb46SBlue Swirl 13765bbdbb46SBlue Swirl static const FDFormat fd_formats[] = { 13775bbdbb46SBlue Swirl /* First entry is default format */ 13785bbdbb46SBlue Swirl /* 1.44 MB 3"1/2 floppy disks */ 13795bbdbb46SBlue Swirl { FDRIVE_DRV_144, 18, 80, 1, }, 13805bbdbb46SBlue Swirl { FDRIVE_DRV_144, 20, 80, 1, }, 13815bbdbb46SBlue Swirl { FDRIVE_DRV_144, 21, 80, 1, }, 13825bbdbb46SBlue Swirl { FDRIVE_DRV_144, 21, 82, 1, }, 13835bbdbb46SBlue Swirl { FDRIVE_DRV_144, 21, 83, 1, }, 13845bbdbb46SBlue Swirl { FDRIVE_DRV_144, 22, 80, 1, }, 13855bbdbb46SBlue Swirl { FDRIVE_DRV_144, 23, 80, 1, }, 13865bbdbb46SBlue Swirl { FDRIVE_DRV_144, 24, 80, 1, }, 13875bbdbb46SBlue Swirl /* 2.88 MB 3"1/2 floppy disks */ 13885bbdbb46SBlue Swirl { FDRIVE_DRV_288, 36, 80, 1, }, 13895bbdbb46SBlue Swirl { FDRIVE_DRV_288, 39, 80, 1, }, 13905bbdbb46SBlue Swirl { FDRIVE_DRV_288, 40, 80, 1, }, 13915bbdbb46SBlue Swirl { FDRIVE_DRV_288, 44, 80, 1, }, 13925bbdbb46SBlue Swirl { FDRIVE_DRV_288, 48, 80, 1, }, 13935bbdbb46SBlue Swirl /* 720 kB 3"1/2 floppy disks */ 13945bbdbb46SBlue Swirl { FDRIVE_DRV_144, 9, 80, 1, }, 13955bbdbb46SBlue Swirl { FDRIVE_DRV_144, 10, 80, 1, }, 13965bbdbb46SBlue Swirl { FDRIVE_DRV_144, 10, 82, 1, }, 13975bbdbb46SBlue Swirl { FDRIVE_DRV_144, 10, 83, 1, }, 13985bbdbb46SBlue Swirl { FDRIVE_DRV_144, 13, 80, 1, }, 13995bbdbb46SBlue Swirl { FDRIVE_DRV_144, 14, 80, 1, }, 14005bbdbb46SBlue Swirl /* 1.2 MB 5"1/4 floppy disks */ 14015bbdbb46SBlue Swirl { FDRIVE_DRV_120, 15, 80, 1, }, 14025bbdbb46SBlue Swirl { FDRIVE_DRV_120, 18, 80, 1, }, 14035bbdbb46SBlue Swirl { FDRIVE_DRV_120, 18, 82, 1, }, 14045bbdbb46SBlue Swirl { FDRIVE_DRV_120, 18, 83, 1, }, 14055bbdbb46SBlue Swirl { FDRIVE_DRV_120, 20, 80, 1, }, 14065bbdbb46SBlue Swirl /* 720 kB 5"1/4 floppy disks */ 14075bbdbb46SBlue Swirl { FDRIVE_DRV_120, 9, 80, 1, }, 14085bbdbb46SBlue Swirl { FDRIVE_DRV_120, 11, 80, 1, }, 14095bbdbb46SBlue Swirl /* 360 kB 5"1/4 floppy disks */ 14105bbdbb46SBlue Swirl { FDRIVE_DRV_120, 9, 40, 1, }, 14115bbdbb46SBlue Swirl { FDRIVE_DRV_120, 9, 40, 0, }, 14125bbdbb46SBlue Swirl { FDRIVE_DRV_120, 10, 41, 1, }, 14135bbdbb46SBlue Swirl { FDRIVE_DRV_120, 10, 42, 1, }, 14145bbdbb46SBlue Swirl /* 320 kB 5"1/4 floppy disks */ 14155bbdbb46SBlue Swirl { FDRIVE_DRV_120, 8, 40, 1, }, 14165bbdbb46SBlue Swirl { FDRIVE_DRV_120, 8, 40, 0, }, 14175bbdbb46SBlue Swirl /* 360 kB must match 5"1/4 better than 3"1/2... */ 14185bbdbb46SBlue Swirl { FDRIVE_DRV_144, 9, 80, 0, }, 14195bbdbb46SBlue Swirl /* end */ 14205bbdbb46SBlue Swirl { FDRIVE_DRV_NONE, -1, -1, 0, }, 14215bbdbb46SBlue Swirl }; 14225bbdbb46SBlue Swirl 14235bbdbb46SBlue Swirl void bdrv_get_floppy_geometry_hint(BlockDriverState *bs, int *nb_heads, 14245bbdbb46SBlue Swirl int *max_track, int *last_sect, 14255bbdbb46SBlue Swirl FDriveType drive_in, FDriveType *drive) 14265bbdbb46SBlue Swirl { 14275bbdbb46SBlue Swirl const FDFormat *parse; 14285bbdbb46SBlue Swirl uint64_t nb_sectors, size; 14295bbdbb46SBlue Swirl int i, first_match, match; 14305bbdbb46SBlue Swirl 14315bbdbb46SBlue Swirl bdrv_get_geometry_hint(bs, nb_heads, max_track, last_sect); 14325bbdbb46SBlue Swirl if (*nb_heads != 0 && *max_track != 0 && *last_sect != 0) { 14335bbdbb46SBlue Swirl /* User defined disk */ 14345bbdbb46SBlue Swirl } else { 14355bbdbb46SBlue Swirl bdrv_get_geometry(bs, &nb_sectors); 14365bbdbb46SBlue Swirl match = -1; 14375bbdbb46SBlue Swirl first_match = -1; 14385bbdbb46SBlue Swirl for (i = 0; ; i++) { 14395bbdbb46SBlue Swirl parse = &fd_formats[i]; 14405bbdbb46SBlue Swirl if (parse->drive == FDRIVE_DRV_NONE) { 14415bbdbb46SBlue Swirl break; 14425bbdbb46SBlue Swirl } 14435bbdbb46SBlue Swirl if (drive_in == parse->drive || 14445bbdbb46SBlue Swirl drive_in == FDRIVE_DRV_NONE) { 14455bbdbb46SBlue Swirl size = (parse->max_head + 1) * parse->max_track * 14465bbdbb46SBlue Swirl parse->last_sect; 14475bbdbb46SBlue Swirl if (nb_sectors == size) { 14485bbdbb46SBlue Swirl match = i; 14495bbdbb46SBlue Swirl break; 14505bbdbb46SBlue Swirl } 14515bbdbb46SBlue Swirl if (first_match == -1) { 14525bbdbb46SBlue Swirl first_match = i; 14535bbdbb46SBlue Swirl } 14545bbdbb46SBlue Swirl } 14555bbdbb46SBlue Swirl } 14565bbdbb46SBlue Swirl if (match == -1) { 14575bbdbb46SBlue Swirl if (first_match == -1) { 14585bbdbb46SBlue Swirl match = 1; 14595bbdbb46SBlue Swirl } else { 14605bbdbb46SBlue Swirl match = first_match; 14615bbdbb46SBlue Swirl } 14625bbdbb46SBlue Swirl parse = &fd_formats[match]; 14635bbdbb46SBlue Swirl } 14645bbdbb46SBlue Swirl *nb_heads = parse->max_head + 1; 14655bbdbb46SBlue Swirl *max_track = parse->max_track; 14665bbdbb46SBlue Swirl *last_sect = parse->last_sect; 14675bbdbb46SBlue Swirl *drive = parse->drive; 14685bbdbb46SBlue Swirl } 14695bbdbb46SBlue Swirl } 14705bbdbb46SBlue Swirl 147146d4767dSbellard int bdrv_get_translation_hint(BlockDriverState *bs) 147246d4767dSbellard { 147346d4767dSbellard return bs->translation; 147446d4767dSbellard } 147546d4767dSbellard 1476abd7f68dSMarkus Armbruster void bdrv_set_on_error(BlockDriverState *bs, BlockErrorAction on_read_error, 1477abd7f68dSMarkus Armbruster BlockErrorAction on_write_error) 1478abd7f68dSMarkus Armbruster { 1479abd7f68dSMarkus Armbruster bs->on_read_error = on_read_error; 1480abd7f68dSMarkus Armbruster bs->on_write_error = on_write_error; 1481abd7f68dSMarkus Armbruster } 1482abd7f68dSMarkus Armbruster 1483abd7f68dSMarkus Armbruster BlockErrorAction bdrv_get_on_error(BlockDriverState *bs, int is_read) 1484abd7f68dSMarkus Armbruster { 1485abd7f68dSMarkus Armbruster return is_read ? bs->on_read_error : bs->on_write_error; 1486abd7f68dSMarkus Armbruster } 1487abd7f68dSMarkus Armbruster 14887d0d6950SMarkus Armbruster void bdrv_set_removable(BlockDriverState *bs, int removable) 14897d0d6950SMarkus Armbruster { 14907d0d6950SMarkus Armbruster bs->removable = removable; 14917d0d6950SMarkus Armbruster if (removable && bs == bs_snapshots) { 14927d0d6950SMarkus Armbruster bs_snapshots = NULL; 14937d0d6950SMarkus Armbruster } 14947d0d6950SMarkus Armbruster } 14957d0d6950SMarkus Armbruster 1496b338082bSbellard int bdrv_is_removable(BlockDriverState *bs) 1497b338082bSbellard { 1498b338082bSbellard return bs->removable; 1499b338082bSbellard } 1500b338082bSbellard 1501b338082bSbellard int bdrv_is_read_only(BlockDriverState *bs) 1502b338082bSbellard { 1503b338082bSbellard return bs->read_only; 1504b338082bSbellard } 1505b338082bSbellard 1506985a03b0Sths int bdrv_is_sg(BlockDriverState *bs) 1507985a03b0Sths { 1508985a03b0Sths return bs->sg; 1509985a03b0Sths } 1510985a03b0Sths 1511e900a7b7SChristoph Hellwig int bdrv_enable_write_cache(BlockDriverState *bs) 1512e900a7b7SChristoph Hellwig { 1513e900a7b7SChristoph Hellwig return bs->enable_write_cache; 1514e900a7b7SChristoph Hellwig } 1515e900a7b7SChristoph Hellwig 151619cb3738Sbellard /* XXX: no longer used */ 1517b338082bSbellard void bdrv_set_change_cb(BlockDriverState *bs, 1518db97ee6aSChristoph Hellwig void (*change_cb)(void *opaque, int reason), 1519db97ee6aSChristoph Hellwig void *opaque) 1520b338082bSbellard { 1521b338082bSbellard bs->change_cb = change_cb; 1522b338082bSbellard bs->change_opaque = opaque; 1523b338082bSbellard } 1524b338082bSbellard 1525ea2384d3Sbellard int bdrv_is_encrypted(BlockDriverState *bs) 1526ea2384d3Sbellard { 1527ea2384d3Sbellard if (bs->backing_hd && bs->backing_hd->encrypted) 1528ea2384d3Sbellard return 1; 1529ea2384d3Sbellard return bs->encrypted; 1530ea2384d3Sbellard } 1531ea2384d3Sbellard 1532c0f4ce77Saliguori int bdrv_key_required(BlockDriverState *bs) 1533c0f4ce77Saliguori { 1534c0f4ce77Saliguori BlockDriverState *backing_hd = bs->backing_hd; 1535c0f4ce77Saliguori 1536c0f4ce77Saliguori if (backing_hd && backing_hd->encrypted && !backing_hd->valid_key) 1537c0f4ce77Saliguori return 1; 1538c0f4ce77Saliguori return (bs->encrypted && !bs->valid_key); 1539c0f4ce77Saliguori } 1540c0f4ce77Saliguori 1541ea2384d3Sbellard int bdrv_set_key(BlockDriverState *bs, const char *key) 1542ea2384d3Sbellard { 1543ea2384d3Sbellard int ret; 1544ea2384d3Sbellard if (bs->backing_hd && bs->backing_hd->encrypted) { 1545ea2384d3Sbellard ret = bdrv_set_key(bs->backing_hd, key); 1546ea2384d3Sbellard if (ret < 0) 1547ea2384d3Sbellard return ret; 1548ea2384d3Sbellard if (!bs->encrypted) 1549ea2384d3Sbellard return 0; 1550ea2384d3Sbellard } 1551fd04a2aeSShahar Havivi if (!bs->encrypted) { 1552fd04a2aeSShahar Havivi return -EINVAL; 1553fd04a2aeSShahar Havivi } else if (!bs->drv || !bs->drv->bdrv_set_key) { 1554fd04a2aeSShahar Havivi return -ENOMEDIUM; 1555fd04a2aeSShahar Havivi } 1556c0f4ce77Saliguori ret = bs->drv->bdrv_set_key(bs, key); 1557bb5fc20fSaliguori if (ret < 0) { 1558bb5fc20fSaliguori bs->valid_key = 0; 1559bb5fc20fSaliguori } else if (!bs->valid_key) { 1560bb5fc20fSaliguori bs->valid_key = 1; 1561bb5fc20fSaliguori /* call the change callback now, we skipped it on open */ 1562bb5fc20fSaliguori bs->media_changed = 1; 1563bb5fc20fSaliguori if (bs->change_cb) 1564db97ee6aSChristoph Hellwig bs->change_cb(bs->change_opaque, CHANGE_MEDIA); 1565bb5fc20fSaliguori } 1566c0f4ce77Saliguori return ret; 1567ea2384d3Sbellard } 1568ea2384d3Sbellard 1569ea2384d3Sbellard void bdrv_get_format(BlockDriverState *bs, char *buf, int buf_size) 1570ea2384d3Sbellard { 157119cb3738Sbellard if (!bs->drv) { 1572ea2384d3Sbellard buf[0] = '\0'; 1573ea2384d3Sbellard } else { 1574ea2384d3Sbellard pstrcpy(buf, buf_size, bs->drv->format_name); 1575ea2384d3Sbellard } 1576ea2384d3Sbellard } 1577ea2384d3Sbellard 1578ea2384d3Sbellard void bdrv_iterate_format(void (*it)(void *opaque, const char *name), 1579ea2384d3Sbellard void *opaque) 1580ea2384d3Sbellard { 1581ea2384d3Sbellard BlockDriver *drv; 1582ea2384d3Sbellard 15838a22f02aSStefan Hajnoczi QLIST_FOREACH(drv, &bdrv_drivers, list) { 1584ea2384d3Sbellard it(opaque, drv->format_name); 1585ea2384d3Sbellard } 1586ea2384d3Sbellard } 1587ea2384d3Sbellard 1588b338082bSbellard BlockDriverState *bdrv_find(const char *name) 1589b338082bSbellard { 1590b338082bSbellard BlockDriverState *bs; 1591b338082bSbellard 15921b7bdbc1SStefan Hajnoczi QTAILQ_FOREACH(bs, &bdrv_states, list) { 15931b7bdbc1SStefan Hajnoczi if (!strcmp(name, bs->device_name)) { 1594b338082bSbellard return bs; 1595b338082bSbellard } 15961b7bdbc1SStefan Hajnoczi } 1597b338082bSbellard return NULL; 1598b338082bSbellard } 1599b338082bSbellard 16002f399b0aSMarkus Armbruster BlockDriverState *bdrv_next(BlockDriverState *bs) 16012f399b0aSMarkus Armbruster { 16022f399b0aSMarkus Armbruster if (!bs) { 16032f399b0aSMarkus Armbruster return QTAILQ_FIRST(&bdrv_states); 16042f399b0aSMarkus Armbruster } 16052f399b0aSMarkus Armbruster return QTAILQ_NEXT(bs, list); 16062f399b0aSMarkus Armbruster } 16072f399b0aSMarkus Armbruster 160851de9760Saliguori void bdrv_iterate(void (*it)(void *opaque, BlockDriverState *bs), void *opaque) 160981d0912dSbellard { 161081d0912dSbellard BlockDriverState *bs; 161181d0912dSbellard 16121b7bdbc1SStefan Hajnoczi QTAILQ_FOREACH(bs, &bdrv_states, list) { 161351de9760Saliguori it(opaque, bs); 161481d0912dSbellard } 161581d0912dSbellard } 161681d0912dSbellard 1617ea2384d3Sbellard const char *bdrv_get_device_name(BlockDriverState *bs) 1618ea2384d3Sbellard { 1619ea2384d3Sbellard return bs->device_name; 1620ea2384d3Sbellard } 1621ea2384d3Sbellard 1622205ef796SKevin Wolf int bdrv_flush(BlockDriverState *bs) 16237a6cba61Spbrook { 1624016f5cf6SAlexander Graf if (bs->open_flags & BDRV_O_NO_FLUSH) { 1625205ef796SKevin Wolf return 0; 1626016f5cf6SAlexander Graf } 1627016f5cf6SAlexander Graf 1628205ef796SKevin Wolf if (bs->drv && bs->drv->bdrv_flush) { 1629205ef796SKevin Wolf return bs->drv->bdrv_flush(bs); 1630205ef796SKevin Wolf } 1631205ef796SKevin Wolf 1632205ef796SKevin Wolf /* 1633205ef796SKevin Wolf * Some block drivers always operate in either writethrough or unsafe mode 1634205ef796SKevin Wolf * and don't support bdrv_flush therefore. Usually qemu doesn't know how 1635205ef796SKevin Wolf * the server works (because the behaviour is hardcoded or depends on 1636205ef796SKevin Wolf * server-side configuration), so we can't ensure that everything is safe 1637205ef796SKevin Wolf * on disk. Returning an error doesn't work because that would break guests 1638205ef796SKevin Wolf * even if the server operates in writethrough mode. 1639205ef796SKevin Wolf * 1640205ef796SKevin Wolf * Let's hope the user knows what he's doing. 1641205ef796SKevin Wolf */ 1642205ef796SKevin Wolf return 0; 16437a6cba61Spbrook } 16447a6cba61Spbrook 1645c6ca28d6Saliguori void bdrv_flush_all(void) 1646c6ca28d6Saliguori { 1647c6ca28d6Saliguori BlockDriverState *bs; 1648c6ca28d6Saliguori 16491b7bdbc1SStefan Hajnoczi QTAILQ_FOREACH(bs, &bdrv_states, list) { 1650c6ca28d6Saliguori if (bs->drv && !bdrv_is_read_only(bs) && 16511b7bdbc1SStefan Hajnoczi (!bdrv_is_removable(bs) || bdrv_is_inserted(bs))) { 1652c6ca28d6Saliguori bdrv_flush(bs); 1653c6ca28d6Saliguori } 16541b7bdbc1SStefan Hajnoczi } 16551b7bdbc1SStefan Hajnoczi } 1656c6ca28d6Saliguori 1657f2feebbdSKevin Wolf int bdrv_has_zero_init(BlockDriverState *bs) 1658f2feebbdSKevin Wolf { 1659f2feebbdSKevin Wolf assert(bs->drv); 1660f2feebbdSKevin Wolf 1661336c1c12SKevin Wolf if (bs->drv->bdrv_has_zero_init) { 1662336c1c12SKevin Wolf return bs->drv->bdrv_has_zero_init(bs); 1663f2feebbdSKevin Wolf } 1664f2feebbdSKevin Wolf 1665f2feebbdSKevin Wolf return 1; 1666f2feebbdSKevin Wolf } 1667f2feebbdSKevin Wolf 1668bb8bf76fSChristoph Hellwig int bdrv_discard(BlockDriverState *bs, int64_t sector_num, int nb_sectors) 1669bb8bf76fSChristoph Hellwig { 1670bb8bf76fSChristoph Hellwig if (!bs->drv) { 1671bb8bf76fSChristoph Hellwig return -ENOMEDIUM; 1672bb8bf76fSChristoph Hellwig } 1673bb8bf76fSChristoph Hellwig if (!bs->drv->bdrv_discard) { 1674bb8bf76fSChristoph Hellwig return 0; 1675bb8bf76fSChristoph Hellwig } 1676bb8bf76fSChristoph Hellwig return bs->drv->bdrv_discard(bs, sector_num, nb_sectors); 1677bb8bf76fSChristoph Hellwig } 1678bb8bf76fSChristoph Hellwig 1679f58c7b35Sths /* 1680f58c7b35Sths * Returns true iff the specified sector is present in the disk image. Drivers 1681f58c7b35Sths * not implementing the functionality are assumed to not support backing files, 1682f58c7b35Sths * hence all their sectors are reported as allocated. 1683f58c7b35Sths * 1684f58c7b35Sths * 'pnum' is set to the number of sectors (including and immediately following 1685f58c7b35Sths * the specified sector) that are known to be in the same 1686f58c7b35Sths * allocated/unallocated state. 1687f58c7b35Sths * 1688f58c7b35Sths * 'nb_sectors' is the max value 'pnum' should be set to. 1689f58c7b35Sths */ 1690f58c7b35Sths int bdrv_is_allocated(BlockDriverState *bs, int64_t sector_num, int nb_sectors, 1691f58c7b35Sths int *pnum) 1692f58c7b35Sths { 1693f58c7b35Sths int64_t n; 1694f58c7b35Sths if (!bs->drv->bdrv_is_allocated) { 1695f58c7b35Sths if (sector_num >= bs->total_sectors) { 1696f58c7b35Sths *pnum = 0; 1697f58c7b35Sths return 0; 1698f58c7b35Sths } 1699f58c7b35Sths n = bs->total_sectors - sector_num; 1700f58c7b35Sths *pnum = (n < nb_sectors) ? (n) : (nb_sectors); 1701f58c7b35Sths return 1; 1702f58c7b35Sths } 1703f58c7b35Sths return bs->drv->bdrv_is_allocated(bs, sector_num, nb_sectors, pnum); 1704f58c7b35Sths } 1705f58c7b35Sths 17062582bfedSLuiz Capitulino void bdrv_mon_event(const BlockDriverState *bdrv, 17072582bfedSLuiz Capitulino BlockMonEventAction action, int is_read) 17082582bfedSLuiz Capitulino { 17092582bfedSLuiz Capitulino QObject *data; 17102582bfedSLuiz Capitulino const char *action_str; 17112582bfedSLuiz Capitulino 17122582bfedSLuiz Capitulino switch (action) { 17132582bfedSLuiz Capitulino case BDRV_ACTION_REPORT: 17142582bfedSLuiz Capitulino action_str = "report"; 17152582bfedSLuiz Capitulino break; 17162582bfedSLuiz Capitulino case BDRV_ACTION_IGNORE: 17172582bfedSLuiz Capitulino action_str = "ignore"; 17182582bfedSLuiz Capitulino break; 17192582bfedSLuiz Capitulino case BDRV_ACTION_STOP: 17202582bfedSLuiz Capitulino action_str = "stop"; 17212582bfedSLuiz Capitulino break; 17222582bfedSLuiz Capitulino default: 17232582bfedSLuiz Capitulino abort(); 17242582bfedSLuiz Capitulino } 17252582bfedSLuiz Capitulino 17262582bfedSLuiz Capitulino data = qobject_from_jsonf("{ 'device': %s, 'action': %s, 'operation': %s }", 17272582bfedSLuiz Capitulino bdrv->device_name, 17282582bfedSLuiz Capitulino action_str, 17292582bfedSLuiz Capitulino is_read ? "read" : "write"); 17302582bfedSLuiz Capitulino monitor_protocol_event(QEVENT_BLOCK_IO_ERROR, data); 17312582bfedSLuiz Capitulino 17322582bfedSLuiz Capitulino qobject_decref(data); 17332582bfedSLuiz Capitulino } 17342582bfedSLuiz Capitulino 1735d15e5465SLuiz Capitulino static void bdrv_print_dict(QObject *obj, void *opaque) 1736b338082bSbellard { 1737d15e5465SLuiz Capitulino QDict *bs_dict; 1738d15e5465SLuiz Capitulino Monitor *mon = opaque; 1739b338082bSbellard 1740d15e5465SLuiz Capitulino bs_dict = qobject_to_qdict(obj); 1741d15e5465SLuiz Capitulino 1742d8aeeb31SMarkus Armbruster monitor_printf(mon, "%s: removable=%d", 1743d15e5465SLuiz Capitulino qdict_get_str(bs_dict, "device"), 1744d15e5465SLuiz Capitulino qdict_get_bool(bs_dict, "removable")); 1745d15e5465SLuiz Capitulino 1746d15e5465SLuiz Capitulino if (qdict_get_bool(bs_dict, "removable")) { 1747d15e5465SLuiz Capitulino monitor_printf(mon, " locked=%d", qdict_get_bool(bs_dict, "locked")); 1748b338082bSbellard } 1749d15e5465SLuiz Capitulino 1750d15e5465SLuiz Capitulino if (qdict_haskey(bs_dict, "inserted")) { 1751d15e5465SLuiz Capitulino QDict *qdict = qobject_to_qdict(qdict_get(bs_dict, "inserted")); 1752d15e5465SLuiz Capitulino 1753376253ecSaliguori monitor_printf(mon, " file="); 1754d15e5465SLuiz Capitulino monitor_print_filename(mon, qdict_get_str(qdict, "file")); 1755d15e5465SLuiz Capitulino if (qdict_haskey(qdict, "backing_file")) { 1756376253ecSaliguori monitor_printf(mon, " backing_file="); 1757d15e5465SLuiz Capitulino monitor_print_filename(mon, qdict_get_str(qdict, "backing_file")); 1758fef30743Sths } 1759d15e5465SLuiz Capitulino monitor_printf(mon, " ro=%d drv=%s encrypted=%d", 1760d15e5465SLuiz Capitulino qdict_get_bool(qdict, "ro"), 1761d15e5465SLuiz Capitulino qdict_get_str(qdict, "drv"), 1762d15e5465SLuiz Capitulino qdict_get_bool(qdict, "encrypted")); 1763b338082bSbellard } else { 1764376253ecSaliguori monitor_printf(mon, " [not inserted]"); 1765b338082bSbellard } 1766d15e5465SLuiz Capitulino 1767376253ecSaliguori monitor_printf(mon, "\n"); 1768b338082bSbellard } 1769d15e5465SLuiz Capitulino 1770d15e5465SLuiz Capitulino void bdrv_info_print(Monitor *mon, const QObject *data) 1771d15e5465SLuiz Capitulino { 1772d15e5465SLuiz Capitulino qlist_iter(qobject_to_qlist(data), bdrv_print_dict, mon); 1773d15e5465SLuiz Capitulino } 1774d15e5465SLuiz Capitulino 1775d15e5465SLuiz Capitulino void bdrv_info(Monitor *mon, QObject **ret_data) 1776d15e5465SLuiz Capitulino { 1777d15e5465SLuiz Capitulino QList *bs_list; 1778d15e5465SLuiz Capitulino BlockDriverState *bs; 1779d15e5465SLuiz Capitulino 1780d15e5465SLuiz Capitulino bs_list = qlist_new(); 1781d15e5465SLuiz Capitulino 17821b7bdbc1SStefan Hajnoczi QTAILQ_FOREACH(bs, &bdrv_states, list) { 1783d15e5465SLuiz Capitulino QObject *bs_obj; 1784d15e5465SLuiz Capitulino 1785d8aeeb31SMarkus Armbruster bs_obj = qobject_from_jsonf("{ 'device': %s, 'type': 'unknown', " 1786d15e5465SLuiz Capitulino "'removable': %i, 'locked': %i }", 1787d8aeeb31SMarkus Armbruster bs->device_name, bs->removable, 1788d15e5465SLuiz Capitulino bs->locked); 1789d15e5465SLuiz Capitulino 1790d15e5465SLuiz Capitulino if (bs->drv) { 1791d15e5465SLuiz Capitulino QObject *obj; 1792d15e5465SLuiz Capitulino QDict *bs_dict = qobject_to_qdict(bs_obj); 1793d15e5465SLuiz Capitulino 1794d15e5465SLuiz Capitulino obj = qobject_from_jsonf("{ 'file': %s, 'ro': %i, 'drv': %s, " 1795d15e5465SLuiz Capitulino "'encrypted': %i }", 1796d15e5465SLuiz Capitulino bs->filename, bs->read_only, 1797d15e5465SLuiz Capitulino bs->drv->format_name, 1798d15e5465SLuiz Capitulino bdrv_is_encrypted(bs)); 1799d15e5465SLuiz Capitulino if (bs->backing_file[0] != '\0') { 1800d15e5465SLuiz Capitulino QDict *qdict = qobject_to_qdict(obj); 1801d15e5465SLuiz Capitulino qdict_put(qdict, "backing_file", 1802d15e5465SLuiz Capitulino qstring_from_str(bs->backing_file)); 1803d15e5465SLuiz Capitulino } 1804d15e5465SLuiz Capitulino 1805d15e5465SLuiz Capitulino qdict_put_obj(bs_dict, "inserted", obj); 1806d15e5465SLuiz Capitulino } 1807d15e5465SLuiz Capitulino qlist_append_obj(bs_list, bs_obj); 1808d15e5465SLuiz Capitulino } 1809d15e5465SLuiz Capitulino 1810d15e5465SLuiz Capitulino *ret_data = QOBJECT(bs_list); 1811b338082bSbellard } 1812a36e69ddSths 1813218a536aSLuiz Capitulino static void bdrv_stats_iter(QObject *data, void *opaque) 1814a36e69ddSths { 1815218a536aSLuiz Capitulino QDict *qdict; 1816218a536aSLuiz Capitulino Monitor *mon = opaque; 1817218a536aSLuiz Capitulino 1818218a536aSLuiz Capitulino qdict = qobject_to_qdict(data); 1819218a536aSLuiz Capitulino monitor_printf(mon, "%s:", qdict_get_str(qdict, "device")); 1820218a536aSLuiz Capitulino 1821218a536aSLuiz Capitulino qdict = qobject_to_qdict(qdict_get(qdict, "stats")); 1822218a536aSLuiz Capitulino monitor_printf(mon, " rd_bytes=%" PRId64 1823218a536aSLuiz Capitulino " wr_bytes=%" PRId64 1824218a536aSLuiz Capitulino " rd_operations=%" PRId64 1825218a536aSLuiz Capitulino " wr_operations=%" PRId64 1826218a536aSLuiz Capitulino "\n", 1827218a536aSLuiz Capitulino qdict_get_int(qdict, "rd_bytes"), 1828218a536aSLuiz Capitulino qdict_get_int(qdict, "wr_bytes"), 1829218a536aSLuiz Capitulino qdict_get_int(qdict, "rd_operations"), 1830218a536aSLuiz Capitulino qdict_get_int(qdict, "wr_operations")); 1831218a536aSLuiz Capitulino } 1832218a536aSLuiz Capitulino 1833218a536aSLuiz Capitulino void bdrv_stats_print(Monitor *mon, const QObject *data) 1834218a536aSLuiz Capitulino { 1835218a536aSLuiz Capitulino qlist_iter(qobject_to_qlist(data), bdrv_stats_iter, mon); 1836218a536aSLuiz Capitulino } 1837218a536aSLuiz Capitulino 1838294cc35fSKevin Wolf static QObject* bdrv_info_stats_bs(BlockDriverState *bs) 1839294cc35fSKevin Wolf { 1840294cc35fSKevin Wolf QObject *res; 1841294cc35fSKevin Wolf QDict *dict; 1842294cc35fSKevin Wolf 1843294cc35fSKevin Wolf res = qobject_from_jsonf("{ 'stats': {" 1844294cc35fSKevin Wolf "'rd_bytes': %" PRId64 "," 1845294cc35fSKevin Wolf "'wr_bytes': %" PRId64 "," 1846294cc35fSKevin Wolf "'rd_operations': %" PRId64 "," 1847294cc35fSKevin Wolf "'wr_operations': %" PRId64 "," 1848294cc35fSKevin Wolf "'wr_highest_offset': %" PRId64 1849294cc35fSKevin Wolf "} }", 1850294cc35fSKevin Wolf bs->rd_bytes, bs->wr_bytes, 1851294cc35fSKevin Wolf bs->rd_ops, bs->wr_ops, 18525ffbbc67SBlue Swirl bs->wr_highest_sector * 18535ffbbc67SBlue Swirl (uint64_t)BDRV_SECTOR_SIZE); 1854294cc35fSKevin Wolf dict = qobject_to_qdict(res); 1855294cc35fSKevin Wolf 1856294cc35fSKevin Wolf if (*bs->device_name) { 1857294cc35fSKevin Wolf qdict_put(dict, "device", qstring_from_str(bs->device_name)); 1858294cc35fSKevin Wolf } 1859294cc35fSKevin Wolf 1860294cc35fSKevin Wolf if (bs->file) { 1861294cc35fSKevin Wolf QObject *parent = bdrv_info_stats_bs(bs->file); 1862294cc35fSKevin Wolf qdict_put_obj(dict, "parent", parent); 1863294cc35fSKevin Wolf } 1864294cc35fSKevin Wolf 1865294cc35fSKevin Wolf return res; 1866294cc35fSKevin Wolf } 1867294cc35fSKevin Wolf 1868218a536aSLuiz Capitulino void bdrv_info_stats(Monitor *mon, QObject **ret_data) 1869218a536aSLuiz Capitulino { 1870218a536aSLuiz Capitulino QObject *obj; 1871218a536aSLuiz Capitulino QList *devices; 1872a36e69ddSths BlockDriverState *bs; 1873a36e69ddSths 1874218a536aSLuiz Capitulino devices = qlist_new(); 1875218a536aSLuiz Capitulino 18761b7bdbc1SStefan Hajnoczi QTAILQ_FOREACH(bs, &bdrv_states, list) { 1877294cc35fSKevin Wolf obj = bdrv_info_stats_bs(bs); 1878218a536aSLuiz Capitulino qlist_append_obj(devices, obj); 1879a36e69ddSths } 1880218a536aSLuiz Capitulino 1881218a536aSLuiz Capitulino *ret_data = QOBJECT(devices); 1882a36e69ddSths } 1883ea2384d3Sbellard 1884045df330Saliguori const char *bdrv_get_encrypted_filename(BlockDriverState *bs) 1885045df330Saliguori { 1886045df330Saliguori if (bs->backing_hd && bs->backing_hd->encrypted) 1887045df330Saliguori return bs->backing_file; 1888045df330Saliguori else if (bs->encrypted) 1889045df330Saliguori return bs->filename; 1890045df330Saliguori else 1891045df330Saliguori return NULL; 1892045df330Saliguori } 1893045df330Saliguori 189483f64091Sbellard void bdrv_get_backing_filename(BlockDriverState *bs, 189583f64091Sbellard char *filename, int filename_size) 189683f64091Sbellard { 1897b783e409SKevin Wolf if (!bs->backing_file) { 189883f64091Sbellard pstrcpy(filename, filename_size, ""); 189983f64091Sbellard } else { 190083f64091Sbellard pstrcpy(filename, filename_size, bs->backing_file); 190183f64091Sbellard } 190283f64091Sbellard } 190383f64091Sbellard 1904faea38e7Sbellard int bdrv_write_compressed(BlockDriverState *bs, int64_t sector_num, 1905faea38e7Sbellard const uint8_t *buf, int nb_sectors) 1906faea38e7Sbellard { 1907faea38e7Sbellard BlockDriver *drv = bs->drv; 1908faea38e7Sbellard if (!drv) 190919cb3738Sbellard return -ENOMEDIUM; 1910faea38e7Sbellard if (!drv->bdrv_write_compressed) 1911faea38e7Sbellard return -ENOTSUP; 1912fbb7b4e0SKevin Wolf if (bdrv_check_request(bs, sector_num, nb_sectors)) 1913fbb7b4e0SKevin Wolf return -EIO; 19147cd1e32aSlirans@il.ibm.com 1915c6d22830SJan Kiszka if (bs->dirty_bitmap) { 19167cd1e32aSlirans@il.ibm.com set_dirty_bitmap(bs, sector_num, nb_sectors, 1); 19177cd1e32aSlirans@il.ibm.com } 19187cd1e32aSlirans@il.ibm.com 1919faea38e7Sbellard return drv->bdrv_write_compressed(bs, sector_num, buf, nb_sectors); 1920faea38e7Sbellard } 1921faea38e7Sbellard 1922faea38e7Sbellard int bdrv_get_info(BlockDriverState *bs, BlockDriverInfo *bdi) 1923faea38e7Sbellard { 1924faea38e7Sbellard BlockDriver *drv = bs->drv; 1925faea38e7Sbellard if (!drv) 192619cb3738Sbellard return -ENOMEDIUM; 1927faea38e7Sbellard if (!drv->bdrv_get_info) 1928faea38e7Sbellard return -ENOTSUP; 1929faea38e7Sbellard memset(bdi, 0, sizeof(*bdi)); 1930faea38e7Sbellard return drv->bdrv_get_info(bs, bdi); 1931faea38e7Sbellard } 1932faea38e7Sbellard 193345566e9cSChristoph Hellwig int bdrv_save_vmstate(BlockDriverState *bs, const uint8_t *buf, 193445566e9cSChristoph Hellwig int64_t pos, int size) 1935178e08a5Saliguori { 1936178e08a5Saliguori BlockDriver *drv = bs->drv; 1937178e08a5Saliguori if (!drv) 1938178e08a5Saliguori return -ENOMEDIUM; 19397cdb1f6dSMORITA Kazutaka if (drv->bdrv_save_vmstate) 194045566e9cSChristoph Hellwig return drv->bdrv_save_vmstate(bs, buf, pos, size); 19417cdb1f6dSMORITA Kazutaka if (bs->file) 19427cdb1f6dSMORITA Kazutaka return bdrv_save_vmstate(bs->file, buf, pos, size); 19437cdb1f6dSMORITA Kazutaka return -ENOTSUP; 1944178e08a5Saliguori } 1945178e08a5Saliguori 194645566e9cSChristoph Hellwig int bdrv_load_vmstate(BlockDriverState *bs, uint8_t *buf, 194745566e9cSChristoph Hellwig int64_t pos, int size) 1948178e08a5Saliguori { 1949178e08a5Saliguori BlockDriver *drv = bs->drv; 1950178e08a5Saliguori if (!drv) 1951178e08a5Saliguori return -ENOMEDIUM; 19527cdb1f6dSMORITA Kazutaka if (drv->bdrv_load_vmstate) 195345566e9cSChristoph Hellwig return drv->bdrv_load_vmstate(bs, buf, pos, size); 19547cdb1f6dSMORITA Kazutaka if (bs->file) 19557cdb1f6dSMORITA Kazutaka return bdrv_load_vmstate(bs->file, buf, pos, size); 19567cdb1f6dSMORITA Kazutaka return -ENOTSUP; 1957178e08a5Saliguori } 1958178e08a5Saliguori 19598b9b0cc2SKevin Wolf void bdrv_debug_event(BlockDriverState *bs, BlkDebugEvent event) 19608b9b0cc2SKevin Wolf { 19618b9b0cc2SKevin Wolf BlockDriver *drv = bs->drv; 19628b9b0cc2SKevin Wolf 19638b9b0cc2SKevin Wolf if (!drv || !drv->bdrv_debug_event) { 19648b9b0cc2SKevin Wolf return; 19658b9b0cc2SKevin Wolf } 19668b9b0cc2SKevin Wolf 19678b9b0cc2SKevin Wolf return drv->bdrv_debug_event(bs, event); 19688b9b0cc2SKevin Wolf 19698b9b0cc2SKevin Wolf } 19708b9b0cc2SKevin Wolf 1971faea38e7Sbellard /**************************************************************/ 1972faea38e7Sbellard /* handling of snapshots */ 1973faea38e7Sbellard 1974feeee5acSMiguel Di Ciurcio Filho int bdrv_can_snapshot(BlockDriverState *bs) 1975feeee5acSMiguel Di Ciurcio Filho { 1976feeee5acSMiguel Di Ciurcio Filho BlockDriver *drv = bs->drv; 1977feeee5acSMiguel Di Ciurcio Filho if (!drv || bdrv_is_removable(bs) || bdrv_is_read_only(bs)) { 1978feeee5acSMiguel Di Ciurcio Filho return 0; 1979feeee5acSMiguel Di Ciurcio Filho } 1980feeee5acSMiguel Di Ciurcio Filho 1981feeee5acSMiguel Di Ciurcio Filho if (!drv->bdrv_snapshot_create) { 1982feeee5acSMiguel Di Ciurcio Filho if (bs->file != NULL) { 1983feeee5acSMiguel Di Ciurcio Filho return bdrv_can_snapshot(bs->file); 1984feeee5acSMiguel Di Ciurcio Filho } 1985feeee5acSMiguel Di Ciurcio Filho return 0; 1986feeee5acSMiguel Di Ciurcio Filho } 1987feeee5acSMiguel Di Ciurcio Filho 1988feeee5acSMiguel Di Ciurcio Filho return 1; 1989feeee5acSMiguel Di Ciurcio Filho } 1990feeee5acSMiguel Di Ciurcio Filho 1991199630b6SBlue Swirl int bdrv_is_snapshot(BlockDriverState *bs) 1992199630b6SBlue Swirl { 1993199630b6SBlue Swirl return !!(bs->open_flags & BDRV_O_SNAPSHOT); 1994199630b6SBlue Swirl } 1995199630b6SBlue Swirl 1996f9092b10SMarkus Armbruster BlockDriverState *bdrv_snapshots(void) 1997f9092b10SMarkus Armbruster { 1998f9092b10SMarkus Armbruster BlockDriverState *bs; 1999f9092b10SMarkus Armbruster 20003ac906f7SMarkus Armbruster if (bs_snapshots) { 2001f9092b10SMarkus Armbruster return bs_snapshots; 20023ac906f7SMarkus Armbruster } 2003f9092b10SMarkus Armbruster 2004f9092b10SMarkus Armbruster bs = NULL; 2005f9092b10SMarkus Armbruster while ((bs = bdrv_next(bs))) { 2006f9092b10SMarkus Armbruster if (bdrv_can_snapshot(bs)) { 20073ac906f7SMarkus Armbruster bs_snapshots = bs; 20083ac906f7SMarkus Armbruster return bs; 2009f9092b10SMarkus Armbruster } 2010f9092b10SMarkus Armbruster } 2011f9092b10SMarkus Armbruster return NULL; 2012f9092b10SMarkus Armbruster } 2013f9092b10SMarkus Armbruster 2014faea38e7Sbellard int bdrv_snapshot_create(BlockDriverState *bs, 2015faea38e7Sbellard QEMUSnapshotInfo *sn_info) 2016faea38e7Sbellard { 2017faea38e7Sbellard BlockDriver *drv = bs->drv; 2018faea38e7Sbellard if (!drv) 201919cb3738Sbellard return -ENOMEDIUM; 20207cdb1f6dSMORITA Kazutaka if (drv->bdrv_snapshot_create) 2021faea38e7Sbellard return drv->bdrv_snapshot_create(bs, sn_info); 20227cdb1f6dSMORITA Kazutaka if (bs->file) 20237cdb1f6dSMORITA Kazutaka return bdrv_snapshot_create(bs->file, sn_info); 20247cdb1f6dSMORITA Kazutaka return -ENOTSUP; 2025faea38e7Sbellard } 2026faea38e7Sbellard 2027faea38e7Sbellard int bdrv_snapshot_goto(BlockDriverState *bs, 2028faea38e7Sbellard const char *snapshot_id) 2029faea38e7Sbellard { 2030faea38e7Sbellard BlockDriver *drv = bs->drv; 20317cdb1f6dSMORITA Kazutaka int ret, open_ret; 20327cdb1f6dSMORITA Kazutaka 2033faea38e7Sbellard if (!drv) 203419cb3738Sbellard return -ENOMEDIUM; 20357cdb1f6dSMORITA Kazutaka if (drv->bdrv_snapshot_goto) 2036faea38e7Sbellard return drv->bdrv_snapshot_goto(bs, snapshot_id); 20377cdb1f6dSMORITA Kazutaka 20387cdb1f6dSMORITA Kazutaka if (bs->file) { 20397cdb1f6dSMORITA Kazutaka drv->bdrv_close(bs); 20407cdb1f6dSMORITA Kazutaka ret = bdrv_snapshot_goto(bs->file, snapshot_id); 20417cdb1f6dSMORITA Kazutaka open_ret = drv->bdrv_open(bs, bs->open_flags); 20427cdb1f6dSMORITA Kazutaka if (open_ret < 0) { 20437cdb1f6dSMORITA Kazutaka bdrv_delete(bs->file); 20447cdb1f6dSMORITA Kazutaka bs->drv = NULL; 20457cdb1f6dSMORITA Kazutaka return open_ret; 20467cdb1f6dSMORITA Kazutaka } 20477cdb1f6dSMORITA Kazutaka return ret; 20487cdb1f6dSMORITA Kazutaka } 20497cdb1f6dSMORITA Kazutaka 20507cdb1f6dSMORITA Kazutaka return -ENOTSUP; 2051faea38e7Sbellard } 2052faea38e7Sbellard 2053faea38e7Sbellard int bdrv_snapshot_delete(BlockDriverState *bs, const char *snapshot_id) 2054faea38e7Sbellard { 2055faea38e7Sbellard BlockDriver *drv = bs->drv; 2056faea38e7Sbellard if (!drv) 205719cb3738Sbellard return -ENOMEDIUM; 20587cdb1f6dSMORITA Kazutaka if (drv->bdrv_snapshot_delete) 2059faea38e7Sbellard return drv->bdrv_snapshot_delete(bs, snapshot_id); 20607cdb1f6dSMORITA Kazutaka if (bs->file) 20617cdb1f6dSMORITA Kazutaka return bdrv_snapshot_delete(bs->file, snapshot_id); 20627cdb1f6dSMORITA Kazutaka return -ENOTSUP; 2063faea38e7Sbellard } 2064faea38e7Sbellard 2065faea38e7Sbellard int bdrv_snapshot_list(BlockDriverState *bs, 2066faea38e7Sbellard QEMUSnapshotInfo **psn_info) 2067faea38e7Sbellard { 2068faea38e7Sbellard BlockDriver *drv = bs->drv; 2069faea38e7Sbellard if (!drv) 207019cb3738Sbellard return -ENOMEDIUM; 20717cdb1f6dSMORITA Kazutaka if (drv->bdrv_snapshot_list) 2072faea38e7Sbellard return drv->bdrv_snapshot_list(bs, psn_info); 20737cdb1f6dSMORITA Kazutaka if (bs->file) 20747cdb1f6dSMORITA Kazutaka return bdrv_snapshot_list(bs->file, psn_info); 20757cdb1f6dSMORITA Kazutaka return -ENOTSUP; 2076faea38e7Sbellard } 2077faea38e7Sbellard 207851ef6727Sedison int bdrv_snapshot_load_tmp(BlockDriverState *bs, 207951ef6727Sedison const char *snapshot_name) 208051ef6727Sedison { 208151ef6727Sedison BlockDriver *drv = bs->drv; 208251ef6727Sedison if (!drv) { 208351ef6727Sedison return -ENOMEDIUM; 208451ef6727Sedison } 208551ef6727Sedison if (!bs->read_only) { 208651ef6727Sedison return -EINVAL; 208751ef6727Sedison } 208851ef6727Sedison if (drv->bdrv_snapshot_load_tmp) { 208951ef6727Sedison return drv->bdrv_snapshot_load_tmp(bs, snapshot_name); 209051ef6727Sedison } 209151ef6727Sedison return -ENOTSUP; 209251ef6727Sedison } 209351ef6727Sedison 2094faea38e7Sbellard #define NB_SUFFIXES 4 2095faea38e7Sbellard 2096faea38e7Sbellard char *get_human_readable_size(char *buf, int buf_size, int64_t size) 2097faea38e7Sbellard { 2098faea38e7Sbellard static const char suffixes[NB_SUFFIXES] = "KMGT"; 2099faea38e7Sbellard int64_t base; 2100faea38e7Sbellard int i; 2101faea38e7Sbellard 2102faea38e7Sbellard if (size <= 999) { 2103faea38e7Sbellard snprintf(buf, buf_size, "%" PRId64, size); 2104faea38e7Sbellard } else { 2105faea38e7Sbellard base = 1024; 2106faea38e7Sbellard for(i = 0; i < NB_SUFFIXES; i++) { 2107faea38e7Sbellard if (size < (10 * base)) { 2108faea38e7Sbellard snprintf(buf, buf_size, "%0.1f%c", 2109faea38e7Sbellard (double)size / base, 2110faea38e7Sbellard suffixes[i]); 2111faea38e7Sbellard break; 2112faea38e7Sbellard } else if (size < (1000 * base) || i == (NB_SUFFIXES - 1)) { 2113faea38e7Sbellard snprintf(buf, buf_size, "%" PRId64 "%c", 2114faea38e7Sbellard ((size + (base >> 1)) / base), 2115faea38e7Sbellard suffixes[i]); 2116faea38e7Sbellard break; 2117faea38e7Sbellard } 2118faea38e7Sbellard base = base * 1024; 2119faea38e7Sbellard } 2120faea38e7Sbellard } 2121faea38e7Sbellard return buf; 2122faea38e7Sbellard } 2123faea38e7Sbellard 2124faea38e7Sbellard char *bdrv_snapshot_dump(char *buf, int buf_size, QEMUSnapshotInfo *sn) 2125faea38e7Sbellard { 2126faea38e7Sbellard char buf1[128], date_buf[128], clock_buf[128]; 21273b9f94e1Sbellard #ifdef _WIN32 21283b9f94e1Sbellard struct tm *ptm; 21293b9f94e1Sbellard #else 2130faea38e7Sbellard struct tm tm; 21313b9f94e1Sbellard #endif 2132faea38e7Sbellard time_t ti; 2133faea38e7Sbellard int64_t secs; 2134faea38e7Sbellard 2135faea38e7Sbellard if (!sn) { 2136faea38e7Sbellard snprintf(buf, buf_size, 2137faea38e7Sbellard "%-10s%-20s%7s%20s%15s", 2138faea38e7Sbellard "ID", "TAG", "VM SIZE", "DATE", "VM CLOCK"); 2139faea38e7Sbellard } else { 2140faea38e7Sbellard ti = sn->date_sec; 21413b9f94e1Sbellard #ifdef _WIN32 21423b9f94e1Sbellard ptm = localtime(&ti); 21433b9f94e1Sbellard strftime(date_buf, sizeof(date_buf), 21443b9f94e1Sbellard "%Y-%m-%d %H:%M:%S", ptm); 21453b9f94e1Sbellard #else 2146faea38e7Sbellard localtime_r(&ti, &tm); 2147faea38e7Sbellard strftime(date_buf, sizeof(date_buf), 2148faea38e7Sbellard "%Y-%m-%d %H:%M:%S", &tm); 21493b9f94e1Sbellard #endif 2150faea38e7Sbellard secs = sn->vm_clock_nsec / 1000000000; 2151faea38e7Sbellard snprintf(clock_buf, sizeof(clock_buf), 2152faea38e7Sbellard "%02d:%02d:%02d.%03d", 2153faea38e7Sbellard (int)(secs / 3600), 2154faea38e7Sbellard (int)((secs / 60) % 60), 2155faea38e7Sbellard (int)(secs % 60), 2156faea38e7Sbellard (int)((sn->vm_clock_nsec / 1000000) % 1000)); 2157faea38e7Sbellard snprintf(buf, buf_size, 2158faea38e7Sbellard "%-10s%-20s%7s%20s%15s", 2159faea38e7Sbellard sn->id_str, sn->name, 2160faea38e7Sbellard get_human_readable_size(buf1, sizeof(buf1), sn->vm_state_size), 2161faea38e7Sbellard date_buf, 2162faea38e7Sbellard clock_buf); 2163faea38e7Sbellard } 2164faea38e7Sbellard return buf; 2165faea38e7Sbellard } 2166faea38e7Sbellard 216783f64091Sbellard 2168ea2384d3Sbellard /**************************************************************/ 216983f64091Sbellard /* async I/Os */ 2170ea2384d3Sbellard 21713b69e4b9Saliguori BlockDriverAIOCB *bdrv_aio_readv(BlockDriverState *bs, int64_t sector_num, 2172f141eafeSaliguori QEMUIOVector *qiov, int nb_sectors, 217383f64091Sbellard BlockDriverCompletionFunc *cb, void *opaque) 2174ea2384d3Sbellard { 217583f64091Sbellard BlockDriver *drv = bs->drv; 2176a36e69ddSths BlockDriverAIOCB *ret; 2177ea2384d3Sbellard 2178bbf0a440SStefan Hajnoczi trace_bdrv_aio_readv(bs, sector_num, nb_sectors, opaque); 2179bbf0a440SStefan Hajnoczi 218019cb3738Sbellard if (!drv) 2181ce1a14dcSpbrook return NULL; 218271d0770cSaliguori if (bdrv_check_request(bs, sector_num, nb_sectors)) 218371d0770cSaliguori return NULL; 218483f64091Sbellard 2185f141eafeSaliguori ret = drv->bdrv_aio_readv(bs, sector_num, qiov, nb_sectors, 2186f141eafeSaliguori cb, opaque); 2187a36e69ddSths 2188a36e69ddSths if (ret) { 2189a36e69ddSths /* Update stats even though technically transfer has not happened. */ 21906ea44308SJan Kiszka bs->rd_bytes += (unsigned) nb_sectors * BDRV_SECTOR_SIZE; 2191a36e69ddSths bs->rd_ops ++; 2192a36e69ddSths } 2193a36e69ddSths 2194a36e69ddSths return ret; 219583f64091Sbellard } 219683f64091Sbellard 21974dcafbb1SMarcelo Tosatti typedef struct BlockCompleteData { 21984dcafbb1SMarcelo Tosatti BlockDriverCompletionFunc *cb; 21994dcafbb1SMarcelo Tosatti void *opaque; 22004dcafbb1SMarcelo Tosatti BlockDriverState *bs; 22014dcafbb1SMarcelo Tosatti int64_t sector_num; 22024dcafbb1SMarcelo Tosatti int nb_sectors; 22034dcafbb1SMarcelo Tosatti } BlockCompleteData; 22044dcafbb1SMarcelo Tosatti 22054dcafbb1SMarcelo Tosatti static void block_complete_cb(void *opaque, int ret) 22064dcafbb1SMarcelo Tosatti { 22074dcafbb1SMarcelo Tosatti BlockCompleteData *b = opaque; 22084dcafbb1SMarcelo Tosatti 22094dcafbb1SMarcelo Tosatti if (b->bs->dirty_bitmap) { 22104dcafbb1SMarcelo Tosatti set_dirty_bitmap(b->bs, b->sector_num, b->nb_sectors, 1); 22114dcafbb1SMarcelo Tosatti } 22124dcafbb1SMarcelo Tosatti b->cb(b->opaque, ret); 22134dcafbb1SMarcelo Tosatti qemu_free(b); 22144dcafbb1SMarcelo Tosatti } 22154dcafbb1SMarcelo Tosatti 22164dcafbb1SMarcelo Tosatti static BlockCompleteData *blk_dirty_cb_alloc(BlockDriverState *bs, 22174dcafbb1SMarcelo Tosatti int64_t sector_num, 22184dcafbb1SMarcelo Tosatti int nb_sectors, 22194dcafbb1SMarcelo Tosatti BlockDriverCompletionFunc *cb, 22204dcafbb1SMarcelo Tosatti void *opaque) 22214dcafbb1SMarcelo Tosatti { 22224dcafbb1SMarcelo Tosatti BlockCompleteData *blkdata = qemu_mallocz(sizeof(BlockCompleteData)); 22234dcafbb1SMarcelo Tosatti 22244dcafbb1SMarcelo Tosatti blkdata->bs = bs; 22254dcafbb1SMarcelo Tosatti blkdata->cb = cb; 22264dcafbb1SMarcelo Tosatti blkdata->opaque = opaque; 22274dcafbb1SMarcelo Tosatti blkdata->sector_num = sector_num; 22284dcafbb1SMarcelo Tosatti blkdata->nb_sectors = nb_sectors; 22294dcafbb1SMarcelo Tosatti 22304dcafbb1SMarcelo Tosatti return blkdata; 22314dcafbb1SMarcelo Tosatti } 22324dcafbb1SMarcelo Tosatti 2233f141eafeSaliguori BlockDriverAIOCB *bdrv_aio_writev(BlockDriverState *bs, int64_t sector_num, 2234f141eafeSaliguori QEMUIOVector *qiov, int nb_sectors, 223583f64091Sbellard BlockDriverCompletionFunc *cb, void *opaque) 22367674e7bfSbellard { 223783f64091Sbellard BlockDriver *drv = bs->drv; 2238a36e69ddSths BlockDriverAIOCB *ret; 22394dcafbb1SMarcelo Tosatti BlockCompleteData *blk_cb_data; 224083f64091Sbellard 2241bbf0a440SStefan Hajnoczi trace_bdrv_aio_writev(bs, sector_num, nb_sectors, opaque); 2242bbf0a440SStefan Hajnoczi 224319cb3738Sbellard if (!drv) 2244ce1a14dcSpbrook return NULL; 224583f64091Sbellard if (bs->read_only) 2246ce1a14dcSpbrook return NULL; 224771d0770cSaliguori if (bdrv_check_request(bs, sector_num, nb_sectors)) 224871d0770cSaliguori return NULL; 224983f64091Sbellard 2250c6d22830SJan Kiszka if (bs->dirty_bitmap) { 22514dcafbb1SMarcelo Tosatti blk_cb_data = blk_dirty_cb_alloc(bs, sector_num, nb_sectors, cb, 22524dcafbb1SMarcelo Tosatti opaque); 22534dcafbb1SMarcelo Tosatti cb = &block_complete_cb; 22544dcafbb1SMarcelo Tosatti opaque = blk_cb_data; 22557cd1e32aSlirans@il.ibm.com } 22567cd1e32aSlirans@il.ibm.com 2257f141eafeSaliguori ret = drv->bdrv_aio_writev(bs, sector_num, qiov, nb_sectors, 2258f141eafeSaliguori cb, opaque); 2259a36e69ddSths 2260a36e69ddSths if (ret) { 2261a36e69ddSths /* Update stats even though technically transfer has not happened. */ 22626ea44308SJan Kiszka bs->wr_bytes += (unsigned) nb_sectors * BDRV_SECTOR_SIZE; 2263a36e69ddSths bs->wr_ops ++; 2264294cc35fSKevin Wolf if (bs->wr_highest_sector < sector_num + nb_sectors - 1) { 2265294cc35fSKevin Wolf bs->wr_highest_sector = sector_num + nb_sectors - 1; 2266294cc35fSKevin Wolf } 2267a36e69ddSths } 2268a36e69ddSths 2269a36e69ddSths return ret; 227083f64091Sbellard } 227183f64091Sbellard 227240b4f539SKevin Wolf 227340b4f539SKevin Wolf typedef struct MultiwriteCB { 227440b4f539SKevin Wolf int error; 227540b4f539SKevin Wolf int num_requests; 227640b4f539SKevin Wolf int num_callbacks; 227740b4f539SKevin Wolf struct { 227840b4f539SKevin Wolf BlockDriverCompletionFunc *cb; 227940b4f539SKevin Wolf void *opaque; 228040b4f539SKevin Wolf QEMUIOVector *free_qiov; 228140b4f539SKevin Wolf void *free_buf; 228240b4f539SKevin Wolf } callbacks[]; 228340b4f539SKevin Wolf } MultiwriteCB; 228440b4f539SKevin Wolf 228540b4f539SKevin Wolf static void multiwrite_user_cb(MultiwriteCB *mcb) 228640b4f539SKevin Wolf { 228740b4f539SKevin Wolf int i; 228840b4f539SKevin Wolf 228940b4f539SKevin Wolf for (i = 0; i < mcb->num_callbacks; i++) { 229040b4f539SKevin Wolf mcb->callbacks[i].cb(mcb->callbacks[i].opaque, mcb->error); 22911e1ea48dSStefan Hajnoczi if (mcb->callbacks[i].free_qiov) { 22921e1ea48dSStefan Hajnoczi qemu_iovec_destroy(mcb->callbacks[i].free_qiov); 22931e1ea48dSStefan Hajnoczi } 229440b4f539SKevin Wolf qemu_free(mcb->callbacks[i].free_qiov); 2295f8a83245SHerve Poussineau qemu_vfree(mcb->callbacks[i].free_buf); 229640b4f539SKevin Wolf } 229740b4f539SKevin Wolf } 229840b4f539SKevin Wolf 229940b4f539SKevin Wolf static void multiwrite_cb(void *opaque, int ret) 230040b4f539SKevin Wolf { 230140b4f539SKevin Wolf MultiwriteCB *mcb = opaque; 230240b4f539SKevin Wolf 23036d519a5fSStefan Hajnoczi trace_multiwrite_cb(mcb, ret); 23046d519a5fSStefan Hajnoczi 2305cb6d3ca0SKevin Wolf if (ret < 0 && !mcb->error) { 230640b4f539SKevin Wolf mcb->error = ret; 230740b4f539SKevin Wolf } 230840b4f539SKevin Wolf 230940b4f539SKevin Wolf mcb->num_requests--; 231040b4f539SKevin Wolf if (mcb->num_requests == 0) { 231140b4f539SKevin Wolf multiwrite_user_cb(mcb); 231240b4f539SKevin Wolf qemu_free(mcb); 231340b4f539SKevin Wolf } 231440b4f539SKevin Wolf } 231540b4f539SKevin Wolf 231640b4f539SKevin Wolf static int multiwrite_req_compare(const void *a, const void *b) 231740b4f539SKevin Wolf { 231877be4366SChristoph Hellwig const BlockRequest *req1 = a, *req2 = b; 231977be4366SChristoph Hellwig 232077be4366SChristoph Hellwig /* 232177be4366SChristoph Hellwig * Note that we can't simply subtract req2->sector from req1->sector 232277be4366SChristoph Hellwig * here as that could overflow the return value. 232377be4366SChristoph Hellwig */ 232477be4366SChristoph Hellwig if (req1->sector > req2->sector) { 232577be4366SChristoph Hellwig return 1; 232677be4366SChristoph Hellwig } else if (req1->sector < req2->sector) { 232777be4366SChristoph Hellwig return -1; 232877be4366SChristoph Hellwig } else { 232977be4366SChristoph Hellwig return 0; 233077be4366SChristoph Hellwig } 233140b4f539SKevin Wolf } 233240b4f539SKevin Wolf 233340b4f539SKevin Wolf /* 233440b4f539SKevin Wolf * Takes a bunch of requests and tries to merge them. Returns the number of 233540b4f539SKevin Wolf * requests that remain after merging. 233640b4f539SKevin Wolf */ 233740b4f539SKevin Wolf static int multiwrite_merge(BlockDriverState *bs, BlockRequest *reqs, 233840b4f539SKevin Wolf int num_reqs, MultiwriteCB *mcb) 233940b4f539SKevin Wolf { 234040b4f539SKevin Wolf int i, outidx; 234140b4f539SKevin Wolf 234240b4f539SKevin Wolf // Sort requests by start sector 234340b4f539SKevin Wolf qsort(reqs, num_reqs, sizeof(*reqs), &multiwrite_req_compare); 234440b4f539SKevin Wolf 234540b4f539SKevin Wolf // Check if adjacent requests touch the same clusters. If so, combine them, 234640b4f539SKevin Wolf // filling up gaps with zero sectors. 234740b4f539SKevin Wolf outidx = 0; 234840b4f539SKevin Wolf for (i = 1; i < num_reqs; i++) { 234940b4f539SKevin Wolf int merge = 0; 235040b4f539SKevin Wolf int64_t oldreq_last = reqs[outidx].sector + reqs[outidx].nb_sectors; 235140b4f539SKevin Wolf 235240b4f539SKevin Wolf // This handles the cases that are valid for all block drivers, namely 235340b4f539SKevin Wolf // exactly sequential writes and overlapping writes. 235440b4f539SKevin Wolf if (reqs[i].sector <= oldreq_last) { 235540b4f539SKevin Wolf merge = 1; 235640b4f539SKevin Wolf } 235740b4f539SKevin Wolf 235840b4f539SKevin Wolf // The block driver may decide that it makes sense to combine requests 235940b4f539SKevin Wolf // even if there is a gap of some sectors between them. In this case, 236040b4f539SKevin Wolf // the gap is filled with zeros (therefore only applicable for yet 236140b4f539SKevin Wolf // unused space in format like qcow2). 236240b4f539SKevin Wolf if (!merge && bs->drv->bdrv_merge_requests) { 236340b4f539SKevin Wolf merge = bs->drv->bdrv_merge_requests(bs, &reqs[outidx], &reqs[i]); 236440b4f539SKevin Wolf } 236540b4f539SKevin Wolf 2366e2a305fbSChristoph Hellwig if (reqs[outidx].qiov->niov + reqs[i].qiov->niov + 1 > IOV_MAX) { 2367e2a305fbSChristoph Hellwig merge = 0; 2368e2a305fbSChristoph Hellwig } 2369e2a305fbSChristoph Hellwig 237040b4f539SKevin Wolf if (merge) { 237140b4f539SKevin Wolf size_t size; 237240b4f539SKevin Wolf QEMUIOVector *qiov = qemu_mallocz(sizeof(*qiov)); 237340b4f539SKevin Wolf qemu_iovec_init(qiov, 237440b4f539SKevin Wolf reqs[outidx].qiov->niov + reqs[i].qiov->niov + 1); 237540b4f539SKevin Wolf 237640b4f539SKevin Wolf // Add the first request to the merged one. If the requests are 237740b4f539SKevin Wolf // overlapping, drop the last sectors of the first request. 237840b4f539SKevin Wolf size = (reqs[i].sector - reqs[outidx].sector) << 9; 237940b4f539SKevin Wolf qemu_iovec_concat(qiov, reqs[outidx].qiov, size); 238040b4f539SKevin Wolf 238140b4f539SKevin Wolf // We might need to add some zeros between the two requests 238240b4f539SKevin Wolf if (reqs[i].sector > oldreq_last) { 238340b4f539SKevin Wolf size_t zero_bytes = (reqs[i].sector - oldreq_last) << 9; 238440b4f539SKevin Wolf uint8_t *buf = qemu_blockalign(bs, zero_bytes); 238540b4f539SKevin Wolf memset(buf, 0, zero_bytes); 238640b4f539SKevin Wolf qemu_iovec_add(qiov, buf, zero_bytes); 238740b4f539SKevin Wolf mcb->callbacks[i].free_buf = buf; 238840b4f539SKevin Wolf } 238940b4f539SKevin Wolf 239040b4f539SKevin Wolf // Add the second request 239140b4f539SKevin Wolf qemu_iovec_concat(qiov, reqs[i].qiov, reqs[i].qiov->size); 239240b4f539SKevin Wolf 2393cbf1dff2SKevin Wolf reqs[outidx].nb_sectors = qiov->size >> 9; 239440b4f539SKevin Wolf reqs[outidx].qiov = qiov; 239540b4f539SKevin Wolf 239640b4f539SKevin Wolf mcb->callbacks[i].free_qiov = reqs[outidx].qiov; 239740b4f539SKevin Wolf } else { 239840b4f539SKevin Wolf outidx++; 239940b4f539SKevin Wolf reqs[outidx].sector = reqs[i].sector; 240040b4f539SKevin Wolf reqs[outidx].nb_sectors = reqs[i].nb_sectors; 240140b4f539SKevin Wolf reqs[outidx].qiov = reqs[i].qiov; 240240b4f539SKevin Wolf } 240340b4f539SKevin Wolf } 240440b4f539SKevin Wolf 240540b4f539SKevin Wolf return outidx + 1; 240640b4f539SKevin Wolf } 240740b4f539SKevin Wolf 240840b4f539SKevin Wolf /* 240940b4f539SKevin Wolf * Submit multiple AIO write requests at once. 241040b4f539SKevin Wolf * 241140b4f539SKevin Wolf * On success, the function returns 0 and all requests in the reqs array have 241240b4f539SKevin Wolf * been submitted. In error case this function returns -1, and any of the 241340b4f539SKevin Wolf * requests may or may not be submitted yet. In particular, this means that the 241440b4f539SKevin Wolf * callback will be called for some of the requests, for others it won't. The 241540b4f539SKevin Wolf * caller must check the error field of the BlockRequest to wait for the right 241640b4f539SKevin Wolf * callbacks (if error != 0, no callback will be called). 241740b4f539SKevin Wolf * 241840b4f539SKevin Wolf * The implementation may modify the contents of the reqs array, e.g. to merge 241940b4f539SKevin Wolf * requests. However, the fields opaque and error are left unmodified as they 242040b4f539SKevin Wolf * are used to signal failure for a single request to the caller. 242140b4f539SKevin Wolf */ 242240b4f539SKevin Wolf int bdrv_aio_multiwrite(BlockDriverState *bs, BlockRequest *reqs, int num_reqs) 242340b4f539SKevin Wolf { 242440b4f539SKevin Wolf BlockDriverAIOCB *acb; 242540b4f539SKevin Wolf MultiwriteCB *mcb; 242640b4f539SKevin Wolf int i; 242740b4f539SKevin Wolf 2428301db7c2SRyan Harper /* don't submit writes if we don't have a medium */ 2429301db7c2SRyan Harper if (bs->drv == NULL) { 2430301db7c2SRyan Harper for (i = 0; i < num_reqs; i++) { 2431301db7c2SRyan Harper reqs[i].error = -ENOMEDIUM; 2432301db7c2SRyan Harper } 2433301db7c2SRyan Harper return -1; 2434301db7c2SRyan Harper } 2435301db7c2SRyan Harper 243640b4f539SKevin Wolf if (num_reqs == 0) { 243740b4f539SKevin Wolf return 0; 243840b4f539SKevin Wolf } 243940b4f539SKevin Wolf 244040b4f539SKevin Wolf // Create MultiwriteCB structure 244140b4f539SKevin Wolf mcb = qemu_mallocz(sizeof(*mcb) + num_reqs * sizeof(*mcb->callbacks)); 244240b4f539SKevin Wolf mcb->num_requests = 0; 244340b4f539SKevin Wolf mcb->num_callbacks = num_reqs; 244440b4f539SKevin Wolf 244540b4f539SKevin Wolf for (i = 0; i < num_reqs; i++) { 244640b4f539SKevin Wolf mcb->callbacks[i].cb = reqs[i].cb; 244740b4f539SKevin Wolf mcb->callbacks[i].opaque = reqs[i].opaque; 244840b4f539SKevin Wolf } 244940b4f539SKevin Wolf 245040b4f539SKevin Wolf // Check for mergable requests 245140b4f539SKevin Wolf num_reqs = multiwrite_merge(bs, reqs, num_reqs, mcb); 245240b4f539SKevin Wolf 24536d519a5fSStefan Hajnoczi trace_bdrv_aio_multiwrite(mcb, mcb->num_callbacks, num_reqs); 24546d519a5fSStefan Hajnoczi 2455453f9a16SKevin Wolf /* 2456453f9a16SKevin Wolf * Run the aio requests. As soon as one request can't be submitted 2457453f9a16SKevin Wolf * successfully, fail all requests that are not yet submitted (we must 2458453f9a16SKevin Wolf * return failure for all requests anyway) 2459453f9a16SKevin Wolf * 2460453f9a16SKevin Wolf * num_requests cannot be set to the right value immediately: If 2461453f9a16SKevin Wolf * bdrv_aio_writev fails for some request, num_requests would be too high 2462453f9a16SKevin Wolf * and therefore multiwrite_cb() would never recognize the multiwrite 2463453f9a16SKevin Wolf * request as completed. We also cannot use the loop variable i to set it 2464453f9a16SKevin Wolf * when the first request fails because the callback may already have been 2465453f9a16SKevin Wolf * called for previously submitted requests. Thus, num_requests must be 2466453f9a16SKevin Wolf * incremented for each request that is submitted. 2467453f9a16SKevin Wolf * 2468453f9a16SKevin Wolf * The problem that callbacks may be called early also means that we need 2469453f9a16SKevin Wolf * to take care that num_requests doesn't become 0 before all requests are 2470453f9a16SKevin Wolf * submitted - multiwrite_cb() would consider the multiwrite request 2471453f9a16SKevin Wolf * completed. A dummy request that is "completed" by a manual call to 2472453f9a16SKevin Wolf * multiwrite_cb() takes care of this. 2473453f9a16SKevin Wolf */ 2474453f9a16SKevin Wolf mcb->num_requests = 1; 2475453f9a16SKevin Wolf 24766d519a5fSStefan Hajnoczi // Run the aio requests 247740b4f539SKevin Wolf for (i = 0; i < num_reqs; i++) { 2478453f9a16SKevin Wolf mcb->num_requests++; 247940b4f539SKevin Wolf acb = bdrv_aio_writev(bs, reqs[i].sector, reqs[i].qiov, 248040b4f539SKevin Wolf reqs[i].nb_sectors, multiwrite_cb, mcb); 248140b4f539SKevin Wolf 248240b4f539SKevin Wolf if (acb == NULL) { 248340b4f539SKevin Wolf // We can only fail the whole thing if no request has been 248440b4f539SKevin Wolf // submitted yet. Otherwise we'll wait for the submitted AIOs to 248540b4f539SKevin Wolf // complete and report the error in the callback. 2486453f9a16SKevin Wolf if (i == 0) { 24876d519a5fSStefan Hajnoczi trace_bdrv_aio_multiwrite_earlyfail(mcb); 248840b4f539SKevin Wolf goto fail; 248940b4f539SKevin Wolf } else { 24906d519a5fSStefan Hajnoczi trace_bdrv_aio_multiwrite_latefail(mcb, i); 24917eb58a6cSKevin Wolf multiwrite_cb(mcb, -EIO); 249240b4f539SKevin Wolf break; 249340b4f539SKevin Wolf } 249440b4f539SKevin Wolf } 249540b4f539SKevin Wolf } 249640b4f539SKevin Wolf 2497453f9a16SKevin Wolf /* Complete the dummy request */ 2498453f9a16SKevin Wolf multiwrite_cb(mcb, 0); 2499453f9a16SKevin Wolf 250040b4f539SKevin Wolf return 0; 250140b4f539SKevin Wolf 250240b4f539SKevin Wolf fail: 2503453f9a16SKevin Wolf for (i = 0; i < mcb->num_callbacks; i++) { 2504453f9a16SKevin Wolf reqs[i].error = -EIO; 2505453f9a16SKevin Wolf } 2506af474591SBruce Rogers qemu_free(mcb); 250740b4f539SKevin Wolf return -1; 250840b4f539SKevin Wolf } 250940b4f539SKevin Wolf 2510b2e12bc6SChristoph Hellwig BlockDriverAIOCB *bdrv_aio_flush(BlockDriverState *bs, 2511b2e12bc6SChristoph Hellwig BlockDriverCompletionFunc *cb, void *opaque) 2512b2e12bc6SChristoph Hellwig { 2513b2e12bc6SChristoph Hellwig BlockDriver *drv = bs->drv; 2514b2e12bc6SChristoph Hellwig 2515a13aac04SStefan Hajnoczi trace_bdrv_aio_flush(bs, opaque); 2516a13aac04SStefan Hajnoczi 2517016f5cf6SAlexander Graf if (bs->open_flags & BDRV_O_NO_FLUSH) { 2518016f5cf6SAlexander Graf return bdrv_aio_noop_em(bs, cb, opaque); 2519016f5cf6SAlexander Graf } 2520016f5cf6SAlexander Graf 2521b2e12bc6SChristoph Hellwig if (!drv) 2522b2e12bc6SChristoph Hellwig return NULL; 2523b2e12bc6SChristoph Hellwig return drv->bdrv_aio_flush(bs, cb, opaque); 2524b2e12bc6SChristoph Hellwig } 2525b2e12bc6SChristoph Hellwig 252683f64091Sbellard void bdrv_aio_cancel(BlockDriverAIOCB *acb) 252783f64091Sbellard { 25286bbff9a0Saliguori acb->pool->cancel(acb); 252983f64091Sbellard } 253083f64091Sbellard 253183f64091Sbellard 253283f64091Sbellard /**************************************************************/ 253383f64091Sbellard /* async block device emulation */ 253483f64091Sbellard 2535c16b5a2cSChristoph Hellwig typedef struct BlockDriverAIOCBSync { 2536c16b5a2cSChristoph Hellwig BlockDriverAIOCB common; 2537c16b5a2cSChristoph Hellwig QEMUBH *bh; 2538c16b5a2cSChristoph Hellwig int ret; 2539c16b5a2cSChristoph Hellwig /* vector translation state */ 2540c16b5a2cSChristoph Hellwig QEMUIOVector *qiov; 2541c16b5a2cSChristoph Hellwig uint8_t *bounce; 2542c16b5a2cSChristoph Hellwig int is_write; 2543c16b5a2cSChristoph Hellwig } BlockDriverAIOCBSync; 2544c16b5a2cSChristoph Hellwig 2545c16b5a2cSChristoph Hellwig static void bdrv_aio_cancel_em(BlockDriverAIOCB *blockacb) 2546c16b5a2cSChristoph Hellwig { 2547b666d239SKevin Wolf BlockDriverAIOCBSync *acb = 2548b666d239SKevin Wolf container_of(blockacb, BlockDriverAIOCBSync, common); 25496a7ad299SDor Laor qemu_bh_delete(acb->bh); 255036afc451SAvi Kivity acb->bh = NULL; 2551c16b5a2cSChristoph Hellwig qemu_aio_release(acb); 2552c16b5a2cSChristoph Hellwig } 2553c16b5a2cSChristoph Hellwig 2554c16b5a2cSChristoph Hellwig static AIOPool bdrv_em_aio_pool = { 2555c16b5a2cSChristoph Hellwig .aiocb_size = sizeof(BlockDriverAIOCBSync), 2556c16b5a2cSChristoph Hellwig .cancel = bdrv_aio_cancel_em, 2557c16b5a2cSChristoph Hellwig }; 2558c16b5a2cSChristoph Hellwig 255983f64091Sbellard static void bdrv_aio_bh_cb(void *opaque) 2560beac80cdSbellard { 2561ce1a14dcSpbrook BlockDriverAIOCBSync *acb = opaque; 2562f141eafeSaliguori 2563f141eafeSaliguori if (!acb->is_write) 2564f141eafeSaliguori qemu_iovec_from_buffer(acb->qiov, acb->bounce, acb->qiov->size); 2565ceb42de8Saliguori qemu_vfree(acb->bounce); 2566ce1a14dcSpbrook acb->common.cb(acb->common.opaque, acb->ret); 25676a7ad299SDor Laor qemu_bh_delete(acb->bh); 256836afc451SAvi Kivity acb->bh = NULL; 2569ce1a14dcSpbrook qemu_aio_release(acb); 2570beac80cdSbellard } 2571beac80cdSbellard 2572f141eafeSaliguori static BlockDriverAIOCB *bdrv_aio_rw_vector(BlockDriverState *bs, 2573f141eafeSaliguori int64_t sector_num, 2574f141eafeSaliguori QEMUIOVector *qiov, 2575f141eafeSaliguori int nb_sectors, 2576f141eafeSaliguori BlockDriverCompletionFunc *cb, 2577f141eafeSaliguori void *opaque, 2578f141eafeSaliguori int is_write) 2579f141eafeSaliguori 2580ea2384d3Sbellard { 2581ce1a14dcSpbrook BlockDriverAIOCBSync *acb; 258283f64091Sbellard 2583c16b5a2cSChristoph Hellwig acb = qemu_aio_get(&bdrv_em_aio_pool, bs, cb, opaque); 2584f141eafeSaliguori acb->is_write = is_write; 2585f141eafeSaliguori acb->qiov = qiov; 2586e268ca52Saliguori acb->bounce = qemu_blockalign(bs, qiov->size); 2587f141eafeSaliguori 2588ce1a14dcSpbrook if (!acb->bh) 2589ce1a14dcSpbrook acb->bh = qemu_bh_new(bdrv_aio_bh_cb, acb); 2590f141eafeSaliguori 2591f141eafeSaliguori if (is_write) { 2592f141eafeSaliguori qemu_iovec_to_buffer(acb->qiov, acb->bounce); 2593f141eafeSaliguori acb->ret = bdrv_write(bs, sector_num, acb->bounce, nb_sectors); 2594f141eafeSaliguori } else { 2595f141eafeSaliguori acb->ret = bdrv_read(bs, sector_num, acb->bounce, nb_sectors); 2596f141eafeSaliguori } 2597f141eafeSaliguori 2598ce1a14dcSpbrook qemu_bh_schedule(acb->bh); 2599f141eafeSaliguori 2600ce1a14dcSpbrook return &acb->common; 26017a6cba61Spbrook } 26027a6cba61Spbrook 2603f141eafeSaliguori static BlockDriverAIOCB *bdrv_aio_readv_em(BlockDriverState *bs, 2604f141eafeSaliguori int64_t sector_num, QEMUIOVector *qiov, int nb_sectors, 2605ce1a14dcSpbrook BlockDriverCompletionFunc *cb, void *opaque) 260683f64091Sbellard { 2607f141eafeSaliguori return bdrv_aio_rw_vector(bs, sector_num, qiov, nb_sectors, cb, opaque, 0); 260883f64091Sbellard } 260983f64091Sbellard 2610f141eafeSaliguori static BlockDriverAIOCB *bdrv_aio_writev_em(BlockDriverState *bs, 2611f141eafeSaliguori int64_t sector_num, QEMUIOVector *qiov, int nb_sectors, 2612f141eafeSaliguori BlockDriverCompletionFunc *cb, void *opaque) 2613f141eafeSaliguori { 2614f141eafeSaliguori return bdrv_aio_rw_vector(bs, sector_num, qiov, nb_sectors, cb, opaque, 1); 2615f141eafeSaliguori } 2616f141eafeSaliguori 2617b2e12bc6SChristoph Hellwig static BlockDriverAIOCB *bdrv_aio_flush_em(BlockDriverState *bs, 2618b2e12bc6SChristoph Hellwig BlockDriverCompletionFunc *cb, void *opaque) 2619b2e12bc6SChristoph Hellwig { 2620b2e12bc6SChristoph Hellwig BlockDriverAIOCBSync *acb; 2621b2e12bc6SChristoph Hellwig 2622b2e12bc6SChristoph Hellwig acb = qemu_aio_get(&bdrv_em_aio_pool, bs, cb, opaque); 2623b2e12bc6SChristoph Hellwig acb->is_write = 1; /* don't bounce in the completion hadler */ 2624b2e12bc6SChristoph Hellwig acb->qiov = NULL; 2625b2e12bc6SChristoph Hellwig acb->bounce = NULL; 2626b2e12bc6SChristoph Hellwig acb->ret = 0; 2627b2e12bc6SChristoph Hellwig 2628b2e12bc6SChristoph Hellwig if (!acb->bh) 2629b2e12bc6SChristoph Hellwig acb->bh = qemu_bh_new(bdrv_aio_bh_cb, acb); 2630b2e12bc6SChristoph Hellwig 2631b2e12bc6SChristoph Hellwig bdrv_flush(bs); 2632b2e12bc6SChristoph Hellwig qemu_bh_schedule(acb->bh); 2633b2e12bc6SChristoph Hellwig return &acb->common; 2634b2e12bc6SChristoph Hellwig } 2635b2e12bc6SChristoph Hellwig 2636016f5cf6SAlexander Graf static BlockDriverAIOCB *bdrv_aio_noop_em(BlockDriverState *bs, 2637016f5cf6SAlexander Graf BlockDriverCompletionFunc *cb, void *opaque) 2638016f5cf6SAlexander Graf { 2639016f5cf6SAlexander Graf BlockDriverAIOCBSync *acb; 2640016f5cf6SAlexander Graf 2641016f5cf6SAlexander Graf acb = qemu_aio_get(&bdrv_em_aio_pool, bs, cb, opaque); 2642016f5cf6SAlexander Graf acb->is_write = 1; /* don't bounce in the completion handler */ 2643016f5cf6SAlexander Graf acb->qiov = NULL; 2644016f5cf6SAlexander Graf acb->bounce = NULL; 2645016f5cf6SAlexander Graf acb->ret = 0; 2646016f5cf6SAlexander Graf 2647016f5cf6SAlexander Graf if (!acb->bh) { 2648016f5cf6SAlexander Graf acb->bh = qemu_bh_new(bdrv_aio_bh_cb, acb); 2649016f5cf6SAlexander Graf } 2650016f5cf6SAlexander Graf 2651016f5cf6SAlexander Graf qemu_bh_schedule(acb->bh); 2652016f5cf6SAlexander Graf return &acb->common; 2653016f5cf6SAlexander Graf } 2654016f5cf6SAlexander Graf 265583f64091Sbellard /**************************************************************/ 265683f64091Sbellard /* sync block device emulation */ 265783f64091Sbellard 265883f64091Sbellard static void bdrv_rw_em_cb(void *opaque, int ret) 265983f64091Sbellard { 266083f64091Sbellard *(int *)opaque = ret; 266183f64091Sbellard } 266283f64091Sbellard 266383f64091Sbellard #define NOT_DONE 0x7fffffff 266483f64091Sbellard 266583f64091Sbellard static int bdrv_read_em(BlockDriverState *bs, int64_t sector_num, 266683f64091Sbellard uint8_t *buf, int nb_sectors) 266783f64091Sbellard { 2668ce1a14dcSpbrook int async_ret; 2669ce1a14dcSpbrook BlockDriverAIOCB *acb; 2670f141eafeSaliguori struct iovec iov; 2671f141eafeSaliguori QEMUIOVector qiov; 267283f64091Sbellard 267365d6b3d8SKevin Wolf async_context_push(); 267465d6b3d8SKevin Wolf 267583f64091Sbellard async_ret = NOT_DONE; 26763f4cb3d3Sblueswir1 iov.iov_base = (void *)buf; 2677eb5a3165SJes Sorensen iov.iov_len = nb_sectors * BDRV_SECTOR_SIZE; 2678f141eafeSaliguori qemu_iovec_init_external(&qiov, &iov, 1); 2679f141eafeSaliguori acb = bdrv_aio_readv(bs, sector_num, &qiov, nb_sectors, 268083f64091Sbellard bdrv_rw_em_cb, &async_ret); 268165d6b3d8SKevin Wolf if (acb == NULL) { 268265d6b3d8SKevin Wolf async_ret = -1; 268365d6b3d8SKevin Wolf goto fail; 268465d6b3d8SKevin Wolf } 2685baf35cb9Saliguori 268683f64091Sbellard while (async_ret == NOT_DONE) { 268783f64091Sbellard qemu_aio_wait(); 268883f64091Sbellard } 2689baf35cb9Saliguori 269065d6b3d8SKevin Wolf 269165d6b3d8SKevin Wolf fail: 269265d6b3d8SKevin Wolf async_context_pop(); 269383f64091Sbellard return async_ret; 269483f64091Sbellard } 269583f64091Sbellard 269683f64091Sbellard static int bdrv_write_em(BlockDriverState *bs, int64_t sector_num, 269783f64091Sbellard const uint8_t *buf, int nb_sectors) 269883f64091Sbellard { 2699ce1a14dcSpbrook int async_ret; 2700ce1a14dcSpbrook BlockDriverAIOCB *acb; 2701f141eafeSaliguori struct iovec iov; 2702f141eafeSaliguori QEMUIOVector qiov; 270383f64091Sbellard 270465d6b3d8SKevin Wolf async_context_push(); 270565d6b3d8SKevin Wolf 270683f64091Sbellard async_ret = NOT_DONE; 2707f141eafeSaliguori iov.iov_base = (void *)buf; 2708eb5a3165SJes Sorensen iov.iov_len = nb_sectors * BDRV_SECTOR_SIZE; 2709f141eafeSaliguori qemu_iovec_init_external(&qiov, &iov, 1); 2710f141eafeSaliguori acb = bdrv_aio_writev(bs, sector_num, &qiov, nb_sectors, 271183f64091Sbellard bdrv_rw_em_cb, &async_ret); 271265d6b3d8SKevin Wolf if (acb == NULL) { 271365d6b3d8SKevin Wolf async_ret = -1; 271465d6b3d8SKevin Wolf goto fail; 271565d6b3d8SKevin Wolf } 271683f64091Sbellard while (async_ret == NOT_DONE) { 271783f64091Sbellard qemu_aio_wait(); 271883f64091Sbellard } 271965d6b3d8SKevin Wolf 272065d6b3d8SKevin Wolf fail: 272165d6b3d8SKevin Wolf async_context_pop(); 272283f64091Sbellard return async_ret; 272383f64091Sbellard } 2724ea2384d3Sbellard 2725ea2384d3Sbellard void bdrv_init(void) 2726ea2384d3Sbellard { 27275efa9d5aSAnthony Liguori module_call_init(MODULE_INIT_BLOCK); 2728ea2384d3Sbellard } 2729ce1a14dcSpbrook 2730eb852011SMarkus Armbruster void bdrv_init_with_whitelist(void) 2731eb852011SMarkus Armbruster { 2732eb852011SMarkus Armbruster use_bdrv_whitelist = 1; 2733eb852011SMarkus Armbruster bdrv_init(); 2734eb852011SMarkus Armbruster } 2735eb852011SMarkus Armbruster 2736c16b5a2cSChristoph Hellwig void *qemu_aio_get(AIOPool *pool, BlockDriverState *bs, 27376bbff9a0Saliguori BlockDriverCompletionFunc *cb, void *opaque) 27386bbff9a0Saliguori { 2739ce1a14dcSpbrook BlockDriverAIOCB *acb; 2740ce1a14dcSpbrook 27416bbff9a0Saliguori if (pool->free_aiocb) { 27426bbff9a0Saliguori acb = pool->free_aiocb; 27436bbff9a0Saliguori pool->free_aiocb = acb->next; 2744ce1a14dcSpbrook } else { 27456bbff9a0Saliguori acb = qemu_mallocz(pool->aiocb_size); 27466bbff9a0Saliguori acb->pool = pool; 2747ce1a14dcSpbrook } 2748ce1a14dcSpbrook acb->bs = bs; 2749ce1a14dcSpbrook acb->cb = cb; 2750ce1a14dcSpbrook acb->opaque = opaque; 2751ce1a14dcSpbrook return acb; 2752ce1a14dcSpbrook } 2753ce1a14dcSpbrook 2754ce1a14dcSpbrook void qemu_aio_release(void *p) 2755ce1a14dcSpbrook { 27566bbff9a0Saliguori BlockDriverAIOCB *acb = (BlockDriverAIOCB *)p; 27576bbff9a0Saliguori AIOPool *pool = acb->pool; 27586bbff9a0Saliguori acb->next = pool->free_aiocb; 27596bbff9a0Saliguori pool->free_aiocb = acb; 2760ce1a14dcSpbrook } 276119cb3738Sbellard 276219cb3738Sbellard /**************************************************************/ 276319cb3738Sbellard /* removable device support */ 276419cb3738Sbellard 276519cb3738Sbellard /** 276619cb3738Sbellard * Return TRUE if the media is present 276719cb3738Sbellard */ 276819cb3738Sbellard int bdrv_is_inserted(BlockDriverState *bs) 276919cb3738Sbellard { 277019cb3738Sbellard BlockDriver *drv = bs->drv; 277119cb3738Sbellard int ret; 277219cb3738Sbellard if (!drv) 277319cb3738Sbellard return 0; 277419cb3738Sbellard if (!drv->bdrv_is_inserted) 27754be9762aSMarkus Armbruster return !bs->tray_open; 277619cb3738Sbellard ret = drv->bdrv_is_inserted(bs); 277719cb3738Sbellard return ret; 277819cb3738Sbellard } 277919cb3738Sbellard 278019cb3738Sbellard /** 278119cb3738Sbellard * Return TRUE if the media changed since the last call to this 278219cb3738Sbellard * function. It is currently only used for floppy disks 278319cb3738Sbellard */ 278419cb3738Sbellard int bdrv_media_changed(BlockDriverState *bs) 278519cb3738Sbellard { 278619cb3738Sbellard BlockDriver *drv = bs->drv; 278719cb3738Sbellard int ret; 278819cb3738Sbellard 278919cb3738Sbellard if (!drv || !drv->bdrv_media_changed) 279019cb3738Sbellard ret = -ENOTSUP; 279119cb3738Sbellard else 279219cb3738Sbellard ret = drv->bdrv_media_changed(bs); 279319cb3738Sbellard if (ret == -ENOTSUP) 279419cb3738Sbellard ret = bs->media_changed; 279519cb3738Sbellard bs->media_changed = 0; 279619cb3738Sbellard return ret; 279719cb3738Sbellard } 279819cb3738Sbellard 279919cb3738Sbellard /** 280019cb3738Sbellard * If eject_flag is TRUE, eject the media. Otherwise, close the tray 280119cb3738Sbellard */ 2802aea2a33cSMark McLoughlin int bdrv_eject(BlockDriverState *bs, int eject_flag) 280319cb3738Sbellard { 280419cb3738Sbellard BlockDriver *drv = bs->drv; 280519cb3738Sbellard 280649aa46bbSMarkus Armbruster if (eject_flag && bs->locked) { 2807aea2a33cSMark McLoughlin return -EBUSY; 2808aea2a33cSMark McLoughlin } 2809aea2a33cSMark McLoughlin 2810822e1cd1SMarkus Armbruster if (drv && drv->bdrv_eject) { 2811822e1cd1SMarkus Armbruster drv->bdrv_eject(bs, eject_flag); 281219cb3738Sbellard } 28134be9762aSMarkus Armbruster bs->tray_open = eject_flag; 2814822e1cd1SMarkus Armbruster return 0; 281519cb3738Sbellard } 281619cb3738Sbellard 281719cb3738Sbellard int bdrv_is_locked(BlockDriverState *bs) 281819cb3738Sbellard { 281919cb3738Sbellard return bs->locked; 282019cb3738Sbellard } 282119cb3738Sbellard 282219cb3738Sbellard /** 282319cb3738Sbellard * Lock or unlock the media (if it is locked, the user won't be able 282419cb3738Sbellard * to eject it manually). 282519cb3738Sbellard */ 282619cb3738Sbellard void bdrv_set_locked(BlockDriverState *bs, int locked) 282719cb3738Sbellard { 282819cb3738Sbellard BlockDriver *drv = bs->drv; 282919cb3738Sbellard 2830b8c6d095SStefan Hajnoczi trace_bdrv_set_locked(bs, locked); 2831b8c6d095SStefan Hajnoczi 283219cb3738Sbellard bs->locked = locked; 283319cb3738Sbellard if (drv && drv->bdrv_set_locked) { 283419cb3738Sbellard drv->bdrv_set_locked(bs, locked); 283519cb3738Sbellard } 283619cb3738Sbellard } 2837985a03b0Sths 2838985a03b0Sths /* needed for generic scsi interface */ 2839985a03b0Sths 2840985a03b0Sths int bdrv_ioctl(BlockDriverState *bs, unsigned long int req, void *buf) 2841985a03b0Sths { 2842985a03b0Sths BlockDriver *drv = bs->drv; 2843985a03b0Sths 2844985a03b0Sths if (drv && drv->bdrv_ioctl) 2845985a03b0Sths return drv->bdrv_ioctl(bs, req, buf); 2846985a03b0Sths return -ENOTSUP; 2847985a03b0Sths } 28487d780669Saliguori 2849221f715dSaliguori BlockDriverAIOCB *bdrv_aio_ioctl(BlockDriverState *bs, 2850221f715dSaliguori unsigned long int req, void *buf, 28517d780669Saliguori BlockDriverCompletionFunc *cb, void *opaque) 28527d780669Saliguori { 2853221f715dSaliguori BlockDriver *drv = bs->drv; 28547d780669Saliguori 2855221f715dSaliguori if (drv && drv->bdrv_aio_ioctl) 2856221f715dSaliguori return drv->bdrv_aio_ioctl(bs, req, buf, cb, opaque); 2857221f715dSaliguori return NULL; 28587d780669Saliguori } 2859e268ca52Saliguori 28607cd1e32aSlirans@il.ibm.com 28617cd1e32aSlirans@il.ibm.com 2862e268ca52Saliguori void *qemu_blockalign(BlockDriverState *bs, size_t size) 2863e268ca52Saliguori { 2864e268ca52Saliguori return qemu_memalign((bs && bs->buffer_alignment) ? bs->buffer_alignment : 512, size); 2865e268ca52Saliguori } 28667cd1e32aSlirans@il.ibm.com 28677cd1e32aSlirans@il.ibm.com void bdrv_set_dirty_tracking(BlockDriverState *bs, int enable) 28687cd1e32aSlirans@il.ibm.com { 28697cd1e32aSlirans@il.ibm.com int64_t bitmap_size; 2870a55eb92cSJan Kiszka 2871aaa0eb75SLiran Schour bs->dirty_count = 0; 28727cd1e32aSlirans@il.ibm.com if (enable) { 2873c6d22830SJan Kiszka if (!bs->dirty_bitmap) { 2874c6d22830SJan Kiszka bitmap_size = (bdrv_getlength(bs) >> BDRV_SECTOR_BITS) + 2875c6d22830SJan Kiszka BDRV_SECTORS_PER_DIRTY_CHUNK * 8 - 1; 2876c6d22830SJan Kiszka bitmap_size /= BDRV_SECTORS_PER_DIRTY_CHUNK * 8; 28777cd1e32aSlirans@il.ibm.com 28787cd1e32aSlirans@il.ibm.com bs->dirty_bitmap = qemu_mallocz(bitmap_size); 28797cd1e32aSlirans@il.ibm.com } 28807cd1e32aSlirans@il.ibm.com } else { 2881c6d22830SJan Kiszka if (bs->dirty_bitmap) { 28827cd1e32aSlirans@il.ibm.com qemu_free(bs->dirty_bitmap); 2883c6d22830SJan Kiszka bs->dirty_bitmap = NULL; 28847cd1e32aSlirans@il.ibm.com } 28857cd1e32aSlirans@il.ibm.com } 28867cd1e32aSlirans@il.ibm.com } 28877cd1e32aSlirans@il.ibm.com 28887cd1e32aSlirans@il.ibm.com int bdrv_get_dirty(BlockDriverState *bs, int64_t sector) 28897cd1e32aSlirans@il.ibm.com { 28906ea44308SJan Kiszka int64_t chunk = sector / (int64_t)BDRV_SECTORS_PER_DIRTY_CHUNK; 28917cd1e32aSlirans@il.ibm.com 2892c6d22830SJan Kiszka if (bs->dirty_bitmap && 2893c6d22830SJan Kiszka (sector << BDRV_SECTOR_BITS) < bdrv_getlength(bs)) { 28946d59fec1SMarcelo Tosatti return !!(bs->dirty_bitmap[chunk / (sizeof(unsigned long) * 8)] & 28956d59fec1SMarcelo Tosatti (1UL << (chunk % (sizeof(unsigned long) * 8)))); 28967cd1e32aSlirans@il.ibm.com } else { 28977cd1e32aSlirans@il.ibm.com return 0; 28987cd1e32aSlirans@il.ibm.com } 28997cd1e32aSlirans@il.ibm.com } 29007cd1e32aSlirans@il.ibm.com 29017cd1e32aSlirans@il.ibm.com void bdrv_reset_dirty(BlockDriverState *bs, int64_t cur_sector, 29027cd1e32aSlirans@il.ibm.com int nr_sectors) 29037cd1e32aSlirans@il.ibm.com { 29047cd1e32aSlirans@il.ibm.com set_dirty_bitmap(bs, cur_sector, nr_sectors, 0); 29057cd1e32aSlirans@il.ibm.com } 2906aaa0eb75SLiran Schour 2907aaa0eb75SLiran Schour int64_t bdrv_get_dirty_count(BlockDriverState *bs) 2908aaa0eb75SLiran Schour { 2909aaa0eb75SLiran Schour return bs->dirty_count; 2910aaa0eb75SLiran Schour } 2911f88e1a42SJes Sorensen 2912db593f25SMarcelo Tosatti void bdrv_set_in_use(BlockDriverState *bs, int in_use) 2913db593f25SMarcelo Tosatti { 2914db593f25SMarcelo Tosatti assert(bs->in_use != in_use); 2915db593f25SMarcelo Tosatti bs->in_use = in_use; 2916db593f25SMarcelo Tosatti } 2917db593f25SMarcelo Tosatti 2918db593f25SMarcelo Tosatti int bdrv_in_use(BlockDriverState *bs) 2919db593f25SMarcelo Tosatti { 2920db593f25SMarcelo Tosatti return bs->in_use; 2921db593f25SMarcelo Tosatti } 2922db593f25SMarcelo Tosatti 2923f88e1a42SJes Sorensen int bdrv_img_create(const char *filename, const char *fmt, 2924f88e1a42SJes Sorensen const char *base_filename, const char *base_fmt, 2925f88e1a42SJes Sorensen char *options, uint64_t img_size, int flags) 2926f88e1a42SJes Sorensen { 2927f88e1a42SJes Sorensen QEMUOptionParameter *param = NULL, *create_options = NULL; 2928d220894eSKevin Wolf QEMUOptionParameter *backing_fmt, *backing_file, *size; 2929f88e1a42SJes Sorensen BlockDriverState *bs = NULL; 2930f88e1a42SJes Sorensen BlockDriver *drv, *proto_drv; 293196df67d1SStefan Hajnoczi BlockDriver *backing_drv = NULL; 2932f88e1a42SJes Sorensen int ret = 0; 2933f88e1a42SJes Sorensen 2934f88e1a42SJes Sorensen /* Find driver and parse its options */ 2935f88e1a42SJes Sorensen drv = bdrv_find_format(fmt); 2936f88e1a42SJes Sorensen if (!drv) { 2937f88e1a42SJes Sorensen error_report("Unknown file format '%s'", fmt); 29384f70f249SJes Sorensen ret = -EINVAL; 2939f88e1a42SJes Sorensen goto out; 2940f88e1a42SJes Sorensen } 2941f88e1a42SJes Sorensen 2942f88e1a42SJes Sorensen proto_drv = bdrv_find_protocol(filename); 2943f88e1a42SJes Sorensen if (!proto_drv) { 2944f88e1a42SJes Sorensen error_report("Unknown protocol '%s'", filename); 29454f70f249SJes Sorensen ret = -EINVAL; 2946f88e1a42SJes Sorensen goto out; 2947f88e1a42SJes Sorensen } 2948f88e1a42SJes Sorensen 2949f88e1a42SJes Sorensen create_options = append_option_parameters(create_options, 2950f88e1a42SJes Sorensen drv->create_options); 2951f88e1a42SJes Sorensen create_options = append_option_parameters(create_options, 2952f88e1a42SJes Sorensen proto_drv->create_options); 2953f88e1a42SJes Sorensen 2954f88e1a42SJes Sorensen /* Create parameter list with default values */ 2955f88e1a42SJes Sorensen param = parse_option_parameters("", create_options, param); 2956f88e1a42SJes Sorensen 2957f88e1a42SJes Sorensen set_option_parameter_int(param, BLOCK_OPT_SIZE, img_size); 2958f88e1a42SJes Sorensen 2959f88e1a42SJes Sorensen /* Parse -o options */ 2960f88e1a42SJes Sorensen if (options) { 2961f88e1a42SJes Sorensen param = parse_option_parameters(options, create_options, param); 2962f88e1a42SJes Sorensen if (param == NULL) { 2963f88e1a42SJes Sorensen error_report("Invalid options for file format '%s'.", fmt); 29644f70f249SJes Sorensen ret = -EINVAL; 2965f88e1a42SJes Sorensen goto out; 2966f88e1a42SJes Sorensen } 2967f88e1a42SJes Sorensen } 2968f88e1a42SJes Sorensen 2969f88e1a42SJes Sorensen if (base_filename) { 2970f88e1a42SJes Sorensen if (set_option_parameter(param, BLOCK_OPT_BACKING_FILE, 2971f88e1a42SJes Sorensen base_filename)) { 2972f88e1a42SJes Sorensen error_report("Backing file not supported for file format '%s'", 2973f88e1a42SJes Sorensen fmt); 29744f70f249SJes Sorensen ret = -EINVAL; 2975f88e1a42SJes Sorensen goto out; 2976f88e1a42SJes Sorensen } 2977f88e1a42SJes Sorensen } 2978f88e1a42SJes Sorensen 2979f88e1a42SJes Sorensen if (base_fmt) { 2980f88e1a42SJes Sorensen if (set_option_parameter(param, BLOCK_OPT_BACKING_FMT, base_fmt)) { 2981f88e1a42SJes Sorensen error_report("Backing file format not supported for file " 2982f88e1a42SJes Sorensen "format '%s'", fmt); 29834f70f249SJes Sorensen ret = -EINVAL; 2984f88e1a42SJes Sorensen goto out; 2985f88e1a42SJes Sorensen } 2986f88e1a42SJes Sorensen } 2987f88e1a42SJes Sorensen 2988792da93aSJes Sorensen backing_file = get_option_parameter(param, BLOCK_OPT_BACKING_FILE); 2989792da93aSJes Sorensen if (backing_file && backing_file->value.s) { 2990792da93aSJes Sorensen if (!strcmp(filename, backing_file->value.s)) { 2991792da93aSJes Sorensen error_report("Error: Trying to create an image with the " 2992792da93aSJes Sorensen "same filename as the backing file"); 29934f70f249SJes Sorensen ret = -EINVAL; 2994792da93aSJes Sorensen goto out; 2995792da93aSJes Sorensen } 2996792da93aSJes Sorensen } 2997792da93aSJes Sorensen 2998f88e1a42SJes Sorensen backing_fmt = get_option_parameter(param, BLOCK_OPT_BACKING_FMT); 2999f88e1a42SJes Sorensen if (backing_fmt && backing_fmt->value.s) { 300096df67d1SStefan Hajnoczi backing_drv = bdrv_find_format(backing_fmt->value.s); 300196df67d1SStefan Hajnoczi if (!backing_drv) { 3002f88e1a42SJes Sorensen error_report("Unknown backing file format '%s'", 3003f88e1a42SJes Sorensen backing_fmt->value.s); 30044f70f249SJes Sorensen ret = -EINVAL; 3005f88e1a42SJes Sorensen goto out; 3006f88e1a42SJes Sorensen } 3007f88e1a42SJes Sorensen } 3008f88e1a42SJes Sorensen 3009f88e1a42SJes Sorensen // The size for the image must always be specified, with one exception: 3010f88e1a42SJes Sorensen // If we are using a backing file, we can obtain the size from there 3011d220894eSKevin Wolf size = get_option_parameter(param, BLOCK_OPT_SIZE); 3012d220894eSKevin Wolf if (size && size->value.n == -1) { 3013f88e1a42SJes Sorensen if (backing_file && backing_file->value.s) { 3014f88e1a42SJes Sorensen uint64_t size; 3015f88e1a42SJes Sorensen char buf[32]; 3016f88e1a42SJes Sorensen 3017f88e1a42SJes Sorensen bs = bdrv_new(""); 3018f88e1a42SJes Sorensen 301996df67d1SStefan Hajnoczi ret = bdrv_open(bs, backing_file->value.s, flags, backing_drv); 3020f88e1a42SJes Sorensen if (ret < 0) { 302196df67d1SStefan Hajnoczi error_report("Could not open '%s'", backing_file->value.s); 3022f88e1a42SJes Sorensen goto out; 3023f88e1a42SJes Sorensen } 3024f88e1a42SJes Sorensen bdrv_get_geometry(bs, &size); 3025f88e1a42SJes Sorensen size *= 512; 3026f88e1a42SJes Sorensen 3027f88e1a42SJes Sorensen snprintf(buf, sizeof(buf), "%" PRId64, size); 3028f88e1a42SJes Sorensen set_option_parameter(param, BLOCK_OPT_SIZE, buf); 3029f88e1a42SJes Sorensen } else { 3030f88e1a42SJes Sorensen error_report("Image creation needs a size parameter"); 30314f70f249SJes Sorensen ret = -EINVAL; 3032f88e1a42SJes Sorensen goto out; 3033f88e1a42SJes Sorensen } 3034f88e1a42SJes Sorensen } 3035f88e1a42SJes Sorensen 3036f88e1a42SJes Sorensen printf("Formatting '%s', fmt=%s ", filename, fmt); 3037f88e1a42SJes Sorensen print_option_parameters(param); 3038f88e1a42SJes Sorensen puts(""); 3039f88e1a42SJes Sorensen 3040f88e1a42SJes Sorensen ret = bdrv_create(drv, filename, param); 3041f88e1a42SJes Sorensen 3042f88e1a42SJes Sorensen if (ret < 0) { 3043f88e1a42SJes Sorensen if (ret == -ENOTSUP) { 3044f88e1a42SJes Sorensen error_report("Formatting or formatting option not supported for " 3045f88e1a42SJes Sorensen "file format '%s'", fmt); 3046f88e1a42SJes Sorensen } else if (ret == -EFBIG) { 3047f88e1a42SJes Sorensen error_report("The image size is too large for file format '%s'", 3048f88e1a42SJes Sorensen fmt); 3049f88e1a42SJes Sorensen } else { 3050f88e1a42SJes Sorensen error_report("%s: error while creating %s: %s", filename, fmt, 3051f88e1a42SJes Sorensen strerror(-ret)); 3052f88e1a42SJes Sorensen } 3053f88e1a42SJes Sorensen } 3054f88e1a42SJes Sorensen 3055f88e1a42SJes Sorensen out: 3056f88e1a42SJes Sorensen free_option_parameters(create_options); 3057f88e1a42SJes Sorensen free_option_parameters(param); 3058f88e1a42SJes Sorensen 3059f88e1a42SJes Sorensen if (bs) { 3060f88e1a42SJes Sorensen bdrv_delete(bs); 3061f88e1a42SJes Sorensen } 30624f70f249SJes Sorensen 30634f70f249SJes Sorensen return ret; 3064f88e1a42SJes Sorensen } 3065