1fc01f7e7Sbellard /* 2fc01f7e7Sbellard * QEMU System Emulator block driver 3fc01f7e7Sbellard * 4fc01f7e7Sbellard * Copyright (c) 2003 Fabrice Bellard 5fc01f7e7Sbellard * 6fc01f7e7Sbellard * Permission is hereby granted, free of charge, to any person obtaining a copy 7fc01f7e7Sbellard * of this software and associated documentation files (the "Software"), to deal 8fc01f7e7Sbellard * in the Software without restriction, including without limitation the rights 9fc01f7e7Sbellard * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell 10fc01f7e7Sbellard * copies of the Software, and to permit persons to whom the Software is 11fc01f7e7Sbellard * furnished to do so, subject to the following conditions: 12fc01f7e7Sbellard * 13fc01f7e7Sbellard * The above copyright notice and this permission notice shall be included in 14fc01f7e7Sbellard * all copies or substantial portions of the Software. 15fc01f7e7Sbellard * 16fc01f7e7Sbellard * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 17fc01f7e7Sbellard * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 18fc01f7e7Sbellard * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 19fc01f7e7Sbellard * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 20fc01f7e7Sbellard * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 21fc01f7e7Sbellard * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN 22fc01f7e7Sbellard * THE SOFTWARE. 23fc01f7e7Sbellard */ 243990d09aSblueswir1 #include "config-host.h" 25faf07963Spbrook #include "qemu-common.h" 26376253ecSaliguori #include "monitor.h" 27ea2384d3Sbellard #include "block_int.h" 285efa9d5aSAnthony Liguori #include "module.h" 29fc01f7e7Sbellard 3071e72a19SJuan Quintela #ifdef CONFIG_BSD 317674e7bfSbellard #include <sys/types.h> 327674e7bfSbellard #include <sys/stat.h> 337674e7bfSbellard #include <sys/ioctl.h> 3472cf2d4fSBlue Swirl #include <sys/queue.h> 35c5e97233Sblueswir1 #ifndef __DragonFly__ 367674e7bfSbellard #include <sys/disk.h> 377674e7bfSbellard #endif 38c5e97233Sblueswir1 #endif 397674e7bfSbellard 4049dc768dSaliguori #ifdef _WIN32 4149dc768dSaliguori #include <windows.h> 4249dc768dSaliguori #endif 4349dc768dSaliguori 44f141eafeSaliguori static BlockDriverAIOCB *bdrv_aio_readv_em(BlockDriverState *bs, 45f141eafeSaliguori int64_t sector_num, QEMUIOVector *qiov, int nb_sectors, 46c87c0672Saliguori BlockDriverCompletionFunc *cb, void *opaque); 47f141eafeSaliguori static BlockDriverAIOCB *bdrv_aio_writev_em(BlockDriverState *bs, 48f141eafeSaliguori int64_t sector_num, QEMUIOVector *qiov, int nb_sectors, 49ce1a14dcSpbrook BlockDriverCompletionFunc *cb, void *opaque); 50b2e12bc6SChristoph Hellwig static BlockDriverAIOCB *bdrv_aio_flush_em(BlockDriverState *bs, 51b2e12bc6SChristoph Hellwig BlockDriverCompletionFunc *cb, void *opaque); 5283f64091Sbellard static int bdrv_read_em(BlockDriverState *bs, int64_t sector_num, 5383f64091Sbellard uint8_t *buf, int nb_sectors); 5483f64091Sbellard static int bdrv_write_em(BlockDriverState *bs, int64_t sector_num, 5583f64091Sbellard const uint8_t *buf, int nb_sectors); 56ec530c81Sbellard 577ee930d0Sblueswir1 BlockDriverState *bdrv_first; 587ee930d0Sblueswir1 59ea2384d3Sbellard static BlockDriver *first_drv; 60ea2384d3Sbellard 61eb852011SMarkus Armbruster /* If non-zero, use only whitelisted block drivers */ 62eb852011SMarkus Armbruster static int use_bdrv_whitelist; 63eb852011SMarkus Armbruster 6483f64091Sbellard int path_is_absolute(const char *path) 6583f64091Sbellard { 6683f64091Sbellard const char *p; 6721664424Sbellard #ifdef _WIN32 6821664424Sbellard /* specific case for names like: "\\.\d:" */ 6921664424Sbellard if (*path == '/' || *path == '\\') 7021664424Sbellard return 1; 7121664424Sbellard #endif 7283f64091Sbellard p = strchr(path, ':'); 7383f64091Sbellard if (p) 7483f64091Sbellard p++; 7583f64091Sbellard else 7683f64091Sbellard p = path; 773b9f94e1Sbellard #ifdef _WIN32 783b9f94e1Sbellard return (*p == '/' || *p == '\\'); 793b9f94e1Sbellard #else 803b9f94e1Sbellard return (*p == '/'); 813b9f94e1Sbellard #endif 8283f64091Sbellard } 8383f64091Sbellard 8483f64091Sbellard /* if filename is absolute, just copy it to dest. Otherwise, build a 8583f64091Sbellard path to it by considering it is relative to base_path. URL are 8683f64091Sbellard supported. */ 8783f64091Sbellard void path_combine(char *dest, int dest_size, 8883f64091Sbellard const char *base_path, 8983f64091Sbellard const char *filename) 9083f64091Sbellard { 9183f64091Sbellard const char *p, *p1; 9283f64091Sbellard int len; 9383f64091Sbellard 9483f64091Sbellard if (dest_size <= 0) 9583f64091Sbellard return; 9683f64091Sbellard if (path_is_absolute(filename)) { 9783f64091Sbellard pstrcpy(dest, dest_size, filename); 9883f64091Sbellard } else { 9983f64091Sbellard p = strchr(base_path, ':'); 10083f64091Sbellard if (p) 10183f64091Sbellard p++; 10283f64091Sbellard else 10383f64091Sbellard p = base_path; 1043b9f94e1Sbellard p1 = strrchr(base_path, '/'); 1053b9f94e1Sbellard #ifdef _WIN32 1063b9f94e1Sbellard { 1073b9f94e1Sbellard const char *p2; 1083b9f94e1Sbellard p2 = strrchr(base_path, '\\'); 1093b9f94e1Sbellard if (!p1 || p2 > p1) 1103b9f94e1Sbellard p1 = p2; 1113b9f94e1Sbellard } 1123b9f94e1Sbellard #endif 11383f64091Sbellard if (p1) 11483f64091Sbellard p1++; 11583f64091Sbellard else 11683f64091Sbellard p1 = base_path; 11783f64091Sbellard if (p1 > p) 11883f64091Sbellard p = p1; 11983f64091Sbellard len = p - base_path; 12083f64091Sbellard if (len > dest_size - 1) 12183f64091Sbellard len = dest_size - 1; 12283f64091Sbellard memcpy(dest, base_path, len); 12383f64091Sbellard dest[len] = '\0'; 12483f64091Sbellard pstrcat(dest, dest_size, filename); 12583f64091Sbellard } 12683f64091Sbellard } 12783f64091Sbellard 1285efa9d5aSAnthony Liguori void bdrv_register(BlockDriver *bdrv) 129ea2384d3Sbellard { 130f141eafeSaliguori if (!bdrv->bdrv_aio_readv) { 13183f64091Sbellard /* add AIO emulation layer */ 132f141eafeSaliguori bdrv->bdrv_aio_readv = bdrv_aio_readv_em; 133f141eafeSaliguori bdrv->bdrv_aio_writev = bdrv_aio_writev_em; 134eda578e5Saliguori } else if (!bdrv->bdrv_read) { 13583f64091Sbellard /* add synchronous IO emulation layer */ 13683f64091Sbellard bdrv->bdrv_read = bdrv_read_em; 13783f64091Sbellard bdrv->bdrv_write = bdrv_write_em; 13883f64091Sbellard } 139b2e12bc6SChristoph Hellwig 140b2e12bc6SChristoph Hellwig if (!bdrv->bdrv_aio_flush) 141b2e12bc6SChristoph Hellwig bdrv->bdrv_aio_flush = bdrv_aio_flush_em; 142b2e12bc6SChristoph Hellwig 143ea2384d3Sbellard bdrv->next = first_drv; 144ea2384d3Sbellard first_drv = bdrv; 145ea2384d3Sbellard } 146b338082bSbellard 147b338082bSbellard /* create a new block device (by default it is empty) */ 148b338082bSbellard BlockDriverState *bdrv_new(const char *device_name) 149fc01f7e7Sbellard { 150b338082bSbellard BlockDriverState **pbs, *bs; 151b338082bSbellard 152b338082bSbellard bs = qemu_mallocz(sizeof(BlockDriverState)); 153b338082bSbellard pstrcpy(bs->device_name, sizeof(bs->device_name), device_name); 154ea2384d3Sbellard if (device_name[0] != '\0') { 155b338082bSbellard /* insert at the end */ 156b338082bSbellard pbs = &bdrv_first; 157b338082bSbellard while (*pbs != NULL) 158b338082bSbellard pbs = &(*pbs)->next; 159b338082bSbellard *pbs = bs; 160ea2384d3Sbellard } 161b338082bSbellard return bs; 162b338082bSbellard } 163b338082bSbellard 164ea2384d3Sbellard BlockDriver *bdrv_find_format(const char *format_name) 165ea2384d3Sbellard { 166ea2384d3Sbellard BlockDriver *drv1; 167ea2384d3Sbellard for(drv1 = first_drv; drv1 != NULL; drv1 = drv1->next) { 168ea2384d3Sbellard if (!strcmp(drv1->format_name, format_name)) 169ea2384d3Sbellard return drv1; 170ea2384d3Sbellard } 171ea2384d3Sbellard return NULL; 172ea2384d3Sbellard } 173ea2384d3Sbellard 174eb852011SMarkus Armbruster static int bdrv_is_whitelisted(BlockDriver *drv) 175eb852011SMarkus Armbruster { 176eb852011SMarkus Armbruster static const char *whitelist[] = { 177eb852011SMarkus Armbruster CONFIG_BDRV_WHITELIST 178eb852011SMarkus Armbruster }; 179eb852011SMarkus Armbruster const char **p; 180eb852011SMarkus Armbruster 181eb852011SMarkus Armbruster if (!whitelist[0]) 182eb852011SMarkus Armbruster return 1; /* no whitelist, anything goes */ 183eb852011SMarkus Armbruster 184eb852011SMarkus Armbruster for (p = whitelist; *p; p++) { 185eb852011SMarkus Armbruster if (!strcmp(drv->format_name, *p)) { 186eb852011SMarkus Armbruster return 1; 187eb852011SMarkus Armbruster } 188eb852011SMarkus Armbruster } 189eb852011SMarkus Armbruster return 0; 190eb852011SMarkus Armbruster } 191eb852011SMarkus Armbruster 192eb852011SMarkus Armbruster BlockDriver *bdrv_find_whitelisted_format(const char *format_name) 193eb852011SMarkus Armbruster { 194eb852011SMarkus Armbruster BlockDriver *drv = bdrv_find_format(format_name); 195eb852011SMarkus Armbruster return drv && bdrv_is_whitelisted(drv) ? drv : NULL; 196eb852011SMarkus Armbruster } 197eb852011SMarkus Armbruster 1980e7e1989SKevin Wolf int bdrv_create(BlockDriver *drv, const char* filename, 1990e7e1989SKevin Wolf QEMUOptionParameter *options) 200ea2384d3Sbellard { 201ea2384d3Sbellard if (!drv->bdrv_create) 202ea2384d3Sbellard return -ENOTSUP; 2030e7e1989SKevin Wolf 2040e7e1989SKevin Wolf return drv->bdrv_create(filename, options); 205ea2384d3Sbellard } 206ea2384d3Sbellard 207d5249393Sbellard #ifdef _WIN32 20895389c86Sbellard void get_tmp_filename(char *filename, int size) 209d5249393Sbellard { 2103b9f94e1Sbellard char temp_dir[MAX_PATH]; 2113b9f94e1Sbellard 2123b9f94e1Sbellard GetTempPath(MAX_PATH, temp_dir); 2133b9f94e1Sbellard GetTempFileName(temp_dir, "qem", 0, filename); 214d5249393Sbellard } 215d5249393Sbellard #else 21695389c86Sbellard void get_tmp_filename(char *filename, int size) 217ea2384d3Sbellard { 218ea2384d3Sbellard int fd; 2197ccfb2ebSblueswir1 const char *tmpdir; 220d5249393Sbellard /* XXX: race condition possible */ 2210badc1eeSaurel32 tmpdir = getenv("TMPDIR"); 2220badc1eeSaurel32 if (!tmpdir) 2230badc1eeSaurel32 tmpdir = "/tmp"; 2240badc1eeSaurel32 snprintf(filename, size, "%s/vl.XXXXXX", tmpdir); 225ea2384d3Sbellard fd = mkstemp(filename); 226ea2384d3Sbellard close(fd); 227ea2384d3Sbellard } 228d5249393Sbellard #endif 229ea2384d3Sbellard 23019cb3738Sbellard #ifdef _WIN32 231f45512feSbellard static int is_windows_drive_prefix(const char *filename) 232f45512feSbellard { 233f45512feSbellard return (((filename[0] >= 'a' && filename[0] <= 'z') || 234f45512feSbellard (filename[0] >= 'A' && filename[0] <= 'Z')) && 235f45512feSbellard filename[1] == ':'); 236f45512feSbellard } 237f45512feSbellard 238508c7cb3SChristoph Hellwig int is_windows_drive(const char *filename) 23919cb3738Sbellard { 240f45512feSbellard if (is_windows_drive_prefix(filename) && 241f45512feSbellard filename[2] == '\0') 24219cb3738Sbellard return 1; 24319cb3738Sbellard if (strstart(filename, "\\\\.\\", NULL) || 24419cb3738Sbellard strstart(filename, "//./", NULL)) 24519cb3738Sbellard return 1; 24619cb3738Sbellard return 0; 24719cb3738Sbellard } 24819cb3738Sbellard #endif 24919cb3738Sbellard 25083f64091Sbellard static BlockDriver *find_protocol(const char *filename) 25183f64091Sbellard { 25283f64091Sbellard BlockDriver *drv1; 25383f64091Sbellard char protocol[128]; 2541cec71e3SAnthony Liguori int len; 25583f64091Sbellard const char *p; 25619cb3738Sbellard 25719cb3738Sbellard #ifdef _WIN32 258f45512feSbellard if (is_windows_drive(filename) || 259f45512feSbellard is_windows_drive_prefix(filename)) 2605efa9d5aSAnthony Liguori return bdrv_find_format("raw"); 26119cb3738Sbellard #endif 2621cec71e3SAnthony Liguori p = strchr(filename, ':'); 2631cec71e3SAnthony Liguori if (!p) 2645efa9d5aSAnthony Liguori return bdrv_find_format("raw"); 2651cec71e3SAnthony Liguori len = p - filename; 2661cec71e3SAnthony Liguori if (len > sizeof(protocol) - 1) 2671cec71e3SAnthony Liguori len = sizeof(protocol) - 1; 2681cec71e3SAnthony Liguori memcpy(protocol, filename, len); 2691cec71e3SAnthony Liguori protocol[len] = '\0'; 27083f64091Sbellard for(drv1 = first_drv; drv1 != NULL; drv1 = drv1->next) { 27183f64091Sbellard if (drv1->protocol_name && 27283f64091Sbellard !strcmp(drv1->protocol_name, protocol)) 27383f64091Sbellard return drv1; 27483f64091Sbellard } 27583f64091Sbellard return NULL; 27683f64091Sbellard } 27783f64091Sbellard 278f3a5d3f8SChristoph Hellwig /* 279f3a5d3f8SChristoph Hellwig * Detect host devices. By convention, /dev/cdrom[N] is always 280f3a5d3f8SChristoph Hellwig * recognized as a host CDROM. 281f3a5d3f8SChristoph Hellwig */ 282f3a5d3f8SChristoph Hellwig static BlockDriver *find_hdev_driver(const char *filename) 283f3a5d3f8SChristoph Hellwig { 284508c7cb3SChristoph Hellwig int score_max = 0, score; 285508c7cb3SChristoph Hellwig BlockDriver *drv = NULL, *d; 286f3a5d3f8SChristoph Hellwig 287508c7cb3SChristoph Hellwig for (d = first_drv; d; d = d->next) { 288508c7cb3SChristoph Hellwig if (d->bdrv_probe_device) { 289508c7cb3SChristoph Hellwig score = d->bdrv_probe_device(filename); 290508c7cb3SChristoph Hellwig if (score > score_max) { 291508c7cb3SChristoph Hellwig score_max = score; 292508c7cb3SChristoph Hellwig drv = d; 293f3a5d3f8SChristoph Hellwig } 294508c7cb3SChristoph Hellwig } 295f3a5d3f8SChristoph Hellwig } 296f3a5d3f8SChristoph Hellwig 297508c7cb3SChristoph Hellwig return drv; 298f3a5d3f8SChristoph Hellwig } 299f3a5d3f8SChristoph Hellwig 300ea2384d3Sbellard static BlockDriver *find_image_format(const char *filename) 301ea2384d3Sbellard { 30283f64091Sbellard int ret, score, score_max; 303ea2384d3Sbellard BlockDriver *drv1, *drv; 30483f64091Sbellard uint8_t buf[2048]; 30583f64091Sbellard BlockDriverState *bs; 306ea2384d3Sbellard 30783f64091Sbellard drv = find_protocol(filename); 30819cb3738Sbellard /* no need to test disk image formats for vvfat */ 309c833ab73SAnthony Liguori if (drv && strcmp(drv->format_name, "vvfat") == 0) 31083f64091Sbellard return drv; 31183f64091Sbellard 31283f64091Sbellard ret = bdrv_file_open(&bs, filename, BDRV_O_RDONLY); 31383f64091Sbellard if (ret < 0) 3147674e7bfSbellard return NULL; 31583f64091Sbellard ret = bdrv_pread(bs, 0, buf, sizeof(buf)); 31683f64091Sbellard bdrv_delete(bs); 317ea2384d3Sbellard if (ret < 0) { 318ea2384d3Sbellard return NULL; 319ea2384d3Sbellard } 320ea2384d3Sbellard 321ea2384d3Sbellard score_max = 0; 322ea2384d3Sbellard for(drv1 = first_drv; drv1 != NULL; drv1 = drv1->next) { 32383f64091Sbellard if (drv1->bdrv_probe) { 324ea2384d3Sbellard score = drv1->bdrv_probe(buf, ret, filename); 325ea2384d3Sbellard if (score > score_max) { 326ea2384d3Sbellard score_max = score; 327ea2384d3Sbellard drv = drv1; 328ea2384d3Sbellard } 329ea2384d3Sbellard } 33083f64091Sbellard } 331ea2384d3Sbellard return drv; 332ea2384d3Sbellard } 333ea2384d3Sbellard 33483f64091Sbellard int bdrv_file_open(BlockDriverState **pbs, const char *filename, int flags) 335b338082bSbellard { 33683f64091Sbellard BlockDriverState *bs; 33783f64091Sbellard int ret; 3383b0d4f61Sbellard 33983f64091Sbellard bs = bdrv_new(""); 34083f64091Sbellard ret = bdrv_open2(bs, filename, flags | BDRV_O_FILE, NULL); 34183f64091Sbellard if (ret < 0) { 34283f64091Sbellard bdrv_delete(bs); 34383f64091Sbellard return ret; 3443b0d4f61Sbellard } 34571d0770cSaliguori bs->growable = 1; 34683f64091Sbellard *pbs = bs; 34783f64091Sbellard return 0; 3483b0d4f61Sbellard } 3493b0d4f61Sbellard 35083f64091Sbellard int bdrv_open(BlockDriverState *bs, const char *filename, int flags) 35183f64091Sbellard { 35283f64091Sbellard return bdrv_open2(bs, filename, flags, NULL); 353ea2384d3Sbellard } 354ea2384d3Sbellard 35583f64091Sbellard int bdrv_open2(BlockDriverState *bs, const char *filename, int flags, 356ea2384d3Sbellard BlockDriver *drv) 357ea2384d3Sbellard { 35859f2689dSNaphtali Sprei int ret, open_flags, try_rw; 359eb5c851fSths char tmp_filename[PATH_MAX]; 360eb5c851fSths char backing_filename[PATH_MAX]; 361fc01f7e7Sbellard 362ea2384d3Sbellard bs->is_temporary = 0; 363ea2384d3Sbellard bs->encrypted = 0; 364c0f4ce77Saliguori bs->valid_key = 0; 365e268ca52Saliguori /* buffer_alignment defaulted to 512, drivers can change this value */ 366e268ca52Saliguori bs->buffer_alignment = 512; 36733e3963eSbellard 36883f64091Sbellard if (flags & BDRV_O_SNAPSHOT) { 369ea2384d3Sbellard BlockDriverState *bs1; 370ea2384d3Sbellard int64_t total_size; 3717c96d46eSaliguori int is_protocol = 0; 37291a073a9SKevin Wolf BlockDriver *bdrv_qcow2; 37391a073a9SKevin Wolf QEMUOptionParameter *options; 37433e3963eSbellard 375ea2384d3Sbellard /* if snapshot, we create a temporary backing file and open it 376ea2384d3Sbellard instead of opening 'filename' directly */ 377ea2384d3Sbellard 378ea2384d3Sbellard /* if there is a backing file, use it */ 379ea2384d3Sbellard bs1 = bdrv_new(""); 3805eb45639Saliguori ret = bdrv_open2(bs1, filename, 0, drv); 38151d7c00cSaliguori if (ret < 0) { 382ea2384d3Sbellard bdrv_delete(bs1); 38351d7c00cSaliguori return ret; 384ea2384d3Sbellard } 3856ea44308SJan Kiszka total_size = bdrv_getlength(bs1) >> BDRV_SECTOR_BITS; 3867c96d46eSaliguori 3877c96d46eSaliguori if (bs1->drv && bs1->drv->protocol_name) 3887c96d46eSaliguori is_protocol = 1; 3897c96d46eSaliguori 390ea2384d3Sbellard bdrv_delete(bs1); 391ea2384d3Sbellard 392ea2384d3Sbellard get_tmp_filename(tmp_filename, sizeof(tmp_filename)); 3937c96d46eSaliguori 3947c96d46eSaliguori /* Real path is meaningless for protocols */ 3957c96d46eSaliguori if (is_protocol) 3967c96d46eSaliguori snprintf(backing_filename, sizeof(backing_filename), 3977c96d46eSaliguori "%s", filename); 3987c96d46eSaliguori else 399a817d936Sbellard realpath(filename, backing_filename); 4007c96d46eSaliguori 40191a073a9SKevin Wolf bdrv_qcow2 = bdrv_find_format("qcow2"); 40291a073a9SKevin Wolf options = parse_option_parameters("", bdrv_qcow2->create_options, NULL); 40391a073a9SKevin Wolf 40491a073a9SKevin Wolf set_option_parameter_int(options, BLOCK_OPT_SIZE, total_size * 512); 40591a073a9SKevin Wolf set_option_parameter(options, BLOCK_OPT_BACKING_FILE, backing_filename); 40691a073a9SKevin Wolf if (drv) { 40791a073a9SKevin Wolf set_option_parameter(options, BLOCK_OPT_BACKING_FMT, 40891a073a9SKevin Wolf drv->format_name); 40991a073a9SKevin Wolf } 41091a073a9SKevin Wolf 41191a073a9SKevin Wolf ret = bdrv_create(bdrv_qcow2, tmp_filename, options); 41251d7c00cSaliguori if (ret < 0) { 41351d7c00cSaliguori return ret; 414ea2384d3Sbellard } 41591a073a9SKevin Wolf 416ea2384d3Sbellard filename = tmp_filename; 41791a073a9SKevin Wolf drv = bdrv_qcow2; 418ea2384d3Sbellard bs->is_temporary = 1; 419ea2384d3Sbellard } 420ea2384d3Sbellard 421ea2384d3Sbellard pstrcpy(bs->filename, sizeof(bs->filename), filename); 42283f64091Sbellard if (flags & BDRV_O_FILE) { 42383f64091Sbellard drv = find_protocol(filename); 42451d7c00cSaliguori } else if (!drv) { 425f3a5d3f8SChristoph Hellwig drv = find_hdev_driver(filename); 426f3a5d3f8SChristoph Hellwig if (!drv) { 427ea2384d3Sbellard drv = find_image_format(filename); 428ea2384d3Sbellard } 429f3a5d3f8SChristoph Hellwig } 43051d7c00cSaliguori if (!drv) { 43151d7c00cSaliguori ret = -ENOENT; 43251d7c00cSaliguori goto unlink_and_fail; 43383f64091Sbellard } 434ea2384d3Sbellard bs->drv = drv; 435ea2384d3Sbellard bs->opaque = qemu_mallocz(drv->instance_size); 436e900a7b7SChristoph Hellwig 437e900a7b7SChristoph Hellwig /* 438e900a7b7SChristoph Hellwig * Yes, BDRV_O_NOCACHE aka O_DIRECT means we have to present a 439e900a7b7SChristoph Hellwig * write cache to the guest. We do need the fdatasync to flush 440e900a7b7SChristoph Hellwig * out transactions for block allocations, and we maybe have a 441e900a7b7SChristoph Hellwig * volatile write cache in our backing device to deal with. 442e900a7b7SChristoph Hellwig */ 443e900a7b7SChristoph Hellwig if (flags & (BDRV_O_CACHE_WB|BDRV_O_NOCACHE)) 444e900a7b7SChristoph Hellwig bs->enable_write_cache = 1; 445e900a7b7SChristoph Hellwig 44683f64091Sbellard /* Note: for compatibility, we open disk image files as RDWR, and 44783f64091Sbellard RDONLY as fallback */ 44859f2689dSNaphtali Sprei try_rw = !bs->read_only || bs->is_temporary; 44983f64091Sbellard if (!(flags & BDRV_O_FILE)) 45059f2689dSNaphtali Sprei open_flags = (try_rw ? BDRV_O_RDWR : 0) | 4515c6c3a6cSChristoph Hellwig (flags & (BDRV_O_CACHE_MASK|BDRV_O_NATIVE_AIO)); 45283f64091Sbellard else 45383f64091Sbellard open_flags = flags & ~(BDRV_O_FILE | BDRV_O_SNAPSHOT); 454eb852011SMarkus Armbruster if (use_bdrv_whitelist && !bdrv_is_whitelisted(drv)) 455eb852011SMarkus Armbruster ret = -ENOTSUP; 456eb852011SMarkus Armbruster else 4571cec71e3SAnthony Liguori ret = drv->bdrv_open(bs, filename, open_flags); 458a0a83536Saurel32 if ((ret == -EACCES || ret == -EPERM) && !(flags & BDRV_O_FILE)) { 4591cec71e3SAnthony Liguori ret = drv->bdrv_open(bs, filename, open_flags & ~BDRV_O_RDWR); 46083f64091Sbellard bs->read_only = 1; 46183f64091Sbellard } 462ea2384d3Sbellard if (ret < 0) { 463ea2384d3Sbellard qemu_free(bs->opaque); 4646b21b973Sbellard bs->opaque = NULL; 4656b21b973Sbellard bs->drv = NULL; 46651d7c00cSaliguori unlink_and_fail: 46751d7c00cSaliguori if (bs->is_temporary) 46851d7c00cSaliguori unlink(filename); 46983f64091Sbellard return ret; 470ea2384d3Sbellard } 471d15a771dSbellard if (drv->bdrv_getlength) { 4726ea44308SJan Kiszka bs->total_sectors = bdrv_getlength(bs) >> BDRV_SECTOR_BITS; 473d15a771dSbellard } 474ea2384d3Sbellard #ifndef _WIN32 475ea2384d3Sbellard if (bs->is_temporary) { 476ea2384d3Sbellard unlink(filename); 47733e3963eSbellard } 47867b915a5Sbellard #endif 47983f64091Sbellard if (bs->backing_file[0] != '\0') { 480ea2384d3Sbellard /* if there is a backing file, use it */ 4815eb45639Saliguori BlockDriver *back_drv = NULL; 482ea2384d3Sbellard bs->backing_hd = bdrv_new(""); 48359f2689dSNaphtali Sprei /* pass on read_only property to the backing_hd */ 48459f2689dSNaphtali Sprei bs->backing_hd->read_only = bs->read_only; 48583f64091Sbellard path_combine(backing_filename, sizeof(backing_filename), 48683f64091Sbellard filename, bs->backing_file); 4875eb45639Saliguori if (bs->backing_format[0] != '\0') 4885eb45639Saliguori back_drv = bdrv_find_format(bs->backing_format); 4895eb45639Saliguori ret = bdrv_open2(bs->backing_hd, backing_filename, open_flags, 4905eb45639Saliguori back_drv); 49151d7c00cSaliguori if (ret < 0) { 49251d7c00cSaliguori bdrv_close(bs); 49351d7c00cSaliguori return ret; 49451d7c00cSaliguori } 495ea2384d3Sbellard } 49633e3963eSbellard 497bb5fc20fSaliguori if (!bdrv_key_required(bs)) { 498b338082bSbellard /* call the change callback */ 49919cb3738Sbellard bs->media_changed = 1; 500b338082bSbellard if (bs->change_cb) 501b338082bSbellard bs->change_cb(bs->change_opaque); 502bb5fc20fSaliguori } 503b338082bSbellard return 0; 504fc01f7e7Sbellard } 505fc01f7e7Sbellard 506fc01f7e7Sbellard void bdrv_close(BlockDriverState *bs) 507fc01f7e7Sbellard { 50819cb3738Sbellard if (bs->drv) { 509ea2384d3Sbellard if (bs->backing_hd) 510ea2384d3Sbellard bdrv_delete(bs->backing_hd); 511ea2384d3Sbellard bs->drv->bdrv_close(bs); 512ea2384d3Sbellard qemu_free(bs->opaque); 513ea2384d3Sbellard #ifdef _WIN32 514ea2384d3Sbellard if (bs->is_temporary) { 515ea2384d3Sbellard unlink(bs->filename); 516ea2384d3Sbellard } 51767b915a5Sbellard #endif 518ea2384d3Sbellard bs->opaque = NULL; 519ea2384d3Sbellard bs->drv = NULL; 520b338082bSbellard 521b338082bSbellard /* call the change callback */ 52219cb3738Sbellard bs->media_changed = 1; 523b338082bSbellard if (bs->change_cb) 524b338082bSbellard bs->change_cb(bs->change_opaque); 525b338082bSbellard } 526b338082bSbellard } 527b338082bSbellard 528b338082bSbellard void bdrv_delete(BlockDriverState *bs) 529b338082bSbellard { 53034c6f050Saurel32 BlockDriverState **pbs; 53134c6f050Saurel32 53234c6f050Saurel32 pbs = &bdrv_first; 53334c6f050Saurel32 while (*pbs != bs && *pbs != NULL) 53434c6f050Saurel32 pbs = &(*pbs)->next; 53534c6f050Saurel32 if (*pbs == bs) 53634c6f050Saurel32 *pbs = bs->next; 53734c6f050Saurel32 538b338082bSbellard bdrv_close(bs); 539b338082bSbellard qemu_free(bs); 540fc01f7e7Sbellard } 541fc01f7e7Sbellard 542e97fc193Saliguori /* 543e97fc193Saliguori * Run consistency checks on an image 544e97fc193Saliguori * 545e97fc193Saliguori * Returns the number of errors or -errno when an internal error occurs 546e97fc193Saliguori */ 547e97fc193Saliguori int bdrv_check(BlockDriverState *bs) 548e97fc193Saliguori { 549e97fc193Saliguori if (bs->drv->bdrv_check == NULL) { 550e97fc193Saliguori return -ENOTSUP; 551e97fc193Saliguori } 552e97fc193Saliguori 553e97fc193Saliguori return bs->drv->bdrv_check(bs); 554e97fc193Saliguori } 555e97fc193Saliguori 55633e3963eSbellard /* commit COW file into the raw image */ 55733e3963eSbellard int bdrv_commit(BlockDriverState *bs) 55833e3963eSbellard { 55919cb3738Sbellard BlockDriver *drv = bs->drv; 56083f64091Sbellard int64_t i, total_sectors; 561ea2384d3Sbellard int n, j; 562ea2384d3Sbellard unsigned char sector[512]; 56333e3963eSbellard 56419cb3738Sbellard if (!drv) 56519cb3738Sbellard return -ENOMEDIUM; 56633e3963eSbellard 56733e3963eSbellard if (bs->read_only) { 568ea2384d3Sbellard return -EACCES; 56933e3963eSbellard } 57033e3963eSbellard 571ea2384d3Sbellard if (!bs->backing_hd) { 572ea2384d3Sbellard return -ENOTSUP; 573ea2384d3Sbellard } 574ea2384d3Sbellard 5756ea44308SJan Kiszka total_sectors = bdrv_getlength(bs) >> BDRV_SECTOR_BITS; 57683f64091Sbellard for (i = 0; i < total_sectors;) { 57719cb3738Sbellard if (drv->bdrv_is_allocated(bs, i, 65536, &n)) { 578ea2384d3Sbellard for(j = 0; j < n; j++) { 57933e3963eSbellard if (bdrv_read(bs, i, sector, 1) != 0) { 580ea2384d3Sbellard return -EIO; 58133e3963eSbellard } 58233e3963eSbellard 583ea2384d3Sbellard if (bdrv_write(bs->backing_hd, i, sector, 1) != 0) { 584ea2384d3Sbellard return -EIO; 58533e3963eSbellard } 586ea2384d3Sbellard i++; 587ea2384d3Sbellard } 588ea2384d3Sbellard } else { 589ea2384d3Sbellard i += n; 59033e3963eSbellard } 59133e3963eSbellard } 59295389c86Sbellard 59319cb3738Sbellard if (drv->bdrv_make_empty) 59419cb3738Sbellard return drv->bdrv_make_empty(bs); 59595389c86Sbellard 59633e3963eSbellard return 0; 59733e3963eSbellard } 59833e3963eSbellard 59971d0770cSaliguori static int bdrv_check_byte_request(BlockDriverState *bs, int64_t offset, 60071d0770cSaliguori size_t size) 60171d0770cSaliguori { 60271d0770cSaliguori int64_t len; 60371d0770cSaliguori 60471d0770cSaliguori if (!bdrv_is_inserted(bs)) 60571d0770cSaliguori return -ENOMEDIUM; 60671d0770cSaliguori 60771d0770cSaliguori if (bs->growable) 60871d0770cSaliguori return 0; 60971d0770cSaliguori 61071d0770cSaliguori len = bdrv_getlength(bs); 61171d0770cSaliguori 612fbb7b4e0SKevin Wolf if (offset < 0) 613fbb7b4e0SKevin Wolf return -EIO; 614fbb7b4e0SKevin Wolf 615fbb7b4e0SKevin Wolf if ((offset > len) || (len - offset < size)) 61671d0770cSaliguori return -EIO; 61771d0770cSaliguori 61871d0770cSaliguori return 0; 61971d0770cSaliguori } 62071d0770cSaliguori 62171d0770cSaliguori static int bdrv_check_request(BlockDriverState *bs, int64_t sector_num, 62271d0770cSaliguori int nb_sectors) 62371d0770cSaliguori { 624999dec57Saliguori return bdrv_check_byte_request(bs, sector_num * 512, nb_sectors * 512); 62571d0770cSaliguori } 62671d0770cSaliguori 62719cb3738Sbellard /* return < 0 if error. See bdrv_write() for the return codes */ 628fc01f7e7Sbellard int bdrv_read(BlockDriverState *bs, int64_t sector_num, 629fc01f7e7Sbellard uint8_t *buf, int nb_sectors) 630fc01f7e7Sbellard { 631ea2384d3Sbellard BlockDriver *drv = bs->drv; 632fc01f7e7Sbellard 63319cb3738Sbellard if (!drv) 63419cb3738Sbellard return -ENOMEDIUM; 63571d0770cSaliguori if (bdrv_check_request(bs, sector_num, nb_sectors)) 63671d0770cSaliguori return -EIO; 637b338082bSbellard 63883f64091Sbellard return drv->bdrv_read(bs, sector_num, buf, nb_sectors); 63983f64091Sbellard } 640fc01f7e7Sbellard 6417cd1e32aSlirans@il.ibm.com static void set_dirty_bitmap(BlockDriverState *bs, int64_t sector_num, 6427cd1e32aSlirans@il.ibm.com int nb_sectors, int dirty) 6437cd1e32aSlirans@il.ibm.com { 6447cd1e32aSlirans@il.ibm.com int64_t start, end; 645*c6d22830SJan Kiszka unsigned long val, idx, bit; 646a55eb92cSJan Kiszka 6476ea44308SJan Kiszka start = sector_num / BDRV_SECTORS_PER_DIRTY_CHUNK; 648*c6d22830SJan Kiszka end = (sector_num + nb_sectors - 1) / BDRV_SECTORS_PER_DIRTY_CHUNK; 6497cd1e32aSlirans@il.ibm.com 6507cd1e32aSlirans@il.ibm.com for (; start <= end; start++) { 651*c6d22830SJan Kiszka idx = start / (sizeof(unsigned long) * 8); 652*c6d22830SJan Kiszka bit = start % (sizeof(unsigned long) * 8); 653*c6d22830SJan Kiszka val = bs->dirty_bitmap[idx]; 654*c6d22830SJan Kiszka if (dirty) { 655*c6d22830SJan Kiszka val |= 1 << bit; 656*c6d22830SJan Kiszka } else { 657*c6d22830SJan Kiszka val &= ~(1 << bit); 658*c6d22830SJan Kiszka } 659*c6d22830SJan Kiszka bs->dirty_bitmap[idx] = val; 6607cd1e32aSlirans@il.ibm.com } 6617cd1e32aSlirans@il.ibm.com } 6627cd1e32aSlirans@il.ibm.com 66319cb3738Sbellard /* Return < 0 if error. Important errors are: 66419cb3738Sbellard -EIO generic I/O error (may happen for all errors) 66519cb3738Sbellard -ENOMEDIUM No media inserted. 66619cb3738Sbellard -EINVAL Invalid sector number or nb_sectors 66719cb3738Sbellard -EACCES Trying to write a read-only device 66819cb3738Sbellard */ 669fc01f7e7Sbellard int bdrv_write(BlockDriverState *bs, int64_t sector_num, 670fc01f7e7Sbellard const uint8_t *buf, int nb_sectors) 671fc01f7e7Sbellard { 67283f64091Sbellard BlockDriver *drv = bs->drv; 67319cb3738Sbellard if (!bs->drv) 67419cb3738Sbellard return -ENOMEDIUM; 6750849bf08Sbellard if (bs->read_only) 67619cb3738Sbellard return -EACCES; 67771d0770cSaliguori if (bdrv_check_request(bs, sector_num, nb_sectors)) 67871d0770cSaliguori return -EIO; 67971d0770cSaliguori 680*c6d22830SJan Kiszka if (bs->dirty_bitmap) { 6817cd1e32aSlirans@il.ibm.com set_dirty_bitmap(bs, sector_num, nb_sectors, 1); 6827cd1e32aSlirans@il.ibm.com } 6837cd1e32aSlirans@il.ibm.com 68483f64091Sbellard return drv->bdrv_write(bs, sector_num, buf, nb_sectors); 68583f64091Sbellard } 68683f64091Sbellard 687eda578e5Saliguori int bdrv_pread(BlockDriverState *bs, int64_t offset, 688eda578e5Saliguori void *buf, int count1) 68983f64091Sbellard { 6906ea44308SJan Kiszka uint8_t tmp_buf[BDRV_SECTOR_SIZE]; 69183f64091Sbellard int len, nb_sectors, count; 69283f64091Sbellard int64_t sector_num; 69383f64091Sbellard 69483f64091Sbellard count = count1; 69583f64091Sbellard /* first read to align to sector start */ 6966ea44308SJan Kiszka len = (BDRV_SECTOR_SIZE - offset) & (BDRV_SECTOR_SIZE - 1); 69783f64091Sbellard if (len > count) 69883f64091Sbellard len = count; 6996ea44308SJan Kiszka sector_num = offset >> BDRV_SECTOR_BITS; 70083f64091Sbellard if (len > 0) { 70183f64091Sbellard if (bdrv_read(bs, sector_num, tmp_buf, 1) < 0) 70283f64091Sbellard return -EIO; 7036ea44308SJan Kiszka memcpy(buf, tmp_buf + (offset & (BDRV_SECTOR_SIZE - 1)), len); 70483f64091Sbellard count -= len; 70583f64091Sbellard if (count == 0) 70683f64091Sbellard return count1; 70783f64091Sbellard sector_num++; 70883f64091Sbellard buf += len; 70983f64091Sbellard } 71083f64091Sbellard 71183f64091Sbellard /* read the sectors "in place" */ 7126ea44308SJan Kiszka nb_sectors = count >> BDRV_SECTOR_BITS; 71383f64091Sbellard if (nb_sectors > 0) { 71483f64091Sbellard if (bdrv_read(bs, sector_num, buf, nb_sectors) < 0) 71583f64091Sbellard return -EIO; 71683f64091Sbellard sector_num += nb_sectors; 7176ea44308SJan Kiszka len = nb_sectors << BDRV_SECTOR_BITS; 71883f64091Sbellard buf += len; 71983f64091Sbellard count -= len; 72083f64091Sbellard } 72183f64091Sbellard 72283f64091Sbellard /* add data from the last sector */ 72383f64091Sbellard if (count > 0) { 72483f64091Sbellard if (bdrv_read(bs, sector_num, tmp_buf, 1) < 0) 72583f64091Sbellard return -EIO; 72683f64091Sbellard memcpy(buf, tmp_buf, count); 72783f64091Sbellard } 72883f64091Sbellard return count1; 72983f64091Sbellard } 73083f64091Sbellard 731eda578e5Saliguori int bdrv_pwrite(BlockDriverState *bs, int64_t offset, 732eda578e5Saliguori const void *buf, int count1) 73383f64091Sbellard { 7346ea44308SJan Kiszka uint8_t tmp_buf[BDRV_SECTOR_SIZE]; 73583f64091Sbellard int len, nb_sectors, count; 73683f64091Sbellard int64_t sector_num; 73783f64091Sbellard 73883f64091Sbellard count = count1; 73983f64091Sbellard /* first write to align to sector start */ 7406ea44308SJan Kiszka len = (BDRV_SECTOR_SIZE - offset) & (BDRV_SECTOR_SIZE - 1); 74183f64091Sbellard if (len > count) 74283f64091Sbellard len = count; 7436ea44308SJan Kiszka sector_num = offset >> BDRV_SECTOR_BITS; 74483f64091Sbellard if (len > 0) { 74583f64091Sbellard if (bdrv_read(bs, sector_num, tmp_buf, 1) < 0) 74683f64091Sbellard return -EIO; 7476ea44308SJan Kiszka memcpy(tmp_buf + (offset & (BDRV_SECTOR_SIZE - 1)), buf, len); 74883f64091Sbellard if (bdrv_write(bs, sector_num, tmp_buf, 1) < 0) 74983f64091Sbellard return -EIO; 75083f64091Sbellard count -= len; 75183f64091Sbellard if (count == 0) 75283f64091Sbellard return count1; 75383f64091Sbellard sector_num++; 75483f64091Sbellard buf += len; 75583f64091Sbellard } 75683f64091Sbellard 75783f64091Sbellard /* write the sectors "in place" */ 7586ea44308SJan Kiszka nb_sectors = count >> BDRV_SECTOR_BITS; 75983f64091Sbellard if (nb_sectors > 0) { 76083f64091Sbellard if (bdrv_write(bs, sector_num, buf, nb_sectors) < 0) 76183f64091Sbellard return -EIO; 76283f64091Sbellard sector_num += nb_sectors; 7636ea44308SJan Kiszka len = nb_sectors << BDRV_SECTOR_BITS; 76483f64091Sbellard buf += len; 76583f64091Sbellard count -= len; 76683f64091Sbellard } 76783f64091Sbellard 76883f64091Sbellard /* add data from the last sector */ 76983f64091Sbellard if (count > 0) { 77083f64091Sbellard if (bdrv_read(bs, sector_num, tmp_buf, 1) < 0) 77183f64091Sbellard return -EIO; 77283f64091Sbellard memcpy(tmp_buf, buf, count); 77383f64091Sbellard if (bdrv_write(bs, sector_num, tmp_buf, 1) < 0) 77483f64091Sbellard return -EIO; 77583f64091Sbellard } 77683f64091Sbellard return count1; 77783f64091Sbellard } 77883f64091Sbellard 77983f64091Sbellard /** 78083f64091Sbellard * Truncate file to 'offset' bytes (needed only for file protocols) 78183f64091Sbellard */ 78283f64091Sbellard int bdrv_truncate(BlockDriverState *bs, int64_t offset) 78383f64091Sbellard { 78483f64091Sbellard BlockDriver *drv = bs->drv; 78583f64091Sbellard if (!drv) 78619cb3738Sbellard return -ENOMEDIUM; 78783f64091Sbellard if (!drv->bdrv_truncate) 78883f64091Sbellard return -ENOTSUP; 78959f2689dSNaphtali Sprei if (bs->read_only) 79059f2689dSNaphtali Sprei return -EACCES; 79183f64091Sbellard return drv->bdrv_truncate(bs, offset); 79283f64091Sbellard } 79383f64091Sbellard 79483f64091Sbellard /** 79583f64091Sbellard * Length of a file in bytes. Return < 0 if error or unknown. 79683f64091Sbellard */ 79783f64091Sbellard int64_t bdrv_getlength(BlockDriverState *bs) 79883f64091Sbellard { 79983f64091Sbellard BlockDriver *drv = bs->drv; 80083f64091Sbellard if (!drv) 80119cb3738Sbellard return -ENOMEDIUM; 80283f64091Sbellard if (!drv->bdrv_getlength) { 80383f64091Sbellard /* legacy mode */ 8046ea44308SJan Kiszka return bs->total_sectors * BDRV_SECTOR_SIZE; 80583f64091Sbellard } 80683f64091Sbellard return drv->bdrv_getlength(bs); 807fc01f7e7Sbellard } 808fc01f7e7Sbellard 80919cb3738Sbellard /* return 0 as number of sectors if no device present or error */ 81096b8f136Sths void bdrv_get_geometry(BlockDriverState *bs, uint64_t *nb_sectors_ptr) 811fc01f7e7Sbellard { 81219cb3738Sbellard int64_t length; 81319cb3738Sbellard length = bdrv_getlength(bs); 81419cb3738Sbellard if (length < 0) 81519cb3738Sbellard length = 0; 81619cb3738Sbellard else 8176ea44308SJan Kiszka length = length >> BDRV_SECTOR_BITS; 81819cb3738Sbellard *nb_sectors_ptr = length; 819fc01f7e7Sbellard } 820cf98951bSbellard 821f3d54fc4Saliguori struct partition { 822f3d54fc4Saliguori uint8_t boot_ind; /* 0x80 - active */ 823f3d54fc4Saliguori uint8_t head; /* starting head */ 824f3d54fc4Saliguori uint8_t sector; /* starting sector */ 825f3d54fc4Saliguori uint8_t cyl; /* starting cylinder */ 826f3d54fc4Saliguori uint8_t sys_ind; /* What partition type */ 827f3d54fc4Saliguori uint8_t end_head; /* end head */ 828f3d54fc4Saliguori uint8_t end_sector; /* end sector */ 829f3d54fc4Saliguori uint8_t end_cyl; /* end cylinder */ 830f3d54fc4Saliguori uint32_t start_sect; /* starting sector counting from 0 */ 831f3d54fc4Saliguori uint32_t nr_sects; /* nr of sectors in partition */ 832f3d54fc4Saliguori } __attribute__((packed)); 833f3d54fc4Saliguori 834f3d54fc4Saliguori /* try to guess the disk logical geometry from the MSDOS partition table. Return 0 if OK, -1 if could not guess */ 835f3d54fc4Saliguori static int guess_disk_lchs(BlockDriverState *bs, 836f3d54fc4Saliguori int *pcylinders, int *pheads, int *psectors) 837f3d54fc4Saliguori { 838f3d54fc4Saliguori uint8_t buf[512]; 839f3d54fc4Saliguori int ret, i, heads, sectors, cylinders; 840f3d54fc4Saliguori struct partition *p; 841f3d54fc4Saliguori uint32_t nr_sects; 842a38131b6Sblueswir1 uint64_t nb_sectors; 843f3d54fc4Saliguori 844f3d54fc4Saliguori bdrv_get_geometry(bs, &nb_sectors); 845f3d54fc4Saliguori 846f3d54fc4Saliguori ret = bdrv_read(bs, 0, buf, 1); 847f3d54fc4Saliguori if (ret < 0) 848f3d54fc4Saliguori return -1; 849f3d54fc4Saliguori /* test msdos magic */ 850f3d54fc4Saliguori if (buf[510] != 0x55 || buf[511] != 0xaa) 851f3d54fc4Saliguori return -1; 852f3d54fc4Saliguori for(i = 0; i < 4; i++) { 853f3d54fc4Saliguori p = ((struct partition *)(buf + 0x1be)) + i; 854f3d54fc4Saliguori nr_sects = le32_to_cpu(p->nr_sects); 855f3d54fc4Saliguori if (nr_sects && p->end_head) { 856f3d54fc4Saliguori /* We make the assumption that the partition terminates on 857f3d54fc4Saliguori a cylinder boundary */ 858f3d54fc4Saliguori heads = p->end_head + 1; 859f3d54fc4Saliguori sectors = p->end_sector & 63; 860f3d54fc4Saliguori if (sectors == 0) 861f3d54fc4Saliguori continue; 862f3d54fc4Saliguori cylinders = nb_sectors / (heads * sectors); 863f3d54fc4Saliguori if (cylinders < 1 || cylinders > 16383) 864f3d54fc4Saliguori continue; 865f3d54fc4Saliguori *pheads = heads; 866f3d54fc4Saliguori *psectors = sectors; 867f3d54fc4Saliguori *pcylinders = cylinders; 868f3d54fc4Saliguori #if 0 869f3d54fc4Saliguori printf("guessed geometry: LCHS=%d %d %d\n", 870f3d54fc4Saliguori cylinders, heads, sectors); 871f3d54fc4Saliguori #endif 872f3d54fc4Saliguori return 0; 873f3d54fc4Saliguori } 874f3d54fc4Saliguori } 875f3d54fc4Saliguori return -1; 876f3d54fc4Saliguori } 877f3d54fc4Saliguori 878f3d54fc4Saliguori void bdrv_guess_geometry(BlockDriverState *bs, int *pcyls, int *pheads, int *psecs) 879f3d54fc4Saliguori { 880f3d54fc4Saliguori int translation, lba_detected = 0; 881f3d54fc4Saliguori int cylinders, heads, secs; 882a38131b6Sblueswir1 uint64_t nb_sectors; 883f3d54fc4Saliguori 884f3d54fc4Saliguori /* if a geometry hint is available, use it */ 885f3d54fc4Saliguori bdrv_get_geometry(bs, &nb_sectors); 886f3d54fc4Saliguori bdrv_get_geometry_hint(bs, &cylinders, &heads, &secs); 887f3d54fc4Saliguori translation = bdrv_get_translation_hint(bs); 888f3d54fc4Saliguori if (cylinders != 0) { 889f3d54fc4Saliguori *pcyls = cylinders; 890f3d54fc4Saliguori *pheads = heads; 891f3d54fc4Saliguori *psecs = secs; 892f3d54fc4Saliguori } else { 893f3d54fc4Saliguori if (guess_disk_lchs(bs, &cylinders, &heads, &secs) == 0) { 894f3d54fc4Saliguori if (heads > 16) { 895f3d54fc4Saliguori /* if heads > 16, it means that a BIOS LBA 896f3d54fc4Saliguori translation was active, so the default 897f3d54fc4Saliguori hardware geometry is OK */ 898f3d54fc4Saliguori lba_detected = 1; 899f3d54fc4Saliguori goto default_geometry; 900f3d54fc4Saliguori } else { 901f3d54fc4Saliguori *pcyls = cylinders; 902f3d54fc4Saliguori *pheads = heads; 903f3d54fc4Saliguori *psecs = secs; 904f3d54fc4Saliguori /* disable any translation to be in sync with 905f3d54fc4Saliguori the logical geometry */ 906f3d54fc4Saliguori if (translation == BIOS_ATA_TRANSLATION_AUTO) { 907f3d54fc4Saliguori bdrv_set_translation_hint(bs, 908f3d54fc4Saliguori BIOS_ATA_TRANSLATION_NONE); 909f3d54fc4Saliguori } 910f3d54fc4Saliguori } 911f3d54fc4Saliguori } else { 912f3d54fc4Saliguori default_geometry: 913f3d54fc4Saliguori /* if no geometry, use a standard physical disk geometry */ 914f3d54fc4Saliguori cylinders = nb_sectors / (16 * 63); 915f3d54fc4Saliguori 916f3d54fc4Saliguori if (cylinders > 16383) 917f3d54fc4Saliguori cylinders = 16383; 918f3d54fc4Saliguori else if (cylinders < 2) 919f3d54fc4Saliguori cylinders = 2; 920f3d54fc4Saliguori *pcyls = cylinders; 921f3d54fc4Saliguori *pheads = 16; 922f3d54fc4Saliguori *psecs = 63; 923f3d54fc4Saliguori if ((lba_detected == 1) && (translation == BIOS_ATA_TRANSLATION_AUTO)) { 924f3d54fc4Saliguori if ((*pcyls * *pheads) <= 131072) { 925f3d54fc4Saliguori bdrv_set_translation_hint(bs, 926f3d54fc4Saliguori BIOS_ATA_TRANSLATION_LARGE); 927f3d54fc4Saliguori } else { 928f3d54fc4Saliguori bdrv_set_translation_hint(bs, 929f3d54fc4Saliguori BIOS_ATA_TRANSLATION_LBA); 930f3d54fc4Saliguori } 931f3d54fc4Saliguori } 932f3d54fc4Saliguori } 933f3d54fc4Saliguori bdrv_set_geometry_hint(bs, *pcyls, *pheads, *psecs); 934f3d54fc4Saliguori } 935f3d54fc4Saliguori } 936f3d54fc4Saliguori 937b338082bSbellard void bdrv_set_geometry_hint(BlockDriverState *bs, 938b338082bSbellard int cyls, int heads, int secs) 939b338082bSbellard { 940b338082bSbellard bs->cyls = cyls; 941b338082bSbellard bs->heads = heads; 942b338082bSbellard bs->secs = secs; 943b338082bSbellard } 944b338082bSbellard 945b338082bSbellard void bdrv_set_type_hint(BlockDriverState *bs, int type) 946b338082bSbellard { 947b338082bSbellard bs->type = type; 948b338082bSbellard bs->removable = ((type == BDRV_TYPE_CDROM || 949b338082bSbellard type == BDRV_TYPE_FLOPPY)); 950b338082bSbellard } 951b338082bSbellard 95246d4767dSbellard void bdrv_set_translation_hint(BlockDriverState *bs, int translation) 95346d4767dSbellard { 95446d4767dSbellard bs->translation = translation; 95546d4767dSbellard } 95646d4767dSbellard 957b338082bSbellard void bdrv_get_geometry_hint(BlockDriverState *bs, 958b338082bSbellard int *pcyls, int *pheads, int *psecs) 959b338082bSbellard { 960b338082bSbellard *pcyls = bs->cyls; 961b338082bSbellard *pheads = bs->heads; 962b338082bSbellard *psecs = bs->secs; 963b338082bSbellard } 964b338082bSbellard 965b338082bSbellard int bdrv_get_type_hint(BlockDriverState *bs) 966b338082bSbellard { 967b338082bSbellard return bs->type; 968b338082bSbellard } 969b338082bSbellard 97046d4767dSbellard int bdrv_get_translation_hint(BlockDriverState *bs) 97146d4767dSbellard { 97246d4767dSbellard return bs->translation; 97346d4767dSbellard } 97446d4767dSbellard 975b338082bSbellard int bdrv_is_removable(BlockDriverState *bs) 976b338082bSbellard { 977b338082bSbellard return bs->removable; 978b338082bSbellard } 979b338082bSbellard 980b338082bSbellard int bdrv_is_read_only(BlockDriverState *bs) 981b338082bSbellard { 982b338082bSbellard return bs->read_only; 983b338082bSbellard } 984b338082bSbellard 98559f2689dSNaphtali Sprei int bdrv_set_read_only(BlockDriverState *bs, int read_only) 98659f2689dSNaphtali Sprei { 98759f2689dSNaphtali Sprei int ret = bs->read_only; 98859f2689dSNaphtali Sprei bs->read_only = read_only; 98959f2689dSNaphtali Sprei return ret; 99059f2689dSNaphtali Sprei } 99159f2689dSNaphtali Sprei 992985a03b0Sths int bdrv_is_sg(BlockDriverState *bs) 993985a03b0Sths { 994985a03b0Sths return bs->sg; 995985a03b0Sths } 996985a03b0Sths 997e900a7b7SChristoph Hellwig int bdrv_enable_write_cache(BlockDriverState *bs) 998e900a7b7SChristoph Hellwig { 999e900a7b7SChristoph Hellwig return bs->enable_write_cache; 1000e900a7b7SChristoph Hellwig } 1001e900a7b7SChristoph Hellwig 100219cb3738Sbellard /* XXX: no longer used */ 1003b338082bSbellard void bdrv_set_change_cb(BlockDriverState *bs, 1004b338082bSbellard void (*change_cb)(void *opaque), void *opaque) 1005b338082bSbellard { 1006b338082bSbellard bs->change_cb = change_cb; 1007b338082bSbellard bs->change_opaque = opaque; 1008b338082bSbellard } 1009b338082bSbellard 1010ea2384d3Sbellard int bdrv_is_encrypted(BlockDriverState *bs) 1011ea2384d3Sbellard { 1012ea2384d3Sbellard if (bs->backing_hd && bs->backing_hd->encrypted) 1013ea2384d3Sbellard return 1; 1014ea2384d3Sbellard return bs->encrypted; 1015ea2384d3Sbellard } 1016ea2384d3Sbellard 1017c0f4ce77Saliguori int bdrv_key_required(BlockDriverState *bs) 1018c0f4ce77Saliguori { 1019c0f4ce77Saliguori BlockDriverState *backing_hd = bs->backing_hd; 1020c0f4ce77Saliguori 1021c0f4ce77Saliguori if (backing_hd && backing_hd->encrypted && !backing_hd->valid_key) 1022c0f4ce77Saliguori return 1; 1023c0f4ce77Saliguori return (bs->encrypted && !bs->valid_key); 1024c0f4ce77Saliguori } 1025c0f4ce77Saliguori 1026ea2384d3Sbellard int bdrv_set_key(BlockDriverState *bs, const char *key) 1027ea2384d3Sbellard { 1028ea2384d3Sbellard int ret; 1029ea2384d3Sbellard if (bs->backing_hd && bs->backing_hd->encrypted) { 1030ea2384d3Sbellard ret = bdrv_set_key(bs->backing_hd, key); 1031ea2384d3Sbellard if (ret < 0) 1032ea2384d3Sbellard return ret; 1033ea2384d3Sbellard if (!bs->encrypted) 1034ea2384d3Sbellard return 0; 1035ea2384d3Sbellard } 1036ea2384d3Sbellard if (!bs->encrypted || !bs->drv || !bs->drv->bdrv_set_key) 1037ea2384d3Sbellard return -1; 1038c0f4ce77Saliguori ret = bs->drv->bdrv_set_key(bs, key); 1039bb5fc20fSaliguori if (ret < 0) { 1040bb5fc20fSaliguori bs->valid_key = 0; 1041bb5fc20fSaliguori } else if (!bs->valid_key) { 1042bb5fc20fSaliguori bs->valid_key = 1; 1043bb5fc20fSaliguori /* call the change callback now, we skipped it on open */ 1044bb5fc20fSaliguori bs->media_changed = 1; 1045bb5fc20fSaliguori if (bs->change_cb) 1046bb5fc20fSaliguori bs->change_cb(bs->change_opaque); 1047bb5fc20fSaliguori } 1048c0f4ce77Saliguori return ret; 1049ea2384d3Sbellard } 1050ea2384d3Sbellard 1051ea2384d3Sbellard void bdrv_get_format(BlockDriverState *bs, char *buf, int buf_size) 1052ea2384d3Sbellard { 105319cb3738Sbellard if (!bs->drv) { 1054ea2384d3Sbellard buf[0] = '\0'; 1055ea2384d3Sbellard } else { 1056ea2384d3Sbellard pstrcpy(buf, buf_size, bs->drv->format_name); 1057ea2384d3Sbellard } 1058ea2384d3Sbellard } 1059ea2384d3Sbellard 1060ea2384d3Sbellard void bdrv_iterate_format(void (*it)(void *opaque, const char *name), 1061ea2384d3Sbellard void *opaque) 1062ea2384d3Sbellard { 1063ea2384d3Sbellard BlockDriver *drv; 1064ea2384d3Sbellard 1065ea2384d3Sbellard for (drv = first_drv; drv != NULL; drv = drv->next) { 1066ea2384d3Sbellard it(opaque, drv->format_name); 1067ea2384d3Sbellard } 1068ea2384d3Sbellard } 1069ea2384d3Sbellard 1070b338082bSbellard BlockDriverState *bdrv_find(const char *name) 1071b338082bSbellard { 1072b338082bSbellard BlockDriverState *bs; 1073b338082bSbellard 1074b338082bSbellard for (bs = bdrv_first; bs != NULL; bs = bs->next) { 1075b338082bSbellard if (!strcmp(name, bs->device_name)) 1076b338082bSbellard return bs; 1077b338082bSbellard } 1078b338082bSbellard return NULL; 1079b338082bSbellard } 1080b338082bSbellard 108151de9760Saliguori void bdrv_iterate(void (*it)(void *opaque, BlockDriverState *bs), void *opaque) 108281d0912dSbellard { 108381d0912dSbellard BlockDriverState *bs; 108481d0912dSbellard 108581d0912dSbellard for (bs = bdrv_first; bs != NULL; bs = bs->next) { 108651de9760Saliguori it(opaque, bs); 108781d0912dSbellard } 108881d0912dSbellard } 108981d0912dSbellard 1090ea2384d3Sbellard const char *bdrv_get_device_name(BlockDriverState *bs) 1091ea2384d3Sbellard { 1092ea2384d3Sbellard return bs->device_name; 1093ea2384d3Sbellard } 1094ea2384d3Sbellard 10957a6cba61Spbrook void bdrv_flush(BlockDriverState *bs) 10967a6cba61Spbrook { 1097081501daSaliguori if (!bs->drv) 1098081501daSaliguori return; 10997a6cba61Spbrook if (bs->drv->bdrv_flush) 11007a6cba61Spbrook bs->drv->bdrv_flush(bs); 11017a6cba61Spbrook if (bs->backing_hd) 11027a6cba61Spbrook bdrv_flush(bs->backing_hd); 11037a6cba61Spbrook } 11047a6cba61Spbrook 1105c6ca28d6Saliguori void bdrv_flush_all(void) 1106c6ca28d6Saliguori { 1107c6ca28d6Saliguori BlockDriverState *bs; 1108c6ca28d6Saliguori 1109c6ca28d6Saliguori for (bs = bdrv_first; bs != NULL; bs = bs->next) 1110c6ca28d6Saliguori if (bs->drv && !bdrv_is_read_only(bs) && 1111c6ca28d6Saliguori (!bdrv_is_removable(bs) || bdrv_is_inserted(bs))) 1112c6ca28d6Saliguori bdrv_flush(bs); 1113c6ca28d6Saliguori } 1114c6ca28d6Saliguori 1115f58c7b35Sths /* 1116f58c7b35Sths * Returns true iff the specified sector is present in the disk image. Drivers 1117f58c7b35Sths * not implementing the functionality are assumed to not support backing files, 1118f58c7b35Sths * hence all their sectors are reported as allocated. 1119f58c7b35Sths * 1120f58c7b35Sths * 'pnum' is set to the number of sectors (including and immediately following 1121f58c7b35Sths * the specified sector) that are known to be in the same 1122f58c7b35Sths * allocated/unallocated state. 1123f58c7b35Sths * 1124f58c7b35Sths * 'nb_sectors' is the max value 'pnum' should be set to. 1125f58c7b35Sths */ 1126f58c7b35Sths int bdrv_is_allocated(BlockDriverState *bs, int64_t sector_num, int nb_sectors, 1127f58c7b35Sths int *pnum) 1128f58c7b35Sths { 1129f58c7b35Sths int64_t n; 1130f58c7b35Sths if (!bs->drv->bdrv_is_allocated) { 1131f58c7b35Sths if (sector_num >= bs->total_sectors) { 1132f58c7b35Sths *pnum = 0; 1133f58c7b35Sths return 0; 1134f58c7b35Sths } 1135f58c7b35Sths n = bs->total_sectors - sector_num; 1136f58c7b35Sths *pnum = (n < nb_sectors) ? (n) : (nb_sectors); 1137f58c7b35Sths return 1; 1138f58c7b35Sths } 1139f58c7b35Sths return bs->drv->bdrv_is_allocated(bs, sector_num, nb_sectors, pnum); 1140f58c7b35Sths } 1141f58c7b35Sths 1142376253ecSaliguori void bdrv_info(Monitor *mon) 1143b338082bSbellard { 1144b338082bSbellard BlockDriverState *bs; 1145b338082bSbellard 1146b338082bSbellard for (bs = bdrv_first; bs != NULL; bs = bs->next) { 1147376253ecSaliguori monitor_printf(mon, "%s:", bs->device_name); 1148376253ecSaliguori monitor_printf(mon, " type="); 1149b338082bSbellard switch(bs->type) { 1150b338082bSbellard case BDRV_TYPE_HD: 1151376253ecSaliguori monitor_printf(mon, "hd"); 1152b338082bSbellard break; 1153b338082bSbellard case BDRV_TYPE_CDROM: 1154376253ecSaliguori monitor_printf(mon, "cdrom"); 1155b338082bSbellard break; 1156b338082bSbellard case BDRV_TYPE_FLOPPY: 1157376253ecSaliguori monitor_printf(mon, "floppy"); 1158b338082bSbellard break; 1159b338082bSbellard } 1160376253ecSaliguori monitor_printf(mon, " removable=%d", bs->removable); 1161b338082bSbellard if (bs->removable) { 1162376253ecSaliguori monitor_printf(mon, " locked=%d", bs->locked); 1163b338082bSbellard } 116419cb3738Sbellard if (bs->drv) { 1165376253ecSaliguori monitor_printf(mon, " file="); 1166376253ecSaliguori monitor_print_filename(mon, bs->filename); 1167fef30743Sths if (bs->backing_file[0] != '\0') { 1168376253ecSaliguori monitor_printf(mon, " backing_file="); 1169376253ecSaliguori monitor_print_filename(mon, bs->backing_file); 1170fef30743Sths } 1171376253ecSaliguori monitor_printf(mon, " ro=%d", bs->read_only); 1172376253ecSaliguori monitor_printf(mon, " drv=%s", bs->drv->format_name); 1173376253ecSaliguori monitor_printf(mon, " encrypted=%d", bdrv_is_encrypted(bs)); 1174b338082bSbellard } else { 1175376253ecSaliguori monitor_printf(mon, " [not inserted]"); 1176b338082bSbellard } 1177376253ecSaliguori monitor_printf(mon, "\n"); 1178b338082bSbellard } 1179b338082bSbellard } 1180a36e69ddSths 1181a36e69ddSths /* The "info blockstats" command. */ 1182376253ecSaliguori void bdrv_info_stats(Monitor *mon) 1183a36e69ddSths { 1184a36e69ddSths BlockDriverState *bs; 1185a36e69ddSths 1186a36e69ddSths for (bs = bdrv_first; bs != NULL; bs = bs->next) { 1187376253ecSaliguori monitor_printf(mon, "%s:" 1188a36e69ddSths " rd_bytes=%" PRIu64 1189a36e69ddSths " wr_bytes=%" PRIu64 1190a36e69ddSths " rd_operations=%" PRIu64 1191a36e69ddSths " wr_operations=%" PRIu64 1192ebf53fcdSaliguori "\n", 1193a36e69ddSths bs->device_name, 1194a36e69ddSths bs->rd_bytes, bs->wr_bytes, 1195a36e69ddSths bs->rd_ops, bs->wr_ops); 1196a36e69ddSths } 1197a36e69ddSths } 1198ea2384d3Sbellard 1199045df330Saliguori const char *bdrv_get_encrypted_filename(BlockDriverState *bs) 1200045df330Saliguori { 1201045df330Saliguori if (bs->backing_hd && bs->backing_hd->encrypted) 1202045df330Saliguori return bs->backing_file; 1203045df330Saliguori else if (bs->encrypted) 1204045df330Saliguori return bs->filename; 1205045df330Saliguori else 1206045df330Saliguori return NULL; 1207045df330Saliguori } 1208045df330Saliguori 120983f64091Sbellard void bdrv_get_backing_filename(BlockDriverState *bs, 121083f64091Sbellard char *filename, int filename_size) 121183f64091Sbellard { 121283f64091Sbellard if (!bs->backing_hd) { 121383f64091Sbellard pstrcpy(filename, filename_size, ""); 121483f64091Sbellard } else { 121583f64091Sbellard pstrcpy(filename, filename_size, bs->backing_file); 121683f64091Sbellard } 121783f64091Sbellard } 121883f64091Sbellard 1219faea38e7Sbellard int bdrv_write_compressed(BlockDriverState *bs, int64_t sector_num, 1220faea38e7Sbellard const uint8_t *buf, int nb_sectors) 1221faea38e7Sbellard { 1222faea38e7Sbellard BlockDriver *drv = bs->drv; 1223faea38e7Sbellard if (!drv) 122419cb3738Sbellard return -ENOMEDIUM; 1225faea38e7Sbellard if (!drv->bdrv_write_compressed) 1226faea38e7Sbellard return -ENOTSUP; 1227fbb7b4e0SKevin Wolf if (bdrv_check_request(bs, sector_num, nb_sectors)) 1228fbb7b4e0SKevin Wolf return -EIO; 12297cd1e32aSlirans@il.ibm.com 1230*c6d22830SJan Kiszka if (bs->dirty_bitmap) { 12317cd1e32aSlirans@il.ibm.com set_dirty_bitmap(bs, sector_num, nb_sectors, 1); 12327cd1e32aSlirans@il.ibm.com } 12337cd1e32aSlirans@il.ibm.com 1234faea38e7Sbellard return drv->bdrv_write_compressed(bs, sector_num, buf, nb_sectors); 1235faea38e7Sbellard } 1236faea38e7Sbellard 1237faea38e7Sbellard int bdrv_get_info(BlockDriverState *bs, BlockDriverInfo *bdi) 1238faea38e7Sbellard { 1239faea38e7Sbellard BlockDriver *drv = bs->drv; 1240faea38e7Sbellard if (!drv) 124119cb3738Sbellard return -ENOMEDIUM; 1242faea38e7Sbellard if (!drv->bdrv_get_info) 1243faea38e7Sbellard return -ENOTSUP; 1244faea38e7Sbellard memset(bdi, 0, sizeof(*bdi)); 1245faea38e7Sbellard return drv->bdrv_get_info(bs, bdi); 1246faea38e7Sbellard } 1247faea38e7Sbellard 124845566e9cSChristoph Hellwig int bdrv_save_vmstate(BlockDriverState *bs, const uint8_t *buf, 124945566e9cSChristoph Hellwig int64_t pos, int size) 1250178e08a5Saliguori { 1251178e08a5Saliguori BlockDriver *drv = bs->drv; 1252178e08a5Saliguori if (!drv) 1253178e08a5Saliguori return -ENOMEDIUM; 125445566e9cSChristoph Hellwig if (!drv->bdrv_save_vmstate) 1255178e08a5Saliguori return -ENOTSUP; 125645566e9cSChristoph Hellwig return drv->bdrv_save_vmstate(bs, buf, pos, size); 1257178e08a5Saliguori } 1258178e08a5Saliguori 125945566e9cSChristoph Hellwig int bdrv_load_vmstate(BlockDriverState *bs, uint8_t *buf, 126045566e9cSChristoph Hellwig int64_t pos, int size) 1261178e08a5Saliguori { 1262178e08a5Saliguori BlockDriver *drv = bs->drv; 1263178e08a5Saliguori if (!drv) 1264178e08a5Saliguori return -ENOMEDIUM; 126545566e9cSChristoph Hellwig if (!drv->bdrv_load_vmstate) 1266178e08a5Saliguori return -ENOTSUP; 126745566e9cSChristoph Hellwig return drv->bdrv_load_vmstate(bs, buf, pos, size); 1268178e08a5Saliguori } 1269178e08a5Saliguori 1270faea38e7Sbellard /**************************************************************/ 1271faea38e7Sbellard /* handling of snapshots */ 1272faea38e7Sbellard 1273faea38e7Sbellard int bdrv_snapshot_create(BlockDriverState *bs, 1274faea38e7Sbellard QEMUSnapshotInfo *sn_info) 1275faea38e7Sbellard { 1276faea38e7Sbellard BlockDriver *drv = bs->drv; 1277faea38e7Sbellard if (!drv) 127819cb3738Sbellard return -ENOMEDIUM; 1279faea38e7Sbellard if (!drv->bdrv_snapshot_create) 1280faea38e7Sbellard return -ENOTSUP; 1281faea38e7Sbellard return drv->bdrv_snapshot_create(bs, sn_info); 1282faea38e7Sbellard } 1283faea38e7Sbellard 1284faea38e7Sbellard int bdrv_snapshot_goto(BlockDriverState *bs, 1285faea38e7Sbellard const char *snapshot_id) 1286faea38e7Sbellard { 1287faea38e7Sbellard BlockDriver *drv = bs->drv; 1288faea38e7Sbellard if (!drv) 128919cb3738Sbellard return -ENOMEDIUM; 1290faea38e7Sbellard if (!drv->bdrv_snapshot_goto) 1291faea38e7Sbellard return -ENOTSUP; 1292faea38e7Sbellard return drv->bdrv_snapshot_goto(bs, snapshot_id); 1293faea38e7Sbellard } 1294faea38e7Sbellard 1295faea38e7Sbellard int bdrv_snapshot_delete(BlockDriverState *bs, const char *snapshot_id) 1296faea38e7Sbellard { 1297faea38e7Sbellard BlockDriver *drv = bs->drv; 1298faea38e7Sbellard if (!drv) 129919cb3738Sbellard return -ENOMEDIUM; 1300faea38e7Sbellard if (!drv->bdrv_snapshot_delete) 1301faea38e7Sbellard return -ENOTSUP; 1302faea38e7Sbellard return drv->bdrv_snapshot_delete(bs, snapshot_id); 1303faea38e7Sbellard } 1304faea38e7Sbellard 1305faea38e7Sbellard int bdrv_snapshot_list(BlockDriverState *bs, 1306faea38e7Sbellard QEMUSnapshotInfo **psn_info) 1307faea38e7Sbellard { 1308faea38e7Sbellard BlockDriver *drv = bs->drv; 1309faea38e7Sbellard if (!drv) 131019cb3738Sbellard return -ENOMEDIUM; 1311faea38e7Sbellard if (!drv->bdrv_snapshot_list) 1312faea38e7Sbellard return -ENOTSUP; 1313faea38e7Sbellard return drv->bdrv_snapshot_list(bs, psn_info); 1314faea38e7Sbellard } 1315faea38e7Sbellard 1316faea38e7Sbellard #define NB_SUFFIXES 4 1317faea38e7Sbellard 1318faea38e7Sbellard char *get_human_readable_size(char *buf, int buf_size, int64_t size) 1319faea38e7Sbellard { 1320faea38e7Sbellard static const char suffixes[NB_SUFFIXES] = "KMGT"; 1321faea38e7Sbellard int64_t base; 1322faea38e7Sbellard int i; 1323faea38e7Sbellard 1324faea38e7Sbellard if (size <= 999) { 1325faea38e7Sbellard snprintf(buf, buf_size, "%" PRId64, size); 1326faea38e7Sbellard } else { 1327faea38e7Sbellard base = 1024; 1328faea38e7Sbellard for(i = 0; i < NB_SUFFIXES; i++) { 1329faea38e7Sbellard if (size < (10 * base)) { 1330faea38e7Sbellard snprintf(buf, buf_size, "%0.1f%c", 1331faea38e7Sbellard (double)size / base, 1332faea38e7Sbellard suffixes[i]); 1333faea38e7Sbellard break; 1334faea38e7Sbellard } else if (size < (1000 * base) || i == (NB_SUFFIXES - 1)) { 1335faea38e7Sbellard snprintf(buf, buf_size, "%" PRId64 "%c", 1336faea38e7Sbellard ((size + (base >> 1)) / base), 1337faea38e7Sbellard suffixes[i]); 1338faea38e7Sbellard break; 1339faea38e7Sbellard } 1340faea38e7Sbellard base = base * 1024; 1341faea38e7Sbellard } 1342faea38e7Sbellard } 1343faea38e7Sbellard return buf; 1344faea38e7Sbellard } 1345faea38e7Sbellard 1346faea38e7Sbellard char *bdrv_snapshot_dump(char *buf, int buf_size, QEMUSnapshotInfo *sn) 1347faea38e7Sbellard { 1348faea38e7Sbellard char buf1[128], date_buf[128], clock_buf[128]; 13493b9f94e1Sbellard #ifdef _WIN32 13503b9f94e1Sbellard struct tm *ptm; 13513b9f94e1Sbellard #else 1352faea38e7Sbellard struct tm tm; 13533b9f94e1Sbellard #endif 1354faea38e7Sbellard time_t ti; 1355faea38e7Sbellard int64_t secs; 1356faea38e7Sbellard 1357faea38e7Sbellard if (!sn) { 1358faea38e7Sbellard snprintf(buf, buf_size, 1359faea38e7Sbellard "%-10s%-20s%7s%20s%15s", 1360faea38e7Sbellard "ID", "TAG", "VM SIZE", "DATE", "VM CLOCK"); 1361faea38e7Sbellard } else { 1362faea38e7Sbellard ti = sn->date_sec; 13633b9f94e1Sbellard #ifdef _WIN32 13643b9f94e1Sbellard ptm = localtime(&ti); 13653b9f94e1Sbellard strftime(date_buf, sizeof(date_buf), 13663b9f94e1Sbellard "%Y-%m-%d %H:%M:%S", ptm); 13673b9f94e1Sbellard #else 1368faea38e7Sbellard localtime_r(&ti, &tm); 1369faea38e7Sbellard strftime(date_buf, sizeof(date_buf), 1370faea38e7Sbellard "%Y-%m-%d %H:%M:%S", &tm); 13713b9f94e1Sbellard #endif 1372faea38e7Sbellard secs = sn->vm_clock_nsec / 1000000000; 1373faea38e7Sbellard snprintf(clock_buf, sizeof(clock_buf), 1374faea38e7Sbellard "%02d:%02d:%02d.%03d", 1375faea38e7Sbellard (int)(secs / 3600), 1376faea38e7Sbellard (int)((secs / 60) % 60), 1377faea38e7Sbellard (int)(secs % 60), 1378faea38e7Sbellard (int)((sn->vm_clock_nsec / 1000000) % 1000)); 1379faea38e7Sbellard snprintf(buf, buf_size, 1380faea38e7Sbellard "%-10s%-20s%7s%20s%15s", 1381faea38e7Sbellard sn->id_str, sn->name, 1382faea38e7Sbellard get_human_readable_size(buf1, sizeof(buf1), sn->vm_state_size), 1383faea38e7Sbellard date_buf, 1384faea38e7Sbellard clock_buf); 1385faea38e7Sbellard } 1386faea38e7Sbellard return buf; 1387faea38e7Sbellard } 1388faea38e7Sbellard 138983f64091Sbellard 1390ea2384d3Sbellard /**************************************************************/ 139183f64091Sbellard /* async I/Os */ 1392ea2384d3Sbellard 13933b69e4b9Saliguori BlockDriverAIOCB *bdrv_aio_readv(BlockDriverState *bs, int64_t sector_num, 1394f141eafeSaliguori QEMUIOVector *qiov, int nb_sectors, 139583f64091Sbellard BlockDriverCompletionFunc *cb, void *opaque) 1396ea2384d3Sbellard { 139783f64091Sbellard BlockDriver *drv = bs->drv; 1398a36e69ddSths BlockDriverAIOCB *ret; 1399ea2384d3Sbellard 140019cb3738Sbellard if (!drv) 1401ce1a14dcSpbrook return NULL; 140271d0770cSaliguori if (bdrv_check_request(bs, sector_num, nb_sectors)) 140371d0770cSaliguori return NULL; 140483f64091Sbellard 1405f141eafeSaliguori ret = drv->bdrv_aio_readv(bs, sector_num, qiov, nb_sectors, 1406f141eafeSaliguori cb, opaque); 1407a36e69ddSths 1408a36e69ddSths if (ret) { 1409a36e69ddSths /* Update stats even though technically transfer has not happened. */ 14106ea44308SJan Kiszka bs->rd_bytes += (unsigned) nb_sectors * BDRV_SECTOR_SIZE; 1411a36e69ddSths bs->rd_ops ++; 1412a36e69ddSths } 1413a36e69ddSths 1414a36e69ddSths return ret; 141583f64091Sbellard } 141683f64091Sbellard 1417f141eafeSaliguori BlockDriverAIOCB *bdrv_aio_writev(BlockDriverState *bs, int64_t sector_num, 1418f141eafeSaliguori QEMUIOVector *qiov, int nb_sectors, 141983f64091Sbellard BlockDriverCompletionFunc *cb, void *opaque) 14207674e7bfSbellard { 142183f64091Sbellard BlockDriver *drv = bs->drv; 1422a36e69ddSths BlockDriverAIOCB *ret; 142383f64091Sbellard 142419cb3738Sbellard if (!drv) 1425ce1a14dcSpbrook return NULL; 142683f64091Sbellard if (bs->read_only) 1427ce1a14dcSpbrook return NULL; 142871d0770cSaliguori if (bdrv_check_request(bs, sector_num, nb_sectors)) 142971d0770cSaliguori return NULL; 143083f64091Sbellard 1431*c6d22830SJan Kiszka if (bs->dirty_bitmap) { 14327cd1e32aSlirans@il.ibm.com set_dirty_bitmap(bs, sector_num, nb_sectors, 1); 14337cd1e32aSlirans@il.ibm.com } 14347cd1e32aSlirans@il.ibm.com 1435f141eafeSaliguori ret = drv->bdrv_aio_writev(bs, sector_num, qiov, nb_sectors, 1436f141eafeSaliguori cb, opaque); 1437a36e69ddSths 1438a36e69ddSths if (ret) { 1439a36e69ddSths /* Update stats even though technically transfer has not happened. */ 14406ea44308SJan Kiszka bs->wr_bytes += (unsigned) nb_sectors * BDRV_SECTOR_SIZE; 1441a36e69ddSths bs->wr_ops ++; 1442a36e69ddSths } 1443a36e69ddSths 1444a36e69ddSths return ret; 144583f64091Sbellard } 144683f64091Sbellard 144740b4f539SKevin Wolf 144840b4f539SKevin Wolf typedef struct MultiwriteCB { 144940b4f539SKevin Wolf int error; 145040b4f539SKevin Wolf int num_requests; 145140b4f539SKevin Wolf int num_callbacks; 145240b4f539SKevin Wolf struct { 145340b4f539SKevin Wolf BlockDriverCompletionFunc *cb; 145440b4f539SKevin Wolf void *opaque; 145540b4f539SKevin Wolf QEMUIOVector *free_qiov; 145640b4f539SKevin Wolf void *free_buf; 145740b4f539SKevin Wolf } callbacks[]; 145840b4f539SKevin Wolf } MultiwriteCB; 145940b4f539SKevin Wolf 146040b4f539SKevin Wolf static void multiwrite_user_cb(MultiwriteCB *mcb) 146140b4f539SKevin Wolf { 146240b4f539SKevin Wolf int i; 146340b4f539SKevin Wolf 146440b4f539SKevin Wolf for (i = 0; i < mcb->num_callbacks; i++) { 146540b4f539SKevin Wolf mcb->callbacks[i].cb(mcb->callbacks[i].opaque, mcb->error); 146640b4f539SKevin Wolf qemu_free(mcb->callbacks[i].free_qiov); 146740b4f539SKevin Wolf qemu_free(mcb->callbacks[i].free_buf); 146840b4f539SKevin Wolf } 146940b4f539SKevin Wolf } 147040b4f539SKevin Wolf 147140b4f539SKevin Wolf static void multiwrite_cb(void *opaque, int ret) 147240b4f539SKevin Wolf { 147340b4f539SKevin Wolf MultiwriteCB *mcb = opaque; 147440b4f539SKevin Wolf 147540b4f539SKevin Wolf if (ret < 0) { 147640b4f539SKevin Wolf mcb->error = ret; 147740b4f539SKevin Wolf multiwrite_user_cb(mcb); 147840b4f539SKevin Wolf } 147940b4f539SKevin Wolf 148040b4f539SKevin Wolf mcb->num_requests--; 148140b4f539SKevin Wolf if (mcb->num_requests == 0) { 148240b4f539SKevin Wolf if (mcb->error == 0) { 148340b4f539SKevin Wolf multiwrite_user_cb(mcb); 148440b4f539SKevin Wolf } 148540b4f539SKevin Wolf qemu_free(mcb); 148640b4f539SKevin Wolf } 148740b4f539SKevin Wolf } 148840b4f539SKevin Wolf 148940b4f539SKevin Wolf static int multiwrite_req_compare(const void *a, const void *b) 149040b4f539SKevin Wolf { 149140b4f539SKevin Wolf return (((BlockRequest*) a)->sector - ((BlockRequest*) b)->sector); 149240b4f539SKevin Wolf } 149340b4f539SKevin Wolf 149440b4f539SKevin Wolf /* 149540b4f539SKevin Wolf * Takes a bunch of requests and tries to merge them. Returns the number of 149640b4f539SKevin Wolf * requests that remain after merging. 149740b4f539SKevin Wolf */ 149840b4f539SKevin Wolf static int multiwrite_merge(BlockDriverState *bs, BlockRequest *reqs, 149940b4f539SKevin Wolf int num_reqs, MultiwriteCB *mcb) 150040b4f539SKevin Wolf { 150140b4f539SKevin Wolf int i, outidx; 150240b4f539SKevin Wolf 150340b4f539SKevin Wolf // Sort requests by start sector 150440b4f539SKevin Wolf qsort(reqs, num_reqs, sizeof(*reqs), &multiwrite_req_compare); 150540b4f539SKevin Wolf 150640b4f539SKevin Wolf // Check if adjacent requests touch the same clusters. If so, combine them, 150740b4f539SKevin Wolf // filling up gaps with zero sectors. 150840b4f539SKevin Wolf outidx = 0; 150940b4f539SKevin Wolf for (i = 1; i < num_reqs; i++) { 151040b4f539SKevin Wolf int merge = 0; 151140b4f539SKevin Wolf int64_t oldreq_last = reqs[outidx].sector + reqs[outidx].nb_sectors; 151240b4f539SKevin Wolf 151340b4f539SKevin Wolf // This handles the cases that are valid for all block drivers, namely 151440b4f539SKevin Wolf // exactly sequential writes and overlapping writes. 151540b4f539SKevin Wolf if (reqs[i].sector <= oldreq_last) { 151640b4f539SKevin Wolf merge = 1; 151740b4f539SKevin Wolf } 151840b4f539SKevin Wolf 151940b4f539SKevin Wolf // The block driver may decide that it makes sense to combine requests 152040b4f539SKevin Wolf // even if there is a gap of some sectors between them. In this case, 152140b4f539SKevin Wolf // the gap is filled with zeros (therefore only applicable for yet 152240b4f539SKevin Wolf // unused space in format like qcow2). 152340b4f539SKevin Wolf if (!merge && bs->drv->bdrv_merge_requests) { 152440b4f539SKevin Wolf merge = bs->drv->bdrv_merge_requests(bs, &reqs[outidx], &reqs[i]); 152540b4f539SKevin Wolf } 152640b4f539SKevin Wolf 152740b4f539SKevin Wolf if (merge) { 152840b4f539SKevin Wolf size_t size; 152940b4f539SKevin Wolf QEMUIOVector *qiov = qemu_mallocz(sizeof(*qiov)); 153040b4f539SKevin Wolf qemu_iovec_init(qiov, 153140b4f539SKevin Wolf reqs[outidx].qiov->niov + reqs[i].qiov->niov + 1); 153240b4f539SKevin Wolf 153340b4f539SKevin Wolf // Add the first request to the merged one. If the requests are 153440b4f539SKevin Wolf // overlapping, drop the last sectors of the first request. 153540b4f539SKevin Wolf size = (reqs[i].sector - reqs[outidx].sector) << 9; 153640b4f539SKevin Wolf qemu_iovec_concat(qiov, reqs[outidx].qiov, size); 153740b4f539SKevin Wolf 153840b4f539SKevin Wolf // We might need to add some zeros between the two requests 153940b4f539SKevin Wolf if (reqs[i].sector > oldreq_last) { 154040b4f539SKevin Wolf size_t zero_bytes = (reqs[i].sector - oldreq_last) << 9; 154140b4f539SKevin Wolf uint8_t *buf = qemu_blockalign(bs, zero_bytes); 154240b4f539SKevin Wolf memset(buf, 0, zero_bytes); 154340b4f539SKevin Wolf qemu_iovec_add(qiov, buf, zero_bytes); 154440b4f539SKevin Wolf mcb->callbacks[i].free_buf = buf; 154540b4f539SKevin Wolf } 154640b4f539SKevin Wolf 154740b4f539SKevin Wolf // Add the second request 154840b4f539SKevin Wolf qemu_iovec_concat(qiov, reqs[i].qiov, reqs[i].qiov->size); 154940b4f539SKevin Wolf 155040b4f539SKevin Wolf reqs[outidx].nb_sectors += reqs[i].nb_sectors; 155140b4f539SKevin Wolf reqs[outidx].qiov = qiov; 155240b4f539SKevin Wolf 155340b4f539SKevin Wolf mcb->callbacks[i].free_qiov = reqs[outidx].qiov; 155440b4f539SKevin Wolf } else { 155540b4f539SKevin Wolf outidx++; 155640b4f539SKevin Wolf reqs[outidx].sector = reqs[i].sector; 155740b4f539SKevin Wolf reqs[outidx].nb_sectors = reqs[i].nb_sectors; 155840b4f539SKevin Wolf reqs[outidx].qiov = reqs[i].qiov; 155940b4f539SKevin Wolf } 156040b4f539SKevin Wolf } 156140b4f539SKevin Wolf 156240b4f539SKevin Wolf return outidx + 1; 156340b4f539SKevin Wolf } 156440b4f539SKevin Wolf 156540b4f539SKevin Wolf /* 156640b4f539SKevin Wolf * Submit multiple AIO write requests at once. 156740b4f539SKevin Wolf * 156840b4f539SKevin Wolf * On success, the function returns 0 and all requests in the reqs array have 156940b4f539SKevin Wolf * been submitted. In error case this function returns -1, and any of the 157040b4f539SKevin Wolf * requests may or may not be submitted yet. In particular, this means that the 157140b4f539SKevin Wolf * callback will be called for some of the requests, for others it won't. The 157240b4f539SKevin Wolf * caller must check the error field of the BlockRequest to wait for the right 157340b4f539SKevin Wolf * callbacks (if error != 0, no callback will be called). 157440b4f539SKevin Wolf * 157540b4f539SKevin Wolf * The implementation may modify the contents of the reqs array, e.g. to merge 157640b4f539SKevin Wolf * requests. However, the fields opaque and error are left unmodified as they 157740b4f539SKevin Wolf * are used to signal failure for a single request to the caller. 157840b4f539SKevin Wolf */ 157940b4f539SKevin Wolf int bdrv_aio_multiwrite(BlockDriverState *bs, BlockRequest *reqs, int num_reqs) 158040b4f539SKevin Wolf { 158140b4f539SKevin Wolf BlockDriverAIOCB *acb; 158240b4f539SKevin Wolf MultiwriteCB *mcb; 158340b4f539SKevin Wolf int i; 158440b4f539SKevin Wolf 158540b4f539SKevin Wolf if (num_reqs == 0) { 158640b4f539SKevin Wolf return 0; 158740b4f539SKevin Wolf } 158840b4f539SKevin Wolf 158940b4f539SKevin Wolf // Create MultiwriteCB structure 159040b4f539SKevin Wolf mcb = qemu_mallocz(sizeof(*mcb) + num_reqs * sizeof(*mcb->callbacks)); 159140b4f539SKevin Wolf mcb->num_requests = 0; 159240b4f539SKevin Wolf mcb->num_callbacks = num_reqs; 159340b4f539SKevin Wolf 159440b4f539SKevin Wolf for (i = 0; i < num_reqs; i++) { 159540b4f539SKevin Wolf mcb->callbacks[i].cb = reqs[i].cb; 159640b4f539SKevin Wolf mcb->callbacks[i].opaque = reqs[i].opaque; 159740b4f539SKevin Wolf } 159840b4f539SKevin Wolf 159940b4f539SKevin Wolf // Check for mergable requests 160040b4f539SKevin Wolf num_reqs = multiwrite_merge(bs, reqs, num_reqs, mcb); 160140b4f539SKevin Wolf 160240b4f539SKevin Wolf // Run the aio requests 160340b4f539SKevin Wolf for (i = 0; i < num_reqs; i++) { 160440b4f539SKevin Wolf acb = bdrv_aio_writev(bs, reqs[i].sector, reqs[i].qiov, 160540b4f539SKevin Wolf reqs[i].nb_sectors, multiwrite_cb, mcb); 160640b4f539SKevin Wolf 160740b4f539SKevin Wolf if (acb == NULL) { 160840b4f539SKevin Wolf // We can only fail the whole thing if no request has been 160940b4f539SKevin Wolf // submitted yet. Otherwise we'll wait for the submitted AIOs to 161040b4f539SKevin Wolf // complete and report the error in the callback. 161140b4f539SKevin Wolf if (mcb->num_requests == 0) { 161240b4f539SKevin Wolf reqs[i].error = EIO; 161340b4f539SKevin Wolf goto fail; 161440b4f539SKevin Wolf } else { 161540b4f539SKevin Wolf mcb->error = EIO; 161640b4f539SKevin Wolf break; 161740b4f539SKevin Wolf } 161840b4f539SKevin Wolf } else { 161940b4f539SKevin Wolf mcb->num_requests++; 162040b4f539SKevin Wolf } 162140b4f539SKevin Wolf } 162240b4f539SKevin Wolf 162340b4f539SKevin Wolf return 0; 162440b4f539SKevin Wolf 162540b4f539SKevin Wolf fail: 162640b4f539SKevin Wolf free(mcb); 162740b4f539SKevin Wolf return -1; 162840b4f539SKevin Wolf } 162940b4f539SKevin Wolf 1630b2e12bc6SChristoph Hellwig BlockDriverAIOCB *bdrv_aio_flush(BlockDriverState *bs, 1631b2e12bc6SChristoph Hellwig BlockDriverCompletionFunc *cb, void *opaque) 1632b2e12bc6SChristoph Hellwig { 1633b2e12bc6SChristoph Hellwig BlockDriver *drv = bs->drv; 1634b2e12bc6SChristoph Hellwig 1635b2e12bc6SChristoph Hellwig if (!drv) 1636b2e12bc6SChristoph Hellwig return NULL; 1637b2e12bc6SChristoph Hellwig 1638b2e12bc6SChristoph Hellwig /* 1639b2e12bc6SChristoph Hellwig * Note that unlike bdrv_flush the driver is reponsible for flushing a 1640b2e12bc6SChristoph Hellwig * backing image if it exists. 1641b2e12bc6SChristoph Hellwig */ 1642b2e12bc6SChristoph Hellwig return drv->bdrv_aio_flush(bs, cb, opaque); 1643b2e12bc6SChristoph Hellwig } 1644b2e12bc6SChristoph Hellwig 164583f64091Sbellard void bdrv_aio_cancel(BlockDriverAIOCB *acb) 164683f64091Sbellard { 16476bbff9a0Saliguori acb->pool->cancel(acb); 164883f64091Sbellard } 164983f64091Sbellard 165083f64091Sbellard 165183f64091Sbellard /**************************************************************/ 165283f64091Sbellard /* async block device emulation */ 165383f64091Sbellard 1654c16b5a2cSChristoph Hellwig typedef struct BlockDriverAIOCBSync { 1655c16b5a2cSChristoph Hellwig BlockDriverAIOCB common; 1656c16b5a2cSChristoph Hellwig QEMUBH *bh; 1657c16b5a2cSChristoph Hellwig int ret; 1658c16b5a2cSChristoph Hellwig /* vector translation state */ 1659c16b5a2cSChristoph Hellwig QEMUIOVector *qiov; 1660c16b5a2cSChristoph Hellwig uint8_t *bounce; 1661c16b5a2cSChristoph Hellwig int is_write; 1662c16b5a2cSChristoph Hellwig } BlockDriverAIOCBSync; 1663c16b5a2cSChristoph Hellwig 1664c16b5a2cSChristoph Hellwig static void bdrv_aio_cancel_em(BlockDriverAIOCB *blockacb) 1665c16b5a2cSChristoph Hellwig { 1666c16b5a2cSChristoph Hellwig BlockDriverAIOCBSync *acb = (BlockDriverAIOCBSync *)blockacb; 16676a7ad299SDor Laor qemu_bh_delete(acb->bh); 166836afc451SAvi Kivity acb->bh = NULL; 1669c16b5a2cSChristoph Hellwig qemu_aio_release(acb); 1670c16b5a2cSChristoph Hellwig } 1671c16b5a2cSChristoph Hellwig 1672c16b5a2cSChristoph Hellwig static AIOPool bdrv_em_aio_pool = { 1673c16b5a2cSChristoph Hellwig .aiocb_size = sizeof(BlockDriverAIOCBSync), 1674c16b5a2cSChristoph Hellwig .cancel = bdrv_aio_cancel_em, 1675c16b5a2cSChristoph Hellwig }; 1676c16b5a2cSChristoph Hellwig 167783f64091Sbellard static void bdrv_aio_bh_cb(void *opaque) 1678beac80cdSbellard { 1679ce1a14dcSpbrook BlockDriverAIOCBSync *acb = opaque; 1680f141eafeSaliguori 1681f141eafeSaliguori if (!acb->is_write) 1682f141eafeSaliguori qemu_iovec_from_buffer(acb->qiov, acb->bounce, acb->qiov->size); 1683ceb42de8Saliguori qemu_vfree(acb->bounce); 1684ce1a14dcSpbrook acb->common.cb(acb->common.opaque, acb->ret); 16856a7ad299SDor Laor qemu_bh_delete(acb->bh); 168636afc451SAvi Kivity acb->bh = NULL; 1687ce1a14dcSpbrook qemu_aio_release(acb); 1688beac80cdSbellard } 1689beac80cdSbellard 1690f141eafeSaliguori static BlockDriverAIOCB *bdrv_aio_rw_vector(BlockDriverState *bs, 1691f141eafeSaliguori int64_t sector_num, 1692f141eafeSaliguori QEMUIOVector *qiov, 1693f141eafeSaliguori int nb_sectors, 1694f141eafeSaliguori BlockDriverCompletionFunc *cb, 1695f141eafeSaliguori void *opaque, 1696f141eafeSaliguori int is_write) 1697f141eafeSaliguori 1698ea2384d3Sbellard { 1699ce1a14dcSpbrook BlockDriverAIOCBSync *acb; 170083f64091Sbellard 1701c16b5a2cSChristoph Hellwig acb = qemu_aio_get(&bdrv_em_aio_pool, bs, cb, opaque); 1702f141eafeSaliguori acb->is_write = is_write; 1703f141eafeSaliguori acb->qiov = qiov; 1704e268ca52Saliguori acb->bounce = qemu_blockalign(bs, qiov->size); 1705f141eafeSaliguori 1706ce1a14dcSpbrook if (!acb->bh) 1707ce1a14dcSpbrook acb->bh = qemu_bh_new(bdrv_aio_bh_cb, acb); 1708f141eafeSaliguori 1709f141eafeSaliguori if (is_write) { 1710f141eafeSaliguori qemu_iovec_to_buffer(acb->qiov, acb->bounce); 1711f141eafeSaliguori acb->ret = bdrv_write(bs, sector_num, acb->bounce, nb_sectors); 1712f141eafeSaliguori } else { 1713f141eafeSaliguori acb->ret = bdrv_read(bs, sector_num, acb->bounce, nb_sectors); 1714f141eafeSaliguori } 1715f141eafeSaliguori 1716ce1a14dcSpbrook qemu_bh_schedule(acb->bh); 1717f141eafeSaliguori 1718ce1a14dcSpbrook return &acb->common; 17197a6cba61Spbrook } 17207a6cba61Spbrook 1721f141eafeSaliguori static BlockDriverAIOCB *bdrv_aio_readv_em(BlockDriverState *bs, 1722f141eafeSaliguori int64_t sector_num, QEMUIOVector *qiov, int nb_sectors, 1723ce1a14dcSpbrook BlockDriverCompletionFunc *cb, void *opaque) 172483f64091Sbellard { 1725f141eafeSaliguori return bdrv_aio_rw_vector(bs, sector_num, qiov, nb_sectors, cb, opaque, 0); 172683f64091Sbellard } 172783f64091Sbellard 1728f141eafeSaliguori static BlockDriverAIOCB *bdrv_aio_writev_em(BlockDriverState *bs, 1729f141eafeSaliguori int64_t sector_num, QEMUIOVector *qiov, int nb_sectors, 1730f141eafeSaliguori BlockDriverCompletionFunc *cb, void *opaque) 1731f141eafeSaliguori { 1732f141eafeSaliguori return bdrv_aio_rw_vector(bs, sector_num, qiov, nb_sectors, cb, opaque, 1); 1733f141eafeSaliguori } 1734f141eafeSaliguori 1735b2e12bc6SChristoph Hellwig static BlockDriverAIOCB *bdrv_aio_flush_em(BlockDriverState *bs, 1736b2e12bc6SChristoph Hellwig BlockDriverCompletionFunc *cb, void *opaque) 1737b2e12bc6SChristoph Hellwig { 1738b2e12bc6SChristoph Hellwig BlockDriverAIOCBSync *acb; 1739b2e12bc6SChristoph Hellwig 1740b2e12bc6SChristoph Hellwig acb = qemu_aio_get(&bdrv_em_aio_pool, bs, cb, opaque); 1741b2e12bc6SChristoph Hellwig acb->is_write = 1; /* don't bounce in the completion hadler */ 1742b2e12bc6SChristoph Hellwig acb->qiov = NULL; 1743b2e12bc6SChristoph Hellwig acb->bounce = NULL; 1744b2e12bc6SChristoph Hellwig acb->ret = 0; 1745b2e12bc6SChristoph Hellwig 1746b2e12bc6SChristoph Hellwig if (!acb->bh) 1747b2e12bc6SChristoph Hellwig acb->bh = qemu_bh_new(bdrv_aio_bh_cb, acb); 1748b2e12bc6SChristoph Hellwig 1749b2e12bc6SChristoph Hellwig bdrv_flush(bs); 1750b2e12bc6SChristoph Hellwig qemu_bh_schedule(acb->bh); 1751b2e12bc6SChristoph Hellwig return &acb->common; 1752b2e12bc6SChristoph Hellwig } 1753b2e12bc6SChristoph Hellwig 175483f64091Sbellard /**************************************************************/ 175583f64091Sbellard /* sync block device emulation */ 175683f64091Sbellard 175783f64091Sbellard static void bdrv_rw_em_cb(void *opaque, int ret) 175883f64091Sbellard { 175983f64091Sbellard *(int *)opaque = ret; 176083f64091Sbellard } 176183f64091Sbellard 176283f64091Sbellard #define NOT_DONE 0x7fffffff 176383f64091Sbellard 176483f64091Sbellard static int bdrv_read_em(BlockDriverState *bs, int64_t sector_num, 176583f64091Sbellard uint8_t *buf, int nb_sectors) 176683f64091Sbellard { 1767ce1a14dcSpbrook int async_ret; 1768ce1a14dcSpbrook BlockDriverAIOCB *acb; 1769f141eafeSaliguori struct iovec iov; 1770f141eafeSaliguori QEMUIOVector qiov; 177183f64091Sbellard 177265d6b3d8SKevin Wolf async_context_push(); 177365d6b3d8SKevin Wolf 177483f64091Sbellard async_ret = NOT_DONE; 17753f4cb3d3Sblueswir1 iov.iov_base = (void *)buf; 1776f141eafeSaliguori iov.iov_len = nb_sectors * 512; 1777f141eafeSaliguori qemu_iovec_init_external(&qiov, &iov, 1); 1778f141eafeSaliguori acb = bdrv_aio_readv(bs, sector_num, &qiov, nb_sectors, 177983f64091Sbellard bdrv_rw_em_cb, &async_ret); 178065d6b3d8SKevin Wolf if (acb == NULL) { 178165d6b3d8SKevin Wolf async_ret = -1; 178265d6b3d8SKevin Wolf goto fail; 178365d6b3d8SKevin Wolf } 1784baf35cb9Saliguori 178583f64091Sbellard while (async_ret == NOT_DONE) { 178683f64091Sbellard qemu_aio_wait(); 178783f64091Sbellard } 1788baf35cb9Saliguori 178965d6b3d8SKevin Wolf 179065d6b3d8SKevin Wolf fail: 179165d6b3d8SKevin Wolf async_context_pop(); 179283f64091Sbellard return async_ret; 179383f64091Sbellard } 179483f64091Sbellard 179583f64091Sbellard static int bdrv_write_em(BlockDriverState *bs, int64_t sector_num, 179683f64091Sbellard const uint8_t *buf, int nb_sectors) 179783f64091Sbellard { 1798ce1a14dcSpbrook int async_ret; 1799ce1a14dcSpbrook BlockDriverAIOCB *acb; 1800f141eafeSaliguori struct iovec iov; 1801f141eafeSaliguori QEMUIOVector qiov; 180283f64091Sbellard 180365d6b3d8SKevin Wolf async_context_push(); 180465d6b3d8SKevin Wolf 180583f64091Sbellard async_ret = NOT_DONE; 1806f141eafeSaliguori iov.iov_base = (void *)buf; 1807f141eafeSaliguori iov.iov_len = nb_sectors * 512; 1808f141eafeSaliguori qemu_iovec_init_external(&qiov, &iov, 1); 1809f141eafeSaliguori acb = bdrv_aio_writev(bs, sector_num, &qiov, nb_sectors, 181083f64091Sbellard bdrv_rw_em_cb, &async_ret); 181165d6b3d8SKevin Wolf if (acb == NULL) { 181265d6b3d8SKevin Wolf async_ret = -1; 181365d6b3d8SKevin Wolf goto fail; 181465d6b3d8SKevin Wolf } 181583f64091Sbellard while (async_ret == NOT_DONE) { 181683f64091Sbellard qemu_aio_wait(); 181783f64091Sbellard } 181865d6b3d8SKevin Wolf 181965d6b3d8SKevin Wolf fail: 182065d6b3d8SKevin Wolf async_context_pop(); 182183f64091Sbellard return async_ret; 182283f64091Sbellard } 1823ea2384d3Sbellard 1824ea2384d3Sbellard void bdrv_init(void) 1825ea2384d3Sbellard { 18265efa9d5aSAnthony Liguori module_call_init(MODULE_INIT_BLOCK); 1827ea2384d3Sbellard } 1828ce1a14dcSpbrook 1829eb852011SMarkus Armbruster void bdrv_init_with_whitelist(void) 1830eb852011SMarkus Armbruster { 1831eb852011SMarkus Armbruster use_bdrv_whitelist = 1; 1832eb852011SMarkus Armbruster bdrv_init(); 1833eb852011SMarkus Armbruster } 1834eb852011SMarkus Armbruster 1835c16b5a2cSChristoph Hellwig void *qemu_aio_get(AIOPool *pool, BlockDriverState *bs, 18366bbff9a0Saliguori BlockDriverCompletionFunc *cb, void *opaque) 18376bbff9a0Saliguori { 1838ce1a14dcSpbrook BlockDriverAIOCB *acb; 1839ce1a14dcSpbrook 18406bbff9a0Saliguori if (pool->free_aiocb) { 18416bbff9a0Saliguori acb = pool->free_aiocb; 18426bbff9a0Saliguori pool->free_aiocb = acb->next; 1843ce1a14dcSpbrook } else { 18446bbff9a0Saliguori acb = qemu_mallocz(pool->aiocb_size); 18456bbff9a0Saliguori acb->pool = pool; 1846ce1a14dcSpbrook } 1847ce1a14dcSpbrook acb->bs = bs; 1848ce1a14dcSpbrook acb->cb = cb; 1849ce1a14dcSpbrook acb->opaque = opaque; 1850ce1a14dcSpbrook return acb; 1851ce1a14dcSpbrook } 1852ce1a14dcSpbrook 1853ce1a14dcSpbrook void qemu_aio_release(void *p) 1854ce1a14dcSpbrook { 18556bbff9a0Saliguori BlockDriverAIOCB *acb = (BlockDriverAIOCB *)p; 18566bbff9a0Saliguori AIOPool *pool = acb->pool; 18576bbff9a0Saliguori acb->next = pool->free_aiocb; 18586bbff9a0Saliguori pool->free_aiocb = acb; 1859ce1a14dcSpbrook } 186019cb3738Sbellard 186119cb3738Sbellard /**************************************************************/ 186219cb3738Sbellard /* removable device support */ 186319cb3738Sbellard 186419cb3738Sbellard /** 186519cb3738Sbellard * Return TRUE if the media is present 186619cb3738Sbellard */ 186719cb3738Sbellard int bdrv_is_inserted(BlockDriverState *bs) 186819cb3738Sbellard { 186919cb3738Sbellard BlockDriver *drv = bs->drv; 187019cb3738Sbellard int ret; 187119cb3738Sbellard if (!drv) 187219cb3738Sbellard return 0; 187319cb3738Sbellard if (!drv->bdrv_is_inserted) 187419cb3738Sbellard return 1; 187519cb3738Sbellard ret = drv->bdrv_is_inserted(bs); 187619cb3738Sbellard return ret; 187719cb3738Sbellard } 187819cb3738Sbellard 187919cb3738Sbellard /** 188019cb3738Sbellard * Return TRUE if the media changed since the last call to this 188119cb3738Sbellard * function. It is currently only used for floppy disks 188219cb3738Sbellard */ 188319cb3738Sbellard int bdrv_media_changed(BlockDriverState *bs) 188419cb3738Sbellard { 188519cb3738Sbellard BlockDriver *drv = bs->drv; 188619cb3738Sbellard int ret; 188719cb3738Sbellard 188819cb3738Sbellard if (!drv || !drv->bdrv_media_changed) 188919cb3738Sbellard ret = -ENOTSUP; 189019cb3738Sbellard else 189119cb3738Sbellard ret = drv->bdrv_media_changed(bs); 189219cb3738Sbellard if (ret == -ENOTSUP) 189319cb3738Sbellard ret = bs->media_changed; 189419cb3738Sbellard bs->media_changed = 0; 189519cb3738Sbellard return ret; 189619cb3738Sbellard } 189719cb3738Sbellard 189819cb3738Sbellard /** 189919cb3738Sbellard * If eject_flag is TRUE, eject the media. Otherwise, close the tray 190019cb3738Sbellard */ 1901aea2a33cSMark McLoughlin int bdrv_eject(BlockDriverState *bs, int eject_flag) 190219cb3738Sbellard { 190319cb3738Sbellard BlockDriver *drv = bs->drv; 190419cb3738Sbellard int ret; 190519cb3738Sbellard 1906aea2a33cSMark McLoughlin if (bs->locked) { 1907aea2a33cSMark McLoughlin return -EBUSY; 1908aea2a33cSMark McLoughlin } 1909aea2a33cSMark McLoughlin 191019cb3738Sbellard if (!drv || !drv->bdrv_eject) { 191119cb3738Sbellard ret = -ENOTSUP; 191219cb3738Sbellard } else { 191319cb3738Sbellard ret = drv->bdrv_eject(bs, eject_flag); 191419cb3738Sbellard } 191519cb3738Sbellard if (ret == -ENOTSUP) { 191619cb3738Sbellard if (eject_flag) 191719cb3738Sbellard bdrv_close(bs); 1918aea2a33cSMark McLoughlin ret = 0; 191919cb3738Sbellard } 1920aea2a33cSMark McLoughlin 1921aea2a33cSMark McLoughlin return ret; 192219cb3738Sbellard } 192319cb3738Sbellard 192419cb3738Sbellard int bdrv_is_locked(BlockDriverState *bs) 192519cb3738Sbellard { 192619cb3738Sbellard return bs->locked; 192719cb3738Sbellard } 192819cb3738Sbellard 192919cb3738Sbellard /** 193019cb3738Sbellard * Lock or unlock the media (if it is locked, the user won't be able 193119cb3738Sbellard * to eject it manually). 193219cb3738Sbellard */ 193319cb3738Sbellard void bdrv_set_locked(BlockDriverState *bs, int locked) 193419cb3738Sbellard { 193519cb3738Sbellard BlockDriver *drv = bs->drv; 193619cb3738Sbellard 193719cb3738Sbellard bs->locked = locked; 193819cb3738Sbellard if (drv && drv->bdrv_set_locked) { 193919cb3738Sbellard drv->bdrv_set_locked(bs, locked); 194019cb3738Sbellard } 194119cb3738Sbellard } 1942985a03b0Sths 1943985a03b0Sths /* needed for generic scsi interface */ 1944985a03b0Sths 1945985a03b0Sths int bdrv_ioctl(BlockDriverState *bs, unsigned long int req, void *buf) 1946985a03b0Sths { 1947985a03b0Sths BlockDriver *drv = bs->drv; 1948985a03b0Sths 1949985a03b0Sths if (drv && drv->bdrv_ioctl) 1950985a03b0Sths return drv->bdrv_ioctl(bs, req, buf); 1951985a03b0Sths return -ENOTSUP; 1952985a03b0Sths } 19537d780669Saliguori 1954221f715dSaliguori BlockDriverAIOCB *bdrv_aio_ioctl(BlockDriverState *bs, 1955221f715dSaliguori unsigned long int req, void *buf, 19567d780669Saliguori BlockDriverCompletionFunc *cb, void *opaque) 19577d780669Saliguori { 1958221f715dSaliguori BlockDriver *drv = bs->drv; 19597d780669Saliguori 1960221f715dSaliguori if (drv && drv->bdrv_aio_ioctl) 1961221f715dSaliguori return drv->bdrv_aio_ioctl(bs, req, buf, cb, opaque); 1962221f715dSaliguori return NULL; 19637d780669Saliguori } 1964e268ca52Saliguori 19657cd1e32aSlirans@il.ibm.com 19667cd1e32aSlirans@il.ibm.com 1967e268ca52Saliguori void *qemu_blockalign(BlockDriverState *bs, size_t size) 1968e268ca52Saliguori { 1969e268ca52Saliguori return qemu_memalign((bs && bs->buffer_alignment) ? bs->buffer_alignment : 512, size); 1970e268ca52Saliguori } 19717cd1e32aSlirans@il.ibm.com 19727cd1e32aSlirans@il.ibm.com void bdrv_set_dirty_tracking(BlockDriverState *bs, int enable) 19737cd1e32aSlirans@il.ibm.com { 19747cd1e32aSlirans@il.ibm.com int64_t bitmap_size; 1975a55eb92cSJan Kiszka 19767cd1e32aSlirans@il.ibm.com if (enable) { 1977*c6d22830SJan Kiszka if (!bs->dirty_bitmap) { 1978*c6d22830SJan Kiszka bitmap_size = (bdrv_getlength(bs) >> BDRV_SECTOR_BITS) + 1979*c6d22830SJan Kiszka BDRV_SECTORS_PER_DIRTY_CHUNK * 8 - 1; 1980*c6d22830SJan Kiszka bitmap_size /= BDRV_SECTORS_PER_DIRTY_CHUNK * 8; 19817cd1e32aSlirans@il.ibm.com 19827cd1e32aSlirans@il.ibm.com bs->dirty_bitmap = qemu_mallocz(bitmap_size); 19837cd1e32aSlirans@il.ibm.com } 19847cd1e32aSlirans@il.ibm.com } else { 1985*c6d22830SJan Kiszka if (bs->dirty_bitmap) { 19867cd1e32aSlirans@il.ibm.com qemu_free(bs->dirty_bitmap); 1987*c6d22830SJan Kiszka bs->dirty_bitmap = NULL; 19887cd1e32aSlirans@il.ibm.com } 19897cd1e32aSlirans@il.ibm.com } 19907cd1e32aSlirans@il.ibm.com } 19917cd1e32aSlirans@il.ibm.com 19927cd1e32aSlirans@il.ibm.com int bdrv_get_dirty(BlockDriverState *bs, int64_t sector) 19937cd1e32aSlirans@il.ibm.com { 19946ea44308SJan Kiszka int64_t chunk = sector / (int64_t)BDRV_SECTORS_PER_DIRTY_CHUNK; 19957cd1e32aSlirans@il.ibm.com 1996*c6d22830SJan Kiszka if (bs->dirty_bitmap && 1997*c6d22830SJan Kiszka (sector << BDRV_SECTOR_BITS) < bdrv_getlength(bs)) { 1998*c6d22830SJan Kiszka return bs->dirty_bitmap[chunk / (sizeof(unsigned long) * 8)] & 1999*c6d22830SJan Kiszka (1 << (chunk % (sizeof(unsigned long) * 8))); 20007cd1e32aSlirans@il.ibm.com } else { 20017cd1e32aSlirans@il.ibm.com return 0; 20027cd1e32aSlirans@il.ibm.com } 20037cd1e32aSlirans@il.ibm.com } 20047cd1e32aSlirans@il.ibm.com 20057cd1e32aSlirans@il.ibm.com void bdrv_reset_dirty(BlockDriverState *bs, int64_t cur_sector, 20067cd1e32aSlirans@il.ibm.com int nr_sectors) 20077cd1e32aSlirans@il.ibm.com { 20087cd1e32aSlirans@il.ibm.com set_dirty_bitmap(bs, cur_sector, nr_sectors, 0); 20097cd1e32aSlirans@il.ibm.com } 2010