1019d6b8fSAnthony Liguori /* 2019d6b8fSAnthony Liguori * Block driver for the various disk image formats used by Bochs 3019d6b8fSAnthony Liguori * Currently only for "growing" type in read-only mode 4019d6b8fSAnthony Liguori * 5019d6b8fSAnthony Liguori * Copyright (c) 2005 Alex Beregszaszi 6019d6b8fSAnthony Liguori * 7019d6b8fSAnthony Liguori * Permission is hereby granted, free of charge, to any person obtaining a copy 8019d6b8fSAnthony Liguori * of this software and associated documentation files (the "Software"), to deal 9019d6b8fSAnthony Liguori * in the Software without restriction, including without limitation the rights 10019d6b8fSAnthony Liguori * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell 11019d6b8fSAnthony Liguori * copies of the Software, and to permit persons to whom the Software is 12019d6b8fSAnthony Liguori * furnished to do so, subject to the following conditions: 13019d6b8fSAnthony Liguori * 14019d6b8fSAnthony Liguori * The above copyright notice and this permission notice shall be included in 15019d6b8fSAnthony Liguori * all copies or substantial portions of the Software. 16019d6b8fSAnthony Liguori * 17019d6b8fSAnthony Liguori * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 18019d6b8fSAnthony Liguori * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 19019d6b8fSAnthony Liguori * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 20019d6b8fSAnthony Liguori * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 21019d6b8fSAnthony Liguori * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 22019d6b8fSAnthony Liguori * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN 23019d6b8fSAnthony Liguori * THE SOFTWARE. 24019d6b8fSAnthony Liguori */ 2580c71a24SPeter Maydell #include "qemu/osdep.h" 26da34e65cSMarkus Armbruster #include "qapi/error.h" 27737e150eSPaolo Bonzini #include "block/block_int.h" 281de7afc9SPaolo Bonzini #include "qemu/module.h" 2958369e22SPaolo Bonzini #include "qemu/bswap.h" 30398e6ad0SKevin Wolf #include "qemu/error-report.h" 31019d6b8fSAnthony Liguori 32019d6b8fSAnthony Liguori /**************************************************************/ 33019d6b8fSAnthony Liguori 34019d6b8fSAnthony Liguori #define HEADER_MAGIC "Bochs Virtual HD Image" 35019d6b8fSAnthony Liguori #define HEADER_VERSION 0x00020000 36019d6b8fSAnthony Liguori #define HEADER_V1 0x00010000 37019d6b8fSAnthony Liguori #define HEADER_SIZE 512 38019d6b8fSAnthony Liguori 39019d6b8fSAnthony Liguori #define REDOLOG_TYPE "Redolog" 40019d6b8fSAnthony Liguori #define GROWING_TYPE "Growing" 41019d6b8fSAnthony Liguori 42019d6b8fSAnthony Liguori // not allocated: 0xffffffff 43019d6b8fSAnthony Liguori 44019d6b8fSAnthony Liguori // always little-endian 45019d6b8fSAnthony Liguori struct bochs_header { 463dd8a676SKevin Wolf char magic[32]; /* "Bochs Virtual HD Image" */ 473dd8a676SKevin Wolf char type[16]; /* "Redolog" */ 483dd8a676SKevin Wolf char subtype[16]; /* "Undoable" / "Volatile" / "Growing" */ 49019d6b8fSAnthony Liguori uint32_t version; 503dd8a676SKevin Wolf uint32_t header; /* size of header */ 513dd8a676SKevin Wolf 523dd8a676SKevin Wolf uint32_t catalog; /* num of entries */ 533dd8a676SKevin Wolf uint32_t bitmap; /* bitmap size */ 543dd8a676SKevin Wolf uint32_t extent; /* extent size */ 55019d6b8fSAnthony Liguori 56019d6b8fSAnthony Liguori union { 57019d6b8fSAnthony Liguori struct { 583dd8a676SKevin Wolf uint32_t reserved; /* for ??? */ 593dd8a676SKevin Wolf uint64_t disk; /* disk size */ 603dd8a676SKevin Wolf char padding[HEADER_SIZE - 64 - 20 - 12]; 613dd8a676SKevin Wolf } QEMU_PACKED redolog; 623dd8a676SKevin Wolf struct { 633dd8a676SKevin Wolf uint64_t disk; /* disk size */ 643dd8a676SKevin Wolf char padding[HEADER_SIZE - 64 - 20 - 8]; 653dd8a676SKevin Wolf } QEMU_PACKED redolog_v1; 663dd8a676SKevin Wolf char padding[HEADER_SIZE - 64 - 20]; 67019d6b8fSAnthony Liguori } extra; 683dd8a676SKevin Wolf } QEMU_PACKED; 69019d6b8fSAnthony Liguori 70019d6b8fSAnthony Liguori typedef struct BDRVBochsState { 71848c66e8SPaolo Bonzini CoMutex lock; 72019d6b8fSAnthony Liguori uint32_t *catalog_bitmap; 73246f6583SKevin Wolf uint32_t catalog_size; 74019d6b8fSAnthony Liguori 75246f6583SKevin Wolf uint32_t data_offset; 76019d6b8fSAnthony Liguori 77246f6583SKevin Wolf uint32_t bitmap_blocks; 78246f6583SKevin Wolf uint32_t extent_blocks; 79246f6583SKevin Wolf uint32_t extent_size; 80019d6b8fSAnthony Liguori } BDRVBochsState; 81019d6b8fSAnthony Liguori 82019d6b8fSAnthony Liguori static int bochs_probe(const uint8_t *buf, int buf_size, const char *filename) 83019d6b8fSAnthony Liguori { 84019d6b8fSAnthony Liguori const struct bochs_header *bochs = (const void *)buf; 85019d6b8fSAnthony Liguori 86019d6b8fSAnthony Liguori if (buf_size < HEADER_SIZE) 87019d6b8fSAnthony Liguori return 0; 88019d6b8fSAnthony Liguori 89019d6b8fSAnthony Liguori if (!strcmp(bochs->magic, HEADER_MAGIC) && 90019d6b8fSAnthony Liguori !strcmp(bochs->type, REDOLOG_TYPE) && 91019d6b8fSAnthony Liguori !strcmp(bochs->subtype, GROWING_TYPE) && 92019d6b8fSAnthony Liguori ((le32_to_cpu(bochs->version) == HEADER_VERSION) || 93019d6b8fSAnthony Liguori (le32_to_cpu(bochs->version) == HEADER_V1))) 94019d6b8fSAnthony Liguori return 100; 95019d6b8fSAnthony Liguori 96019d6b8fSAnthony Liguori return 0; 97019d6b8fSAnthony Liguori } 98019d6b8fSAnthony Liguori 99015a1036SMax Reitz static int bochs_open(BlockDriverState *bs, QDict *options, int flags, 100015a1036SMax Reitz Error **errp) 101019d6b8fSAnthony Liguori { 102019d6b8fSAnthony Liguori BDRVBochsState *s = bs->opaque; 103246f6583SKevin Wolf uint32_t i; 104019d6b8fSAnthony Liguori struct bochs_header bochs; 1055b7d7dfdSKevin Wolf int ret; 106019d6b8fSAnthony Liguori 107eaa2410fSKevin Wolf /* No write support yet */ 108eaa2410fSKevin Wolf ret = bdrv_apply_auto_read_only(bs, NULL, errp); 109eaa2410fSKevin Wolf if (ret < 0) { 110eaa2410fSKevin Wolf return ret; 111eaa2410fSKevin Wolf } 112eaa2410fSKevin Wolf 1134e4bf5c4SKevin Wolf bs->file = bdrv_open_child(NULL, options, "file", bs, &child_file, 1144e4bf5c4SKevin Wolf false, errp); 1154e4bf5c4SKevin Wolf if (!bs->file) { 1164e4bf5c4SKevin Wolf return -EINVAL; 1174e4bf5c4SKevin Wolf } 1184e4bf5c4SKevin Wolf 119cf2ab8fcSKevin Wolf ret = bdrv_pread(bs->file, 0, &bochs, sizeof(bochs)); 1205b7d7dfdSKevin Wolf if (ret < 0) { 1215b7d7dfdSKevin Wolf return ret; 122019d6b8fSAnthony Liguori } 123019d6b8fSAnthony Liguori 124019d6b8fSAnthony Liguori if (strcmp(bochs.magic, HEADER_MAGIC) || 125019d6b8fSAnthony Liguori strcmp(bochs.type, REDOLOG_TYPE) || 126019d6b8fSAnthony Liguori strcmp(bochs.subtype, GROWING_TYPE) || 127019d6b8fSAnthony Liguori ((le32_to_cpu(bochs.version) != HEADER_VERSION) && 128019d6b8fSAnthony Liguori (le32_to_cpu(bochs.version) != HEADER_V1))) { 12976abe407SPaolo Bonzini error_setg(errp, "Image not in Bochs format"); 13076abe407SPaolo Bonzini return -EINVAL; 131019d6b8fSAnthony Liguori } 132019d6b8fSAnthony Liguori 133019d6b8fSAnthony Liguori if (le32_to_cpu(bochs.version) == HEADER_V1) { 1343dd8a676SKevin Wolf bs->total_sectors = le64_to_cpu(bochs.extra.redolog_v1.disk) / 512; 135019d6b8fSAnthony Liguori } else { 136019d6b8fSAnthony Liguori bs->total_sectors = le64_to_cpu(bochs.extra.redolog.disk) / 512; 137019d6b8fSAnthony Liguori } 138019d6b8fSAnthony Liguori 139e3737b82SKevin Wolf /* Limit to 1M entries to avoid unbounded allocation. This is what is 140e3737b82SKevin Wolf * needed for the largest image that bximage can create (~8 TB). */ 1413dd8a676SKevin Wolf s->catalog_size = le32_to_cpu(bochs.catalog); 142e3737b82SKevin Wolf if (s->catalog_size > 0x100000) { 143e3737b82SKevin Wolf error_setg(errp, "Catalog size is too large"); 144e3737b82SKevin Wolf return -EFBIG; 145e3737b82SKevin Wolf } 146e3737b82SKevin Wolf 14702c4f26bSMarkus Armbruster s->catalog_bitmap = g_try_new(uint32_t, s->catalog_size); 1487bf665eeSKevin Wolf if (s->catalog_size && s->catalog_bitmap == NULL) { 1497bf665eeSKevin Wolf error_setg(errp, "Could not allocate memory for catalog"); 1507bf665eeSKevin Wolf return -ENOMEM; 1517bf665eeSKevin Wolf } 1525b7d7dfdSKevin Wolf 153cf2ab8fcSKevin Wolf ret = bdrv_pread(bs->file, le32_to_cpu(bochs.header), s->catalog_bitmap, 1545b7d7dfdSKevin Wolf s->catalog_size * 4); 1555b7d7dfdSKevin Wolf if (ret < 0) { 156019d6b8fSAnthony Liguori goto fail; 1575b7d7dfdSKevin Wolf } 1585b7d7dfdSKevin Wolf 159019d6b8fSAnthony Liguori for (i = 0; i < s->catalog_size; i++) 160019d6b8fSAnthony Liguori le32_to_cpus(&s->catalog_bitmap[i]); 161019d6b8fSAnthony Liguori 162019d6b8fSAnthony Liguori s->data_offset = le32_to_cpu(bochs.header) + (s->catalog_size * 4); 163019d6b8fSAnthony Liguori 1643dd8a676SKevin Wolf s->bitmap_blocks = 1 + (le32_to_cpu(bochs.bitmap) - 1) / 512; 1653dd8a676SKevin Wolf s->extent_blocks = 1 + (le32_to_cpu(bochs.extent) - 1) / 512; 166019d6b8fSAnthony Liguori 1673dd8a676SKevin Wolf s->extent_size = le32_to_cpu(bochs.extent); 168715c3f60SKevin Wolf if (s->extent_size < BDRV_SECTOR_SIZE) { 169715c3f60SKevin Wolf /* bximage actually never creates extents smaller than 4k */ 170715c3f60SKevin Wolf error_setg(errp, "Extent size must be at least 512"); 171715c3f60SKevin Wolf ret = -EINVAL; 172715c3f60SKevin Wolf goto fail; 173715c3f60SKevin Wolf } else if (!is_power_of_2(s->extent_size)) { 174715c3f60SKevin Wolf error_setg(errp, "Extent size %" PRIu32 " is not a power of two", 175715c3f60SKevin Wolf s->extent_size); 17628ec11bcSKevin Wolf ret = -EINVAL; 17728ec11bcSKevin Wolf goto fail; 1788e53abbcSKevin Wolf } else if (s->extent_size > 0x800000) { 1798e53abbcSKevin Wolf error_setg(errp, "Extent size %" PRIu32 " is too large", 1808e53abbcSKevin Wolf s->extent_size); 18128ec11bcSKevin Wolf ret = -EINVAL; 18228ec11bcSKevin Wolf goto fail; 1838e53abbcSKevin Wolf } 184019d6b8fSAnthony Liguori 185715c3f60SKevin Wolf if (s->catalog_size < DIV_ROUND_UP(bs->total_sectors, 186715c3f60SKevin Wolf s->extent_size / BDRV_SECTOR_SIZE)) 187715c3f60SKevin Wolf { 188e3737b82SKevin Wolf error_setg(errp, "Catalog size is too small for this disk size"); 189e3737b82SKevin Wolf ret = -EINVAL; 190e3737b82SKevin Wolf goto fail; 191e3737b82SKevin Wolf } 192e3737b82SKevin Wolf 193848c66e8SPaolo Bonzini qemu_co_mutex_init(&s->lock); 194019d6b8fSAnthony Liguori return 0; 1955b7d7dfdSKevin Wolf 196019d6b8fSAnthony Liguori fail: 1975b7d7dfdSKevin Wolf g_free(s->catalog_bitmap); 1985b7d7dfdSKevin Wolf return ret; 199019d6b8fSAnthony Liguori } 200019d6b8fSAnthony Liguori 201a6506481SEric Blake static void bochs_refresh_limits(BlockDriverState *bs, Error **errp) 202a6506481SEric Blake { 203a5b8dd2cSEric Blake bs->bl.request_alignment = BDRV_SECTOR_SIZE; /* No sub-sector I/O */ 204a6506481SEric Blake } 205a6506481SEric Blake 206efbca10fSChristoph Hellwig static int64_t seek_to_sector(BlockDriverState *bs, int64_t sector_num) 207019d6b8fSAnthony Liguori { 208019d6b8fSAnthony Liguori BDRVBochsState *s = bs->opaque; 209246f6583SKevin Wolf uint64_t offset = sector_num * 512; 210246f6583SKevin Wolf uint64_t extent_index, extent_offset, bitmap_offset; 211019d6b8fSAnthony Liguori char bitmap_entry; 212e1b42f45SMax Reitz int ret; 213019d6b8fSAnthony Liguori 214019d6b8fSAnthony Liguori // seek to sector 215019d6b8fSAnthony Liguori extent_index = offset / s->extent_size; 216019d6b8fSAnthony Liguori extent_offset = (offset % s->extent_size) / 512; 217019d6b8fSAnthony Liguori 218efbca10fSChristoph Hellwig if (s->catalog_bitmap[extent_index] == 0xffffffff) { 219e1b42f45SMax Reitz return 0; /* not allocated */ 220019d6b8fSAnthony Liguori } 221019d6b8fSAnthony Liguori 222a9ba36a4SKevin Wolf bitmap_offset = s->data_offset + 223a9ba36a4SKevin Wolf (512 * (uint64_t) s->catalog_bitmap[extent_index] * 224019d6b8fSAnthony Liguori (s->extent_blocks + s->bitmap_blocks)); 225019d6b8fSAnthony Liguori 226efbca10fSChristoph Hellwig /* read in bitmap for current extent */ 227cf2ab8fcSKevin Wolf ret = bdrv_pread(bs->file, bitmap_offset + (extent_offset / 8), 228e1b42f45SMax Reitz &bitmap_entry, 1); 229e1b42f45SMax Reitz if (ret < 0) { 230e1b42f45SMax Reitz return ret; 231ecbe1576SBlue Swirl } 232019d6b8fSAnthony Liguori 233efbca10fSChristoph Hellwig if (!((bitmap_entry >> (extent_offset % 8)) & 1)) { 234e1b42f45SMax Reitz return 0; /* not allocated */ 235019d6b8fSAnthony Liguori } 236019d6b8fSAnthony Liguori 237efbca10fSChristoph Hellwig return bitmap_offset + (512 * (s->bitmap_blocks + extent_offset)); 238019d6b8fSAnthony Liguori } 239019d6b8fSAnthony Liguori 2403b8fd330SKevin Wolf static int coroutine_fn 2413b8fd330SKevin Wolf bochs_co_preadv(BlockDriverState *bs, uint64_t offset, uint64_t bytes, 2423b8fd330SKevin Wolf QEMUIOVector *qiov, int flags) 243019d6b8fSAnthony Liguori { 2443b8fd330SKevin Wolf BDRVBochsState *s = bs->opaque; 2453b8fd330SKevin Wolf uint64_t sector_num = offset >> BDRV_SECTOR_BITS; 2463b8fd330SKevin Wolf int nb_sectors = bytes >> BDRV_SECTOR_BITS; 2473b8fd330SKevin Wolf uint64_t bytes_done = 0; 2483b8fd330SKevin Wolf QEMUIOVector local_qiov; 249019d6b8fSAnthony Liguori int ret; 250019d6b8fSAnthony Liguori 251*1bbbf32dSNir Soffer assert(QEMU_IS_ALIGNED(offset, BDRV_SECTOR_SIZE)); 252*1bbbf32dSNir Soffer assert(QEMU_IS_ALIGNED(bytes, BDRV_SECTOR_SIZE)); 2533b8fd330SKevin Wolf 2543b8fd330SKevin Wolf qemu_iovec_init(&local_qiov, qiov->niov); 2553b8fd330SKevin Wolf qemu_co_mutex_lock(&s->lock); 2563b8fd330SKevin Wolf 257019d6b8fSAnthony Liguori while (nb_sectors > 0) { 258efbca10fSChristoph Hellwig int64_t block_offset = seek_to_sector(bs, sector_num); 259e1b42f45SMax Reitz if (block_offset < 0) { 2603b8fd330SKevin Wolf ret = block_offset; 2613b8fd330SKevin Wolf goto fail; 2623b8fd330SKevin Wolf } 2633b8fd330SKevin Wolf 2643b8fd330SKevin Wolf qemu_iovec_reset(&local_qiov); 2653b8fd330SKevin Wolf qemu_iovec_concat(&local_qiov, qiov, bytes_done, 512); 2663b8fd330SKevin Wolf 2673b8fd330SKevin Wolf if (block_offset > 0) { 268a03ef88fSKevin Wolf ret = bdrv_co_preadv(bs->file, block_offset, 512, 2693b8fd330SKevin Wolf &local_qiov, 0); 270e1b42f45SMax Reitz if (ret < 0) { 2713b8fd330SKevin Wolf goto fail; 272019d6b8fSAnthony Liguori } 273e1b42f45SMax Reitz } else { 2743b8fd330SKevin Wolf qemu_iovec_memset(&local_qiov, 0, 0, 512); 275e1b42f45SMax Reitz } 276019d6b8fSAnthony Liguori nb_sectors--; 277019d6b8fSAnthony Liguori sector_num++; 2783b8fd330SKevin Wolf bytes_done += 512; 279019d6b8fSAnthony Liguori } 280019d6b8fSAnthony Liguori 2813b8fd330SKevin Wolf ret = 0; 2823b8fd330SKevin Wolf fail: 2832914caa0SPaolo Bonzini qemu_co_mutex_unlock(&s->lock); 2843b8fd330SKevin Wolf qemu_iovec_destroy(&local_qiov); 2853b8fd330SKevin Wolf 2862914caa0SPaolo Bonzini return ret; 2872914caa0SPaolo Bonzini } 2882914caa0SPaolo Bonzini 289019d6b8fSAnthony Liguori static void bochs_close(BlockDriverState *bs) 290019d6b8fSAnthony Liguori { 291019d6b8fSAnthony Liguori BDRVBochsState *s = bs->opaque; 2927267c094SAnthony Liguori g_free(s->catalog_bitmap); 293019d6b8fSAnthony Liguori } 294019d6b8fSAnthony Liguori 295019d6b8fSAnthony Liguori static BlockDriver bdrv_bochs = { 296019d6b8fSAnthony Liguori .format_name = "bochs", 297019d6b8fSAnthony Liguori .instance_size = sizeof(BDRVBochsState), 298019d6b8fSAnthony Liguori .bdrv_probe = bochs_probe, 2997a6f3913SChristoph Hellwig .bdrv_open = bochs_open, 300862f215fSKevin Wolf .bdrv_child_perm = bdrv_format_default_perms, 301a6506481SEric Blake .bdrv_refresh_limits = bochs_refresh_limits, 3023b8fd330SKevin Wolf .bdrv_co_preadv = bochs_co_preadv, 303019d6b8fSAnthony Liguori .bdrv_close = bochs_close, 304019d6b8fSAnthony Liguori }; 305019d6b8fSAnthony Liguori 306019d6b8fSAnthony Liguori static void bdrv_bochs_init(void) 307019d6b8fSAnthony Liguori { 308019d6b8fSAnthony Liguori bdrv_register(&bdrv_bochs); 309019d6b8fSAnthony Liguori } 310019d6b8fSAnthony Liguori 311019d6b8fSAnthony Liguori block_init(bdrv_bochs_init); 312