1019d6b8fSAnthony Liguori /*
2019d6b8fSAnthony Liguori * Block driver for the various disk image formats used by Bochs
3019d6b8fSAnthony Liguori * Currently only for "growing" type in read-only mode
4019d6b8fSAnthony Liguori *
5019d6b8fSAnthony Liguori * Copyright (c) 2005 Alex Beregszaszi
6019d6b8fSAnthony Liguori *
7019d6b8fSAnthony Liguori * Permission is hereby granted, free of charge, to any person obtaining a copy
8019d6b8fSAnthony Liguori * of this software and associated documentation files (the "Software"), to deal
9019d6b8fSAnthony Liguori * in the Software without restriction, including without limitation the rights
10019d6b8fSAnthony Liguori * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
11019d6b8fSAnthony Liguori * copies of the Software, and to permit persons to whom the Software is
12019d6b8fSAnthony Liguori * furnished to do so, subject to the following conditions:
13019d6b8fSAnthony Liguori *
14019d6b8fSAnthony Liguori * The above copyright notice and this permission notice shall be included in
15019d6b8fSAnthony Liguori * all copies or substantial portions of the Software.
16019d6b8fSAnthony Liguori *
17019d6b8fSAnthony Liguori * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
18019d6b8fSAnthony Liguori * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
19019d6b8fSAnthony Liguori * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
20019d6b8fSAnthony Liguori * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
21019d6b8fSAnthony Liguori * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
22019d6b8fSAnthony Liguori * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
23019d6b8fSAnthony Liguori * THE SOFTWARE.
24019d6b8fSAnthony Liguori */
2580c71a24SPeter Maydell #include "qemu/osdep.h"
26da34e65cSMarkus Armbruster #include "qapi/error.h"
27e2c1c34fSMarkus Armbruster #include "block/block-io.h"
28737e150eSPaolo Bonzini #include "block/block_int.h"
291de7afc9SPaolo Bonzini #include "qemu/module.h"
3058369e22SPaolo Bonzini #include "qemu/bswap.h"
31398e6ad0SKevin Wolf #include "qemu/error-report.h"
32019d6b8fSAnthony Liguori
33019d6b8fSAnthony Liguori /**************************************************************/
34019d6b8fSAnthony Liguori
35019d6b8fSAnthony Liguori #define HEADER_MAGIC "Bochs Virtual HD Image"
36019d6b8fSAnthony Liguori #define HEADER_VERSION 0x00020000
37019d6b8fSAnthony Liguori #define HEADER_V1 0x00010000
38019d6b8fSAnthony Liguori #define HEADER_SIZE 512
39019d6b8fSAnthony Liguori
40019d6b8fSAnthony Liguori #define REDOLOG_TYPE "Redolog"
41019d6b8fSAnthony Liguori #define GROWING_TYPE "Growing"
42019d6b8fSAnthony Liguori
43019d6b8fSAnthony Liguori // not allocated: 0xffffffff
44019d6b8fSAnthony Liguori
45019d6b8fSAnthony Liguori // always little-endian
46019d6b8fSAnthony Liguori struct bochs_header {
473dd8a676SKevin Wolf char magic[32]; /* "Bochs Virtual HD Image" */
483dd8a676SKevin Wolf char type[16]; /* "Redolog" */
493dd8a676SKevin Wolf char subtype[16]; /* "Undoable" / "Volatile" / "Growing" */
50019d6b8fSAnthony Liguori uint32_t version;
513dd8a676SKevin Wolf uint32_t header; /* size of header */
523dd8a676SKevin Wolf
533dd8a676SKevin Wolf uint32_t catalog; /* num of entries */
543dd8a676SKevin Wolf uint32_t bitmap; /* bitmap size */
553dd8a676SKevin Wolf uint32_t extent; /* extent size */
56019d6b8fSAnthony Liguori
57019d6b8fSAnthony Liguori union {
58019d6b8fSAnthony Liguori struct {
593dd8a676SKevin Wolf uint32_t reserved; /* for ??? */
603dd8a676SKevin Wolf uint64_t disk; /* disk size */
613dd8a676SKevin Wolf char padding[HEADER_SIZE - 64 - 20 - 12];
623dd8a676SKevin Wolf } QEMU_PACKED redolog;
633dd8a676SKevin Wolf struct {
643dd8a676SKevin Wolf uint64_t disk; /* disk size */
653dd8a676SKevin Wolf char padding[HEADER_SIZE - 64 - 20 - 8];
663dd8a676SKevin Wolf } QEMU_PACKED redolog_v1;
673dd8a676SKevin Wolf char padding[HEADER_SIZE - 64 - 20];
68019d6b8fSAnthony Liguori } extra;
693dd8a676SKevin Wolf } QEMU_PACKED;
70019d6b8fSAnthony Liguori
71019d6b8fSAnthony Liguori typedef struct BDRVBochsState {
72848c66e8SPaolo Bonzini CoMutex lock;
73019d6b8fSAnthony Liguori uint32_t *catalog_bitmap;
74246f6583SKevin Wolf uint32_t catalog_size;
75019d6b8fSAnthony Liguori
76246f6583SKevin Wolf uint32_t data_offset;
77019d6b8fSAnthony Liguori
78246f6583SKevin Wolf uint32_t bitmap_blocks;
79246f6583SKevin Wolf uint32_t extent_blocks;
80246f6583SKevin Wolf uint32_t extent_size;
81019d6b8fSAnthony Liguori } BDRVBochsState;
82019d6b8fSAnthony Liguori
bochs_probe(const uint8_t * buf,int buf_size,const char * filename)83019d6b8fSAnthony Liguori static int bochs_probe(const uint8_t *buf, int buf_size, const char *filename)
84019d6b8fSAnthony Liguori {
85019d6b8fSAnthony Liguori const struct bochs_header *bochs = (const void *)buf;
86019d6b8fSAnthony Liguori
87019d6b8fSAnthony Liguori if (buf_size < HEADER_SIZE)
88019d6b8fSAnthony Liguori return 0;
89019d6b8fSAnthony Liguori
90019d6b8fSAnthony Liguori if (!strcmp(bochs->magic, HEADER_MAGIC) &&
91019d6b8fSAnthony Liguori !strcmp(bochs->type, REDOLOG_TYPE) &&
92019d6b8fSAnthony Liguori !strcmp(bochs->subtype, GROWING_TYPE) &&
93019d6b8fSAnthony Liguori ((le32_to_cpu(bochs->version) == HEADER_VERSION) ||
94019d6b8fSAnthony Liguori (le32_to_cpu(bochs->version) == HEADER_V1)))
95019d6b8fSAnthony Liguori return 100;
96019d6b8fSAnthony Liguori
97019d6b8fSAnthony Liguori return 0;
98019d6b8fSAnthony Liguori }
99019d6b8fSAnthony Liguori
bochs_open(BlockDriverState * bs,QDict * options,int flags,Error ** errp)100015a1036SMax Reitz static int bochs_open(BlockDriverState *bs, QDict *options, int flags,
101015a1036SMax Reitz Error **errp)
102019d6b8fSAnthony Liguori {
103019d6b8fSAnthony Liguori BDRVBochsState *s = bs->opaque;
104246f6583SKevin Wolf uint32_t i;
105019d6b8fSAnthony Liguori struct bochs_header bochs;
1065b7d7dfdSKevin Wolf int ret;
107019d6b8fSAnthony Liguori
108*a4b740dbSKevin Wolf GLOBAL_STATE_CODE();
109*a4b740dbSKevin Wolf
110eaa2410fSKevin Wolf /* No write support yet */
111018f9deaSKevin Wolf bdrv_graph_rdlock_main_loop();
112eaa2410fSKevin Wolf ret = bdrv_apply_auto_read_only(bs, NULL, errp);
113018f9deaSKevin Wolf bdrv_graph_rdunlock_main_loop();
114eaa2410fSKevin Wolf if (ret < 0) {
115eaa2410fSKevin Wolf return ret;
116eaa2410fSKevin Wolf }
117eaa2410fSKevin Wolf
11883930780SVladimir Sementsov-Ogievskiy ret = bdrv_open_file_child(NULL, options, "file", bs, errp);
11983930780SVladimir Sementsov-Ogievskiy if (ret < 0) {
12083930780SVladimir Sementsov-Ogievskiy return ret;
1214e4bf5c4SKevin Wolf }
1224e4bf5c4SKevin Wolf
123*a4b740dbSKevin Wolf GRAPH_RDLOCK_GUARD_MAINLOOP();
124*a4b740dbSKevin Wolf
12532cc71deSAlberto Faria ret = bdrv_pread(bs->file, 0, sizeof(bochs), &bochs, 0);
1265b7d7dfdSKevin Wolf if (ret < 0) {
1275b7d7dfdSKevin Wolf return ret;
128019d6b8fSAnthony Liguori }
129019d6b8fSAnthony Liguori
130019d6b8fSAnthony Liguori if (strcmp(bochs.magic, HEADER_MAGIC) ||
131019d6b8fSAnthony Liguori strcmp(bochs.type, REDOLOG_TYPE) ||
132019d6b8fSAnthony Liguori strcmp(bochs.subtype, GROWING_TYPE) ||
133019d6b8fSAnthony Liguori ((le32_to_cpu(bochs.version) != HEADER_VERSION) &&
134019d6b8fSAnthony Liguori (le32_to_cpu(bochs.version) != HEADER_V1))) {
13576abe407SPaolo Bonzini error_setg(errp, "Image not in Bochs format");
13676abe407SPaolo Bonzini return -EINVAL;
137019d6b8fSAnthony Liguori }
138019d6b8fSAnthony Liguori
139019d6b8fSAnthony Liguori if (le32_to_cpu(bochs.version) == HEADER_V1) {
1403dd8a676SKevin Wolf bs->total_sectors = le64_to_cpu(bochs.extra.redolog_v1.disk) / 512;
141019d6b8fSAnthony Liguori } else {
142019d6b8fSAnthony Liguori bs->total_sectors = le64_to_cpu(bochs.extra.redolog.disk) / 512;
143019d6b8fSAnthony Liguori }
144019d6b8fSAnthony Liguori
145e3737b82SKevin Wolf /* Limit to 1M entries to avoid unbounded allocation. This is what is
146e3737b82SKevin Wolf * needed for the largest image that bximage can create (~8 TB). */
1473dd8a676SKevin Wolf s->catalog_size = le32_to_cpu(bochs.catalog);
148e3737b82SKevin Wolf if (s->catalog_size > 0x100000) {
149e3737b82SKevin Wolf error_setg(errp, "Catalog size is too large");
150e3737b82SKevin Wolf return -EFBIG;
151e3737b82SKevin Wolf }
152e3737b82SKevin Wolf
15302c4f26bSMarkus Armbruster s->catalog_bitmap = g_try_new(uint32_t, s->catalog_size);
1547bf665eeSKevin Wolf if (s->catalog_size && s->catalog_bitmap == NULL) {
1557bf665eeSKevin Wolf error_setg(errp, "Could not allocate memory for catalog");
1567bf665eeSKevin Wolf return -ENOMEM;
1577bf665eeSKevin Wolf }
1585b7d7dfdSKevin Wolf
15932cc71deSAlberto Faria ret = bdrv_pread(bs->file, le32_to_cpu(bochs.header), s->catalog_size * 4,
16032cc71deSAlberto Faria s->catalog_bitmap, 0);
1615b7d7dfdSKevin Wolf if (ret < 0) {
162019d6b8fSAnthony Liguori goto fail;
1635b7d7dfdSKevin Wolf }
1645b7d7dfdSKevin Wolf
165019d6b8fSAnthony Liguori for (i = 0; i < s->catalog_size; i++)
166019d6b8fSAnthony Liguori le32_to_cpus(&s->catalog_bitmap[i]);
167019d6b8fSAnthony Liguori
168019d6b8fSAnthony Liguori s->data_offset = le32_to_cpu(bochs.header) + (s->catalog_size * 4);
169019d6b8fSAnthony Liguori
1703dd8a676SKevin Wolf s->bitmap_blocks = 1 + (le32_to_cpu(bochs.bitmap) - 1) / 512;
1713dd8a676SKevin Wolf s->extent_blocks = 1 + (le32_to_cpu(bochs.extent) - 1) / 512;
172019d6b8fSAnthony Liguori
1733dd8a676SKevin Wolf s->extent_size = le32_to_cpu(bochs.extent);
174715c3f60SKevin Wolf if (s->extent_size < BDRV_SECTOR_SIZE) {
175715c3f60SKevin Wolf /* bximage actually never creates extents smaller than 4k */
176715c3f60SKevin Wolf error_setg(errp, "Extent size must be at least 512");
177715c3f60SKevin Wolf ret = -EINVAL;
178715c3f60SKevin Wolf goto fail;
179715c3f60SKevin Wolf } else if (!is_power_of_2(s->extent_size)) {
180715c3f60SKevin Wolf error_setg(errp, "Extent size %" PRIu32 " is not a power of two",
181715c3f60SKevin Wolf s->extent_size);
18228ec11bcSKevin Wolf ret = -EINVAL;
18328ec11bcSKevin Wolf goto fail;
1848e53abbcSKevin Wolf } else if (s->extent_size > 0x800000) {
1858e53abbcSKevin Wolf error_setg(errp, "Extent size %" PRIu32 " is too large",
1868e53abbcSKevin Wolf s->extent_size);
18728ec11bcSKevin Wolf ret = -EINVAL;
18828ec11bcSKevin Wolf goto fail;
1898e53abbcSKevin Wolf }
190019d6b8fSAnthony Liguori
191715c3f60SKevin Wolf if (s->catalog_size < DIV_ROUND_UP(bs->total_sectors,
192715c3f60SKevin Wolf s->extent_size / BDRV_SECTOR_SIZE))
193715c3f60SKevin Wolf {
194e3737b82SKevin Wolf error_setg(errp, "Catalog size is too small for this disk size");
195e3737b82SKevin Wolf ret = -EINVAL;
196e3737b82SKevin Wolf goto fail;
197e3737b82SKevin Wolf }
198e3737b82SKevin Wolf
199848c66e8SPaolo Bonzini qemu_co_mutex_init(&s->lock);
200019d6b8fSAnthony Liguori return 0;
2015b7d7dfdSKevin Wolf
202019d6b8fSAnthony Liguori fail:
2035b7d7dfdSKevin Wolf g_free(s->catalog_bitmap);
2045b7d7dfdSKevin Wolf return ret;
205019d6b8fSAnthony Liguori }
206019d6b8fSAnthony Liguori
bochs_refresh_limits(BlockDriverState * bs,Error ** errp)207a6506481SEric Blake static void bochs_refresh_limits(BlockDriverState *bs, Error **errp)
208a6506481SEric Blake {
209a5b8dd2cSEric Blake bs->bl.request_alignment = BDRV_SECTOR_SIZE; /* No sub-sector I/O */
210a6506481SEric Blake }
211a6506481SEric Blake
212e7918e96SPaolo Bonzini static int64_t coroutine_fn GRAPH_RDLOCK
seek_to_sector(BlockDriverState * bs,int64_t sector_num)213e7918e96SPaolo Bonzini seek_to_sector(BlockDriverState *bs, int64_t sector_num)
214019d6b8fSAnthony Liguori {
215019d6b8fSAnthony Liguori BDRVBochsState *s = bs->opaque;
216246f6583SKevin Wolf uint64_t offset = sector_num * 512;
217246f6583SKevin Wolf uint64_t extent_index, extent_offset, bitmap_offset;
218019d6b8fSAnthony Liguori char bitmap_entry;
219e1b42f45SMax Reitz int ret;
220019d6b8fSAnthony Liguori
221019d6b8fSAnthony Liguori // seek to sector
222019d6b8fSAnthony Liguori extent_index = offset / s->extent_size;
223019d6b8fSAnthony Liguori extent_offset = (offset % s->extent_size) / 512;
224019d6b8fSAnthony Liguori
225efbca10fSChristoph Hellwig if (s->catalog_bitmap[extent_index] == 0xffffffff) {
226e1b42f45SMax Reitz return 0; /* not allocated */
227019d6b8fSAnthony Liguori }
228019d6b8fSAnthony Liguori
229a9ba36a4SKevin Wolf bitmap_offset = s->data_offset +
230a9ba36a4SKevin Wolf (512 * (uint64_t) s->catalog_bitmap[extent_index] *
231019d6b8fSAnthony Liguori (s->extent_blocks + s->bitmap_blocks));
232019d6b8fSAnthony Liguori
233efbca10fSChristoph Hellwig /* read in bitmap for current extent */
234e7918e96SPaolo Bonzini ret = bdrv_co_pread(bs->file, bitmap_offset + (extent_offset / 8), 1,
23532cc71deSAlberto Faria &bitmap_entry, 0);
236e1b42f45SMax Reitz if (ret < 0) {
237e1b42f45SMax Reitz return ret;
238ecbe1576SBlue Swirl }
239019d6b8fSAnthony Liguori
240efbca10fSChristoph Hellwig if (!((bitmap_entry >> (extent_offset % 8)) & 1)) {
241e1b42f45SMax Reitz return 0; /* not allocated */
242019d6b8fSAnthony Liguori }
243019d6b8fSAnthony Liguori
244efbca10fSChristoph Hellwig return bitmap_offset + (512 * (s->bitmap_blocks + extent_offset));
245019d6b8fSAnthony Liguori }
246019d6b8fSAnthony Liguori
247b9b10c35SKevin Wolf static int coroutine_fn GRAPH_RDLOCK
bochs_co_preadv(BlockDriverState * bs,int64_t offset,int64_t bytes,QEMUIOVector * qiov,BdrvRequestFlags flags)248f7ef38ddSVladimir Sementsov-Ogievskiy bochs_co_preadv(BlockDriverState *bs, int64_t offset, int64_t bytes,
249f7ef38ddSVladimir Sementsov-Ogievskiy QEMUIOVector *qiov, BdrvRequestFlags flags)
250019d6b8fSAnthony Liguori {
2513b8fd330SKevin Wolf BDRVBochsState *s = bs->opaque;
2523b8fd330SKevin Wolf uint64_t sector_num = offset >> BDRV_SECTOR_BITS;
2533b8fd330SKevin Wolf int nb_sectors = bytes >> BDRV_SECTOR_BITS;
2543b8fd330SKevin Wolf uint64_t bytes_done = 0;
2553b8fd330SKevin Wolf QEMUIOVector local_qiov;
256019d6b8fSAnthony Liguori int ret;
257019d6b8fSAnthony Liguori
2581bbbf32dSNir Soffer assert(QEMU_IS_ALIGNED(offset, BDRV_SECTOR_SIZE));
2591bbbf32dSNir Soffer assert(QEMU_IS_ALIGNED(bytes, BDRV_SECTOR_SIZE));
2603b8fd330SKevin Wolf
2613b8fd330SKevin Wolf qemu_iovec_init(&local_qiov, qiov->niov);
2623b8fd330SKevin Wolf qemu_co_mutex_lock(&s->lock);
2633b8fd330SKevin Wolf
264019d6b8fSAnthony Liguori while (nb_sectors > 0) {
265efbca10fSChristoph Hellwig int64_t block_offset = seek_to_sector(bs, sector_num);
266e1b42f45SMax Reitz if (block_offset < 0) {
2673b8fd330SKevin Wolf ret = block_offset;
2683b8fd330SKevin Wolf goto fail;
2693b8fd330SKevin Wolf }
2703b8fd330SKevin Wolf
2713b8fd330SKevin Wolf qemu_iovec_reset(&local_qiov);
2723b8fd330SKevin Wolf qemu_iovec_concat(&local_qiov, qiov, bytes_done, 512);
2733b8fd330SKevin Wolf
2743b8fd330SKevin Wolf if (block_offset > 0) {
275a03ef88fSKevin Wolf ret = bdrv_co_preadv(bs->file, block_offset, 512,
2763b8fd330SKevin Wolf &local_qiov, 0);
277e1b42f45SMax Reitz if (ret < 0) {
2783b8fd330SKevin Wolf goto fail;
279019d6b8fSAnthony Liguori }
280e1b42f45SMax Reitz } else {
2813b8fd330SKevin Wolf qemu_iovec_memset(&local_qiov, 0, 0, 512);
282e1b42f45SMax Reitz }
283019d6b8fSAnthony Liguori nb_sectors--;
284019d6b8fSAnthony Liguori sector_num++;
2853b8fd330SKevin Wolf bytes_done += 512;
286019d6b8fSAnthony Liguori }
287019d6b8fSAnthony Liguori
2883b8fd330SKevin Wolf ret = 0;
2893b8fd330SKevin Wolf fail:
2902914caa0SPaolo Bonzini qemu_co_mutex_unlock(&s->lock);
2913b8fd330SKevin Wolf qemu_iovec_destroy(&local_qiov);
2923b8fd330SKevin Wolf
2932914caa0SPaolo Bonzini return ret;
2942914caa0SPaolo Bonzini }
2952914caa0SPaolo Bonzini
bochs_close(BlockDriverState * bs)296019d6b8fSAnthony Liguori static void bochs_close(BlockDriverState *bs)
297019d6b8fSAnthony Liguori {
298019d6b8fSAnthony Liguori BDRVBochsState *s = bs->opaque;
2997267c094SAnthony Liguori g_free(s->catalog_bitmap);
300019d6b8fSAnthony Liguori }
301019d6b8fSAnthony Liguori
302019d6b8fSAnthony Liguori static BlockDriver bdrv_bochs = {
303019d6b8fSAnthony Liguori .format_name = "bochs",
304019d6b8fSAnthony Liguori .instance_size = sizeof(BDRVBochsState),
305019d6b8fSAnthony Liguori .bdrv_probe = bochs_probe,
3067a6f3913SChristoph Hellwig .bdrv_open = bochs_open,
30769dca43dSMax Reitz .bdrv_child_perm = bdrv_default_perms,
308a6506481SEric Blake .bdrv_refresh_limits = bochs_refresh_limits,
3093b8fd330SKevin Wolf .bdrv_co_preadv = bochs_co_preadv,
310019d6b8fSAnthony Liguori .bdrv_close = bochs_close,
311d67066d8SMax Reitz .is_format = true,
312019d6b8fSAnthony Liguori };
313019d6b8fSAnthony Liguori
bdrv_bochs_init(void)314019d6b8fSAnthony Liguori static void bdrv_bochs_init(void)
315019d6b8fSAnthony Liguori {
316019d6b8fSAnthony Liguori bdrv_register(&bdrv_bochs);
317019d6b8fSAnthony Liguori }
318019d6b8fSAnthony Liguori
319019d6b8fSAnthony Liguori block_init(bdrv_bochs_init);
320