1 /* 2 * QEMU host block devices 3 * 4 * Copyright (c) 2003-2008 Fabrice Bellard 5 * 6 * This work is licensed under the terms of the GNU GPL, version 2 or 7 * later. See the COPYING file in the top-level directory. 8 * 9 * This file incorporates work covered by the following copyright and 10 * permission notice: 11 * 12 * Copyright (c) 2003-2008 Fabrice Bellard 13 * 14 * Permission is hereby granted, free of charge, to any person obtaining a copy 15 * of this software and associated documentation files (the "Software"), to deal 16 * in the Software without restriction, including without limitation the rights 17 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell 18 * copies of the Software, and to permit persons to whom the Software is 19 * furnished to do so, subject to the following conditions: 20 * 21 * The above copyright notice and this permission notice shall be included in 22 * all copies or substantial portions of the Software. 23 * 24 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 25 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 26 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 27 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 28 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 29 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN 30 * THE SOFTWARE. 31 */ 32 33 #include "qemu/osdep.h" 34 #include "sysemu/block-backend.h" 35 #include "sysemu/blockdev.h" 36 #include "hw/block/block.h" 37 #include "block/blockjob.h" 38 #include "block/qdict.h" 39 #include "block/throttle-groups.h" 40 #include "monitor/monitor.h" 41 #include "qemu/error-report.h" 42 #include "qemu/option.h" 43 #include "qemu/qemu-print.h" 44 #include "qemu/config-file.h" 45 #include "qapi/qapi-commands-block.h" 46 #include "qapi/qapi-commands-transaction.h" 47 #include "qapi/qapi-visit-block-core.h" 48 #include "qapi/qmp/qdict.h" 49 #include "qapi/qmp/qnum.h" 50 #include "qapi/qmp/qstring.h" 51 #include "qapi/error.h" 52 #include "qapi/qmp/qerror.h" 53 #include "qapi/qmp/qlist.h" 54 #include "qapi/qobject-output-visitor.h" 55 #include "sysemu/sysemu.h" 56 #include "sysemu/iothread.h" 57 #include "block/block_int.h" 58 #include "block/trace.h" 59 #include "sysemu/arch_init.h" 60 #include "sysemu/runstate.h" 61 #include "sysemu/replay.h" 62 #include "qemu/cutils.h" 63 #include "qemu/help_option.h" 64 #include "qemu/main-loop.h" 65 #include "qemu/throttle-options.h" 66 67 QTAILQ_HEAD(, BlockDriverState) monitor_bdrv_states = 68 QTAILQ_HEAD_INITIALIZER(monitor_bdrv_states); 69 70 void bdrv_set_monitor_owned(BlockDriverState *bs) 71 { 72 QTAILQ_INSERT_TAIL(&monitor_bdrv_states, bs, monitor_list); 73 } 74 75 static const char *const if_name[IF_COUNT] = { 76 [IF_NONE] = "none", 77 [IF_IDE] = "ide", 78 [IF_SCSI] = "scsi", 79 [IF_FLOPPY] = "floppy", 80 [IF_PFLASH] = "pflash", 81 [IF_MTD] = "mtd", 82 [IF_SD] = "sd", 83 [IF_VIRTIO] = "virtio", 84 [IF_XEN] = "xen", 85 }; 86 87 static int if_max_devs[IF_COUNT] = { 88 /* 89 * Do not change these numbers! They govern how drive option 90 * index maps to unit and bus. That mapping is ABI. 91 * 92 * All controllers used to implement if=T drives need to support 93 * if_max_devs[T] units, for any T with if_max_devs[T] != 0. 94 * Otherwise, some index values map to "impossible" bus, unit 95 * values. 96 * 97 * For instance, if you change [IF_SCSI] to 255, -drive 98 * if=scsi,index=12 no longer means bus=1,unit=5, but 99 * bus=0,unit=12. With an lsi53c895a controller (7 units max), 100 * the drive can't be set up. Regression. 101 */ 102 [IF_IDE] = 2, 103 [IF_SCSI] = 7, 104 }; 105 106 /** 107 * Boards may call this to offer board-by-board overrides 108 * of the default, global values. 109 */ 110 void override_max_devs(BlockInterfaceType type, int max_devs) 111 { 112 BlockBackend *blk; 113 DriveInfo *dinfo; 114 115 if (max_devs <= 0) { 116 return; 117 } 118 119 for (blk = blk_next(NULL); blk; blk = blk_next(blk)) { 120 dinfo = blk_legacy_dinfo(blk); 121 if (dinfo->type == type) { 122 fprintf(stderr, "Cannot override units-per-bus property of" 123 " the %s interface, because a drive of that type has" 124 " already been added.\n", if_name[type]); 125 g_assert_not_reached(); 126 } 127 } 128 129 if_max_devs[type] = max_devs; 130 } 131 132 /* 133 * We automatically delete the drive when a device using it gets 134 * unplugged. Questionable feature, but we can't just drop it. 135 * Device models call blockdev_mark_auto_del() to schedule the 136 * automatic deletion, and generic qdev code calls blockdev_auto_del() 137 * when deletion is actually safe. 138 */ 139 void blockdev_mark_auto_del(BlockBackend *blk) 140 { 141 DriveInfo *dinfo = blk_legacy_dinfo(blk); 142 BlockJob *job; 143 144 if (!dinfo) { 145 return; 146 } 147 148 for (job = block_job_next(NULL); job; job = block_job_next(job)) { 149 if (block_job_has_bdrv(job, blk_bs(blk))) { 150 AioContext *aio_context = job->job.aio_context; 151 aio_context_acquire(aio_context); 152 153 job_cancel(&job->job, false); 154 155 aio_context_release(aio_context); 156 } 157 } 158 159 dinfo->auto_del = 1; 160 } 161 162 void blockdev_auto_del(BlockBackend *blk) 163 { 164 DriveInfo *dinfo = blk_legacy_dinfo(blk); 165 166 if (dinfo && dinfo->auto_del) { 167 monitor_remove_blk(blk); 168 blk_unref(blk); 169 } 170 } 171 172 /** 173 * Returns the current mapping of how many units per bus 174 * a particular interface can support. 175 * 176 * A positive integer indicates n units per bus. 177 * 0 implies the mapping has not been established. 178 * -1 indicates an invalid BlockInterfaceType was given. 179 */ 180 int drive_get_max_devs(BlockInterfaceType type) 181 { 182 if (type >= IF_IDE && type < IF_COUNT) { 183 return if_max_devs[type]; 184 } 185 186 return -1; 187 } 188 189 static int drive_index_to_bus_id(BlockInterfaceType type, int index) 190 { 191 int max_devs = if_max_devs[type]; 192 return max_devs ? index / max_devs : 0; 193 } 194 195 static int drive_index_to_unit_id(BlockInterfaceType type, int index) 196 { 197 int max_devs = if_max_devs[type]; 198 return max_devs ? index % max_devs : index; 199 } 200 201 QemuOpts *drive_def(const char *optstr) 202 { 203 return qemu_opts_parse_noisily(qemu_find_opts("drive"), optstr, false); 204 } 205 206 QemuOpts *drive_add(BlockInterfaceType type, int index, const char *file, 207 const char *optstr) 208 { 209 QemuOpts *opts; 210 211 opts = drive_def(optstr); 212 if (!opts) { 213 return NULL; 214 } 215 if (type != IF_DEFAULT) { 216 qemu_opt_set(opts, "if", if_name[type], &error_abort); 217 } 218 if (index >= 0) { 219 qemu_opt_set_number(opts, "index", index, &error_abort); 220 } 221 if (file) 222 qemu_opt_set(opts, "file", file, &error_abort); 223 return opts; 224 } 225 226 DriveInfo *drive_get(BlockInterfaceType type, int bus, int unit) 227 { 228 BlockBackend *blk; 229 DriveInfo *dinfo; 230 231 for (blk = blk_next(NULL); blk; blk = blk_next(blk)) { 232 dinfo = blk_legacy_dinfo(blk); 233 if (dinfo && dinfo->type == type 234 && dinfo->bus == bus && dinfo->unit == unit) { 235 return dinfo; 236 } 237 } 238 239 return NULL; 240 } 241 242 /* 243 * Check board claimed all -drive that are meant to be claimed. 244 * Fatal error if any remain unclaimed. 245 */ 246 void drive_check_orphaned(void) 247 { 248 BlockBackend *blk; 249 DriveInfo *dinfo; 250 Location loc; 251 bool orphans = false; 252 253 for (blk = blk_next(NULL); blk; blk = blk_next(blk)) { 254 dinfo = blk_legacy_dinfo(blk); 255 /* 256 * Ignore default drives, because we create certain default 257 * drives unconditionally, then leave them unclaimed. Not the 258 * users fault. 259 * Ignore IF_VIRTIO, because it gets desugared into -device, 260 * so we can leave failing to -device. 261 * Ignore IF_NONE, because leaving unclaimed IF_NONE remains 262 * available for device_add is a feature. 263 */ 264 if (dinfo->is_default || dinfo->type == IF_VIRTIO 265 || dinfo->type == IF_NONE) { 266 continue; 267 } 268 if (!blk_get_attached_dev(blk)) { 269 loc_push_none(&loc); 270 qemu_opts_loc_restore(dinfo->opts); 271 error_report("machine type does not support" 272 " if=%s,bus=%d,unit=%d", 273 if_name[dinfo->type], dinfo->bus, dinfo->unit); 274 loc_pop(&loc); 275 orphans = true; 276 } 277 } 278 279 if (orphans) { 280 exit(1); 281 } 282 } 283 284 DriveInfo *drive_get_by_index(BlockInterfaceType type, int index) 285 { 286 return drive_get(type, 287 drive_index_to_bus_id(type, index), 288 drive_index_to_unit_id(type, index)); 289 } 290 291 int drive_get_max_bus(BlockInterfaceType type) 292 { 293 int max_bus; 294 BlockBackend *blk; 295 DriveInfo *dinfo; 296 297 max_bus = -1; 298 for (blk = blk_next(NULL); blk; blk = blk_next(blk)) { 299 dinfo = blk_legacy_dinfo(blk); 300 if (dinfo && dinfo->type == type && dinfo->bus > max_bus) { 301 max_bus = dinfo->bus; 302 } 303 } 304 return max_bus; 305 } 306 307 /* Get a block device. This should only be used for single-drive devices 308 (e.g. SD/Floppy/MTD). Multi-disk devices (scsi/ide) should use the 309 appropriate bus. */ 310 DriveInfo *drive_get_next(BlockInterfaceType type) 311 { 312 static int next_block_unit[IF_COUNT]; 313 314 return drive_get(type, 0, next_block_unit[type]++); 315 } 316 317 static void bdrv_format_print(void *opaque, const char *name) 318 { 319 qemu_printf(" %s", name); 320 } 321 322 typedef struct { 323 QEMUBH *bh; 324 BlockDriverState *bs; 325 } BDRVPutRefBH; 326 327 static int parse_block_error_action(const char *buf, bool is_read, Error **errp) 328 { 329 if (!strcmp(buf, "ignore")) { 330 return BLOCKDEV_ON_ERROR_IGNORE; 331 } else if (!is_read && !strcmp(buf, "enospc")) { 332 return BLOCKDEV_ON_ERROR_ENOSPC; 333 } else if (!strcmp(buf, "stop")) { 334 return BLOCKDEV_ON_ERROR_STOP; 335 } else if (!strcmp(buf, "report")) { 336 return BLOCKDEV_ON_ERROR_REPORT; 337 } else { 338 error_setg(errp, "'%s' invalid %s error action", 339 buf, is_read ? "read" : "write"); 340 return -1; 341 } 342 } 343 344 static bool parse_stats_intervals(BlockAcctStats *stats, QList *intervals, 345 Error **errp) 346 { 347 const QListEntry *entry; 348 for (entry = qlist_first(intervals); entry; entry = qlist_next(entry)) { 349 switch (qobject_type(entry->value)) { 350 351 case QTYPE_QSTRING: { 352 unsigned long long length; 353 const char *str = qstring_get_str(qobject_to(QString, 354 entry->value)); 355 if (parse_uint_full(str, &length, 10) == 0 && 356 length > 0 && length <= UINT_MAX) { 357 block_acct_add_interval(stats, (unsigned) length); 358 } else { 359 error_setg(errp, "Invalid interval length: %s", str); 360 return false; 361 } 362 break; 363 } 364 365 case QTYPE_QNUM: { 366 int64_t length = qnum_get_int(qobject_to(QNum, entry->value)); 367 368 if (length > 0 && length <= UINT_MAX) { 369 block_acct_add_interval(stats, (unsigned) length); 370 } else { 371 error_setg(errp, "Invalid interval length: %" PRId64, length); 372 return false; 373 } 374 break; 375 } 376 377 default: 378 error_setg(errp, "The specification of stats-intervals is invalid"); 379 return false; 380 } 381 } 382 return true; 383 } 384 385 typedef enum { MEDIA_DISK, MEDIA_CDROM } DriveMediaType; 386 387 /* All parameters but @opts are optional and may be set to NULL. */ 388 static void extract_common_blockdev_options(QemuOpts *opts, int *bdrv_flags, 389 const char **throttling_group, ThrottleConfig *throttle_cfg, 390 BlockdevDetectZeroesOptions *detect_zeroes, Error **errp) 391 { 392 Error *local_error = NULL; 393 const char *aio; 394 395 if (bdrv_flags) { 396 if (qemu_opt_get_bool(opts, "copy-on-read", false)) { 397 *bdrv_flags |= BDRV_O_COPY_ON_READ; 398 } 399 400 if ((aio = qemu_opt_get(opts, "aio")) != NULL) { 401 if (bdrv_parse_aio(aio, bdrv_flags) < 0) { 402 error_setg(errp, "invalid aio option"); 403 return; 404 } 405 } 406 } 407 408 /* disk I/O throttling */ 409 if (throttling_group) { 410 *throttling_group = qemu_opt_get(opts, "throttling.group"); 411 } 412 413 if (throttle_cfg) { 414 throttle_config_init(throttle_cfg); 415 throttle_cfg->buckets[THROTTLE_BPS_TOTAL].avg = 416 qemu_opt_get_number(opts, "throttling.bps-total", 0); 417 throttle_cfg->buckets[THROTTLE_BPS_READ].avg = 418 qemu_opt_get_number(opts, "throttling.bps-read", 0); 419 throttle_cfg->buckets[THROTTLE_BPS_WRITE].avg = 420 qemu_opt_get_number(opts, "throttling.bps-write", 0); 421 throttle_cfg->buckets[THROTTLE_OPS_TOTAL].avg = 422 qemu_opt_get_number(opts, "throttling.iops-total", 0); 423 throttle_cfg->buckets[THROTTLE_OPS_READ].avg = 424 qemu_opt_get_number(opts, "throttling.iops-read", 0); 425 throttle_cfg->buckets[THROTTLE_OPS_WRITE].avg = 426 qemu_opt_get_number(opts, "throttling.iops-write", 0); 427 428 throttle_cfg->buckets[THROTTLE_BPS_TOTAL].max = 429 qemu_opt_get_number(opts, "throttling.bps-total-max", 0); 430 throttle_cfg->buckets[THROTTLE_BPS_READ].max = 431 qemu_opt_get_number(opts, "throttling.bps-read-max", 0); 432 throttle_cfg->buckets[THROTTLE_BPS_WRITE].max = 433 qemu_opt_get_number(opts, "throttling.bps-write-max", 0); 434 throttle_cfg->buckets[THROTTLE_OPS_TOTAL].max = 435 qemu_opt_get_number(opts, "throttling.iops-total-max", 0); 436 throttle_cfg->buckets[THROTTLE_OPS_READ].max = 437 qemu_opt_get_number(opts, "throttling.iops-read-max", 0); 438 throttle_cfg->buckets[THROTTLE_OPS_WRITE].max = 439 qemu_opt_get_number(opts, "throttling.iops-write-max", 0); 440 441 throttle_cfg->buckets[THROTTLE_BPS_TOTAL].burst_length = 442 qemu_opt_get_number(opts, "throttling.bps-total-max-length", 1); 443 throttle_cfg->buckets[THROTTLE_BPS_READ].burst_length = 444 qemu_opt_get_number(opts, "throttling.bps-read-max-length", 1); 445 throttle_cfg->buckets[THROTTLE_BPS_WRITE].burst_length = 446 qemu_opt_get_number(opts, "throttling.bps-write-max-length", 1); 447 throttle_cfg->buckets[THROTTLE_OPS_TOTAL].burst_length = 448 qemu_opt_get_number(opts, "throttling.iops-total-max-length", 1); 449 throttle_cfg->buckets[THROTTLE_OPS_READ].burst_length = 450 qemu_opt_get_number(opts, "throttling.iops-read-max-length", 1); 451 throttle_cfg->buckets[THROTTLE_OPS_WRITE].burst_length = 452 qemu_opt_get_number(opts, "throttling.iops-write-max-length", 1); 453 454 throttle_cfg->op_size = 455 qemu_opt_get_number(opts, "throttling.iops-size", 0); 456 457 if (!throttle_is_valid(throttle_cfg, errp)) { 458 return; 459 } 460 } 461 462 if (detect_zeroes) { 463 *detect_zeroes = 464 qapi_enum_parse(&BlockdevDetectZeroesOptions_lookup, 465 qemu_opt_get(opts, "detect-zeroes"), 466 BLOCKDEV_DETECT_ZEROES_OPTIONS_OFF, 467 &local_error); 468 if (local_error) { 469 error_propagate(errp, local_error); 470 return; 471 } 472 } 473 } 474 475 /* Takes the ownership of bs_opts */ 476 static BlockBackend *blockdev_init(const char *file, QDict *bs_opts, 477 Error **errp) 478 { 479 const char *buf; 480 int bdrv_flags = 0; 481 int on_read_error, on_write_error; 482 bool account_invalid, account_failed; 483 bool writethrough, read_only; 484 BlockBackend *blk; 485 BlockDriverState *bs; 486 ThrottleConfig cfg; 487 int snapshot = 0; 488 Error *error = NULL; 489 QemuOpts *opts; 490 QDict *interval_dict = NULL; 491 QList *interval_list = NULL; 492 const char *id; 493 BlockdevDetectZeroesOptions detect_zeroes = 494 BLOCKDEV_DETECT_ZEROES_OPTIONS_OFF; 495 const char *throttling_group = NULL; 496 497 /* Check common options by copying from bs_opts to opts, all other options 498 * stay in bs_opts for processing by bdrv_open(). */ 499 id = qdict_get_try_str(bs_opts, "id"); 500 opts = qemu_opts_create(&qemu_common_drive_opts, id, 1, errp); 501 if (!opts) { 502 goto err_no_opts; 503 } 504 505 if (!qemu_opts_absorb_qdict(opts, bs_opts, errp)) { 506 goto early_err; 507 } 508 509 if (id) { 510 qdict_del(bs_opts, "id"); 511 } 512 513 /* extract parameters */ 514 snapshot = qemu_opt_get_bool(opts, "snapshot", 0); 515 516 account_invalid = qemu_opt_get_bool(opts, "stats-account-invalid", true); 517 account_failed = qemu_opt_get_bool(opts, "stats-account-failed", true); 518 519 writethrough = !qemu_opt_get_bool(opts, BDRV_OPT_CACHE_WB, true); 520 521 id = qemu_opts_id(opts); 522 523 qdict_extract_subqdict(bs_opts, &interval_dict, "stats-intervals."); 524 qdict_array_split(interval_dict, &interval_list); 525 526 if (qdict_size(interval_dict) != 0) { 527 error_setg(errp, "Invalid option stats-intervals.%s", 528 qdict_first(interval_dict)->key); 529 goto early_err; 530 } 531 532 extract_common_blockdev_options(opts, &bdrv_flags, &throttling_group, &cfg, 533 &detect_zeroes, &error); 534 if (error) { 535 error_propagate(errp, error); 536 goto early_err; 537 } 538 539 if ((buf = qemu_opt_get(opts, "format")) != NULL) { 540 if (is_help_option(buf)) { 541 qemu_printf("Supported formats:"); 542 bdrv_iterate_format(bdrv_format_print, NULL, false); 543 qemu_printf("\nSupported formats (read-only):"); 544 bdrv_iterate_format(bdrv_format_print, NULL, true); 545 qemu_printf("\n"); 546 goto early_err; 547 } 548 549 if (qdict_haskey(bs_opts, "driver")) { 550 error_setg(errp, "Cannot specify both 'driver' and 'format'"); 551 goto early_err; 552 } 553 qdict_put_str(bs_opts, "driver", buf); 554 } 555 556 on_write_error = BLOCKDEV_ON_ERROR_ENOSPC; 557 if ((buf = qemu_opt_get(opts, "werror")) != NULL) { 558 on_write_error = parse_block_error_action(buf, 0, &error); 559 if (error) { 560 error_propagate(errp, error); 561 goto early_err; 562 } 563 } 564 565 on_read_error = BLOCKDEV_ON_ERROR_REPORT; 566 if ((buf = qemu_opt_get(opts, "rerror")) != NULL) { 567 on_read_error = parse_block_error_action(buf, 1, &error); 568 if (error) { 569 error_propagate(errp, error); 570 goto early_err; 571 } 572 } 573 574 if (snapshot) { 575 bdrv_flags |= BDRV_O_SNAPSHOT; 576 } 577 578 read_only = qemu_opt_get_bool(opts, BDRV_OPT_READ_ONLY, false); 579 580 /* init */ 581 if ((!file || !*file) && !qdict_size(bs_opts)) { 582 BlockBackendRootState *blk_rs; 583 584 blk = blk_new(qemu_get_aio_context(), 0, BLK_PERM_ALL); 585 blk_rs = blk_get_root_state(blk); 586 blk_rs->open_flags = bdrv_flags | (read_only ? 0 : BDRV_O_RDWR); 587 blk_rs->detect_zeroes = detect_zeroes; 588 589 qobject_unref(bs_opts); 590 } else { 591 if (file && !*file) { 592 file = NULL; 593 } 594 595 /* bdrv_open() defaults to the values in bdrv_flags (for compatibility 596 * with other callers) rather than what we want as the real defaults. 597 * Apply the defaults here instead. */ 598 qdict_set_default_str(bs_opts, BDRV_OPT_CACHE_DIRECT, "off"); 599 qdict_set_default_str(bs_opts, BDRV_OPT_CACHE_NO_FLUSH, "off"); 600 qdict_set_default_str(bs_opts, BDRV_OPT_READ_ONLY, 601 read_only ? "on" : "off"); 602 qdict_set_default_str(bs_opts, BDRV_OPT_AUTO_READ_ONLY, "on"); 603 assert((bdrv_flags & BDRV_O_CACHE_MASK) == 0); 604 605 if (runstate_check(RUN_STATE_INMIGRATE)) { 606 bdrv_flags |= BDRV_O_INACTIVE; 607 } 608 609 blk = blk_new_open(file, NULL, bs_opts, bdrv_flags, errp); 610 if (!blk) { 611 goto err_no_bs_opts; 612 } 613 bs = blk_bs(blk); 614 615 bs->detect_zeroes = detect_zeroes; 616 617 block_acct_setup(blk_get_stats(blk), account_invalid, account_failed); 618 619 if (!parse_stats_intervals(blk_get_stats(blk), interval_list, errp)) { 620 blk_unref(blk); 621 blk = NULL; 622 goto err_no_bs_opts; 623 } 624 } 625 626 /* disk I/O throttling */ 627 if (throttle_enabled(&cfg)) { 628 if (!throttling_group) { 629 throttling_group = id; 630 } 631 blk_io_limits_enable(blk, throttling_group); 632 blk_set_io_limits(blk, &cfg); 633 } 634 635 blk_set_enable_write_cache(blk, !writethrough); 636 blk_set_on_error(blk, on_read_error, on_write_error); 637 638 if (!monitor_add_blk(blk, id, errp)) { 639 blk_unref(blk); 640 blk = NULL; 641 goto err_no_bs_opts; 642 } 643 644 err_no_bs_opts: 645 qemu_opts_del(opts); 646 qobject_unref(interval_dict); 647 qobject_unref(interval_list); 648 return blk; 649 650 early_err: 651 qemu_opts_del(opts); 652 qobject_unref(interval_dict); 653 qobject_unref(interval_list); 654 err_no_opts: 655 qobject_unref(bs_opts); 656 return NULL; 657 } 658 659 /* Takes the ownership of bs_opts */ 660 BlockDriverState *bds_tree_init(QDict *bs_opts, Error **errp) 661 { 662 int bdrv_flags = 0; 663 664 /* bdrv_open() defaults to the values in bdrv_flags (for compatibility 665 * with other callers) rather than what we want as the real defaults. 666 * Apply the defaults here instead. */ 667 qdict_set_default_str(bs_opts, BDRV_OPT_CACHE_DIRECT, "off"); 668 qdict_set_default_str(bs_opts, BDRV_OPT_CACHE_NO_FLUSH, "off"); 669 qdict_set_default_str(bs_opts, BDRV_OPT_READ_ONLY, "off"); 670 671 if (runstate_check(RUN_STATE_INMIGRATE)) { 672 bdrv_flags |= BDRV_O_INACTIVE; 673 } 674 675 return bdrv_open(NULL, NULL, bs_opts, bdrv_flags, errp); 676 } 677 678 void blockdev_close_all_bdrv_states(void) 679 { 680 BlockDriverState *bs, *next_bs; 681 682 QTAILQ_FOREACH_SAFE(bs, &monitor_bdrv_states, monitor_list, next_bs) { 683 AioContext *ctx = bdrv_get_aio_context(bs); 684 685 aio_context_acquire(ctx); 686 bdrv_unref(bs); 687 aio_context_release(ctx); 688 } 689 } 690 691 /* Iterates over the list of monitor-owned BlockDriverStates */ 692 BlockDriverState *bdrv_next_monitor_owned(BlockDriverState *bs) 693 { 694 return bs ? QTAILQ_NEXT(bs, monitor_list) 695 : QTAILQ_FIRST(&monitor_bdrv_states); 696 } 697 698 static bool qemu_opt_rename(QemuOpts *opts, const char *from, const char *to, 699 Error **errp) 700 { 701 const char *value; 702 703 value = qemu_opt_get(opts, from); 704 if (value) { 705 if (qemu_opt_find(opts, to)) { 706 error_setg(errp, "'%s' and its alias '%s' can't be used at the " 707 "same time", to, from); 708 return false; 709 } 710 } 711 712 /* rename all items in opts */ 713 while ((value = qemu_opt_get(opts, from))) { 714 qemu_opt_set(opts, to, value, &error_abort); 715 qemu_opt_unset(opts, from); 716 } 717 return true; 718 } 719 720 QemuOptsList qemu_legacy_drive_opts = { 721 .name = "drive", 722 .head = QTAILQ_HEAD_INITIALIZER(qemu_legacy_drive_opts.head), 723 .desc = { 724 { 725 .name = "bus", 726 .type = QEMU_OPT_NUMBER, 727 .help = "bus number", 728 },{ 729 .name = "unit", 730 .type = QEMU_OPT_NUMBER, 731 .help = "unit number (i.e. lun for scsi)", 732 },{ 733 .name = "index", 734 .type = QEMU_OPT_NUMBER, 735 .help = "index number", 736 },{ 737 .name = "media", 738 .type = QEMU_OPT_STRING, 739 .help = "media type (disk, cdrom)", 740 },{ 741 .name = "if", 742 .type = QEMU_OPT_STRING, 743 .help = "interface (ide, scsi, sd, mtd, floppy, pflash, virtio)", 744 },{ 745 .name = "file", 746 .type = QEMU_OPT_STRING, 747 .help = "file name", 748 }, 749 750 /* Options that are passed on, but have special semantics with -drive */ 751 { 752 .name = BDRV_OPT_READ_ONLY, 753 .type = QEMU_OPT_BOOL, 754 .help = "open drive file as read-only", 755 },{ 756 .name = "rerror", 757 .type = QEMU_OPT_STRING, 758 .help = "read error action", 759 },{ 760 .name = "werror", 761 .type = QEMU_OPT_STRING, 762 .help = "write error action", 763 },{ 764 .name = "copy-on-read", 765 .type = QEMU_OPT_BOOL, 766 .help = "copy read data from backing file into image file", 767 }, 768 769 { /* end of list */ } 770 }, 771 }; 772 773 DriveInfo *drive_new(QemuOpts *all_opts, BlockInterfaceType block_default_type, 774 Error **errp) 775 { 776 const char *value; 777 BlockBackend *blk; 778 DriveInfo *dinfo = NULL; 779 QDict *bs_opts; 780 QemuOpts *legacy_opts; 781 DriveMediaType media = MEDIA_DISK; 782 BlockInterfaceType type; 783 int max_devs, bus_id, unit_id, index; 784 const char *werror, *rerror; 785 bool read_only = false; 786 bool copy_on_read; 787 const char *filename; 788 int i; 789 790 /* Change legacy command line options into QMP ones */ 791 static const struct { 792 const char *from; 793 const char *to; 794 } opt_renames[] = { 795 { "iops", "throttling.iops-total" }, 796 { "iops_rd", "throttling.iops-read" }, 797 { "iops_wr", "throttling.iops-write" }, 798 799 { "bps", "throttling.bps-total" }, 800 { "bps_rd", "throttling.bps-read" }, 801 { "bps_wr", "throttling.bps-write" }, 802 803 { "iops_max", "throttling.iops-total-max" }, 804 { "iops_rd_max", "throttling.iops-read-max" }, 805 { "iops_wr_max", "throttling.iops-write-max" }, 806 807 { "bps_max", "throttling.bps-total-max" }, 808 { "bps_rd_max", "throttling.bps-read-max" }, 809 { "bps_wr_max", "throttling.bps-write-max" }, 810 811 { "iops_size", "throttling.iops-size" }, 812 813 { "group", "throttling.group" }, 814 815 { "readonly", BDRV_OPT_READ_ONLY }, 816 }; 817 818 for (i = 0; i < ARRAY_SIZE(opt_renames); i++) { 819 if (!qemu_opt_rename(all_opts, opt_renames[i].from, 820 opt_renames[i].to, errp)) { 821 return NULL; 822 } 823 } 824 825 value = qemu_opt_get(all_opts, "cache"); 826 if (value) { 827 int flags = 0; 828 bool writethrough; 829 830 if (bdrv_parse_cache_mode(value, &flags, &writethrough) != 0) { 831 error_setg(errp, "invalid cache option"); 832 return NULL; 833 } 834 835 /* Specific options take precedence */ 836 if (!qemu_opt_get(all_opts, BDRV_OPT_CACHE_WB)) { 837 qemu_opt_set_bool(all_opts, BDRV_OPT_CACHE_WB, 838 !writethrough, &error_abort); 839 } 840 if (!qemu_opt_get(all_opts, BDRV_OPT_CACHE_DIRECT)) { 841 qemu_opt_set_bool(all_opts, BDRV_OPT_CACHE_DIRECT, 842 !!(flags & BDRV_O_NOCACHE), &error_abort); 843 } 844 if (!qemu_opt_get(all_opts, BDRV_OPT_CACHE_NO_FLUSH)) { 845 qemu_opt_set_bool(all_opts, BDRV_OPT_CACHE_NO_FLUSH, 846 !!(flags & BDRV_O_NO_FLUSH), &error_abort); 847 } 848 qemu_opt_unset(all_opts, "cache"); 849 } 850 851 /* Get a QDict for processing the options */ 852 bs_opts = qdict_new(); 853 qemu_opts_to_qdict(all_opts, bs_opts); 854 855 legacy_opts = qemu_opts_create(&qemu_legacy_drive_opts, NULL, 0, 856 &error_abort); 857 if (!qemu_opts_absorb_qdict(legacy_opts, bs_opts, errp)) { 858 goto fail; 859 } 860 861 /* Media type */ 862 value = qemu_opt_get(legacy_opts, "media"); 863 if (value) { 864 if (!strcmp(value, "disk")) { 865 media = MEDIA_DISK; 866 } else if (!strcmp(value, "cdrom")) { 867 media = MEDIA_CDROM; 868 read_only = true; 869 } else { 870 error_setg(errp, "'%s' invalid media", value); 871 goto fail; 872 } 873 } 874 875 /* copy-on-read is disabled with a warning for read-only devices */ 876 read_only |= qemu_opt_get_bool(legacy_opts, BDRV_OPT_READ_ONLY, false); 877 copy_on_read = qemu_opt_get_bool(legacy_opts, "copy-on-read", false); 878 879 if (read_only && copy_on_read) { 880 warn_report("disabling copy-on-read on read-only drive"); 881 copy_on_read = false; 882 } 883 884 qdict_put_str(bs_opts, BDRV_OPT_READ_ONLY, read_only ? "on" : "off"); 885 qdict_put_str(bs_opts, "copy-on-read", copy_on_read ? "on" : "off"); 886 887 /* Controller type */ 888 value = qemu_opt_get(legacy_opts, "if"); 889 if (value) { 890 for (type = 0; 891 type < IF_COUNT && strcmp(value, if_name[type]); 892 type++) { 893 } 894 if (type == IF_COUNT) { 895 error_setg(errp, "unsupported bus type '%s'", value); 896 goto fail; 897 } 898 } else { 899 type = block_default_type; 900 } 901 902 /* Device address specified by bus/unit or index. 903 * If none was specified, try to find the first free one. */ 904 bus_id = qemu_opt_get_number(legacy_opts, "bus", 0); 905 unit_id = qemu_opt_get_number(legacy_opts, "unit", -1); 906 index = qemu_opt_get_number(legacy_opts, "index", -1); 907 908 max_devs = if_max_devs[type]; 909 910 if (index != -1) { 911 if (bus_id != 0 || unit_id != -1) { 912 error_setg(errp, "index cannot be used with bus and unit"); 913 goto fail; 914 } 915 bus_id = drive_index_to_bus_id(type, index); 916 unit_id = drive_index_to_unit_id(type, index); 917 } 918 919 if (unit_id == -1) { 920 unit_id = 0; 921 while (drive_get(type, bus_id, unit_id) != NULL) { 922 unit_id++; 923 if (max_devs && unit_id >= max_devs) { 924 unit_id -= max_devs; 925 bus_id++; 926 } 927 } 928 } 929 930 if (max_devs && unit_id >= max_devs) { 931 error_setg(errp, "unit %d too big (max is %d)", unit_id, max_devs - 1); 932 goto fail; 933 } 934 935 if (drive_get(type, bus_id, unit_id) != NULL) { 936 error_setg(errp, "drive with bus=%d, unit=%d (index=%d) exists", 937 bus_id, unit_id, index); 938 goto fail; 939 } 940 941 /* no id supplied -> create one */ 942 if (qemu_opts_id(all_opts) == NULL) { 943 char *new_id; 944 const char *mediastr = ""; 945 if (type == IF_IDE || type == IF_SCSI) { 946 mediastr = (media == MEDIA_CDROM) ? "-cd" : "-hd"; 947 } 948 if (max_devs) { 949 new_id = g_strdup_printf("%s%i%s%i", if_name[type], bus_id, 950 mediastr, unit_id); 951 } else { 952 new_id = g_strdup_printf("%s%s%i", if_name[type], 953 mediastr, unit_id); 954 } 955 qdict_put_str(bs_opts, "id", new_id); 956 g_free(new_id); 957 } 958 959 /* Add virtio block device */ 960 if (type == IF_VIRTIO) { 961 QemuOpts *devopts; 962 devopts = qemu_opts_create(qemu_find_opts("device"), NULL, 0, 963 &error_abort); 964 qemu_opt_set(devopts, "driver", "virtio-blk", &error_abort); 965 qemu_opt_set(devopts, "drive", qdict_get_str(bs_opts, "id"), 966 &error_abort); 967 } 968 969 filename = qemu_opt_get(legacy_opts, "file"); 970 971 /* Check werror/rerror compatibility with if=... */ 972 werror = qemu_opt_get(legacy_opts, "werror"); 973 if (werror != NULL) { 974 if (type != IF_IDE && type != IF_SCSI && type != IF_VIRTIO && 975 type != IF_NONE) { 976 error_setg(errp, "werror is not supported by this bus type"); 977 goto fail; 978 } 979 qdict_put_str(bs_opts, "werror", werror); 980 } 981 982 rerror = qemu_opt_get(legacy_opts, "rerror"); 983 if (rerror != NULL) { 984 if (type != IF_IDE && type != IF_VIRTIO && type != IF_SCSI && 985 type != IF_NONE) { 986 error_setg(errp, "rerror is not supported by this bus type"); 987 goto fail; 988 } 989 qdict_put_str(bs_opts, "rerror", rerror); 990 } 991 992 /* Actual block device init: Functionality shared with blockdev-add */ 993 blk = blockdev_init(filename, bs_opts, errp); 994 bs_opts = NULL; 995 if (!blk) { 996 goto fail; 997 } 998 999 /* Create legacy DriveInfo */ 1000 dinfo = g_malloc0(sizeof(*dinfo)); 1001 dinfo->opts = all_opts; 1002 1003 dinfo->type = type; 1004 dinfo->bus = bus_id; 1005 dinfo->unit = unit_id; 1006 1007 blk_set_legacy_dinfo(blk, dinfo); 1008 1009 switch(type) { 1010 case IF_IDE: 1011 case IF_SCSI: 1012 case IF_XEN: 1013 case IF_NONE: 1014 dinfo->media_cd = media == MEDIA_CDROM; 1015 break; 1016 default: 1017 break; 1018 } 1019 1020 fail: 1021 qemu_opts_del(legacy_opts); 1022 qobject_unref(bs_opts); 1023 return dinfo; 1024 } 1025 1026 static BlockDriverState *qmp_get_root_bs(const char *name, Error **errp) 1027 { 1028 BlockDriverState *bs; 1029 1030 bs = bdrv_lookup_bs(name, name, errp); 1031 if (bs == NULL) { 1032 return NULL; 1033 } 1034 1035 if (!bdrv_is_root_node(bs)) { 1036 error_setg(errp, "Need a root block node"); 1037 return NULL; 1038 } 1039 1040 if (!bdrv_is_inserted(bs)) { 1041 error_setg(errp, "Device has no medium"); 1042 return NULL; 1043 } 1044 1045 return bs; 1046 } 1047 1048 static void blockdev_do_action(TransactionAction *action, Error **errp) 1049 { 1050 TransactionActionList list; 1051 1052 list.value = action; 1053 list.next = NULL; 1054 qmp_transaction(&list, false, NULL, errp); 1055 } 1056 1057 void qmp_blockdev_snapshot_sync(bool has_device, const char *device, 1058 bool has_node_name, const char *node_name, 1059 const char *snapshot_file, 1060 bool has_snapshot_node_name, 1061 const char *snapshot_node_name, 1062 bool has_format, const char *format, 1063 bool has_mode, NewImageMode mode, Error **errp) 1064 { 1065 BlockdevSnapshotSync snapshot = { 1066 .has_device = has_device, 1067 .device = (char *) device, 1068 .has_node_name = has_node_name, 1069 .node_name = (char *) node_name, 1070 .snapshot_file = (char *) snapshot_file, 1071 .has_snapshot_node_name = has_snapshot_node_name, 1072 .snapshot_node_name = (char *) snapshot_node_name, 1073 .has_format = has_format, 1074 .format = (char *) format, 1075 .has_mode = has_mode, 1076 .mode = mode, 1077 }; 1078 TransactionAction action = { 1079 .type = TRANSACTION_ACTION_KIND_BLOCKDEV_SNAPSHOT_SYNC, 1080 .u.blockdev_snapshot_sync.data = &snapshot, 1081 }; 1082 blockdev_do_action(&action, errp); 1083 } 1084 1085 void qmp_blockdev_snapshot(const char *node, const char *overlay, 1086 Error **errp) 1087 { 1088 BlockdevSnapshot snapshot_data = { 1089 .node = (char *) node, 1090 .overlay = (char *) overlay 1091 }; 1092 TransactionAction action = { 1093 .type = TRANSACTION_ACTION_KIND_BLOCKDEV_SNAPSHOT, 1094 .u.blockdev_snapshot.data = &snapshot_data, 1095 }; 1096 blockdev_do_action(&action, errp); 1097 } 1098 1099 void qmp_blockdev_snapshot_internal_sync(const char *device, 1100 const char *name, 1101 Error **errp) 1102 { 1103 BlockdevSnapshotInternal snapshot = { 1104 .device = (char *) device, 1105 .name = (char *) name 1106 }; 1107 TransactionAction action = { 1108 .type = TRANSACTION_ACTION_KIND_BLOCKDEV_SNAPSHOT_INTERNAL_SYNC, 1109 .u.blockdev_snapshot_internal_sync.data = &snapshot, 1110 }; 1111 blockdev_do_action(&action, errp); 1112 } 1113 1114 SnapshotInfo *qmp_blockdev_snapshot_delete_internal_sync(const char *device, 1115 bool has_id, 1116 const char *id, 1117 bool has_name, 1118 const char *name, 1119 Error **errp) 1120 { 1121 BlockDriverState *bs; 1122 AioContext *aio_context; 1123 QEMUSnapshotInfo sn; 1124 Error *local_err = NULL; 1125 SnapshotInfo *info = NULL; 1126 int ret; 1127 1128 bs = qmp_get_root_bs(device, errp); 1129 if (!bs) { 1130 return NULL; 1131 } 1132 aio_context = bdrv_get_aio_context(bs); 1133 aio_context_acquire(aio_context); 1134 1135 if (!has_id) { 1136 id = NULL; 1137 } 1138 1139 if (!has_name) { 1140 name = NULL; 1141 } 1142 1143 if (!id && !name) { 1144 error_setg(errp, "Name or id must be provided"); 1145 goto out_aio_context; 1146 } 1147 1148 if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_INTERNAL_SNAPSHOT_DELETE, errp)) { 1149 goto out_aio_context; 1150 } 1151 1152 ret = bdrv_snapshot_find_by_id_and_name(bs, id, name, &sn, &local_err); 1153 if (local_err) { 1154 error_propagate(errp, local_err); 1155 goto out_aio_context; 1156 } 1157 if (!ret) { 1158 error_setg(errp, 1159 "Snapshot with id '%s' and name '%s' does not exist on " 1160 "device '%s'", 1161 STR_OR_NULL(id), STR_OR_NULL(name), device); 1162 goto out_aio_context; 1163 } 1164 1165 bdrv_snapshot_delete(bs, id, name, &local_err); 1166 if (local_err) { 1167 error_propagate(errp, local_err); 1168 goto out_aio_context; 1169 } 1170 1171 aio_context_release(aio_context); 1172 1173 info = g_new0(SnapshotInfo, 1); 1174 info->id = g_strdup(sn.id_str); 1175 info->name = g_strdup(sn.name); 1176 info->date_nsec = sn.date_nsec; 1177 info->date_sec = sn.date_sec; 1178 info->vm_state_size = sn.vm_state_size; 1179 info->vm_clock_nsec = sn.vm_clock_nsec % 1000000000; 1180 info->vm_clock_sec = sn.vm_clock_nsec / 1000000000; 1181 if (sn.icount != -1ULL) { 1182 info->icount = sn.icount; 1183 info->has_icount = true; 1184 } 1185 1186 return info; 1187 1188 out_aio_context: 1189 aio_context_release(aio_context); 1190 return NULL; 1191 } 1192 1193 /* New and old BlockDriverState structs for atomic group operations */ 1194 1195 typedef struct BlkActionState BlkActionState; 1196 1197 /** 1198 * BlkActionOps: 1199 * Table of operations that define an Action. 1200 * 1201 * @instance_size: Size of state struct, in bytes. 1202 * @prepare: Prepare the work, must NOT be NULL. 1203 * @commit: Commit the changes, can be NULL. 1204 * @abort: Abort the changes on fail, can be NULL. 1205 * @clean: Clean up resources after all transaction actions have called 1206 * commit() or abort(). Can be NULL. 1207 * 1208 * Only prepare() may fail. In a single transaction, only one of commit() or 1209 * abort() will be called. clean() will always be called if it is present. 1210 */ 1211 typedef struct BlkActionOps { 1212 size_t instance_size; 1213 void (*prepare)(BlkActionState *common, Error **errp); 1214 void (*commit)(BlkActionState *common); 1215 void (*abort)(BlkActionState *common); 1216 void (*clean)(BlkActionState *common); 1217 } BlkActionOps; 1218 1219 /** 1220 * BlkActionState: 1221 * Describes one Action's state within a Transaction. 1222 * 1223 * @action: QAPI-defined enum identifying which Action to perform. 1224 * @ops: Table of ActionOps this Action can perform. 1225 * @block_job_txn: Transaction which this action belongs to. 1226 * @entry: List membership for all Actions in this Transaction. 1227 * 1228 * This structure must be arranged as first member in a subclassed type, 1229 * assuming that the compiler will also arrange it to the same offsets as the 1230 * base class. 1231 */ 1232 struct BlkActionState { 1233 TransactionAction *action; 1234 const BlkActionOps *ops; 1235 JobTxn *block_job_txn; 1236 TransactionProperties *txn_props; 1237 QTAILQ_ENTRY(BlkActionState) entry; 1238 }; 1239 1240 /* internal snapshot private data */ 1241 typedef struct InternalSnapshotState { 1242 BlkActionState common; 1243 BlockDriverState *bs; 1244 QEMUSnapshotInfo sn; 1245 bool created; 1246 } InternalSnapshotState; 1247 1248 1249 static int action_check_completion_mode(BlkActionState *s, Error **errp) 1250 { 1251 if (s->txn_props->completion_mode != ACTION_COMPLETION_MODE_INDIVIDUAL) { 1252 error_setg(errp, 1253 "Action '%s' does not support Transaction property " 1254 "completion-mode = %s", 1255 TransactionActionKind_str(s->action->type), 1256 ActionCompletionMode_str(s->txn_props->completion_mode)); 1257 return -1; 1258 } 1259 return 0; 1260 } 1261 1262 static void internal_snapshot_prepare(BlkActionState *common, 1263 Error **errp) 1264 { 1265 Error *local_err = NULL; 1266 const char *device; 1267 const char *name; 1268 BlockDriverState *bs; 1269 QEMUSnapshotInfo old_sn, *sn; 1270 bool ret; 1271 qemu_timeval tv; 1272 BlockdevSnapshotInternal *internal; 1273 InternalSnapshotState *state; 1274 AioContext *aio_context; 1275 int ret1; 1276 1277 g_assert(common->action->type == 1278 TRANSACTION_ACTION_KIND_BLOCKDEV_SNAPSHOT_INTERNAL_SYNC); 1279 internal = common->action->u.blockdev_snapshot_internal_sync.data; 1280 state = DO_UPCAST(InternalSnapshotState, common, common); 1281 1282 /* 1. parse input */ 1283 device = internal->device; 1284 name = internal->name; 1285 1286 /* 2. check for validation */ 1287 if (action_check_completion_mode(common, errp) < 0) { 1288 return; 1289 } 1290 1291 bs = qmp_get_root_bs(device, errp); 1292 if (!bs) { 1293 return; 1294 } 1295 1296 aio_context = bdrv_get_aio_context(bs); 1297 aio_context_acquire(aio_context); 1298 1299 state->bs = bs; 1300 1301 /* Paired with .clean() */ 1302 bdrv_drained_begin(bs); 1303 1304 if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_INTERNAL_SNAPSHOT, errp)) { 1305 goto out; 1306 } 1307 1308 if (bdrv_is_read_only(bs)) { 1309 error_setg(errp, "Device '%s' is read only", device); 1310 goto out; 1311 } 1312 1313 if (!bdrv_can_snapshot(bs)) { 1314 error_setg(errp, "Block format '%s' used by device '%s' " 1315 "does not support internal snapshots", 1316 bs->drv->format_name, device); 1317 goto out; 1318 } 1319 1320 if (!strlen(name)) { 1321 error_setg(errp, "Name is empty"); 1322 goto out; 1323 } 1324 1325 /* check whether a snapshot with name exist */ 1326 ret = bdrv_snapshot_find_by_id_and_name(bs, NULL, name, &old_sn, 1327 &local_err); 1328 if (local_err) { 1329 error_propagate(errp, local_err); 1330 goto out; 1331 } else if (ret) { 1332 error_setg(errp, 1333 "Snapshot with name '%s' already exists on device '%s'", 1334 name, device); 1335 goto out; 1336 } 1337 1338 /* 3. take the snapshot */ 1339 sn = &state->sn; 1340 pstrcpy(sn->name, sizeof(sn->name), name); 1341 qemu_gettimeofday(&tv); 1342 sn->date_sec = tv.tv_sec; 1343 sn->date_nsec = tv.tv_usec * 1000; 1344 sn->vm_clock_nsec = qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL); 1345 if (replay_mode != REPLAY_MODE_NONE) { 1346 sn->icount = replay_get_current_icount(); 1347 } else { 1348 sn->icount = -1ULL; 1349 } 1350 1351 ret1 = bdrv_snapshot_create(bs, sn); 1352 if (ret1 < 0) { 1353 error_setg_errno(errp, -ret1, 1354 "Failed to create snapshot '%s' on device '%s'", 1355 name, device); 1356 goto out; 1357 } 1358 1359 /* 4. succeed, mark a snapshot is created */ 1360 state->created = true; 1361 1362 out: 1363 aio_context_release(aio_context); 1364 } 1365 1366 static void internal_snapshot_abort(BlkActionState *common) 1367 { 1368 InternalSnapshotState *state = 1369 DO_UPCAST(InternalSnapshotState, common, common); 1370 BlockDriverState *bs = state->bs; 1371 QEMUSnapshotInfo *sn = &state->sn; 1372 AioContext *aio_context; 1373 Error *local_error = NULL; 1374 1375 if (!state->created) { 1376 return; 1377 } 1378 1379 aio_context = bdrv_get_aio_context(state->bs); 1380 aio_context_acquire(aio_context); 1381 1382 if (bdrv_snapshot_delete(bs, sn->id_str, sn->name, &local_error) < 0) { 1383 error_reportf_err(local_error, 1384 "Failed to delete snapshot with id '%s' and " 1385 "name '%s' on device '%s' in abort: ", 1386 sn->id_str, sn->name, 1387 bdrv_get_device_name(bs)); 1388 } 1389 1390 aio_context_release(aio_context); 1391 } 1392 1393 static void internal_snapshot_clean(BlkActionState *common) 1394 { 1395 InternalSnapshotState *state = DO_UPCAST(InternalSnapshotState, 1396 common, common); 1397 AioContext *aio_context; 1398 1399 if (!state->bs) { 1400 return; 1401 } 1402 1403 aio_context = bdrv_get_aio_context(state->bs); 1404 aio_context_acquire(aio_context); 1405 1406 bdrv_drained_end(state->bs); 1407 1408 aio_context_release(aio_context); 1409 } 1410 1411 /* external snapshot private data */ 1412 typedef struct ExternalSnapshotState { 1413 BlkActionState common; 1414 BlockDriverState *old_bs; 1415 BlockDriverState *new_bs; 1416 bool overlay_appended; 1417 } ExternalSnapshotState; 1418 1419 static void external_snapshot_prepare(BlkActionState *common, 1420 Error **errp) 1421 { 1422 int ret; 1423 int flags = 0; 1424 QDict *options = NULL; 1425 Error *local_err = NULL; 1426 /* Device and node name of the image to generate the snapshot from */ 1427 const char *device; 1428 const char *node_name; 1429 /* Reference to the new image (for 'blockdev-snapshot') */ 1430 const char *snapshot_ref; 1431 /* File name of the new image (for 'blockdev-snapshot-sync') */ 1432 const char *new_image_file; 1433 ExternalSnapshotState *state = 1434 DO_UPCAST(ExternalSnapshotState, common, common); 1435 TransactionAction *action = common->action; 1436 AioContext *aio_context; 1437 uint64_t perm, shared; 1438 1439 /* 'blockdev-snapshot' and 'blockdev-snapshot-sync' have similar 1440 * purpose but a different set of parameters */ 1441 switch (action->type) { 1442 case TRANSACTION_ACTION_KIND_BLOCKDEV_SNAPSHOT: 1443 { 1444 BlockdevSnapshot *s = action->u.blockdev_snapshot.data; 1445 device = s->node; 1446 node_name = s->node; 1447 new_image_file = NULL; 1448 snapshot_ref = s->overlay; 1449 } 1450 break; 1451 case TRANSACTION_ACTION_KIND_BLOCKDEV_SNAPSHOT_SYNC: 1452 { 1453 BlockdevSnapshotSync *s = action->u.blockdev_snapshot_sync.data; 1454 device = s->has_device ? s->device : NULL; 1455 node_name = s->has_node_name ? s->node_name : NULL; 1456 new_image_file = s->snapshot_file; 1457 snapshot_ref = NULL; 1458 } 1459 break; 1460 default: 1461 g_assert_not_reached(); 1462 } 1463 1464 /* start processing */ 1465 if (action_check_completion_mode(common, errp) < 0) { 1466 return; 1467 } 1468 1469 state->old_bs = bdrv_lookup_bs(device, node_name, errp); 1470 if (!state->old_bs) { 1471 return; 1472 } 1473 1474 aio_context = bdrv_get_aio_context(state->old_bs); 1475 aio_context_acquire(aio_context); 1476 1477 /* Paired with .clean() */ 1478 bdrv_drained_begin(state->old_bs); 1479 1480 if (!bdrv_is_inserted(state->old_bs)) { 1481 error_setg(errp, QERR_DEVICE_HAS_NO_MEDIUM, device); 1482 goto out; 1483 } 1484 1485 if (bdrv_op_is_blocked(state->old_bs, 1486 BLOCK_OP_TYPE_EXTERNAL_SNAPSHOT, errp)) { 1487 goto out; 1488 } 1489 1490 if (!bdrv_is_read_only(state->old_bs)) { 1491 if (bdrv_flush(state->old_bs)) { 1492 error_setg(errp, QERR_IO_ERROR); 1493 goto out; 1494 } 1495 } 1496 1497 if (action->type == TRANSACTION_ACTION_KIND_BLOCKDEV_SNAPSHOT_SYNC) { 1498 BlockdevSnapshotSync *s = action->u.blockdev_snapshot_sync.data; 1499 const char *format = s->has_format ? s->format : "qcow2"; 1500 enum NewImageMode mode; 1501 const char *snapshot_node_name = 1502 s->has_snapshot_node_name ? s->snapshot_node_name : NULL; 1503 1504 if (node_name && !snapshot_node_name) { 1505 error_setg(errp, "New overlay node-name missing"); 1506 goto out; 1507 } 1508 1509 if (snapshot_node_name && 1510 bdrv_lookup_bs(snapshot_node_name, snapshot_node_name, NULL)) { 1511 error_setg(errp, "New overlay node-name already in use"); 1512 goto out; 1513 } 1514 1515 flags = state->old_bs->open_flags; 1516 flags &= ~(BDRV_O_SNAPSHOT | BDRV_O_COPY_ON_READ); 1517 flags |= BDRV_O_NO_BACKING; 1518 1519 /* create new image w/backing file */ 1520 mode = s->has_mode ? s->mode : NEW_IMAGE_MODE_ABSOLUTE_PATHS; 1521 if (mode != NEW_IMAGE_MODE_EXISTING) { 1522 int64_t size = bdrv_getlength(state->old_bs); 1523 if (size < 0) { 1524 error_setg_errno(errp, -size, "bdrv_getlength failed"); 1525 goto out; 1526 } 1527 bdrv_refresh_filename(state->old_bs); 1528 bdrv_img_create(new_image_file, format, 1529 state->old_bs->filename, 1530 state->old_bs->drv->format_name, 1531 NULL, size, flags, false, &local_err); 1532 if (local_err) { 1533 error_propagate(errp, local_err); 1534 goto out; 1535 } 1536 } 1537 1538 options = qdict_new(); 1539 if (snapshot_node_name) { 1540 qdict_put_str(options, "node-name", snapshot_node_name); 1541 } 1542 qdict_put_str(options, "driver", format); 1543 } 1544 1545 state->new_bs = bdrv_open(new_image_file, snapshot_ref, options, flags, 1546 errp); 1547 /* We will manually add the backing_hd field to the bs later */ 1548 if (!state->new_bs) { 1549 goto out; 1550 } 1551 1552 /* 1553 * Allow attaching a backing file to an overlay that's already in use only 1554 * if the parents don't assume that they are already seeing a valid image. 1555 * (Specifically, allow it as a mirror target, which is write-only access.) 1556 */ 1557 bdrv_get_cumulative_perm(state->new_bs, &perm, &shared); 1558 if (perm & BLK_PERM_CONSISTENT_READ) { 1559 error_setg(errp, "The overlay is already in use"); 1560 goto out; 1561 } 1562 1563 if (state->new_bs->drv->is_filter) { 1564 error_setg(errp, "Filters cannot be used as overlays"); 1565 goto out; 1566 } 1567 1568 if (bdrv_cow_child(state->new_bs)) { 1569 error_setg(errp, "The overlay already has a backing image"); 1570 goto out; 1571 } 1572 1573 if (!state->new_bs->drv->supports_backing) { 1574 error_setg(errp, "The overlay does not support backing images"); 1575 goto out; 1576 } 1577 1578 ret = bdrv_append(state->new_bs, state->old_bs, errp); 1579 if (ret < 0) { 1580 goto out; 1581 } 1582 state->overlay_appended = true; 1583 1584 out: 1585 aio_context_release(aio_context); 1586 } 1587 1588 static void external_snapshot_commit(BlkActionState *common) 1589 { 1590 ExternalSnapshotState *state = 1591 DO_UPCAST(ExternalSnapshotState, common, common); 1592 AioContext *aio_context; 1593 1594 aio_context = bdrv_get_aio_context(state->old_bs); 1595 aio_context_acquire(aio_context); 1596 1597 /* We don't need (or want) to use the transactional 1598 * bdrv_reopen_multiple() across all the entries at once, because we 1599 * don't want to abort all of them if one of them fails the reopen */ 1600 if (!qatomic_read(&state->old_bs->copy_on_read)) { 1601 bdrv_reopen_set_read_only(state->old_bs, true, NULL); 1602 } 1603 1604 aio_context_release(aio_context); 1605 } 1606 1607 static void external_snapshot_abort(BlkActionState *common) 1608 { 1609 ExternalSnapshotState *state = 1610 DO_UPCAST(ExternalSnapshotState, common, common); 1611 if (state->new_bs) { 1612 if (state->overlay_appended) { 1613 AioContext *aio_context; 1614 AioContext *tmp_context; 1615 int ret; 1616 1617 aio_context = bdrv_get_aio_context(state->old_bs); 1618 aio_context_acquire(aio_context); 1619 1620 bdrv_ref(state->old_bs); /* we can't let bdrv_set_backind_hd() 1621 close state->old_bs; we need it */ 1622 bdrv_set_backing_hd(state->new_bs, NULL, &error_abort); 1623 1624 /* 1625 * The call to bdrv_set_backing_hd() above returns state->old_bs to 1626 * the main AioContext. As we're still going to be using it, return 1627 * it to the AioContext it was before. 1628 */ 1629 tmp_context = bdrv_get_aio_context(state->old_bs); 1630 if (aio_context != tmp_context) { 1631 aio_context_release(aio_context); 1632 aio_context_acquire(tmp_context); 1633 1634 ret = bdrv_try_set_aio_context(state->old_bs, 1635 aio_context, NULL); 1636 assert(ret == 0); 1637 1638 aio_context_release(tmp_context); 1639 aio_context_acquire(aio_context); 1640 } 1641 1642 bdrv_replace_node(state->new_bs, state->old_bs, &error_abort); 1643 bdrv_unref(state->old_bs); /* bdrv_replace_node() ref'ed old_bs */ 1644 1645 aio_context_release(aio_context); 1646 } 1647 } 1648 } 1649 1650 static void external_snapshot_clean(BlkActionState *common) 1651 { 1652 ExternalSnapshotState *state = 1653 DO_UPCAST(ExternalSnapshotState, common, common); 1654 AioContext *aio_context; 1655 1656 if (!state->old_bs) { 1657 return; 1658 } 1659 1660 aio_context = bdrv_get_aio_context(state->old_bs); 1661 aio_context_acquire(aio_context); 1662 1663 bdrv_drained_end(state->old_bs); 1664 bdrv_unref(state->new_bs); 1665 1666 aio_context_release(aio_context); 1667 } 1668 1669 typedef struct DriveBackupState { 1670 BlkActionState common; 1671 BlockDriverState *bs; 1672 BlockJob *job; 1673 } DriveBackupState; 1674 1675 static BlockJob *do_backup_common(BackupCommon *backup, 1676 BlockDriverState *bs, 1677 BlockDriverState *target_bs, 1678 AioContext *aio_context, 1679 JobTxn *txn, Error **errp); 1680 1681 static void drive_backup_prepare(BlkActionState *common, Error **errp) 1682 { 1683 DriveBackupState *state = DO_UPCAST(DriveBackupState, common, common); 1684 DriveBackup *backup; 1685 BlockDriverState *bs; 1686 BlockDriverState *target_bs; 1687 BlockDriverState *source = NULL; 1688 AioContext *aio_context; 1689 AioContext *old_context; 1690 QDict *options; 1691 Error *local_err = NULL; 1692 int flags; 1693 int64_t size; 1694 bool set_backing_hd = false; 1695 int ret; 1696 1697 assert(common->action->type == TRANSACTION_ACTION_KIND_DRIVE_BACKUP); 1698 backup = common->action->u.drive_backup.data; 1699 1700 if (!backup->has_mode) { 1701 backup->mode = NEW_IMAGE_MODE_ABSOLUTE_PATHS; 1702 } 1703 1704 bs = bdrv_lookup_bs(backup->device, backup->device, errp); 1705 if (!bs) { 1706 return; 1707 } 1708 1709 if (!bs->drv) { 1710 error_setg(errp, "Device has no medium"); 1711 return; 1712 } 1713 1714 aio_context = bdrv_get_aio_context(bs); 1715 aio_context_acquire(aio_context); 1716 1717 state->bs = bs; 1718 /* Paired with .clean() */ 1719 bdrv_drained_begin(bs); 1720 1721 if (!backup->has_format) { 1722 backup->format = backup->mode == NEW_IMAGE_MODE_EXISTING ? 1723 NULL : (char *) bs->drv->format_name; 1724 } 1725 1726 /* Early check to avoid creating target */ 1727 if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_BACKUP_SOURCE, errp)) { 1728 goto out; 1729 } 1730 1731 flags = bs->open_flags | BDRV_O_RDWR; 1732 1733 /* 1734 * See if we have a backing HD we can use to create our new image 1735 * on top of. 1736 */ 1737 if (backup->sync == MIRROR_SYNC_MODE_TOP) { 1738 /* 1739 * Backup will not replace the source by the target, so none 1740 * of the filters skipped here will be removed (in contrast to 1741 * mirror). Therefore, we can skip all of them when looking 1742 * for the first COW relationship. 1743 */ 1744 source = bdrv_cow_bs(bdrv_skip_filters(bs)); 1745 if (!source) { 1746 backup->sync = MIRROR_SYNC_MODE_FULL; 1747 } 1748 } 1749 if (backup->sync == MIRROR_SYNC_MODE_NONE) { 1750 source = bs; 1751 flags |= BDRV_O_NO_BACKING; 1752 set_backing_hd = true; 1753 } 1754 1755 size = bdrv_getlength(bs); 1756 if (size < 0) { 1757 error_setg_errno(errp, -size, "bdrv_getlength failed"); 1758 goto out; 1759 } 1760 1761 if (backup->mode != NEW_IMAGE_MODE_EXISTING) { 1762 assert(backup->format); 1763 if (source) { 1764 /* Implicit filters should not appear in the filename */ 1765 BlockDriverState *explicit_backing = 1766 bdrv_skip_implicit_filters(source); 1767 1768 bdrv_refresh_filename(explicit_backing); 1769 bdrv_img_create(backup->target, backup->format, 1770 explicit_backing->filename, 1771 explicit_backing->drv->format_name, NULL, 1772 size, flags, false, &local_err); 1773 } else { 1774 bdrv_img_create(backup->target, backup->format, NULL, NULL, NULL, 1775 size, flags, false, &local_err); 1776 } 1777 } 1778 1779 if (local_err) { 1780 error_propagate(errp, local_err); 1781 goto out; 1782 } 1783 1784 options = qdict_new(); 1785 qdict_put_str(options, "discard", "unmap"); 1786 qdict_put_str(options, "detect-zeroes", "unmap"); 1787 if (backup->format) { 1788 qdict_put_str(options, "driver", backup->format); 1789 } 1790 1791 target_bs = bdrv_open(backup->target, NULL, options, flags, errp); 1792 if (!target_bs) { 1793 goto out; 1794 } 1795 1796 /* Honor bdrv_try_set_aio_context() context acquisition requirements. */ 1797 old_context = bdrv_get_aio_context(target_bs); 1798 aio_context_release(aio_context); 1799 aio_context_acquire(old_context); 1800 1801 ret = bdrv_try_set_aio_context(target_bs, aio_context, errp); 1802 if (ret < 0) { 1803 bdrv_unref(target_bs); 1804 aio_context_release(old_context); 1805 return; 1806 } 1807 1808 aio_context_release(old_context); 1809 aio_context_acquire(aio_context); 1810 1811 if (set_backing_hd) { 1812 if (bdrv_set_backing_hd(target_bs, source, errp) < 0) { 1813 goto unref; 1814 } 1815 } 1816 1817 state->job = do_backup_common(qapi_DriveBackup_base(backup), 1818 bs, target_bs, aio_context, 1819 common->block_job_txn, errp); 1820 1821 unref: 1822 bdrv_unref(target_bs); 1823 out: 1824 aio_context_release(aio_context); 1825 } 1826 1827 static void drive_backup_commit(BlkActionState *common) 1828 { 1829 DriveBackupState *state = DO_UPCAST(DriveBackupState, common, common); 1830 AioContext *aio_context; 1831 1832 aio_context = bdrv_get_aio_context(state->bs); 1833 aio_context_acquire(aio_context); 1834 1835 assert(state->job); 1836 job_start(&state->job->job); 1837 1838 aio_context_release(aio_context); 1839 } 1840 1841 static void drive_backup_abort(BlkActionState *common) 1842 { 1843 DriveBackupState *state = DO_UPCAST(DriveBackupState, common, common); 1844 1845 if (state->job) { 1846 AioContext *aio_context; 1847 1848 aio_context = bdrv_get_aio_context(state->bs); 1849 aio_context_acquire(aio_context); 1850 1851 job_cancel_sync(&state->job->job); 1852 1853 aio_context_release(aio_context); 1854 } 1855 } 1856 1857 static void drive_backup_clean(BlkActionState *common) 1858 { 1859 DriveBackupState *state = DO_UPCAST(DriveBackupState, common, common); 1860 AioContext *aio_context; 1861 1862 if (!state->bs) { 1863 return; 1864 } 1865 1866 aio_context = bdrv_get_aio_context(state->bs); 1867 aio_context_acquire(aio_context); 1868 1869 bdrv_drained_end(state->bs); 1870 1871 aio_context_release(aio_context); 1872 } 1873 1874 typedef struct BlockdevBackupState { 1875 BlkActionState common; 1876 BlockDriverState *bs; 1877 BlockJob *job; 1878 } BlockdevBackupState; 1879 1880 static void blockdev_backup_prepare(BlkActionState *common, Error **errp) 1881 { 1882 BlockdevBackupState *state = DO_UPCAST(BlockdevBackupState, common, common); 1883 BlockdevBackup *backup; 1884 BlockDriverState *bs; 1885 BlockDriverState *target_bs; 1886 AioContext *aio_context; 1887 AioContext *old_context; 1888 int ret; 1889 1890 assert(common->action->type == TRANSACTION_ACTION_KIND_BLOCKDEV_BACKUP); 1891 backup = common->action->u.blockdev_backup.data; 1892 1893 bs = bdrv_lookup_bs(backup->device, backup->device, errp); 1894 if (!bs) { 1895 return; 1896 } 1897 1898 target_bs = bdrv_lookup_bs(backup->target, backup->target, errp); 1899 if (!target_bs) { 1900 return; 1901 } 1902 1903 /* Honor bdrv_try_set_aio_context() context acquisition requirements. */ 1904 aio_context = bdrv_get_aio_context(bs); 1905 old_context = bdrv_get_aio_context(target_bs); 1906 aio_context_acquire(old_context); 1907 1908 ret = bdrv_try_set_aio_context(target_bs, aio_context, errp); 1909 if (ret < 0) { 1910 aio_context_release(old_context); 1911 return; 1912 } 1913 1914 aio_context_release(old_context); 1915 aio_context_acquire(aio_context); 1916 state->bs = bs; 1917 1918 /* Paired with .clean() */ 1919 bdrv_drained_begin(state->bs); 1920 1921 state->job = do_backup_common(qapi_BlockdevBackup_base(backup), 1922 bs, target_bs, aio_context, 1923 common->block_job_txn, errp); 1924 1925 aio_context_release(aio_context); 1926 } 1927 1928 static void blockdev_backup_commit(BlkActionState *common) 1929 { 1930 BlockdevBackupState *state = DO_UPCAST(BlockdevBackupState, common, common); 1931 AioContext *aio_context; 1932 1933 aio_context = bdrv_get_aio_context(state->bs); 1934 aio_context_acquire(aio_context); 1935 1936 assert(state->job); 1937 job_start(&state->job->job); 1938 1939 aio_context_release(aio_context); 1940 } 1941 1942 static void blockdev_backup_abort(BlkActionState *common) 1943 { 1944 BlockdevBackupState *state = DO_UPCAST(BlockdevBackupState, common, common); 1945 1946 if (state->job) { 1947 AioContext *aio_context; 1948 1949 aio_context = bdrv_get_aio_context(state->bs); 1950 aio_context_acquire(aio_context); 1951 1952 job_cancel_sync(&state->job->job); 1953 1954 aio_context_release(aio_context); 1955 } 1956 } 1957 1958 static void blockdev_backup_clean(BlkActionState *common) 1959 { 1960 BlockdevBackupState *state = DO_UPCAST(BlockdevBackupState, common, common); 1961 AioContext *aio_context; 1962 1963 if (!state->bs) { 1964 return; 1965 } 1966 1967 aio_context = bdrv_get_aio_context(state->bs); 1968 aio_context_acquire(aio_context); 1969 1970 bdrv_drained_end(state->bs); 1971 1972 aio_context_release(aio_context); 1973 } 1974 1975 typedef struct BlockDirtyBitmapState { 1976 BlkActionState common; 1977 BdrvDirtyBitmap *bitmap; 1978 BlockDriverState *bs; 1979 HBitmap *backup; 1980 bool prepared; 1981 bool was_enabled; 1982 } BlockDirtyBitmapState; 1983 1984 static void block_dirty_bitmap_add_prepare(BlkActionState *common, 1985 Error **errp) 1986 { 1987 Error *local_err = NULL; 1988 BlockDirtyBitmapAdd *action; 1989 BlockDirtyBitmapState *state = DO_UPCAST(BlockDirtyBitmapState, 1990 common, common); 1991 1992 if (action_check_completion_mode(common, errp) < 0) { 1993 return; 1994 } 1995 1996 action = common->action->u.block_dirty_bitmap_add.data; 1997 /* AIO context taken and released within qmp_block_dirty_bitmap_add */ 1998 qmp_block_dirty_bitmap_add(action->node, action->name, 1999 action->has_granularity, action->granularity, 2000 action->has_persistent, action->persistent, 2001 action->has_disabled, action->disabled, 2002 &local_err); 2003 2004 if (!local_err) { 2005 state->prepared = true; 2006 } else { 2007 error_propagate(errp, local_err); 2008 } 2009 } 2010 2011 static void block_dirty_bitmap_add_abort(BlkActionState *common) 2012 { 2013 BlockDirtyBitmapAdd *action; 2014 BlockDirtyBitmapState *state = DO_UPCAST(BlockDirtyBitmapState, 2015 common, common); 2016 2017 action = common->action->u.block_dirty_bitmap_add.data; 2018 /* Should not be able to fail: IF the bitmap was added via .prepare(), 2019 * then the node reference and bitmap name must have been valid. 2020 */ 2021 if (state->prepared) { 2022 qmp_block_dirty_bitmap_remove(action->node, action->name, &error_abort); 2023 } 2024 } 2025 2026 static void block_dirty_bitmap_clear_prepare(BlkActionState *common, 2027 Error **errp) 2028 { 2029 BlockDirtyBitmapState *state = DO_UPCAST(BlockDirtyBitmapState, 2030 common, common); 2031 BlockDirtyBitmap *action; 2032 2033 if (action_check_completion_mode(common, errp) < 0) { 2034 return; 2035 } 2036 2037 action = common->action->u.block_dirty_bitmap_clear.data; 2038 state->bitmap = block_dirty_bitmap_lookup(action->node, 2039 action->name, 2040 &state->bs, 2041 errp); 2042 if (!state->bitmap) { 2043 return; 2044 } 2045 2046 if (bdrv_dirty_bitmap_check(state->bitmap, BDRV_BITMAP_DEFAULT, errp)) { 2047 return; 2048 } 2049 2050 bdrv_clear_dirty_bitmap(state->bitmap, &state->backup); 2051 } 2052 2053 static void block_dirty_bitmap_restore(BlkActionState *common) 2054 { 2055 BlockDirtyBitmapState *state = DO_UPCAST(BlockDirtyBitmapState, 2056 common, common); 2057 2058 if (state->backup) { 2059 bdrv_restore_dirty_bitmap(state->bitmap, state->backup); 2060 } 2061 } 2062 2063 static void block_dirty_bitmap_free_backup(BlkActionState *common) 2064 { 2065 BlockDirtyBitmapState *state = DO_UPCAST(BlockDirtyBitmapState, 2066 common, common); 2067 2068 hbitmap_free(state->backup); 2069 } 2070 2071 static void block_dirty_bitmap_enable_prepare(BlkActionState *common, 2072 Error **errp) 2073 { 2074 BlockDirtyBitmap *action; 2075 BlockDirtyBitmapState *state = DO_UPCAST(BlockDirtyBitmapState, 2076 common, common); 2077 2078 if (action_check_completion_mode(common, errp) < 0) { 2079 return; 2080 } 2081 2082 action = common->action->u.block_dirty_bitmap_enable.data; 2083 state->bitmap = block_dirty_bitmap_lookup(action->node, 2084 action->name, 2085 NULL, 2086 errp); 2087 if (!state->bitmap) { 2088 return; 2089 } 2090 2091 if (bdrv_dirty_bitmap_check(state->bitmap, BDRV_BITMAP_ALLOW_RO, errp)) { 2092 return; 2093 } 2094 2095 state->was_enabled = bdrv_dirty_bitmap_enabled(state->bitmap); 2096 bdrv_enable_dirty_bitmap(state->bitmap); 2097 } 2098 2099 static void block_dirty_bitmap_enable_abort(BlkActionState *common) 2100 { 2101 BlockDirtyBitmapState *state = DO_UPCAST(BlockDirtyBitmapState, 2102 common, common); 2103 2104 if (!state->was_enabled) { 2105 bdrv_disable_dirty_bitmap(state->bitmap); 2106 } 2107 } 2108 2109 static void block_dirty_bitmap_disable_prepare(BlkActionState *common, 2110 Error **errp) 2111 { 2112 BlockDirtyBitmap *action; 2113 BlockDirtyBitmapState *state = DO_UPCAST(BlockDirtyBitmapState, 2114 common, common); 2115 2116 if (action_check_completion_mode(common, errp) < 0) { 2117 return; 2118 } 2119 2120 action = common->action->u.block_dirty_bitmap_disable.data; 2121 state->bitmap = block_dirty_bitmap_lookup(action->node, 2122 action->name, 2123 NULL, 2124 errp); 2125 if (!state->bitmap) { 2126 return; 2127 } 2128 2129 if (bdrv_dirty_bitmap_check(state->bitmap, BDRV_BITMAP_ALLOW_RO, errp)) { 2130 return; 2131 } 2132 2133 state->was_enabled = bdrv_dirty_bitmap_enabled(state->bitmap); 2134 bdrv_disable_dirty_bitmap(state->bitmap); 2135 } 2136 2137 static void block_dirty_bitmap_disable_abort(BlkActionState *common) 2138 { 2139 BlockDirtyBitmapState *state = DO_UPCAST(BlockDirtyBitmapState, 2140 common, common); 2141 2142 if (state->was_enabled) { 2143 bdrv_enable_dirty_bitmap(state->bitmap); 2144 } 2145 } 2146 2147 static void block_dirty_bitmap_merge_prepare(BlkActionState *common, 2148 Error **errp) 2149 { 2150 BlockDirtyBitmapMerge *action; 2151 BlockDirtyBitmapState *state = DO_UPCAST(BlockDirtyBitmapState, 2152 common, common); 2153 2154 if (action_check_completion_mode(common, errp) < 0) { 2155 return; 2156 } 2157 2158 action = common->action->u.block_dirty_bitmap_merge.data; 2159 2160 state->bitmap = block_dirty_bitmap_merge(action->node, action->target, 2161 action->bitmaps, &state->backup, 2162 errp); 2163 } 2164 2165 static void block_dirty_bitmap_remove_prepare(BlkActionState *common, 2166 Error **errp) 2167 { 2168 BlockDirtyBitmap *action; 2169 BlockDirtyBitmapState *state = DO_UPCAST(BlockDirtyBitmapState, 2170 common, common); 2171 2172 if (action_check_completion_mode(common, errp) < 0) { 2173 return; 2174 } 2175 2176 action = common->action->u.block_dirty_bitmap_remove.data; 2177 2178 state->bitmap = block_dirty_bitmap_remove(action->node, action->name, 2179 false, &state->bs, errp); 2180 if (state->bitmap) { 2181 bdrv_dirty_bitmap_skip_store(state->bitmap, true); 2182 bdrv_dirty_bitmap_set_busy(state->bitmap, true); 2183 } 2184 } 2185 2186 static void block_dirty_bitmap_remove_abort(BlkActionState *common) 2187 { 2188 BlockDirtyBitmapState *state = DO_UPCAST(BlockDirtyBitmapState, 2189 common, common); 2190 2191 if (state->bitmap) { 2192 bdrv_dirty_bitmap_skip_store(state->bitmap, false); 2193 bdrv_dirty_bitmap_set_busy(state->bitmap, false); 2194 } 2195 } 2196 2197 static void block_dirty_bitmap_remove_commit(BlkActionState *common) 2198 { 2199 BlockDirtyBitmapState *state = DO_UPCAST(BlockDirtyBitmapState, 2200 common, common); 2201 2202 bdrv_dirty_bitmap_set_busy(state->bitmap, false); 2203 bdrv_release_dirty_bitmap(state->bitmap); 2204 } 2205 2206 static void abort_prepare(BlkActionState *common, Error **errp) 2207 { 2208 error_setg(errp, "Transaction aborted using Abort action"); 2209 } 2210 2211 static void abort_commit(BlkActionState *common) 2212 { 2213 g_assert_not_reached(); /* this action never succeeds */ 2214 } 2215 2216 static const BlkActionOps actions[] = { 2217 [TRANSACTION_ACTION_KIND_BLOCKDEV_SNAPSHOT] = { 2218 .instance_size = sizeof(ExternalSnapshotState), 2219 .prepare = external_snapshot_prepare, 2220 .commit = external_snapshot_commit, 2221 .abort = external_snapshot_abort, 2222 .clean = external_snapshot_clean, 2223 }, 2224 [TRANSACTION_ACTION_KIND_BLOCKDEV_SNAPSHOT_SYNC] = { 2225 .instance_size = sizeof(ExternalSnapshotState), 2226 .prepare = external_snapshot_prepare, 2227 .commit = external_snapshot_commit, 2228 .abort = external_snapshot_abort, 2229 .clean = external_snapshot_clean, 2230 }, 2231 [TRANSACTION_ACTION_KIND_DRIVE_BACKUP] = { 2232 .instance_size = sizeof(DriveBackupState), 2233 .prepare = drive_backup_prepare, 2234 .commit = drive_backup_commit, 2235 .abort = drive_backup_abort, 2236 .clean = drive_backup_clean, 2237 }, 2238 [TRANSACTION_ACTION_KIND_BLOCKDEV_BACKUP] = { 2239 .instance_size = sizeof(BlockdevBackupState), 2240 .prepare = blockdev_backup_prepare, 2241 .commit = blockdev_backup_commit, 2242 .abort = blockdev_backup_abort, 2243 .clean = blockdev_backup_clean, 2244 }, 2245 [TRANSACTION_ACTION_KIND_ABORT] = { 2246 .instance_size = sizeof(BlkActionState), 2247 .prepare = abort_prepare, 2248 .commit = abort_commit, 2249 }, 2250 [TRANSACTION_ACTION_KIND_BLOCKDEV_SNAPSHOT_INTERNAL_SYNC] = { 2251 .instance_size = sizeof(InternalSnapshotState), 2252 .prepare = internal_snapshot_prepare, 2253 .abort = internal_snapshot_abort, 2254 .clean = internal_snapshot_clean, 2255 }, 2256 [TRANSACTION_ACTION_KIND_BLOCK_DIRTY_BITMAP_ADD] = { 2257 .instance_size = sizeof(BlockDirtyBitmapState), 2258 .prepare = block_dirty_bitmap_add_prepare, 2259 .abort = block_dirty_bitmap_add_abort, 2260 }, 2261 [TRANSACTION_ACTION_KIND_BLOCK_DIRTY_BITMAP_CLEAR] = { 2262 .instance_size = sizeof(BlockDirtyBitmapState), 2263 .prepare = block_dirty_bitmap_clear_prepare, 2264 .commit = block_dirty_bitmap_free_backup, 2265 .abort = block_dirty_bitmap_restore, 2266 }, 2267 [TRANSACTION_ACTION_KIND_BLOCK_DIRTY_BITMAP_ENABLE] = { 2268 .instance_size = sizeof(BlockDirtyBitmapState), 2269 .prepare = block_dirty_bitmap_enable_prepare, 2270 .abort = block_dirty_bitmap_enable_abort, 2271 }, 2272 [TRANSACTION_ACTION_KIND_BLOCK_DIRTY_BITMAP_DISABLE] = { 2273 .instance_size = sizeof(BlockDirtyBitmapState), 2274 .prepare = block_dirty_bitmap_disable_prepare, 2275 .abort = block_dirty_bitmap_disable_abort, 2276 }, 2277 [TRANSACTION_ACTION_KIND_BLOCK_DIRTY_BITMAP_MERGE] = { 2278 .instance_size = sizeof(BlockDirtyBitmapState), 2279 .prepare = block_dirty_bitmap_merge_prepare, 2280 .commit = block_dirty_bitmap_free_backup, 2281 .abort = block_dirty_bitmap_restore, 2282 }, 2283 [TRANSACTION_ACTION_KIND_BLOCK_DIRTY_BITMAP_REMOVE] = { 2284 .instance_size = sizeof(BlockDirtyBitmapState), 2285 .prepare = block_dirty_bitmap_remove_prepare, 2286 .commit = block_dirty_bitmap_remove_commit, 2287 .abort = block_dirty_bitmap_remove_abort, 2288 }, 2289 /* Where are transactions for MIRROR, COMMIT and STREAM? 2290 * Although these blockjobs use transaction callbacks like the backup job, 2291 * these jobs do not necessarily adhere to transaction semantics. 2292 * These jobs may not fully undo all of their actions on abort, nor do they 2293 * necessarily work in transactions with more than one job in them. 2294 */ 2295 }; 2296 2297 /** 2298 * Allocate a TransactionProperties structure if necessary, and fill 2299 * that structure with desired defaults if they are unset. 2300 */ 2301 static TransactionProperties *get_transaction_properties( 2302 TransactionProperties *props) 2303 { 2304 if (!props) { 2305 props = g_new0(TransactionProperties, 1); 2306 } 2307 2308 if (!props->has_completion_mode) { 2309 props->has_completion_mode = true; 2310 props->completion_mode = ACTION_COMPLETION_MODE_INDIVIDUAL; 2311 } 2312 2313 return props; 2314 } 2315 2316 /* 2317 * 'Atomic' group operations. The operations are performed as a set, and if 2318 * any fail then we roll back all operations in the group. 2319 */ 2320 void qmp_transaction(TransactionActionList *dev_list, 2321 bool has_props, 2322 struct TransactionProperties *props, 2323 Error **errp) 2324 { 2325 TransactionActionList *dev_entry = dev_list; 2326 JobTxn *block_job_txn = NULL; 2327 BlkActionState *state, *next; 2328 Error *local_err = NULL; 2329 2330 QTAILQ_HEAD(, BlkActionState) snap_bdrv_states; 2331 QTAILQ_INIT(&snap_bdrv_states); 2332 2333 /* Does this transaction get canceled as a group on failure? 2334 * If not, we don't really need to make a JobTxn. 2335 */ 2336 props = get_transaction_properties(props); 2337 if (props->completion_mode != ACTION_COMPLETION_MODE_INDIVIDUAL) { 2338 block_job_txn = job_txn_new(); 2339 } 2340 2341 /* drain all i/o before any operations */ 2342 bdrv_drain_all(); 2343 2344 /* We don't do anything in this loop that commits us to the operations */ 2345 while (NULL != dev_entry) { 2346 TransactionAction *dev_info = NULL; 2347 const BlkActionOps *ops; 2348 2349 dev_info = dev_entry->value; 2350 dev_entry = dev_entry->next; 2351 2352 assert(dev_info->type < ARRAY_SIZE(actions)); 2353 2354 ops = &actions[dev_info->type]; 2355 assert(ops->instance_size > 0); 2356 2357 state = g_malloc0(ops->instance_size); 2358 state->ops = ops; 2359 state->action = dev_info; 2360 state->block_job_txn = block_job_txn; 2361 state->txn_props = props; 2362 QTAILQ_INSERT_TAIL(&snap_bdrv_states, state, entry); 2363 2364 state->ops->prepare(state, &local_err); 2365 if (local_err) { 2366 error_propagate(errp, local_err); 2367 goto delete_and_fail; 2368 } 2369 } 2370 2371 QTAILQ_FOREACH(state, &snap_bdrv_states, entry) { 2372 if (state->ops->commit) { 2373 state->ops->commit(state); 2374 } 2375 } 2376 2377 /* success */ 2378 goto exit; 2379 2380 delete_and_fail: 2381 /* failure, and it is all-or-none; roll back all operations */ 2382 QTAILQ_FOREACH_REVERSE(state, &snap_bdrv_states, entry) { 2383 if (state->ops->abort) { 2384 state->ops->abort(state); 2385 } 2386 } 2387 exit: 2388 QTAILQ_FOREACH_SAFE(state, &snap_bdrv_states, entry, next) { 2389 if (state->ops->clean) { 2390 state->ops->clean(state); 2391 } 2392 g_free(state); 2393 } 2394 if (!has_props) { 2395 qapi_free_TransactionProperties(props); 2396 } 2397 job_txn_unref(block_job_txn); 2398 } 2399 2400 BlockDirtyBitmapSha256 *qmp_x_debug_block_dirty_bitmap_sha256(const char *node, 2401 const char *name, 2402 Error **errp) 2403 { 2404 BdrvDirtyBitmap *bitmap; 2405 BlockDriverState *bs; 2406 BlockDirtyBitmapSha256 *ret = NULL; 2407 char *sha256; 2408 2409 bitmap = block_dirty_bitmap_lookup(node, name, &bs, errp); 2410 if (!bitmap || !bs) { 2411 return NULL; 2412 } 2413 2414 sha256 = bdrv_dirty_bitmap_sha256(bitmap, errp); 2415 if (sha256 == NULL) { 2416 return NULL; 2417 } 2418 2419 ret = g_new(BlockDirtyBitmapSha256, 1); 2420 ret->sha256 = sha256; 2421 2422 return ret; 2423 } 2424 2425 void coroutine_fn qmp_block_resize(bool has_device, const char *device, 2426 bool has_node_name, const char *node_name, 2427 int64_t size, Error **errp) 2428 { 2429 Error *local_err = NULL; 2430 BlockBackend *blk; 2431 BlockDriverState *bs; 2432 AioContext *old_ctx; 2433 2434 bs = bdrv_lookup_bs(has_device ? device : NULL, 2435 has_node_name ? node_name : NULL, 2436 &local_err); 2437 if (local_err) { 2438 error_propagate(errp, local_err); 2439 return; 2440 } 2441 2442 if (size < 0) { 2443 error_setg(errp, QERR_INVALID_PARAMETER_VALUE, "size", "a >0 size"); 2444 return; 2445 } 2446 2447 if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_RESIZE, NULL)) { 2448 error_setg(errp, QERR_DEVICE_IN_USE, device); 2449 return; 2450 } 2451 2452 blk = blk_new_with_bs(bs, BLK_PERM_RESIZE, BLK_PERM_ALL, errp); 2453 if (!blk) { 2454 return; 2455 } 2456 2457 bdrv_co_lock(bs); 2458 bdrv_drained_begin(bs); 2459 bdrv_co_unlock(bs); 2460 2461 old_ctx = bdrv_co_enter(bs); 2462 blk_truncate(blk, size, false, PREALLOC_MODE_OFF, 0, errp); 2463 bdrv_co_leave(bs, old_ctx); 2464 2465 bdrv_co_lock(bs); 2466 bdrv_drained_end(bs); 2467 blk_unref(blk); 2468 bdrv_co_unlock(bs); 2469 } 2470 2471 void qmp_block_stream(bool has_job_id, const char *job_id, const char *device, 2472 bool has_base, const char *base, 2473 bool has_base_node, const char *base_node, 2474 bool has_backing_file, const char *backing_file, 2475 bool has_bottom, const char *bottom, 2476 bool has_speed, int64_t speed, 2477 bool has_on_error, BlockdevOnError on_error, 2478 bool has_filter_node_name, const char *filter_node_name, 2479 bool has_auto_finalize, bool auto_finalize, 2480 bool has_auto_dismiss, bool auto_dismiss, 2481 Error **errp) 2482 { 2483 BlockDriverState *bs, *iter, *iter_end; 2484 BlockDriverState *base_bs = NULL; 2485 BlockDriverState *bottom_bs = NULL; 2486 AioContext *aio_context; 2487 Error *local_err = NULL; 2488 int job_flags = JOB_DEFAULT; 2489 2490 if (has_base && has_base_node) { 2491 error_setg(errp, "'base' and 'base-node' cannot be specified " 2492 "at the same time"); 2493 return; 2494 } 2495 2496 if (has_base && has_bottom) { 2497 error_setg(errp, "'base' and 'bottom' cannot be specified " 2498 "at the same time"); 2499 return; 2500 } 2501 2502 if (has_bottom && has_base_node) { 2503 error_setg(errp, "'bottom' and 'base-node' cannot be specified " 2504 "at the same time"); 2505 return; 2506 } 2507 2508 if (!has_on_error) { 2509 on_error = BLOCKDEV_ON_ERROR_REPORT; 2510 } 2511 2512 bs = bdrv_lookup_bs(device, device, errp); 2513 if (!bs) { 2514 return; 2515 } 2516 2517 aio_context = bdrv_get_aio_context(bs); 2518 aio_context_acquire(aio_context); 2519 2520 if (has_base) { 2521 base_bs = bdrv_find_backing_image(bs, base); 2522 if (base_bs == NULL) { 2523 error_setg(errp, "Can't find '%s' in the backing chain", base); 2524 goto out; 2525 } 2526 assert(bdrv_get_aio_context(base_bs) == aio_context); 2527 } 2528 2529 if (has_base_node) { 2530 base_bs = bdrv_lookup_bs(NULL, base_node, errp); 2531 if (!base_bs) { 2532 goto out; 2533 } 2534 if (bs == base_bs || !bdrv_chain_contains(bs, base_bs)) { 2535 error_setg(errp, "Node '%s' is not a backing image of '%s'", 2536 base_node, device); 2537 goto out; 2538 } 2539 assert(bdrv_get_aio_context(base_bs) == aio_context); 2540 bdrv_refresh_filename(base_bs); 2541 } 2542 2543 if (has_bottom) { 2544 bottom_bs = bdrv_lookup_bs(NULL, bottom, errp); 2545 if (!bottom_bs) { 2546 goto out; 2547 } 2548 if (!bottom_bs->drv) { 2549 error_setg(errp, "Node '%s' is not open", bottom); 2550 goto out; 2551 } 2552 if (bottom_bs->drv->is_filter) { 2553 error_setg(errp, "Node '%s' is a filter, use a non-filter node " 2554 "as 'bottom'", bottom); 2555 goto out; 2556 } 2557 if (!bdrv_chain_contains(bs, bottom_bs)) { 2558 error_setg(errp, "Node '%s' is not in a chain starting from '%s'", 2559 bottom, device); 2560 goto out; 2561 } 2562 assert(bdrv_get_aio_context(bottom_bs) == aio_context); 2563 } 2564 2565 /* 2566 * Check for op blockers in the whole chain between bs and base (or bottom) 2567 */ 2568 iter_end = has_bottom ? bdrv_filter_or_cow_bs(bottom_bs) : base_bs; 2569 for (iter = bs; iter && iter != iter_end; 2570 iter = bdrv_filter_or_cow_bs(iter)) 2571 { 2572 if (bdrv_op_is_blocked(iter, BLOCK_OP_TYPE_STREAM, errp)) { 2573 goto out; 2574 } 2575 } 2576 2577 /* if we are streaming the entire chain, the result will have no backing 2578 * file, and specifying one is therefore an error */ 2579 if (base_bs == NULL && has_backing_file) { 2580 error_setg(errp, "backing file specified, but streaming the " 2581 "entire chain"); 2582 goto out; 2583 } 2584 2585 if (has_auto_finalize && !auto_finalize) { 2586 job_flags |= JOB_MANUAL_FINALIZE; 2587 } 2588 if (has_auto_dismiss && !auto_dismiss) { 2589 job_flags |= JOB_MANUAL_DISMISS; 2590 } 2591 2592 stream_start(has_job_id ? job_id : NULL, bs, base_bs, backing_file, 2593 bottom_bs, job_flags, has_speed ? speed : 0, on_error, 2594 filter_node_name, &local_err); 2595 if (local_err) { 2596 error_propagate(errp, local_err); 2597 goto out; 2598 } 2599 2600 trace_qmp_block_stream(bs); 2601 2602 out: 2603 aio_context_release(aio_context); 2604 } 2605 2606 void qmp_block_commit(bool has_job_id, const char *job_id, const char *device, 2607 bool has_base_node, const char *base_node, 2608 bool has_base, const char *base, 2609 bool has_top_node, const char *top_node, 2610 bool has_top, const char *top, 2611 bool has_backing_file, const char *backing_file, 2612 bool has_speed, int64_t speed, 2613 bool has_on_error, BlockdevOnError on_error, 2614 bool has_filter_node_name, const char *filter_node_name, 2615 bool has_auto_finalize, bool auto_finalize, 2616 bool has_auto_dismiss, bool auto_dismiss, 2617 Error **errp) 2618 { 2619 BlockDriverState *bs; 2620 BlockDriverState *iter; 2621 BlockDriverState *base_bs, *top_bs; 2622 AioContext *aio_context; 2623 Error *local_err = NULL; 2624 int job_flags = JOB_DEFAULT; 2625 uint64_t top_perm, top_shared; 2626 2627 if (!has_speed) { 2628 speed = 0; 2629 } 2630 if (!has_on_error) { 2631 on_error = BLOCKDEV_ON_ERROR_REPORT; 2632 } 2633 if (!has_filter_node_name) { 2634 filter_node_name = NULL; 2635 } 2636 if (has_auto_finalize && !auto_finalize) { 2637 job_flags |= JOB_MANUAL_FINALIZE; 2638 } 2639 if (has_auto_dismiss && !auto_dismiss) { 2640 job_flags |= JOB_MANUAL_DISMISS; 2641 } 2642 2643 /* Important Note: 2644 * libvirt relies on the DeviceNotFound error class in order to probe for 2645 * live commit feature versions; for this to work, we must make sure to 2646 * perform the device lookup before any generic errors that may occur in a 2647 * scenario in which all optional arguments are omitted. */ 2648 bs = qmp_get_root_bs(device, &local_err); 2649 if (!bs) { 2650 bs = bdrv_lookup_bs(device, device, NULL); 2651 if (!bs) { 2652 error_free(local_err); 2653 error_set(errp, ERROR_CLASS_DEVICE_NOT_FOUND, 2654 "Device '%s' not found", device); 2655 } else { 2656 error_propagate(errp, local_err); 2657 } 2658 return; 2659 } 2660 2661 aio_context = bdrv_get_aio_context(bs); 2662 aio_context_acquire(aio_context); 2663 2664 if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_COMMIT_SOURCE, errp)) { 2665 goto out; 2666 } 2667 2668 /* default top_bs is the active layer */ 2669 top_bs = bs; 2670 2671 if (has_top_node && has_top) { 2672 error_setg(errp, "'top-node' and 'top' are mutually exclusive"); 2673 goto out; 2674 } else if (has_top_node) { 2675 top_bs = bdrv_lookup_bs(NULL, top_node, errp); 2676 if (top_bs == NULL) { 2677 goto out; 2678 } 2679 if (!bdrv_chain_contains(bs, top_bs)) { 2680 error_setg(errp, "'%s' is not in this backing file chain", 2681 top_node); 2682 goto out; 2683 } 2684 } else if (has_top && top) { 2685 /* This strcmp() is just a shortcut, there is no need to 2686 * refresh @bs's filename. If it mismatches, 2687 * bdrv_find_backing_image() will do the refresh and may still 2688 * return @bs. */ 2689 if (strcmp(bs->filename, top) != 0) { 2690 top_bs = bdrv_find_backing_image(bs, top); 2691 } 2692 } 2693 2694 if (top_bs == NULL) { 2695 error_setg(errp, "Top image file %s not found", top ? top : "NULL"); 2696 goto out; 2697 } 2698 2699 assert(bdrv_get_aio_context(top_bs) == aio_context); 2700 2701 if (has_base_node && has_base) { 2702 error_setg(errp, "'base-node' and 'base' are mutually exclusive"); 2703 goto out; 2704 } else if (has_base_node) { 2705 base_bs = bdrv_lookup_bs(NULL, base_node, errp); 2706 if (base_bs == NULL) { 2707 goto out; 2708 } 2709 if (!bdrv_chain_contains(top_bs, base_bs)) { 2710 error_setg(errp, "'%s' is not in this backing file chain", 2711 base_node); 2712 goto out; 2713 } 2714 } else if (has_base && base) { 2715 base_bs = bdrv_find_backing_image(top_bs, base); 2716 if (base_bs == NULL) { 2717 error_setg(errp, "Can't find '%s' in the backing chain", base); 2718 goto out; 2719 } 2720 } else { 2721 base_bs = bdrv_find_base(top_bs); 2722 if (base_bs == NULL) { 2723 error_setg(errp, "There is no backimg image"); 2724 goto out; 2725 } 2726 } 2727 2728 assert(bdrv_get_aio_context(base_bs) == aio_context); 2729 2730 for (iter = top_bs; iter != bdrv_filter_or_cow_bs(base_bs); 2731 iter = bdrv_filter_or_cow_bs(iter)) 2732 { 2733 if (bdrv_op_is_blocked(iter, BLOCK_OP_TYPE_COMMIT_TARGET, errp)) { 2734 goto out; 2735 } 2736 } 2737 2738 /* Do not allow attempts to commit an image into itself */ 2739 if (top_bs == base_bs) { 2740 error_setg(errp, "cannot commit an image into itself"); 2741 goto out; 2742 } 2743 2744 /* 2745 * Active commit is required if and only if someone has taken a 2746 * WRITE permission on the top node. Historically, we have always 2747 * used active commit for top nodes, so continue that practice 2748 * lest we possibly break clients that rely on this behavior, e.g. 2749 * to later attach this node to a writing parent. 2750 * (Active commit is never really wrong.) 2751 */ 2752 bdrv_get_cumulative_perm(top_bs, &top_perm, &top_shared); 2753 if (top_perm & BLK_PERM_WRITE || 2754 bdrv_skip_filters(top_bs) == bdrv_skip_filters(bs)) 2755 { 2756 if (has_backing_file) { 2757 if (bdrv_skip_filters(top_bs) == bdrv_skip_filters(bs)) { 2758 error_setg(errp, "'backing-file' specified," 2759 " but 'top' is the active layer"); 2760 } else { 2761 error_setg(errp, "'backing-file' specified, but 'top' has a " 2762 "writer on it"); 2763 } 2764 goto out; 2765 } 2766 if (!has_job_id) { 2767 /* 2768 * Emulate here what block_job_create() does, because it 2769 * is possible that @bs != @top_bs (the block job should 2770 * be named after @bs, even if @top_bs is the actual 2771 * source) 2772 */ 2773 job_id = bdrv_get_device_name(bs); 2774 } 2775 commit_active_start(job_id, top_bs, base_bs, job_flags, speed, on_error, 2776 filter_node_name, NULL, NULL, false, &local_err); 2777 } else { 2778 BlockDriverState *overlay_bs = bdrv_find_overlay(bs, top_bs); 2779 if (bdrv_op_is_blocked(overlay_bs, BLOCK_OP_TYPE_COMMIT_TARGET, errp)) { 2780 goto out; 2781 } 2782 commit_start(has_job_id ? job_id : NULL, bs, base_bs, top_bs, job_flags, 2783 speed, on_error, has_backing_file ? backing_file : NULL, 2784 filter_node_name, &local_err); 2785 } 2786 if (local_err != NULL) { 2787 error_propagate(errp, local_err); 2788 goto out; 2789 } 2790 2791 out: 2792 aio_context_release(aio_context); 2793 } 2794 2795 /* Common QMP interface for drive-backup and blockdev-backup */ 2796 static BlockJob *do_backup_common(BackupCommon *backup, 2797 BlockDriverState *bs, 2798 BlockDriverState *target_bs, 2799 AioContext *aio_context, 2800 JobTxn *txn, Error **errp) 2801 { 2802 BlockJob *job = NULL; 2803 BdrvDirtyBitmap *bmap = NULL; 2804 BackupPerf perf = { .max_workers = 64 }; 2805 int job_flags = JOB_DEFAULT; 2806 2807 if (!backup->has_speed) { 2808 backup->speed = 0; 2809 } 2810 if (!backup->has_on_source_error) { 2811 backup->on_source_error = BLOCKDEV_ON_ERROR_REPORT; 2812 } 2813 if (!backup->has_on_target_error) { 2814 backup->on_target_error = BLOCKDEV_ON_ERROR_REPORT; 2815 } 2816 if (!backup->has_job_id) { 2817 backup->job_id = NULL; 2818 } 2819 if (!backup->has_auto_finalize) { 2820 backup->auto_finalize = true; 2821 } 2822 if (!backup->has_auto_dismiss) { 2823 backup->auto_dismiss = true; 2824 } 2825 if (!backup->has_compress) { 2826 backup->compress = false; 2827 } 2828 2829 if (backup->x_perf) { 2830 if (backup->x_perf->has_use_copy_range) { 2831 perf.use_copy_range = backup->x_perf->use_copy_range; 2832 } 2833 if (backup->x_perf->has_max_workers) { 2834 perf.max_workers = backup->x_perf->max_workers; 2835 } 2836 if (backup->x_perf->has_max_chunk) { 2837 perf.max_chunk = backup->x_perf->max_chunk; 2838 } 2839 } 2840 2841 if ((backup->sync == MIRROR_SYNC_MODE_BITMAP) || 2842 (backup->sync == MIRROR_SYNC_MODE_INCREMENTAL)) { 2843 /* done before desugaring 'incremental' to print the right message */ 2844 if (!backup->has_bitmap) { 2845 error_setg(errp, "must provide a valid bitmap name for " 2846 "'%s' sync mode", MirrorSyncMode_str(backup->sync)); 2847 return NULL; 2848 } 2849 } 2850 2851 if (backup->sync == MIRROR_SYNC_MODE_INCREMENTAL) { 2852 if (backup->has_bitmap_mode && 2853 backup->bitmap_mode != BITMAP_SYNC_MODE_ON_SUCCESS) { 2854 error_setg(errp, "Bitmap sync mode must be '%s' " 2855 "when using sync mode '%s'", 2856 BitmapSyncMode_str(BITMAP_SYNC_MODE_ON_SUCCESS), 2857 MirrorSyncMode_str(backup->sync)); 2858 return NULL; 2859 } 2860 backup->has_bitmap_mode = true; 2861 backup->sync = MIRROR_SYNC_MODE_BITMAP; 2862 backup->bitmap_mode = BITMAP_SYNC_MODE_ON_SUCCESS; 2863 } 2864 2865 if (backup->has_bitmap) { 2866 bmap = bdrv_find_dirty_bitmap(bs, backup->bitmap); 2867 if (!bmap) { 2868 error_setg(errp, "Bitmap '%s' could not be found", backup->bitmap); 2869 return NULL; 2870 } 2871 if (!backup->has_bitmap_mode) { 2872 error_setg(errp, "Bitmap sync mode must be given " 2873 "when providing a bitmap"); 2874 return NULL; 2875 } 2876 if (bdrv_dirty_bitmap_check(bmap, BDRV_BITMAP_ALLOW_RO, errp)) { 2877 return NULL; 2878 } 2879 2880 /* This does not produce a useful bitmap artifact: */ 2881 if (backup->sync == MIRROR_SYNC_MODE_NONE) { 2882 error_setg(errp, "sync mode '%s' does not produce meaningful bitmap" 2883 " outputs", MirrorSyncMode_str(backup->sync)); 2884 return NULL; 2885 } 2886 2887 /* If the bitmap isn't used for input or output, this is useless: */ 2888 if (backup->bitmap_mode == BITMAP_SYNC_MODE_NEVER && 2889 backup->sync != MIRROR_SYNC_MODE_BITMAP) { 2890 error_setg(errp, "Bitmap sync mode '%s' has no meaningful effect" 2891 " when combined with sync mode '%s'", 2892 BitmapSyncMode_str(backup->bitmap_mode), 2893 MirrorSyncMode_str(backup->sync)); 2894 return NULL; 2895 } 2896 } 2897 2898 if (!backup->has_bitmap && backup->has_bitmap_mode) { 2899 error_setg(errp, "Cannot specify bitmap sync mode without a bitmap"); 2900 return NULL; 2901 } 2902 2903 if (!backup->auto_finalize) { 2904 job_flags |= JOB_MANUAL_FINALIZE; 2905 } 2906 if (!backup->auto_dismiss) { 2907 job_flags |= JOB_MANUAL_DISMISS; 2908 } 2909 2910 job = backup_job_create(backup->job_id, bs, target_bs, backup->speed, 2911 backup->sync, bmap, backup->bitmap_mode, 2912 backup->compress, 2913 backup->filter_node_name, 2914 &perf, 2915 backup->on_source_error, 2916 backup->on_target_error, 2917 job_flags, NULL, NULL, txn, errp); 2918 return job; 2919 } 2920 2921 void qmp_drive_backup(DriveBackup *backup, Error **errp) 2922 { 2923 TransactionAction action = { 2924 .type = TRANSACTION_ACTION_KIND_DRIVE_BACKUP, 2925 .u.drive_backup.data = backup, 2926 }; 2927 blockdev_do_action(&action, errp); 2928 } 2929 2930 BlockDeviceInfoList *qmp_query_named_block_nodes(bool has_flat, 2931 bool flat, 2932 Error **errp) 2933 { 2934 bool return_flat = has_flat && flat; 2935 2936 return bdrv_named_nodes_list(return_flat, errp); 2937 } 2938 2939 XDbgBlockGraph *qmp_x_debug_query_block_graph(Error **errp) 2940 { 2941 return bdrv_get_xdbg_block_graph(errp); 2942 } 2943 2944 void qmp_blockdev_backup(BlockdevBackup *backup, Error **errp) 2945 { 2946 TransactionAction action = { 2947 .type = TRANSACTION_ACTION_KIND_BLOCKDEV_BACKUP, 2948 .u.blockdev_backup.data = backup, 2949 }; 2950 blockdev_do_action(&action, errp); 2951 } 2952 2953 /* Parameter check and block job starting for drive mirroring. 2954 * Caller should hold @device and @target's aio context (must be the same). 2955 **/ 2956 static void blockdev_mirror_common(const char *job_id, BlockDriverState *bs, 2957 BlockDriverState *target, 2958 bool has_replaces, const char *replaces, 2959 enum MirrorSyncMode sync, 2960 BlockMirrorBackingMode backing_mode, 2961 bool zero_target, 2962 bool has_speed, int64_t speed, 2963 bool has_granularity, uint32_t granularity, 2964 bool has_buf_size, int64_t buf_size, 2965 bool has_on_source_error, 2966 BlockdevOnError on_source_error, 2967 bool has_on_target_error, 2968 BlockdevOnError on_target_error, 2969 bool has_unmap, bool unmap, 2970 bool has_filter_node_name, 2971 const char *filter_node_name, 2972 bool has_copy_mode, MirrorCopyMode copy_mode, 2973 bool has_auto_finalize, bool auto_finalize, 2974 bool has_auto_dismiss, bool auto_dismiss, 2975 Error **errp) 2976 { 2977 BlockDriverState *unfiltered_bs; 2978 int job_flags = JOB_DEFAULT; 2979 2980 if (!has_speed) { 2981 speed = 0; 2982 } 2983 if (!has_on_source_error) { 2984 on_source_error = BLOCKDEV_ON_ERROR_REPORT; 2985 } 2986 if (!has_on_target_error) { 2987 on_target_error = BLOCKDEV_ON_ERROR_REPORT; 2988 } 2989 if (!has_granularity) { 2990 granularity = 0; 2991 } 2992 if (!has_buf_size) { 2993 buf_size = 0; 2994 } 2995 if (!has_unmap) { 2996 unmap = true; 2997 } 2998 if (!has_filter_node_name) { 2999 filter_node_name = NULL; 3000 } 3001 if (!has_copy_mode) { 3002 copy_mode = MIRROR_COPY_MODE_BACKGROUND; 3003 } 3004 if (has_auto_finalize && !auto_finalize) { 3005 job_flags |= JOB_MANUAL_FINALIZE; 3006 } 3007 if (has_auto_dismiss && !auto_dismiss) { 3008 job_flags |= JOB_MANUAL_DISMISS; 3009 } 3010 3011 if (granularity != 0 && (granularity < 512 || granularity > 1048576 * 64)) { 3012 error_setg(errp, QERR_INVALID_PARAMETER_VALUE, "granularity", 3013 "a value in range [512B, 64MB]"); 3014 return; 3015 } 3016 if (granularity & (granularity - 1)) { 3017 error_setg(errp, QERR_INVALID_PARAMETER_VALUE, "granularity", 3018 "a power of 2"); 3019 return; 3020 } 3021 3022 if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_MIRROR_SOURCE, errp)) { 3023 return; 3024 } 3025 if (bdrv_op_is_blocked(target, BLOCK_OP_TYPE_MIRROR_TARGET, errp)) { 3026 return; 3027 } 3028 3029 if (!bdrv_backing_chain_next(bs) && sync == MIRROR_SYNC_MODE_TOP) { 3030 sync = MIRROR_SYNC_MODE_FULL; 3031 } 3032 3033 if (!has_replaces) { 3034 /* We want to mirror from @bs, but keep implicit filters on top */ 3035 unfiltered_bs = bdrv_skip_implicit_filters(bs); 3036 if (unfiltered_bs != bs) { 3037 replaces = unfiltered_bs->node_name; 3038 has_replaces = true; 3039 } 3040 } 3041 3042 if (has_replaces) { 3043 BlockDriverState *to_replace_bs; 3044 AioContext *replace_aio_context; 3045 int64_t bs_size, replace_size; 3046 3047 bs_size = bdrv_getlength(bs); 3048 if (bs_size < 0) { 3049 error_setg_errno(errp, -bs_size, "Failed to query device's size"); 3050 return; 3051 } 3052 3053 to_replace_bs = check_to_replace_node(bs, replaces, errp); 3054 if (!to_replace_bs) { 3055 return; 3056 } 3057 3058 replace_aio_context = bdrv_get_aio_context(to_replace_bs); 3059 aio_context_acquire(replace_aio_context); 3060 replace_size = bdrv_getlength(to_replace_bs); 3061 aio_context_release(replace_aio_context); 3062 3063 if (replace_size < 0) { 3064 error_setg_errno(errp, -replace_size, 3065 "Failed to query the replacement node's size"); 3066 return; 3067 } 3068 if (bs_size != replace_size) { 3069 error_setg(errp, "cannot replace image with a mirror image of " 3070 "different size"); 3071 return; 3072 } 3073 } 3074 3075 /* pass the node name to replace to mirror start since it's loose coupling 3076 * and will allow to check whether the node still exist at mirror completion 3077 */ 3078 mirror_start(job_id, bs, target, 3079 has_replaces ? replaces : NULL, job_flags, 3080 speed, granularity, buf_size, sync, backing_mode, zero_target, 3081 on_source_error, on_target_error, unmap, filter_node_name, 3082 copy_mode, errp); 3083 } 3084 3085 void qmp_drive_mirror(DriveMirror *arg, Error **errp) 3086 { 3087 BlockDriverState *bs; 3088 BlockDriverState *target_backing_bs, *target_bs; 3089 AioContext *aio_context; 3090 AioContext *old_context; 3091 BlockMirrorBackingMode backing_mode; 3092 Error *local_err = NULL; 3093 QDict *options = NULL; 3094 int flags; 3095 int64_t size; 3096 const char *format = arg->format; 3097 bool zero_target; 3098 int ret; 3099 3100 bs = qmp_get_root_bs(arg->device, errp); 3101 if (!bs) { 3102 return; 3103 } 3104 3105 /* Early check to avoid creating target */ 3106 if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_MIRROR_SOURCE, errp)) { 3107 return; 3108 } 3109 3110 aio_context = bdrv_get_aio_context(bs); 3111 aio_context_acquire(aio_context); 3112 3113 if (!arg->has_mode) { 3114 arg->mode = NEW_IMAGE_MODE_ABSOLUTE_PATHS; 3115 } 3116 3117 if (!arg->has_format) { 3118 format = (arg->mode == NEW_IMAGE_MODE_EXISTING 3119 ? NULL : bs->drv->format_name); 3120 } 3121 3122 flags = bs->open_flags | BDRV_O_RDWR; 3123 target_backing_bs = bdrv_cow_bs(bdrv_skip_filters(bs)); 3124 if (!target_backing_bs && arg->sync == MIRROR_SYNC_MODE_TOP) { 3125 arg->sync = MIRROR_SYNC_MODE_FULL; 3126 } 3127 if (arg->sync == MIRROR_SYNC_MODE_NONE) { 3128 target_backing_bs = bs; 3129 } 3130 3131 size = bdrv_getlength(bs); 3132 if (size < 0) { 3133 error_setg_errno(errp, -size, "bdrv_getlength failed"); 3134 goto out; 3135 } 3136 3137 if (arg->has_replaces) { 3138 if (!arg->has_node_name) { 3139 error_setg(errp, "a node-name must be provided when replacing a" 3140 " named node of the graph"); 3141 goto out; 3142 } 3143 } 3144 3145 if (arg->mode == NEW_IMAGE_MODE_ABSOLUTE_PATHS) { 3146 backing_mode = MIRROR_SOURCE_BACKING_CHAIN; 3147 } else { 3148 backing_mode = MIRROR_OPEN_BACKING_CHAIN; 3149 } 3150 3151 /* Don't open backing image in create() */ 3152 flags |= BDRV_O_NO_BACKING; 3153 3154 if ((arg->sync == MIRROR_SYNC_MODE_FULL || !target_backing_bs) 3155 && arg->mode != NEW_IMAGE_MODE_EXISTING) 3156 { 3157 /* create new image w/o backing file */ 3158 assert(format); 3159 bdrv_img_create(arg->target, format, 3160 NULL, NULL, NULL, size, flags, false, &local_err); 3161 } else { 3162 /* Implicit filters should not appear in the filename */ 3163 BlockDriverState *explicit_backing = 3164 bdrv_skip_implicit_filters(target_backing_bs); 3165 3166 switch (arg->mode) { 3167 case NEW_IMAGE_MODE_EXISTING: 3168 break; 3169 case NEW_IMAGE_MODE_ABSOLUTE_PATHS: 3170 /* create new image with backing file */ 3171 bdrv_refresh_filename(explicit_backing); 3172 bdrv_img_create(arg->target, format, 3173 explicit_backing->filename, 3174 explicit_backing->drv->format_name, 3175 NULL, size, flags, false, &local_err); 3176 break; 3177 default: 3178 abort(); 3179 } 3180 } 3181 3182 if (local_err) { 3183 error_propagate(errp, local_err); 3184 goto out; 3185 } 3186 3187 options = qdict_new(); 3188 if (arg->has_node_name) { 3189 qdict_put_str(options, "node-name", arg->node_name); 3190 } 3191 if (format) { 3192 qdict_put_str(options, "driver", format); 3193 } 3194 3195 /* Mirroring takes care of copy-on-write using the source's backing 3196 * file. 3197 */ 3198 target_bs = bdrv_open(arg->target, NULL, options, flags, errp); 3199 if (!target_bs) { 3200 goto out; 3201 } 3202 3203 zero_target = (arg->sync == MIRROR_SYNC_MODE_FULL && 3204 (arg->mode == NEW_IMAGE_MODE_EXISTING || 3205 !bdrv_has_zero_init(target_bs))); 3206 3207 3208 /* Honor bdrv_try_set_aio_context() context acquisition requirements. */ 3209 old_context = bdrv_get_aio_context(target_bs); 3210 aio_context_release(aio_context); 3211 aio_context_acquire(old_context); 3212 3213 ret = bdrv_try_set_aio_context(target_bs, aio_context, errp); 3214 if (ret < 0) { 3215 bdrv_unref(target_bs); 3216 aio_context_release(old_context); 3217 return; 3218 } 3219 3220 aio_context_release(old_context); 3221 aio_context_acquire(aio_context); 3222 3223 blockdev_mirror_common(arg->has_job_id ? arg->job_id : NULL, bs, target_bs, 3224 arg->has_replaces, arg->replaces, arg->sync, 3225 backing_mode, zero_target, 3226 arg->has_speed, arg->speed, 3227 arg->has_granularity, arg->granularity, 3228 arg->has_buf_size, arg->buf_size, 3229 arg->has_on_source_error, arg->on_source_error, 3230 arg->has_on_target_error, arg->on_target_error, 3231 arg->has_unmap, arg->unmap, 3232 false, NULL, 3233 arg->has_copy_mode, arg->copy_mode, 3234 arg->has_auto_finalize, arg->auto_finalize, 3235 arg->has_auto_dismiss, arg->auto_dismiss, 3236 errp); 3237 bdrv_unref(target_bs); 3238 out: 3239 aio_context_release(aio_context); 3240 } 3241 3242 void qmp_blockdev_mirror(bool has_job_id, const char *job_id, 3243 const char *device, const char *target, 3244 bool has_replaces, const char *replaces, 3245 MirrorSyncMode sync, 3246 bool has_speed, int64_t speed, 3247 bool has_granularity, uint32_t granularity, 3248 bool has_buf_size, int64_t buf_size, 3249 bool has_on_source_error, 3250 BlockdevOnError on_source_error, 3251 bool has_on_target_error, 3252 BlockdevOnError on_target_error, 3253 bool has_filter_node_name, 3254 const char *filter_node_name, 3255 bool has_copy_mode, MirrorCopyMode copy_mode, 3256 bool has_auto_finalize, bool auto_finalize, 3257 bool has_auto_dismiss, bool auto_dismiss, 3258 Error **errp) 3259 { 3260 BlockDriverState *bs; 3261 BlockDriverState *target_bs; 3262 AioContext *aio_context; 3263 AioContext *old_context; 3264 BlockMirrorBackingMode backing_mode = MIRROR_LEAVE_BACKING_CHAIN; 3265 bool zero_target; 3266 int ret; 3267 3268 bs = qmp_get_root_bs(device, errp); 3269 if (!bs) { 3270 return; 3271 } 3272 3273 target_bs = bdrv_lookup_bs(target, target, errp); 3274 if (!target_bs) { 3275 return; 3276 } 3277 3278 zero_target = (sync == MIRROR_SYNC_MODE_FULL); 3279 3280 /* Honor bdrv_try_set_aio_context() context acquisition requirements. */ 3281 old_context = bdrv_get_aio_context(target_bs); 3282 aio_context = bdrv_get_aio_context(bs); 3283 aio_context_acquire(old_context); 3284 3285 ret = bdrv_try_set_aio_context(target_bs, aio_context, errp); 3286 3287 aio_context_release(old_context); 3288 aio_context_acquire(aio_context); 3289 3290 if (ret < 0) { 3291 goto out; 3292 } 3293 3294 blockdev_mirror_common(has_job_id ? job_id : NULL, bs, target_bs, 3295 has_replaces, replaces, sync, backing_mode, 3296 zero_target, has_speed, speed, 3297 has_granularity, granularity, 3298 has_buf_size, buf_size, 3299 has_on_source_error, on_source_error, 3300 has_on_target_error, on_target_error, 3301 true, true, 3302 has_filter_node_name, filter_node_name, 3303 has_copy_mode, copy_mode, 3304 has_auto_finalize, auto_finalize, 3305 has_auto_dismiss, auto_dismiss, 3306 errp); 3307 out: 3308 aio_context_release(aio_context); 3309 } 3310 3311 /* Get a block job using its ID and acquire its AioContext */ 3312 static BlockJob *find_block_job(const char *id, AioContext **aio_context, 3313 Error **errp) 3314 { 3315 BlockJob *job; 3316 3317 assert(id != NULL); 3318 3319 *aio_context = NULL; 3320 3321 job = block_job_get(id); 3322 3323 if (!job) { 3324 error_set(errp, ERROR_CLASS_DEVICE_NOT_ACTIVE, 3325 "Block job '%s' not found", id); 3326 return NULL; 3327 } 3328 3329 *aio_context = blk_get_aio_context(job->blk); 3330 aio_context_acquire(*aio_context); 3331 3332 return job; 3333 } 3334 3335 void qmp_block_job_set_speed(const char *device, int64_t speed, Error **errp) 3336 { 3337 AioContext *aio_context; 3338 BlockJob *job = find_block_job(device, &aio_context, errp); 3339 3340 if (!job) { 3341 return; 3342 } 3343 3344 block_job_set_speed(job, speed, errp); 3345 aio_context_release(aio_context); 3346 } 3347 3348 void qmp_block_job_cancel(const char *device, 3349 bool has_force, bool force, Error **errp) 3350 { 3351 AioContext *aio_context; 3352 BlockJob *job = find_block_job(device, &aio_context, errp); 3353 3354 if (!job) { 3355 return; 3356 } 3357 3358 if (!has_force) { 3359 force = false; 3360 } 3361 3362 if (job_user_paused(&job->job) && !force) { 3363 error_setg(errp, "The block job for device '%s' is currently paused", 3364 device); 3365 goto out; 3366 } 3367 3368 trace_qmp_block_job_cancel(job); 3369 job_user_cancel(&job->job, force, errp); 3370 out: 3371 aio_context_release(aio_context); 3372 } 3373 3374 void qmp_block_job_pause(const char *device, Error **errp) 3375 { 3376 AioContext *aio_context; 3377 BlockJob *job = find_block_job(device, &aio_context, errp); 3378 3379 if (!job) { 3380 return; 3381 } 3382 3383 trace_qmp_block_job_pause(job); 3384 job_user_pause(&job->job, errp); 3385 aio_context_release(aio_context); 3386 } 3387 3388 void qmp_block_job_resume(const char *device, Error **errp) 3389 { 3390 AioContext *aio_context; 3391 BlockJob *job = find_block_job(device, &aio_context, errp); 3392 3393 if (!job) { 3394 return; 3395 } 3396 3397 trace_qmp_block_job_resume(job); 3398 job_user_resume(&job->job, errp); 3399 aio_context_release(aio_context); 3400 } 3401 3402 void qmp_block_job_complete(const char *device, Error **errp) 3403 { 3404 AioContext *aio_context; 3405 BlockJob *job = find_block_job(device, &aio_context, errp); 3406 3407 if (!job) { 3408 return; 3409 } 3410 3411 trace_qmp_block_job_complete(job); 3412 job_complete(&job->job, errp); 3413 aio_context_release(aio_context); 3414 } 3415 3416 void qmp_block_job_finalize(const char *id, Error **errp) 3417 { 3418 AioContext *aio_context; 3419 BlockJob *job = find_block_job(id, &aio_context, errp); 3420 3421 if (!job) { 3422 return; 3423 } 3424 3425 trace_qmp_block_job_finalize(job); 3426 job_ref(&job->job); 3427 job_finalize(&job->job, errp); 3428 3429 /* 3430 * Job's context might have changed via job_finalize (and job_txn_apply 3431 * automatically acquires the new one), so make sure we release the correct 3432 * one. 3433 */ 3434 aio_context = blk_get_aio_context(job->blk); 3435 job_unref(&job->job); 3436 aio_context_release(aio_context); 3437 } 3438 3439 void qmp_block_job_dismiss(const char *id, Error **errp) 3440 { 3441 AioContext *aio_context; 3442 BlockJob *bjob = find_block_job(id, &aio_context, errp); 3443 Job *job; 3444 3445 if (!bjob) { 3446 return; 3447 } 3448 3449 trace_qmp_block_job_dismiss(bjob); 3450 job = &bjob->job; 3451 job_dismiss(&job, errp); 3452 aio_context_release(aio_context); 3453 } 3454 3455 void qmp_change_backing_file(const char *device, 3456 const char *image_node_name, 3457 const char *backing_file, 3458 Error **errp) 3459 { 3460 BlockDriverState *bs = NULL; 3461 AioContext *aio_context; 3462 BlockDriverState *image_bs = NULL; 3463 Error *local_err = NULL; 3464 bool ro; 3465 int ret; 3466 3467 bs = qmp_get_root_bs(device, errp); 3468 if (!bs) { 3469 return; 3470 } 3471 3472 aio_context = bdrv_get_aio_context(bs); 3473 aio_context_acquire(aio_context); 3474 3475 image_bs = bdrv_lookup_bs(NULL, image_node_name, &local_err); 3476 if (local_err) { 3477 error_propagate(errp, local_err); 3478 goto out; 3479 } 3480 3481 if (!image_bs) { 3482 error_setg(errp, "image file not found"); 3483 goto out; 3484 } 3485 3486 if (bdrv_find_base(image_bs) == image_bs) { 3487 error_setg(errp, "not allowing backing file change on an image " 3488 "without a backing file"); 3489 goto out; 3490 } 3491 3492 /* even though we are not necessarily operating on bs, we need it to 3493 * determine if block ops are currently prohibited on the chain */ 3494 if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_CHANGE, errp)) { 3495 goto out; 3496 } 3497 3498 /* final sanity check */ 3499 if (!bdrv_chain_contains(bs, image_bs)) { 3500 error_setg(errp, "'%s' and image file are not in the same chain", 3501 device); 3502 goto out; 3503 } 3504 3505 /* if not r/w, reopen to make r/w */ 3506 ro = bdrv_is_read_only(image_bs); 3507 3508 if (ro) { 3509 if (bdrv_reopen_set_read_only(image_bs, false, errp) != 0) { 3510 goto out; 3511 } 3512 } 3513 3514 ret = bdrv_change_backing_file(image_bs, backing_file, 3515 image_bs->drv ? image_bs->drv->format_name : "", 3516 false); 3517 3518 if (ret < 0) { 3519 error_setg_errno(errp, -ret, "Could not change backing file to '%s'", 3520 backing_file); 3521 /* don't exit here, so we can try to restore open flags if 3522 * appropriate */ 3523 } 3524 3525 if (ro) { 3526 bdrv_reopen_set_read_only(image_bs, true, errp); 3527 } 3528 3529 out: 3530 aio_context_release(aio_context); 3531 } 3532 3533 void qmp_blockdev_add(BlockdevOptions *options, Error **errp) 3534 { 3535 BlockDriverState *bs; 3536 QObject *obj; 3537 Visitor *v = qobject_output_visitor_new(&obj); 3538 QDict *qdict; 3539 3540 visit_type_BlockdevOptions(v, NULL, &options, &error_abort); 3541 visit_complete(v, &obj); 3542 qdict = qobject_to(QDict, obj); 3543 3544 qdict_flatten(qdict); 3545 3546 if (!qdict_get_try_str(qdict, "node-name")) { 3547 error_setg(errp, "'node-name' must be specified for the root node"); 3548 goto fail; 3549 } 3550 3551 bs = bds_tree_init(qdict, errp); 3552 if (!bs) { 3553 goto fail; 3554 } 3555 3556 bdrv_set_monitor_owned(bs); 3557 3558 fail: 3559 visit_free(v); 3560 } 3561 3562 void qmp_blockdev_reopen(BlockdevOptionsList *reopen_list, Error **errp) 3563 { 3564 BlockReopenQueue *queue = NULL; 3565 GSList *drained = NULL; 3566 3567 /* Add each one of the BDS that we want to reopen to the queue */ 3568 for (; reopen_list != NULL; reopen_list = reopen_list->next) { 3569 BlockdevOptions *options = reopen_list->value; 3570 BlockDriverState *bs; 3571 AioContext *ctx; 3572 QObject *obj; 3573 Visitor *v; 3574 QDict *qdict; 3575 3576 /* Check for the selected node name */ 3577 if (!options->has_node_name) { 3578 error_setg(errp, "node-name not specified"); 3579 goto fail; 3580 } 3581 3582 bs = bdrv_find_node(options->node_name); 3583 if (!bs) { 3584 error_setg(errp, "Failed to find node with node-name='%s'", 3585 options->node_name); 3586 goto fail; 3587 } 3588 3589 /* Put all options in a QDict and flatten it */ 3590 v = qobject_output_visitor_new(&obj); 3591 visit_type_BlockdevOptions(v, NULL, &options, &error_abort); 3592 visit_complete(v, &obj); 3593 visit_free(v); 3594 3595 qdict = qobject_to(QDict, obj); 3596 3597 qdict_flatten(qdict); 3598 3599 ctx = bdrv_get_aio_context(bs); 3600 aio_context_acquire(ctx); 3601 3602 bdrv_subtree_drained_begin(bs); 3603 queue = bdrv_reopen_queue(queue, bs, qdict, false); 3604 drained = g_slist_prepend(drained, bs); 3605 3606 aio_context_release(ctx); 3607 } 3608 3609 /* Perform the reopen operation */ 3610 bdrv_reopen_multiple(queue, errp); 3611 queue = NULL; 3612 3613 fail: 3614 bdrv_reopen_queue_free(queue); 3615 g_slist_free_full(drained, (GDestroyNotify) bdrv_subtree_drained_end); 3616 } 3617 3618 void qmp_blockdev_del(const char *node_name, Error **errp) 3619 { 3620 AioContext *aio_context; 3621 BlockDriverState *bs; 3622 3623 bs = bdrv_find_node(node_name); 3624 if (!bs) { 3625 error_setg(errp, "Failed to find node with node-name='%s'", node_name); 3626 return; 3627 } 3628 if (bdrv_has_blk(bs)) { 3629 error_setg(errp, "Node %s is in use", node_name); 3630 return; 3631 } 3632 aio_context = bdrv_get_aio_context(bs); 3633 aio_context_acquire(aio_context); 3634 3635 if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_DRIVE_DEL, errp)) { 3636 goto out; 3637 } 3638 3639 if (!QTAILQ_IN_USE(bs, monitor_list)) { 3640 error_setg(errp, "Node %s is not owned by the monitor", 3641 bs->node_name); 3642 goto out; 3643 } 3644 3645 if (bs->refcnt > 1) { 3646 error_setg(errp, "Block device %s is in use", 3647 bdrv_get_device_or_node_name(bs)); 3648 goto out; 3649 } 3650 3651 QTAILQ_REMOVE(&monitor_bdrv_states, bs, monitor_list); 3652 bdrv_unref(bs); 3653 3654 out: 3655 aio_context_release(aio_context); 3656 } 3657 3658 static BdrvChild *bdrv_find_child(BlockDriverState *parent_bs, 3659 const char *child_name) 3660 { 3661 BdrvChild *child; 3662 3663 QLIST_FOREACH(child, &parent_bs->children, next) { 3664 if (strcmp(child->name, child_name) == 0) { 3665 return child; 3666 } 3667 } 3668 3669 return NULL; 3670 } 3671 3672 void qmp_x_blockdev_change(const char *parent, bool has_child, 3673 const char *child, bool has_node, 3674 const char *node, Error **errp) 3675 { 3676 BlockDriverState *parent_bs, *new_bs = NULL; 3677 BdrvChild *p_child; 3678 3679 parent_bs = bdrv_lookup_bs(parent, parent, errp); 3680 if (!parent_bs) { 3681 return; 3682 } 3683 3684 if (has_child == has_node) { 3685 if (has_child) { 3686 error_setg(errp, "The parameters child and node are in conflict"); 3687 } else { 3688 error_setg(errp, "Either child or node must be specified"); 3689 } 3690 return; 3691 } 3692 3693 if (has_child) { 3694 p_child = bdrv_find_child(parent_bs, child); 3695 if (!p_child) { 3696 error_setg(errp, "Node '%s' does not have child '%s'", 3697 parent, child); 3698 return; 3699 } 3700 bdrv_del_child(parent_bs, p_child, errp); 3701 } 3702 3703 if (has_node) { 3704 new_bs = bdrv_find_node(node); 3705 if (!new_bs) { 3706 error_setg(errp, "Node '%s' not found", node); 3707 return; 3708 } 3709 bdrv_add_child(parent_bs, new_bs, errp); 3710 } 3711 } 3712 3713 BlockJobInfoList *qmp_query_block_jobs(Error **errp) 3714 { 3715 BlockJobInfoList *head = NULL, **tail = &head; 3716 BlockJob *job; 3717 3718 for (job = block_job_next(NULL); job; job = block_job_next(job)) { 3719 BlockJobInfo *value; 3720 AioContext *aio_context; 3721 3722 if (block_job_is_internal(job)) { 3723 continue; 3724 } 3725 aio_context = blk_get_aio_context(job->blk); 3726 aio_context_acquire(aio_context); 3727 value = block_job_query(job, errp); 3728 aio_context_release(aio_context); 3729 if (!value) { 3730 qapi_free_BlockJobInfoList(head); 3731 return NULL; 3732 } 3733 QAPI_LIST_APPEND(tail, value); 3734 } 3735 3736 return head; 3737 } 3738 3739 void qmp_x_blockdev_set_iothread(const char *node_name, StrOrNull *iothread, 3740 bool has_force, bool force, Error **errp) 3741 { 3742 AioContext *old_context; 3743 AioContext *new_context; 3744 BlockDriverState *bs; 3745 3746 bs = bdrv_find_node(node_name); 3747 if (!bs) { 3748 error_setg(errp, "Failed to find node with node-name='%s'", node_name); 3749 return; 3750 } 3751 3752 /* Protects against accidents. */ 3753 if (!(has_force && force) && bdrv_has_blk(bs)) { 3754 error_setg(errp, "Node %s is associated with a BlockBackend and could " 3755 "be in use (use force=true to override this check)", 3756 node_name); 3757 return; 3758 } 3759 3760 if (iothread->type == QTYPE_QSTRING) { 3761 IOThread *obj = iothread_by_id(iothread->u.s); 3762 if (!obj) { 3763 error_setg(errp, "Cannot find iothread %s", iothread->u.s); 3764 return; 3765 } 3766 3767 new_context = iothread_get_aio_context(obj); 3768 } else { 3769 new_context = qemu_get_aio_context(); 3770 } 3771 3772 old_context = bdrv_get_aio_context(bs); 3773 aio_context_acquire(old_context); 3774 3775 bdrv_try_set_aio_context(bs, new_context, errp); 3776 3777 aio_context_release(old_context); 3778 } 3779 3780 QemuOptsList qemu_common_drive_opts = { 3781 .name = "drive", 3782 .head = QTAILQ_HEAD_INITIALIZER(qemu_common_drive_opts.head), 3783 .desc = { 3784 { 3785 .name = "snapshot", 3786 .type = QEMU_OPT_BOOL, 3787 .help = "enable/disable snapshot mode", 3788 },{ 3789 .name = "aio", 3790 .type = QEMU_OPT_STRING, 3791 .help = "host AIO implementation (threads, native, io_uring)", 3792 },{ 3793 .name = BDRV_OPT_CACHE_WB, 3794 .type = QEMU_OPT_BOOL, 3795 .help = "Enable writeback mode", 3796 },{ 3797 .name = "format", 3798 .type = QEMU_OPT_STRING, 3799 .help = "disk format (raw, qcow2, ...)", 3800 },{ 3801 .name = "rerror", 3802 .type = QEMU_OPT_STRING, 3803 .help = "read error action", 3804 },{ 3805 .name = "werror", 3806 .type = QEMU_OPT_STRING, 3807 .help = "write error action", 3808 },{ 3809 .name = BDRV_OPT_READ_ONLY, 3810 .type = QEMU_OPT_BOOL, 3811 .help = "open drive file as read-only", 3812 }, 3813 3814 THROTTLE_OPTS, 3815 3816 { 3817 .name = "throttling.group", 3818 .type = QEMU_OPT_STRING, 3819 .help = "name of the block throttling group", 3820 },{ 3821 .name = "copy-on-read", 3822 .type = QEMU_OPT_BOOL, 3823 .help = "copy read data from backing file into image file", 3824 },{ 3825 .name = "detect-zeroes", 3826 .type = QEMU_OPT_STRING, 3827 .help = "try to optimize zero writes (off, on, unmap)", 3828 },{ 3829 .name = "stats-account-invalid", 3830 .type = QEMU_OPT_BOOL, 3831 .help = "whether to account for invalid I/O operations " 3832 "in the statistics", 3833 },{ 3834 .name = "stats-account-failed", 3835 .type = QEMU_OPT_BOOL, 3836 .help = "whether to account for failed I/O operations " 3837 "in the statistics", 3838 }, 3839 { /* end of list */ } 3840 }, 3841 }; 3842 3843 QemuOptsList qemu_drive_opts = { 3844 .name = "drive", 3845 .head = QTAILQ_HEAD_INITIALIZER(qemu_drive_opts.head), 3846 .desc = { 3847 /* 3848 * no elements => accept any params 3849 * validation will happen later 3850 */ 3851 { /* end of list */ } 3852 }, 3853 }; 3854