1 /* 2 * QEMU host block devices 3 * 4 * Copyright (c) 2003-2008 Fabrice Bellard 5 * 6 * This work is licensed under the terms of the GNU GPL, version 2 or 7 * later. See the COPYING file in the top-level directory. 8 * 9 * This file incorporates work covered by the following copyright and 10 * permission notice: 11 * 12 * Copyright (c) 2003-2008 Fabrice Bellard 13 * 14 * Permission is hereby granted, free of charge, to any person obtaining a copy 15 * of this software and associated documentation files (the "Software"), to deal 16 * in the Software without restriction, including without limitation the rights 17 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell 18 * copies of the Software, and to permit persons to whom the Software is 19 * furnished to do so, subject to the following conditions: 20 * 21 * The above copyright notice and this permission notice shall be included in 22 * all copies or substantial portions of the Software. 23 * 24 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 25 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 26 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 27 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 28 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 29 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN 30 * THE SOFTWARE. 31 */ 32 33 #include "qemu/osdep.h" 34 #include "sysemu/block-backend.h" 35 #include "sysemu/blockdev.h" 36 #include "hw/block/block.h" 37 #include "block/blockjob.h" 38 #include "block/qdict.h" 39 #include "block/throttle-groups.h" 40 #include "monitor/monitor.h" 41 #include "qemu/error-report.h" 42 #include "qemu/option.h" 43 #include "qemu/qemu-print.h" 44 #include "qemu/config-file.h" 45 #include "qapi/qapi-commands-block.h" 46 #include "qapi/qapi-commands-transaction.h" 47 #include "qapi/qapi-visit-block-core.h" 48 #include "qapi/qmp/qdict.h" 49 #include "qapi/qmp/qnum.h" 50 #include "qapi/qmp/qstring.h" 51 #include "qapi/error.h" 52 #include "qapi/qmp/qerror.h" 53 #include "qapi/qmp/qlist.h" 54 #include "qapi/qobject-output-visitor.h" 55 #include "sysemu/sysemu.h" 56 #include "sysemu/iothread.h" 57 #include "block/block_int.h" 58 #include "block/trace.h" 59 #include "sysemu/runstate.h" 60 #include "sysemu/replay.h" 61 #include "qemu/cutils.h" 62 #include "qemu/help_option.h" 63 #include "qemu/main-loop.h" 64 #include "qemu/throttle-options.h" 65 66 /* Protected by BQL */ 67 QTAILQ_HEAD(, BlockDriverState) monitor_bdrv_states = 68 QTAILQ_HEAD_INITIALIZER(monitor_bdrv_states); 69 70 void bdrv_set_monitor_owned(BlockDriverState *bs) 71 { 72 GLOBAL_STATE_CODE(); 73 QTAILQ_INSERT_TAIL(&monitor_bdrv_states, bs, monitor_list); 74 } 75 76 static const char *const if_name[IF_COUNT] = { 77 [IF_NONE] = "none", 78 [IF_IDE] = "ide", 79 [IF_SCSI] = "scsi", 80 [IF_FLOPPY] = "floppy", 81 [IF_PFLASH] = "pflash", 82 [IF_MTD] = "mtd", 83 [IF_SD] = "sd", 84 [IF_VIRTIO] = "virtio", 85 [IF_XEN] = "xen", 86 }; 87 88 static int if_max_devs[IF_COUNT] = { 89 /* 90 * Do not change these numbers! They govern how drive option 91 * index maps to unit and bus. That mapping is ABI. 92 * 93 * All controllers used to implement if=T drives need to support 94 * if_max_devs[T] units, for any T with if_max_devs[T] != 0. 95 * Otherwise, some index values map to "impossible" bus, unit 96 * values. 97 * 98 * For instance, if you change [IF_SCSI] to 255, -drive 99 * if=scsi,index=12 no longer means bus=1,unit=5, but 100 * bus=0,unit=12. With an lsi53c895a controller (7 units max), 101 * the drive can't be set up. Regression. 102 */ 103 [IF_IDE] = 2, 104 [IF_SCSI] = 7, 105 }; 106 107 /** 108 * Boards may call this to offer board-by-board overrides 109 * of the default, global values. 110 */ 111 void override_max_devs(BlockInterfaceType type, int max_devs) 112 { 113 BlockBackend *blk; 114 DriveInfo *dinfo; 115 116 GLOBAL_STATE_CODE(); 117 118 if (max_devs <= 0) { 119 return; 120 } 121 122 for (blk = blk_next(NULL); blk; blk = blk_next(blk)) { 123 dinfo = blk_legacy_dinfo(blk); 124 if (dinfo->type == type) { 125 fprintf(stderr, "Cannot override units-per-bus property of" 126 " the %s interface, because a drive of that type has" 127 " already been added.\n", if_name[type]); 128 g_assert_not_reached(); 129 } 130 } 131 132 if_max_devs[type] = max_devs; 133 } 134 135 /* 136 * We automatically delete the drive when a device using it gets 137 * unplugged. Questionable feature, but we can't just drop it. 138 * Device models call blockdev_mark_auto_del() to schedule the 139 * automatic deletion, and generic qdev code calls blockdev_auto_del() 140 * when deletion is actually safe. 141 */ 142 void blockdev_mark_auto_del(BlockBackend *blk) 143 { 144 DriveInfo *dinfo = blk_legacy_dinfo(blk); 145 BlockJob *job; 146 147 GLOBAL_STATE_CODE(); 148 149 if (!dinfo) { 150 return; 151 } 152 153 JOB_LOCK_GUARD(); 154 155 for (job = block_job_next_locked(NULL); job; 156 job = block_job_next_locked(job)) { 157 if (block_job_has_bdrv(job, blk_bs(blk))) { 158 job_cancel_locked(&job->job, false); 159 } 160 } 161 162 dinfo->auto_del = 1; 163 } 164 165 void blockdev_auto_del(BlockBackend *blk) 166 { 167 DriveInfo *dinfo = blk_legacy_dinfo(blk); 168 GLOBAL_STATE_CODE(); 169 170 if (dinfo && dinfo->auto_del) { 171 monitor_remove_blk(blk); 172 blk_unref(blk); 173 } 174 } 175 176 static int drive_index_to_bus_id(BlockInterfaceType type, int index) 177 { 178 int max_devs = if_max_devs[type]; 179 return max_devs ? index / max_devs : 0; 180 } 181 182 static int drive_index_to_unit_id(BlockInterfaceType type, int index) 183 { 184 int max_devs = if_max_devs[type]; 185 return max_devs ? index % max_devs : index; 186 } 187 188 QemuOpts *drive_add(BlockInterfaceType type, int index, const char *file, 189 const char *optstr) 190 { 191 QemuOpts *opts; 192 193 GLOBAL_STATE_CODE(); 194 195 opts = qemu_opts_parse_noisily(qemu_find_opts("drive"), optstr, false); 196 if (!opts) { 197 return NULL; 198 } 199 if (type != IF_DEFAULT) { 200 qemu_opt_set(opts, "if", if_name[type], &error_abort); 201 } 202 if (index >= 0) { 203 qemu_opt_set_number(opts, "index", index, &error_abort); 204 } 205 if (file) 206 qemu_opt_set(opts, "file", file, &error_abort); 207 return opts; 208 } 209 210 DriveInfo *drive_get(BlockInterfaceType type, int bus, int unit) 211 { 212 BlockBackend *blk; 213 DriveInfo *dinfo; 214 215 GLOBAL_STATE_CODE(); 216 217 for (blk = blk_next(NULL); blk; blk = blk_next(blk)) { 218 dinfo = blk_legacy_dinfo(blk); 219 if (dinfo && dinfo->type == type 220 && dinfo->bus == bus && dinfo->unit == unit) { 221 return dinfo; 222 } 223 } 224 225 return NULL; 226 } 227 228 /* 229 * Check board claimed all -drive that are meant to be claimed. 230 * Fatal error if any remain unclaimed. 231 */ 232 void drive_check_orphaned(void) 233 { 234 BlockBackend *blk; 235 DriveInfo *dinfo; 236 Location loc; 237 bool orphans = false; 238 239 GLOBAL_STATE_CODE(); 240 241 for (blk = blk_next(NULL); blk; blk = blk_next(blk)) { 242 dinfo = blk_legacy_dinfo(blk); 243 /* 244 * Ignore default drives, because we create certain default 245 * drives unconditionally, then leave them unclaimed. Not the 246 * users fault. 247 * Ignore IF_VIRTIO, because it gets desugared into -device, 248 * so we can leave failing to -device. 249 * Ignore IF_NONE, because leaving unclaimed IF_NONE remains 250 * available for device_add is a feature. 251 */ 252 if (dinfo->is_default || dinfo->type == IF_VIRTIO 253 || dinfo->type == IF_NONE) { 254 continue; 255 } 256 if (!blk_get_attached_dev(blk)) { 257 loc_push_none(&loc); 258 qemu_opts_loc_restore(dinfo->opts); 259 error_report("machine type does not support" 260 " if=%s,bus=%d,unit=%d", 261 if_name[dinfo->type], dinfo->bus, dinfo->unit); 262 loc_pop(&loc); 263 orphans = true; 264 } 265 } 266 267 if (orphans) { 268 exit(1); 269 } 270 } 271 272 DriveInfo *drive_get_by_index(BlockInterfaceType type, int index) 273 { 274 GLOBAL_STATE_CODE(); 275 return drive_get(type, 276 drive_index_to_bus_id(type, index), 277 drive_index_to_unit_id(type, index)); 278 } 279 280 int drive_get_max_bus(BlockInterfaceType type) 281 { 282 int max_bus; 283 BlockBackend *blk; 284 DriveInfo *dinfo; 285 286 GLOBAL_STATE_CODE(); 287 288 max_bus = -1; 289 for (blk = blk_next(NULL); blk; blk = blk_next(blk)) { 290 dinfo = blk_legacy_dinfo(blk); 291 if (dinfo && dinfo->type == type && dinfo->bus > max_bus) { 292 max_bus = dinfo->bus; 293 } 294 } 295 return max_bus; 296 } 297 298 static void bdrv_format_print(void *opaque, const char *name) 299 { 300 qemu_printf(" %s", name); 301 } 302 303 typedef struct { 304 QEMUBH *bh; 305 BlockDriverState *bs; 306 } BDRVPutRefBH; 307 308 static int parse_block_error_action(const char *buf, bool is_read, Error **errp) 309 { 310 if (!strcmp(buf, "ignore")) { 311 return BLOCKDEV_ON_ERROR_IGNORE; 312 } else if (!is_read && !strcmp(buf, "enospc")) { 313 return BLOCKDEV_ON_ERROR_ENOSPC; 314 } else if (!strcmp(buf, "stop")) { 315 return BLOCKDEV_ON_ERROR_STOP; 316 } else if (!strcmp(buf, "report")) { 317 return BLOCKDEV_ON_ERROR_REPORT; 318 } else { 319 error_setg(errp, "'%s' invalid %s error action", 320 buf, is_read ? "read" : "write"); 321 return -1; 322 } 323 } 324 325 static bool parse_stats_intervals(BlockAcctStats *stats, QList *intervals, 326 Error **errp) 327 { 328 const QListEntry *entry; 329 for (entry = qlist_first(intervals); entry; entry = qlist_next(entry)) { 330 switch (qobject_type(entry->value)) { 331 332 case QTYPE_QSTRING: { 333 unsigned long long length; 334 const char *str = qstring_get_str(qobject_to(QString, 335 entry->value)); 336 if (parse_uint_full(str, &length, 10) == 0 && 337 length > 0 && length <= UINT_MAX) { 338 block_acct_add_interval(stats, (unsigned) length); 339 } else { 340 error_setg(errp, "Invalid interval length: %s", str); 341 return false; 342 } 343 break; 344 } 345 346 case QTYPE_QNUM: { 347 int64_t length = qnum_get_int(qobject_to(QNum, entry->value)); 348 349 if (length > 0 && length <= UINT_MAX) { 350 block_acct_add_interval(stats, (unsigned) length); 351 } else { 352 error_setg(errp, "Invalid interval length: %" PRId64, length); 353 return false; 354 } 355 break; 356 } 357 358 default: 359 error_setg(errp, "The specification of stats-intervals is invalid"); 360 return false; 361 } 362 } 363 return true; 364 } 365 366 typedef enum { MEDIA_DISK, MEDIA_CDROM } DriveMediaType; 367 368 /* All parameters but @opts are optional and may be set to NULL. */ 369 static void extract_common_blockdev_options(QemuOpts *opts, int *bdrv_flags, 370 const char **throttling_group, ThrottleConfig *throttle_cfg, 371 BlockdevDetectZeroesOptions *detect_zeroes, Error **errp) 372 { 373 Error *local_error = NULL; 374 const char *aio; 375 376 if (bdrv_flags) { 377 if (qemu_opt_get_bool(opts, "copy-on-read", false)) { 378 *bdrv_flags |= BDRV_O_COPY_ON_READ; 379 } 380 381 if ((aio = qemu_opt_get(opts, "aio")) != NULL) { 382 if (bdrv_parse_aio(aio, bdrv_flags) < 0) { 383 error_setg(errp, "invalid aio option"); 384 return; 385 } 386 } 387 } 388 389 /* disk I/O throttling */ 390 if (throttling_group) { 391 *throttling_group = qemu_opt_get(opts, "throttling.group"); 392 } 393 394 if (throttle_cfg) { 395 throttle_config_init(throttle_cfg); 396 throttle_cfg->buckets[THROTTLE_BPS_TOTAL].avg = 397 qemu_opt_get_number(opts, "throttling.bps-total", 0); 398 throttle_cfg->buckets[THROTTLE_BPS_READ].avg = 399 qemu_opt_get_number(opts, "throttling.bps-read", 0); 400 throttle_cfg->buckets[THROTTLE_BPS_WRITE].avg = 401 qemu_opt_get_number(opts, "throttling.bps-write", 0); 402 throttle_cfg->buckets[THROTTLE_OPS_TOTAL].avg = 403 qemu_opt_get_number(opts, "throttling.iops-total", 0); 404 throttle_cfg->buckets[THROTTLE_OPS_READ].avg = 405 qemu_opt_get_number(opts, "throttling.iops-read", 0); 406 throttle_cfg->buckets[THROTTLE_OPS_WRITE].avg = 407 qemu_opt_get_number(opts, "throttling.iops-write", 0); 408 409 throttle_cfg->buckets[THROTTLE_BPS_TOTAL].max = 410 qemu_opt_get_number(opts, "throttling.bps-total-max", 0); 411 throttle_cfg->buckets[THROTTLE_BPS_READ].max = 412 qemu_opt_get_number(opts, "throttling.bps-read-max", 0); 413 throttle_cfg->buckets[THROTTLE_BPS_WRITE].max = 414 qemu_opt_get_number(opts, "throttling.bps-write-max", 0); 415 throttle_cfg->buckets[THROTTLE_OPS_TOTAL].max = 416 qemu_opt_get_number(opts, "throttling.iops-total-max", 0); 417 throttle_cfg->buckets[THROTTLE_OPS_READ].max = 418 qemu_opt_get_number(opts, "throttling.iops-read-max", 0); 419 throttle_cfg->buckets[THROTTLE_OPS_WRITE].max = 420 qemu_opt_get_number(opts, "throttling.iops-write-max", 0); 421 422 throttle_cfg->buckets[THROTTLE_BPS_TOTAL].burst_length = 423 qemu_opt_get_number(opts, "throttling.bps-total-max-length", 1); 424 throttle_cfg->buckets[THROTTLE_BPS_READ].burst_length = 425 qemu_opt_get_number(opts, "throttling.bps-read-max-length", 1); 426 throttle_cfg->buckets[THROTTLE_BPS_WRITE].burst_length = 427 qemu_opt_get_number(opts, "throttling.bps-write-max-length", 1); 428 throttle_cfg->buckets[THROTTLE_OPS_TOTAL].burst_length = 429 qemu_opt_get_number(opts, "throttling.iops-total-max-length", 1); 430 throttle_cfg->buckets[THROTTLE_OPS_READ].burst_length = 431 qemu_opt_get_number(opts, "throttling.iops-read-max-length", 1); 432 throttle_cfg->buckets[THROTTLE_OPS_WRITE].burst_length = 433 qemu_opt_get_number(opts, "throttling.iops-write-max-length", 1); 434 435 throttle_cfg->op_size = 436 qemu_opt_get_number(opts, "throttling.iops-size", 0); 437 438 if (!throttle_is_valid(throttle_cfg, errp)) { 439 return; 440 } 441 } 442 443 if (detect_zeroes) { 444 *detect_zeroes = 445 qapi_enum_parse(&BlockdevDetectZeroesOptions_lookup, 446 qemu_opt_get(opts, "detect-zeroes"), 447 BLOCKDEV_DETECT_ZEROES_OPTIONS_OFF, 448 &local_error); 449 if (local_error) { 450 error_propagate(errp, local_error); 451 return; 452 } 453 } 454 } 455 456 static OnOffAuto account_get_opt(QemuOpts *opts, const char *name) 457 { 458 if (!qemu_opt_find(opts, name)) { 459 return ON_OFF_AUTO_AUTO; 460 } 461 if (qemu_opt_get_bool(opts, name, true)) { 462 return ON_OFF_AUTO_ON; 463 } 464 return ON_OFF_AUTO_OFF; 465 } 466 467 /* Takes the ownership of bs_opts */ 468 static BlockBackend *blockdev_init(const char *file, QDict *bs_opts, 469 Error **errp) 470 { 471 const char *buf; 472 int bdrv_flags = 0; 473 int on_read_error, on_write_error; 474 OnOffAuto account_invalid, account_failed; 475 bool writethrough, read_only; 476 BlockBackend *blk; 477 BlockDriverState *bs; 478 ThrottleConfig cfg; 479 int snapshot = 0; 480 Error *error = NULL; 481 QemuOpts *opts; 482 QDict *interval_dict = NULL; 483 QList *interval_list = NULL; 484 const char *id; 485 BlockdevDetectZeroesOptions detect_zeroes = 486 BLOCKDEV_DETECT_ZEROES_OPTIONS_OFF; 487 const char *throttling_group = NULL; 488 489 /* Check common options by copying from bs_opts to opts, all other options 490 * stay in bs_opts for processing by bdrv_open(). */ 491 id = qdict_get_try_str(bs_opts, "id"); 492 opts = qemu_opts_create(&qemu_common_drive_opts, id, 1, errp); 493 if (!opts) { 494 goto err_no_opts; 495 } 496 497 if (!qemu_opts_absorb_qdict(opts, bs_opts, errp)) { 498 goto early_err; 499 } 500 501 if (id) { 502 qdict_del(bs_opts, "id"); 503 } 504 505 /* extract parameters */ 506 snapshot = qemu_opt_get_bool(opts, "snapshot", 0); 507 508 account_invalid = account_get_opt(opts, "stats-account-invalid"); 509 account_failed = account_get_opt(opts, "stats-account-failed"); 510 511 writethrough = !qemu_opt_get_bool(opts, BDRV_OPT_CACHE_WB, true); 512 513 id = qemu_opts_id(opts); 514 515 qdict_extract_subqdict(bs_opts, &interval_dict, "stats-intervals."); 516 qdict_array_split(interval_dict, &interval_list); 517 518 if (qdict_size(interval_dict) != 0) { 519 error_setg(errp, "Invalid option stats-intervals.%s", 520 qdict_first(interval_dict)->key); 521 goto early_err; 522 } 523 524 extract_common_blockdev_options(opts, &bdrv_flags, &throttling_group, &cfg, 525 &detect_zeroes, &error); 526 if (error) { 527 error_propagate(errp, error); 528 goto early_err; 529 } 530 531 if ((buf = qemu_opt_get(opts, "format")) != NULL) { 532 if (is_help_option(buf)) { 533 qemu_printf("Supported formats:"); 534 bdrv_iterate_format(bdrv_format_print, NULL, false); 535 qemu_printf("\nSupported formats (read-only):"); 536 bdrv_iterate_format(bdrv_format_print, NULL, true); 537 qemu_printf("\n"); 538 goto early_err; 539 } 540 541 if (qdict_haskey(bs_opts, "driver")) { 542 error_setg(errp, "Cannot specify both 'driver' and 'format'"); 543 goto early_err; 544 } 545 qdict_put_str(bs_opts, "driver", buf); 546 } 547 548 on_write_error = BLOCKDEV_ON_ERROR_ENOSPC; 549 if ((buf = qemu_opt_get(opts, "werror")) != NULL) { 550 on_write_error = parse_block_error_action(buf, 0, &error); 551 if (error) { 552 error_propagate(errp, error); 553 goto early_err; 554 } 555 } 556 557 on_read_error = BLOCKDEV_ON_ERROR_REPORT; 558 if ((buf = qemu_opt_get(opts, "rerror")) != NULL) { 559 on_read_error = parse_block_error_action(buf, 1, &error); 560 if (error) { 561 error_propagate(errp, error); 562 goto early_err; 563 } 564 } 565 566 if (snapshot) { 567 bdrv_flags |= BDRV_O_SNAPSHOT; 568 } 569 570 read_only = qemu_opt_get_bool(opts, BDRV_OPT_READ_ONLY, false); 571 572 /* init */ 573 if ((!file || !*file) && !qdict_size(bs_opts)) { 574 BlockBackendRootState *blk_rs; 575 576 blk = blk_new(qemu_get_aio_context(), 0, BLK_PERM_ALL); 577 blk_rs = blk_get_root_state(blk); 578 blk_rs->open_flags = bdrv_flags | (read_only ? 0 : BDRV_O_RDWR); 579 blk_rs->detect_zeroes = detect_zeroes; 580 581 qobject_unref(bs_opts); 582 } else { 583 if (file && !*file) { 584 file = NULL; 585 } 586 587 /* bdrv_open() defaults to the values in bdrv_flags (for compatibility 588 * with other callers) rather than what we want as the real defaults. 589 * Apply the defaults here instead. */ 590 qdict_set_default_str(bs_opts, BDRV_OPT_CACHE_DIRECT, "off"); 591 qdict_set_default_str(bs_opts, BDRV_OPT_CACHE_NO_FLUSH, "off"); 592 qdict_set_default_str(bs_opts, BDRV_OPT_READ_ONLY, 593 read_only ? "on" : "off"); 594 qdict_set_default_str(bs_opts, BDRV_OPT_AUTO_READ_ONLY, "on"); 595 assert((bdrv_flags & BDRV_O_CACHE_MASK) == 0); 596 597 if (runstate_check(RUN_STATE_INMIGRATE)) { 598 bdrv_flags |= BDRV_O_INACTIVE; 599 } 600 601 blk = blk_new_open(file, NULL, bs_opts, bdrv_flags, errp); 602 if (!blk) { 603 goto err_no_bs_opts; 604 } 605 bs = blk_bs(blk); 606 607 bs->detect_zeroes = detect_zeroes; 608 609 block_acct_setup(blk_get_stats(blk), account_invalid, account_failed); 610 611 if (!parse_stats_intervals(blk_get_stats(blk), interval_list, errp)) { 612 blk_unref(blk); 613 blk = NULL; 614 goto err_no_bs_opts; 615 } 616 } 617 618 /* disk I/O throttling */ 619 if (throttle_enabled(&cfg)) { 620 if (!throttling_group) { 621 throttling_group = id; 622 } 623 blk_io_limits_enable(blk, throttling_group); 624 blk_set_io_limits(blk, &cfg); 625 } 626 627 blk_set_enable_write_cache(blk, !writethrough); 628 blk_set_on_error(blk, on_read_error, on_write_error); 629 630 if (!monitor_add_blk(blk, id, errp)) { 631 blk_unref(blk); 632 blk = NULL; 633 goto err_no_bs_opts; 634 } 635 636 err_no_bs_opts: 637 qemu_opts_del(opts); 638 qobject_unref(interval_dict); 639 qobject_unref(interval_list); 640 return blk; 641 642 early_err: 643 qemu_opts_del(opts); 644 qobject_unref(interval_dict); 645 qobject_unref(interval_list); 646 err_no_opts: 647 qobject_unref(bs_opts); 648 return NULL; 649 } 650 651 /* Takes the ownership of bs_opts */ 652 BlockDriverState *bds_tree_init(QDict *bs_opts, Error **errp) 653 { 654 int bdrv_flags = 0; 655 656 GLOBAL_STATE_CODE(); 657 /* bdrv_open() defaults to the values in bdrv_flags (for compatibility 658 * with other callers) rather than what we want as the real defaults. 659 * Apply the defaults here instead. */ 660 qdict_set_default_str(bs_opts, BDRV_OPT_CACHE_DIRECT, "off"); 661 qdict_set_default_str(bs_opts, BDRV_OPT_CACHE_NO_FLUSH, "off"); 662 qdict_set_default_str(bs_opts, BDRV_OPT_READ_ONLY, "off"); 663 664 if (runstate_check(RUN_STATE_INMIGRATE)) { 665 bdrv_flags |= BDRV_O_INACTIVE; 666 } 667 668 return bdrv_open(NULL, NULL, bs_opts, bdrv_flags, errp); 669 } 670 671 void blockdev_close_all_bdrv_states(void) 672 { 673 BlockDriverState *bs, *next_bs; 674 675 GLOBAL_STATE_CODE(); 676 QTAILQ_FOREACH_SAFE(bs, &monitor_bdrv_states, monitor_list, next_bs) { 677 AioContext *ctx = bdrv_get_aio_context(bs); 678 679 aio_context_acquire(ctx); 680 bdrv_unref(bs); 681 aio_context_release(ctx); 682 } 683 } 684 685 /* Iterates over the list of monitor-owned BlockDriverStates */ 686 BlockDriverState *bdrv_next_monitor_owned(BlockDriverState *bs) 687 { 688 GLOBAL_STATE_CODE(); 689 return bs ? QTAILQ_NEXT(bs, monitor_list) 690 : QTAILQ_FIRST(&monitor_bdrv_states); 691 } 692 693 static bool qemu_opt_rename(QemuOpts *opts, const char *from, const char *to, 694 Error **errp) 695 { 696 const char *value; 697 698 value = qemu_opt_get(opts, from); 699 if (value) { 700 if (qemu_opt_find(opts, to)) { 701 error_setg(errp, "'%s' and its alias '%s' can't be used at the " 702 "same time", to, from); 703 return false; 704 } 705 } 706 707 /* rename all items in opts */ 708 while ((value = qemu_opt_get(opts, from))) { 709 qemu_opt_set(opts, to, value, &error_abort); 710 qemu_opt_unset(opts, from); 711 } 712 return true; 713 } 714 715 QemuOptsList qemu_legacy_drive_opts = { 716 .name = "drive", 717 .head = QTAILQ_HEAD_INITIALIZER(qemu_legacy_drive_opts.head), 718 .desc = { 719 { 720 .name = "bus", 721 .type = QEMU_OPT_NUMBER, 722 .help = "bus number", 723 },{ 724 .name = "unit", 725 .type = QEMU_OPT_NUMBER, 726 .help = "unit number (i.e. lun for scsi)", 727 },{ 728 .name = "index", 729 .type = QEMU_OPT_NUMBER, 730 .help = "index number", 731 },{ 732 .name = "media", 733 .type = QEMU_OPT_STRING, 734 .help = "media type (disk, cdrom)", 735 },{ 736 .name = "if", 737 .type = QEMU_OPT_STRING, 738 .help = "interface (ide, scsi, sd, mtd, floppy, pflash, virtio)", 739 },{ 740 .name = "file", 741 .type = QEMU_OPT_STRING, 742 .help = "file name", 743 }, 744 745 /* Options that are passed on, but have special semantics with -drive */ 746 { 747 .name = BDRV_OPT_READ_ONLY, 748 .type = QEMU_OPT_BOOL, 749 .help = "open drive file as read-only", 750 },{ 751 .name = "rerror", 752 .type = QEMU_OPT_STRING, 753 .help = "read error action", 754 },{ 755 .name = "werror", 756 .type = QEMU_OPT_STRING, 757 .help = "write error action", 758 },{ 759 .name = "copy-on-read", 760 .type = QEMU_OPT_BOOL, 761 .help = "copy read data from backing file into image file", 762 }, 763 764 { /* end of list */ } 765 }, 766 }; 767 768 DriveInfo *drive_new(QemuOpts *all_opts, BlockInterfaceType block_default_type, 769 Error **errp) 770 { 771 const char *value; 772 BlockBackend *blk; 773 DriveInfo *dinfo = NULL; 774 QDict *bs_opts; 775 QemuOpts *legacy_opts; 776 DriveMediaType media = MEDIA_DISK; 777 BlockInterfaceType type; 778 int max_devs, bus_id, unit_id, index; 779 const char *werror, *rerror; 780 bool read_only = false; 781 bool copy_on_read; 782 const char *filename; 783 int i; 784 785 GLOBAL_STATE_CODE(); 786 787 /* Change legacy command line options into QMP ones */ 788 static const struct { 789 const char *from; 790 const char *to; 791 } opt_renames[] = { 792 { "iops", "throttling.iops-total" }, 793 { "iops_rd", "throttling.iops-read" }, 794 { "iops_wr", "throttling.iops-write" }, 795 796 { "bps", "throttling.bps-total" }, 797 { "bps_rd", "throttling.bps-read" }, 798 { "bps_wr", "throttling.bps-write" }, 799 800 { "iops_max", "throttling.iops-total-max" }, 801 { "iops_rd_max", "throttling.iops-read-max" }, 802 { "iops_wr_max", "throttling.iops-write-max" }, 803 804 { "bps_max", "throttling.bps-total-max" }, 805 { "bps_rd_max", "throttling.bps-read-max" }, 806 { "bps_wr_max", "throttling.bps-write-max" }, 807 808 { "iops_size", "throttling.iops-size" }, 809 810 { "group", "throttling.group" }, 811 812 { "readonly", BDRV_OPT_READ_ONLY }, 813 }; 814 815 for (i = 0; i < ARRAY_SIZE(opt_renames); i++) { 816 if (!qemu_opt_rename(all_opts, opt_renames[i].from, 817 opt_renames[i].to, errp)) { 818 return NULL; 819 } 820 } 821 822 value = qemu_opt_get(all_opts, "cache"); 823 if (value) { 824 int flags = 0; 825 bool writethrough; 826 827 if (bdrv_parse_cache_mode(value, &flags, &writethrough) != 0) { 828 error_setg(errp, "invalid cache option"); 829 return NULL; 830 } 831 832 /* Specific options take precedence */ 833 if (!qemu_opt_get(all_opts, BDRV_OPT_CACHE_WB)) { 834 qemu_opt_set_bool(all_opts, BDRV_OPT_CACHE_WB, 835 !writethrough, &error_abort); 836 } 837 if (!qemu_opt_get(all_opts, BDRV_OPT_CACHE_DIRECT)) { 838 qemu_opt_set_bool(all_opts, BDRV_OPT_CACHE_DIRECT, 839 !!(flags & BDRV_O_NOCACHE), &error_abort); 840 } 841 if (!qemu_opt_get(all_opts, BDRV_OPT_CACHE_NO_FLUSH)) { 842 qemu_opt_set_bool(all_opts, BDRV_OPT_CACHE_NO_FLUSH, 843 !!(flags & BDRV_O_NO_FLUSH), &error_abort); 844 } 845 qemu_opt_unset(all_opts, "cache"); 846 } 847 848 /* Get a QDict for processing the options */ 849 bs_opts = qdict_new(); 850 qemu_opts_to_qdict(all_opts, bs_opts); 851 852 legacy_opts = qemu_opts_create(&qemu_legacy_drive_opts, NULL, 0, 853 &error_abort); 854 if (!qemu_opts_absorb_qdict(legacy_opts, bs_opts, errp)) { 855 goto fail; 856 } 857 858 /* Media type */ 859 value = qemu_opt_get(legacy_opts, "media"); 860 if (value) { 861 if (!strcmp(value, "disk")) { 862 media = MEDIA_DISK; 863 } else if (!strcmp(value, "cdrom")) { 864 media = MEDIA_CDROM; 865 read_only = true; 866 } else { 867 error_setg(errp, "'%s' invalid media", value); 868 goto fail; 869 } 870 } 871 872 /* copy-on-read is disabled with a warning for read-only devices */ 873 read_only |= qemu_opt_get_bool(legacy_opts, BDRV_OPT_READ_ONLY, false); 874 copy_on_read = qemu_opt_get_bool(legacy_opts, "copy-on-read", false); 875 876 if (read_only && copy_on_read) { 877 warn_report("disabling copy-on-read on read-only drive"); 878 copy_on_read = false; 879 } 880 881 qdict_put_str(bs_opts, BDRV_OPT_READ_ONLY, read_only ? "on" : "off"); 882 qdict_put_str(bs_opts, "copy-on-read", copy_on_read ? "on" : "off"); 883 884 /* Controller type */ 885 value = qemu_opt_get(legacy_opts, "if"); 886 if (value) { 887 for (type = 0; 888 type < IF_COUNT && strcmp(value, if_name[type]); 889 type++) { 890 } 891 if (type == IF_COUNT) { 892 error_setg(errp, "unsupported bus type '%s'", value); 893 goto fail; 894 } 895 } else { 896 type = block_default_type; 897 } 898 899 /* Device address specified by bus/unit or index. 900 * If none was specified, try to find the first free one. */ 901 bus_id = qemu_opt_get_number(legacy_opts, "bus", 0); 902 unit_id = qemu_opt_get_number(legacy_opts, "unit", -1); 903 index = qemu_opt_get_number(legacy_opts, "index", -1); 904 905 max_devs = if_max_devs[type]; 906 907 if (index != -1) { 908 if (bus_id != 0 || unit_id != -1) { 909 error_setg(errp, "index cannot be used with bus and unit"); 910 goto fail; 911 } 912 bus_id = drive_index_to_bus_id(type, index); 913 unit_id = drive_index_to_unit_id(type, index); 914 } 915 916 if (unit_id == -1) { 917 unit_id = 0; 918 while (drive_get(type, bus_id, unit_id) != NULL) { 919 unit_id++; 920 if (max_devs && unit_id >= max_devs) { 921 unit_id -= max_devs; 922 bus_id++; 923 } 924 } 925 } 926 927 if (max_devs && unit_id >= max_devs) { 928 error_setg(errp, "unit %d too big (max is %d)", unit_id, max_devs - 1); 929 goto fail; 930 } 931 932 if (drive_get(type, bus_id, unit_id) != NULL) { 933 error_setg(errp, "drive with bus=%d, unit=%d (index=%d) exists", 934 bus_id, unit_id, index); 935 goto fail; 936 } 937 938 /* no id supplied -> create one */ 939 if (qemu_opts_id(all_opts) == NULL) { 940 char *new_id; 941 const char *mediastr = ""; 942 if (type == IF_IDE || type == IF_SCSI) { 943 mediastr = (media == MEDIA_CDROM) ? "-cd" : "-hd"; 944 } 945 if (max_devs) { 946 new_id = g_strdup_printf("%s%i%s%i", if_name[type], bus_id, 947 mediastr, unit_id); 948 } else { 949 new_id = g_strdup_printf("%s%s%i", if_name[type], 950 mediastr, unit_id); 951 } 952 qdict_put_str(bs_opts, "id", new_id); 953 g_free(new_id); 954 } 955 956 /* Add virtio block device */ 957 if (type == IF_VIRTIO) { 958 QemuOpts *devopts; 959 devopts = qemu_opts_create(qemu_find_opts("device"), NULL, 0, 960 &error_abort); 961 qemu_opt_set(devopts, "driver", "virtio-blk", &error_abort); 962 qemu_opt_set(devopts, "drive", qdict_get_str(bs_opts, "id"), 963 &error_abort); 964 } 965 966 filename = qemu_opt_get(legacy_opts, "file"); 967 968 /* Check werror/rerror compatibility with if=... */ 969 werror = qemu_opt_get(legacy_opts, "werror"); 970 if (werror != NULL) { 971 if (type != IF_IDE && type != IF_SCSI && type != IF_VIRTIO && 972 type != IF_NONE) { 973 error_setg(errp, "werror is not supported by this bus type"); 974 goto fail; 975 } 976 qdict_put_str(bs_opts, "werror", werror); 977 } 978 979 rerror = qemu_opt_get(legacy_opts, "rerror"); 980 if (rerror != NULL) { 981 if (type != IF_IDE && type != IF_VIRTIO && type != IF_SCSI && 982 type != IF_NONE) { 983 error_setg(errp, "rerror is not supported by this bus type"); 984 goto fail; 985 } 986 qdict_put_str(bs_opts, "rerror", rerror); 987 } 988 989 /* Actual block device init: Functionality shared with blockdev-add */ 990 blk = blockdev_init(filename, bs_opts, errp); 991 bs_opts = NULL; 992 if (!blk) { 993 goto fail; 994 } 995 996 /* Create legacy DriveInfo */ 997 dinfo = g_malloc0(sizeof(*dinfo)); 998 dinfo->opts = all_opts; 999 1000 dinfo->type = type; 1001 dinfo->bus = bus_id; 1002 dinfo->unit = unit_id; 1003 1004 blk_set_legacy_dinfo(blk, dinfo); 1005 1006 switch(type) { 1007 case IF_IDE: 1008 case IF_SCSI: 1009 case IF_XEN: 1010 case IF_NONE: 1011 dinfo->media_cd = media == MEDIA_CDROM; 1012 break; 1013 default: 1014 break; 1015 } 1016 1017 fail: 1018 qemu_opts_del(legacy_opts); 1019 qobject_unref(bs_opts); 1020 return dinfo; 1021 } 1022 1023 static BlockDriverState *qmp_get_root_bs(const char *name, Error **errp) 1024 { 1025 BlockDriverState *bs; 1026 1027 bs = bdrv_lookup_bs(name, name, errp); 1028 if (bs == NULL) { 1029 return NULL; 1030 } 1031 1032 if (!bdrv_is_root_node(bs)) { 1033 error_setg(errp, "Need a root block node"); 1034 return NULL; 1035 } 1036 1037 if (!bdrv_is_inserted(bs)) { 1038 error_setg(errp, "Device has no medium"); 1039 return NULL; 1040 } 1041 1042 return bs; 1043 } 1044 1045 static void blockdev_do_action(TransactionAction *action, Error **errp) 1046 { 1047 TransactionActionList list; 1048 1049 list.value = action; 1050 list.next = NULL; 1051 qmp_transaction(&list, NULL, errp); 1052 } 1053 1054 void qmp_blockdev_snapshot_sync(const char *device, const char *node_name, 1055 const char *snapshot_file, 1056 const char *snapshot_node_name, 1057 const char *format, 1058 bool has_mode, NewImageMode mode, Error **errp) 1059 { 1060 BlockdevSnapshotSync snapshot = { 1061 .device = (char *) device, 1062 .node_name = (char *) node_name, 1063 .snapshot_file = (char *) snapshot_file, 1064 .snapshot_node_name = (char *) snapshot_node_name, 1065 .format = (char *) format, 1066 .has_mode = has_mode, 1067 .mode = mode, 1068 }; 1069 TransactionAction action = { 1070 .type = TRANSACTION_ACTION_KIND_BLOCKDEV_SNAPSHOT_SYNC, 1071 .u.blockdev_snapshot_sync.data = &snapshot, 1072 }; 1073 blockdev_do_action(&action, errp); 1074 } 1075 1076 void qmp_blockdev_snapshot(const char *node, const char *overlay, 1077 Error **errp) 1078 { 1079 BlockdevSnapshot snapshot_data = { 1080 .node = (char *) node, 1081 .overlay = (char *) overlay 1082 }; 1083 TransactionAction action = { 1084 .type = TRANSACTION_ACTION_KIND_BLOCKDEV_SNAPSHOT, 1085 .u.blockdev_snapshot.data = &snapshot_data, 1086 }; 1087 blockdev_do_action(&action, errp); 1088 } 1089 1090 void qmp_blockdev_snapshot_internal_sync(const char *device, 1091 const char *name, 1092 Error **errp) 1093 { 1094 BlockdevSnapshotInternal snapshot = { 1095 .device = (char *) device, 1096 .name = (char *) name 1097 }; 1098 TransactionAction action = { 1099 .type = TRANSACTION_ACTION_KIND_BLOCKDEV_SNAPSHOT_INTERNAL_SYNC, 1100 .u.blockdev_snapshot_internal_sync.data = &snapshot, 1101 }; 1102 blockdev_do_action(&action, errp); 1103 } 1104 1105 SnapshotInfo *qmp_blockdev_snapshot_delete_internal_sync(const char *device, 1106 const char *id, 1107 const char *name, 1108 Error **errp) 1109 { 1110 BlockDriverState *bs; 1111 AioContext *aio_context; 1112 QEMUSnapshotInfo sn; 1113 Error *local_err = NULL; 1114 SnapshotInfo *info = NULL; 1115 int ret; 1116 1117 bs = qmp_get_root_bs(device, errp); 1118 if (!bs) { 1119 return NULL; 1120 } 1121 aio_context = bdrv_get_aio_context(bs); 1122 aio_context_acquire(aio_context); 1123 1124 if (!id && !name) { 1125 error_setg(errp, "Name or id must be provided"); 1126 goto out_aio_context; 1127 } 1128 1129 if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_INTERNAL_SNAPSHOT_DELETE, errp)) { 1130 goto out_aio_context; 1131 } 1132 1133 ret = bdrv_snapshot_find_by_id_and_name(bs, id, name, &sn, &local_err); 1134 if (local_err) { 1135 error_propagate(errp, local_err); 1136 goto out_aio_context; 1137 } 1138 if (!ret) { 1139 error_setg(errp, 1140 "Snapshot with id '%s' and name '%s' does not exist on " 1141 "device '%s'", 1142 STR_OR_NULL(id), STR_OR_NULL(name), device); 1143 goto out_aio_context; 1144 } 1145 1146 bdrv_snapshot_delete(bs, id, name, &local_err); 1147 if (local_err) { 1148 error_propagate(errp, local_err); 1149 goto out_aio_context; 1150 } 1151 1152 aio_context_release(aio_context); 1153 1154 info = g_new0(SnapshotInfo, 1); 1155 info->id = g_strdup(sn.id_str); 1156 info->name = g_strdup(sn.name); 1157 info->date_nsec = sn.date_nsec; 1158 info->date_sec = sn.date_sec; 1159 info->vm_state_size = sn.vm_state_size; 1160 info->vm_clock_nsec = sn.vm_clock_nsec % 1000000000; 1161 info->vm_clock_sec = sn.vm_clock_nsec / 1000000000; 1162 if (sn.icount != -1ULL) { 1163 info->icount = sn.icount; 1164 info->has_icount = true; 1165 } 1166 1167 return info; 1168 1169 out_aio_context: 1170 aio_context_release(aio_context); 1171 return NULL; 1172 } 1173 1174 /* New and old BlockDriverState structs for atomic group operations */ 1175 1176 typedef struct BlkActionState BlkActionState; 1177 1178 /** 1179 * BlkActionOps: 1180 * Table of operations that define an Action. 1181 * 1182 * @instance_size: Size of state struct, in bytes. 1183 * @prepare: Prepare the work, must NOT be NULL. 1184 * @commit: Commit the changes, can be NULL. 1185 * @abort: Abort the changes on fail, can be NULL. 1186 * @clean: Clean up resources after all transaction actions have called 1187 * commit() or abort(). Can be NULL. 1188 * 1189 * Only prepare() may fail. In a single transaction, only one of commit() or 1190 * abort() will be called. clean() will always be called if it is present. 1191 * 1192 * Always run under BQL. 1193 */ 1194 typedef struct BlkActionOps { 1195 size_t instance_size; 1196 void (*prepare)(BlkActionState *common, Error **errp); 1197 void (*commit)(BlkActionState *common); 1198 void (*abort)(BlkActionState *common); 1199 void (*clean)(BlkActionState *common); 1200 } BlkActionOps; 1201 1202 /** 1203 * BlkActionState: 1204 * Describes one Action's state within a Transaction. 1205 * 1206 * @action: QAPI-defined enum identifying which Action to perform. 1207 * @ops: Table of ActionOps this Action can perform. 1208 * @block_job_txn: Transaction which this action belongs to. 1209 * @entry: List membership for all Actions in this Transaction. 1210 * 1211 * This structure must be arranged as first member in a subclassed type, 1212 * assuming that the compiler will also arrange it to the same offsets as the 1213 * base class. 1214 */ 1215 struct BlkActionState { 1216 TransactionAction *action; 1217 const BlkActionOps *ops; 1218 JobTxn *block_job_txn; 1219 TransactionProperties *txn_props; 1220 QTAILQ_ENTRY(BlkActionState) entry; 1221 }; 1222 1223 /* internal snapshot private data */ 1224 typedef struct InternalSnapshotState { 1225 BlkActionState common; 1226 BlockDriverState *bs; 1227 QEMUSnapshotInfo sn; 1228 bool created; 1229 } InternalSnapshotState; 1230 1231 1232 static int action_check_completion_mode(BlkActionState *s, Error **errp) 1233 { 1234 if (s->txn_props->completion_mode != ACTION_COMPLETION_MODE_INDIVIDUAL) { 1235 error_setg(errp, 1236 "Action '%s' does not support Transaction property " 1237 "completion-mode = %s", 1238 TransactionActionKind_str(s->action->type), 1239 ActionCompletionMode_str(s->txn_props->completion_mode)); 1240 return -1; 1241 } 1242 return 0; 1243 } 1244 1245 static void internal_snapshot_prepare(BlkActionState *common, 1246 Error **errp) 1247 { 1248 Error *local_err = NULL; 1249 const char *device; 1250 const char *name; 1251 BlockDriverState *bs; 1252 QEMUSnapshotInfo old_sn, *sn; 1253 bool ret; 1254 int64_t rt; 1255 BlockdevSnapshotInternal *internal; 1256 InternalSnapshotState *state; 1257 AioContext *aio_context; 1258 int ret1; 1259 1260 g_assert(common->action->type == 1261 TRANSACTION_ACTION_KIND_BLOCKDEV_SNAPSHOT_INTERNAL_SYNC); 1262 internal = common->action->u.blockdev_snapshot_internal_sync.data; 1263 state = DO_UPCAST(InternalSnapshotState, common, common); 1264 1265 /* 1. parse input */ 1266 device = internal->device; 1267 name = internal->name; 1268 1269 /* 2. check for validation */ 1270 if (action_check_completion_mode(common, errp) < 0) { 1271 return; 1272 } 1273 1274 bs = qmp_get_root_bs(device, errp); 1275 if (!bs) { 1276 return; 1277 } 1278 1279 aio_context = bdrv_get_aio_context(bs); 1280 aio_context_acquire(aio_context); 1281 1282 state->bs = bs; 1283 1284 /* Paired with .clean() */ 1285 bdrv_drained_begin(bs); 1286 1287 if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_INTERNAL_SNAPSHOT, errp)) { 1288 goto out; 1289 } 1290 1291 if (bdrv_is_read_only(bs)) { 1292 error_setg(errp, "Device '%s' is read only", device); 1293 goto out; 1294 } 1295 1296 if (!bdrv_can_snapshot(bs)) { 1297 error_setg(errp, "Block format '%s' used by device '%s' " 1298 "does not support internal snapshots", 1299 bs->drv->format_name, device); 1300 goto out; 1301 } 1302 1303 if (!strlen(name)) { 1304 error_setg(errp, "Name is empty"); 1305 goto out; 1306 } 1307 1308 /* check whether a snapshot with name exist */ 1309 ret = bdrv_snapshot_find_by_id_and_name(bs, NULL, name, &old_sn, 1310 &local_err); 1311 if (local_err) { 1312 error_propagate(errp, local_err); 1313 goto out; 1314 } else if (ret) { 1315 error_setg(errp, 1316 "Snapshot with name '%s' already exists on device '%s'", 1317 name, device); 1318 goto out; 1319 } 1320 1321 /* 3. take the snapshot */ 1322 sn = &state->sn; 1323 pstrcpy(sn->name, sizeof(sn->name), name); 1324 rt = g_get_real_time(); 1325 sn->date_sec = rt / G_USEC_PER_SEC; 1326 sn->date_nsec = (rt % G_USEC_PER_SEC) * 1000; 1327 sn->vm_clock_nsec = qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL); 1328 if (replay_mode != REPLAY_MODE_NONE) { 1329 sn->icount = replay_get_current_icount(); 1330 } else { 1331 sn->icount = -1ULL; 1332 } 1333 1334 ret1 = bdrv_snapshot_create(bs, sn); 1335 if (ret1 < 0) { 1336 error_setg_errno(errp, -ret1, 1337 "Failed to create snapshot '%s' on device '%s'", 1338 name, device); 1339 goto out; 1340 } 1341 1342 /* 4. succeed, mark a snapshot is created */ 1343 state->created = true; 1344 1345 out: 1346 aio_context_release(aio_context); 1347 } 1348 1349 static void internal_snapshot_abort(BlkActionState *common) 1350 { 1351 InternalSnapshotState *state = 1352 DO_UPCAST(InternalSnapshotState, common, common); 1353 BlockDriverState *bs = state->bs; 1354 QEMUSnapshotInfo *sn = &state->sn; 1355 AioContext *aio_context; 1356 Error *local_error = NULL; 1357 1358 if (!state->created) { 1359 return; 1360 } 1361 1362 aio_context = bdrv_get_aio_context(state->bs); 1363 aio_context_acquire(aio_context); 1364 1365 if (bdrv_snapshot_delete(bs, sn->id_str, sn->name, &local_error) < 0) { 1366 error_reportf_err(local_error, 1367 "Failed to delete snapshot with id '%s' and " 1368 "name '%s' on device '%s' in abort: ", 1369 sn->id_str, sn->name, 1370 bdrv_get_device_name(bs)); 1371 } 1372 1373 aio_context_release(aio_context); 1374 } 1375 1376 static void internal_snapshot_clean(BlkActionState *common) 1377 { 1378 InternalSnapshotState *state = DO_UPCAST(InternalSnapshotState, 1379 common, common); 1380 AioContext *aio_context; 1381 1382 if (!state->bs) { 1383 return; 1384 } 1385 1386 aio_context = bdrv_get_aio_context(state->bs); 1387 aio_context_acquire(aio_context); 1388 1389 bdrv_drained_end(state->bs); 1390 1391 aio_context_release(aio_context); 1392 } 1393 1394 /* external snapshot private data */ 1395 typedef struct ExternalSnapshotState { 1396 BlkActionState common; 1397 BlockDriverState *old_bs; 1398 BlockDriverState *new_bs; 1399 bool overlay_appended; 1400 } ExternalSnapshotState; 1401 1402 static void external_snapshot_prepare(BlkActionState *common, 1403 Error **errp) 1404 { 1405 int ret; 1406 int flags = 0; 1407 QDict *options = NULL; 1408 Error *local_err = NULL; 1409 /* Device and node name of the image to generate the snapshot from */ 1410 const char *device; 1411 const char *node_name; 1412 /* Reference to the new image (for 'blockdev-snapshot') */ 1413 const char *snapshot_ref; 1414 /* File name of the new image (for 'blockdev-snapshot-sync') */ 1415 const char *new_image_file; 1416 ExternalSnapshotState *state = 1417 DO_UPCAST(ExternalSnapshotState, common, common); 1418 TransactionAction *action = common->action; 1419 AioContext *aio_context; 1420 uint64_t perm, shared; 1421 1422 /* 'blockdev-snapshot' and 'blockdev-snapshot-sync' have similar 1423 * purpose but a different set of parameters */ 1424 switch (action->type) { 1425 case TRANSACTION_ACTION_KIND_BLOCKDEV_SNAPSHOT: 1426 { 1427 BlockdevSnapshot *s = action->u.blockdev_snapshot.data; 1428 device = s->node; 1429 node_name = s->node; 1430 new_image_file = NULL; 1431 snapshot_ref = s->overlay; 1432 } 1433 break; 1434 case TRANSACTION_ACTION_KIND_BLOCKDEV_SNAPSHOT_SYNC: 1435 { 1436 BlockdevSnapshotSync *s = action->u.blockdev_snapshot_sync.data; 1437 device = s->device; 1438 node_name = s->node_name; 1439 new_image_file = s->snapshot_file; 1440 snapshot_ref = NULL; 1441 } 1442 break; 1443 default: 1444 g_assert_not_reached(); 1445 } 1446 1447 /* start processing */ 1448 if (action_check_completion_mode(common, errp) < 0) { 1449 return; 1450 } 1451 1452 state->old_bs = bdrv_lookup_bs(device, node_name, errp); 1453 if (!state->old_bs) { 1454 return; 1455 } 1456 1457 aio_context = bdrv_get_aio_context(state->old_bs); 1458 aio_context_acquire(aio_context); 1459 1460 /* Paired with .clean() */ 1461 bdrv_drained_begin(state->old_bs); 1462 1463 if (!bdrv_is_inserted(state->old_bs)) { 1464 error_setg(errp, QERR_DEVICE_HAS_NO_MEDIUM, device); 1465 goto out; 1466 } 1467 1468 if (bdrv_op_is_blocked(state->old_bs, 1469 BLOCK_OP_TYPE_EXTERNAL_SNAPSHOT, errp)) { 1470 goto out; 1471 } 1472 1473 if (!bdrv_is_read_only(state->old_bs)) { 1474 if (bdrv_flush(state->old_bs)) { 1475 error_setg(errp, QERR_IO_ERROR); 1476 goto out; 1477 } 1478 } 1479 1480 if (action->type == TRANSACTION_ACTION_KIND_BLOCKDEV_SNAPSHOT_SYNC) { 1481 BlockdevSnapshotSync *s = action->u.blockdev_snapshot_sync.data; 1482 const char *format = s->format ?: "qcow2"; 1483 enum NewImageMode mode; 1484 const char *snapshot_node_name = s->snapshot_node_name; 1485 1486 if (node_name && !snapshot_node_name) { 1487 error_setg(errp, "New overlay node-name missing"); 1488 goto out; 1489 } 1490 1491 if (snapshot_node_name && 1492 bdrv_lookup_bs(snapshot_node_name, snapshot_node_name, NULL)) { 1493 error_setg(errp, "New overlay node-name already in use"); 1494 goto out; 1495 } 1496 1497 flags = state->old_bs->open_flags; 1498 flags &= ~(BDRV_O_SNAPSHOT | BDRV_O_COPY_ON_READ); 1499 flags |= BDRV_O_NO_BACKING; 1500 1501 /* create new image w/backing file */ 1502 mode = s->has_mode ? s->mode : NEW_IMAGE_MODE_ABSOLUTE_PATHS; 1503 if (mode != NEW_IMAGE_MODE_EXISTING) { 1504 int64_t size = bdrv_getlength(state->old_bs); 1505 if (size < 0) { 1506 error_setg_errno(errp, -size, "bdrv_getlength failed"); 1507 goto out; 1508 } 1509 bdrv_refresh_filename(state->old_bs); 1510 bdrv_img_create(new_image_file, format, 1511 state->old_bs->filename, 1512 state->old_bs->drv->format_name, 1513 NULL, size, flags, false, &local_err); 1514 if (local_err) { 1515 error_propagate(errp, local_err); 1516 goto out; 1517 } 1518 } 1519 1520 options = qdict_new(); 1521 if (snapshot_node_name) { 1522 qdict_put_str(options, "node-name", snapshot_node_name); 1523 } 1524 qdict_put_str(options, "driver", format); 1525 } 1526 1527 state->new_bs = bdrv_open(new_image_file, snapshot_ref, options, flags, 1528 errp); 1529 /* We will manually add the backing_hd field to the bs later */ 1530 if (!state->new_bs) { 1531 goto out; 1532 } 1533 1534 /* 1535 * Allow attaching a backing file to an overlay that's already in use only 1536 * if the parents don't assume that they are already seeing a valid image. 1537 * (Specifically, allow it as a mirror target, which is write-only access.) 1538 */ 1539 bdrv_get_cumulative_perm(state->new_bs, &perm, &shared); 1540 if (perm & BLK_PERM_CONSISTENT_READ) { 1541 error_setg(errp, "The overlay is already in use"); 1542 goto out; 1543 } 1544 1545 if (state->new_bs->drv->is_filter) { 1546 error_setg(errp, "Filters cannot be used as overlays"); 1547 goto out; 1548 } 1549 1550 if (bdrv_cow_child(state->new_bs)) { 1551 error_setg(errp, "The overlay already has a backing image"); 1552 goto out; 1553 } 1554 1555 if (!state->new_bs->drv->supports_backing) { 1556 error_setg(errp, "The overlay does not support backing images"); 1557 goto out; 1558 } 1559 1560 ret = bdrv_append(state->new_bs, state->old_bs, errp); 1561 if (ret < 0) { 1562 goto out; 1563 } 1564 state->overlay_appended = true; 1565 1566 out: 1567 aio_context_release(aio_context); 1568 } 1569 1570 static void external_snapshot_commit(BlkActionState *common) 1571 { 1572 ExternalSnapshotState *state = 1573 DO_UPCAST(ExternalSnapshotState, common, common); 1574 AioContext *aio_context; 1575 1576 aio_context = bdrv_get_aio_context(state->old_bs); 1577 aio_context_acquire(aio_context); 1578 1579 /* We don't need (or want) to use the transactional 1580 * bdrv_reopen_multiple() across all the entries at once, because we 1581 * don't want to abort all of them if one of them fails the reopen */ 1582 if (!qatomic_read(&state->old_bs->copy_on_read)) { 1583 bdrv_reopen_set_read_only(state->old_bs, true, NULL); 1584 } 1585 1586 aio_context_release(aio_context); 1587 } 1588 1589 static void external_snapshot_abort(BlkActionState *common) 1590 { 1591 ExternalSnapshotState *state = 1592 DO_UPCAST(ExternalSnapshotState, common, common); 1593 if (state->new_bs) { 1594 if (state->overlay_appended) { 1595 AioContext *aio_context; 1596 AioContext *tmp_context; 1597 int ret; 1598 1599 aio_context = bdrv_get_aio_context(state->old_bs); 1600 aio_context_acquire(aio_context); 1601 1602 bdrv_ref(state->old_bs); /* we can't let bdrv_set_backind_hd() 1603 close state->old_bs; we need it */ 1604 bdrv_set_backing_hd(state->new_bs, NULL, &error_abort); 1605 1606 /* 1607 * The call to bdrv_set_backing_hd() above returns state->old_bs to 1608 * the main AioContext. As we're still going to be using it, return 1609 * it to the AioContext it was before. 1610 */ 1611 tmp_context = bdrv_get_aio_context(state->old_bs); 1612 if (aio_context != tmp_context) { 1613 aio_context_release(aio_context); 1614 aio_context_acquire(tmp_context); 1615 1616 ret = bdrv_try_change_aio_context(state->old_bs, 1617 aio_context, NULL, NULL); 1618 assert(ret == 0); 1619 1620 aio_context_release(tmp_context); 1621 aio_context_acquire(aio_context); 1622 } 1623 1624 bdrv_replace_node(state->new_bs, state->old_bs, &error_abort); 1625 bdrv_unref(state->old_bs); /* bdrv_replace_node() ref'ed old_bs */ 1626 1627 aio_context_release(aio_context); 1628 } 1629 } 1630 } 1631 1632 static void external_snapshot_clean(BlkActionState *common) 1633 { 1634 ExternalSnapshotState *state = 1635 DO_UPCAST(ExternalSnapshotState, common, common); 1636 AioContext *aio_context; 1637 1638 if (!state->old_bs) { 1639 return; 1640 } 1641 1642 aio_context = bdrv_get_aio_context(state->old_bs); 1643 aio_context_acquire(aio_context); 1644 1645 bdrv_drained_end(state->old_bs); 1646 bdrv_unref(state->new_bs); 1647 1648 aio_context_release(aio_context); 1649 } 1650 1651 typedef struct DriveBackupState { 1652 BlkActionState common; 1653 BlockDriverState *bs; 1654 BlockJob *job; 1655 } DriveBackupState; 1656 1657 static BlockJob *do_backup_common(BackupCommon *backup, 1658 BlockDriverState *bs, 1659 BlockDriverState *target_bs, 1660 AioContext *aio_context, 1661 JobTxn *txn, Error **errp); 1662 1663 static void drive_backup_prepare(BlkActionState *common, Error **errp) 1664 { 1665 DriveBackupState *state = DO_UPCAST(DriveBackupState, common, common); 1666 DriveBackup *backup; 1667 BlockDriverState *bs; 1668 BlockDriverState *target_bs; 1669 BlockDriverState *source = NULL; 1670 AioContext *aio_context; 1671 AioContext *old_context; 1672 const char *format; 1673 QDict *options; 1674 Error *local_err = NULL; 1675 int flags; 1676 int64_t size; 1677 bool set_backing_hd = false; 1678 int ret; 1679 1680 assert(common->action->type == TRANSACTION_ACTION_KIND_DRIVE_BACKUP); 1681 backup = common->action->u.drive_backup.data; 1682 1683 if (!backup->has_mode) { 1684 backup->mode = NEW_IMAGE_MODE_ABSOLUTE_PATHS; 1685 } 1686 1687 bs = bdrv_lookup_bs(backup->device, backup->device, errp); 1688 if (!bs) { 1689 return; 1690 } 1691 1692 if (!bs->drv) { 1693 error_setg(errp, "Device has no medium"); 1694 return; 1695 } 1696 1697 aio_context = bdrv_get_aio_context(bs); 1698 aio_context_acquire(aio_context); 1699 1700 state->bs = bs; 1701 /* Paired with .clean() */ 1702 bdrv_drained_begin(bs); 1703 1704 format = backup->format; 1705 if (!format && backup->mode != NEW_IMAGE_MODE_EXISTING) { 1706 format = bs->drv->format_name; 1707 } 1708 1709 /* Early check to avoid creating target */ 1710 if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_BACKUP_SOURCE, errp)) { 1711 goto out; 1712 } 1713 1714 flags = bs->open_flags | BDRV_O_RDWR; 1715 1716 /* 1717 * See if we have a backing HD we can use to create our new image 1718 * on top of. 1719 */ 1720 if (backup->sync == MIRROR_SYNC_MODE_TOP) { 1721 /* 1722 * Backup will not replace the source by the target, so none 1723 * of the filters skipped here will be removed (in contrast to 1724 * mirror). Therefore, we can skip all of them when looking 1725 * for the first COW relationship. 1726 */ 1727 source = bdrv_cow_bs(bdrv_skip_filters(bs)); 1728 if (!source) { 1729 backup->sync = MIRROR_SYNC_MODE_FULL; 1730 } 1731 } 1732 if (backup->sync == MIRROR_SYNC_MODE_NONE) { 1733 source = bs; 1734 flags |= BDRV_O_NO_BACKING; 1735 set_backing_hd = true; 1736 } 1737 1738 size = bdrv_getlength(bs); 1739 if (size < 0) { 1740 error_setg_errno(errp, -size, "bdrv_getlength failed"); 1741 goto out; 1742 } 1743 1744 if (backup->mode != NEW_IMAGE_MODE_EXISTING) { 1745 assert(format); 1746 if (source) { 1747 /* Implicit filters should not appear in the filename */ 1748 BlockDriverState *explicit_backing = 1749 bdrv_skip_implicit_filters(source); 1750 1751 bdrv_refresh_filename(explicit_backing); 1752 bdrv_img_create(backup->target, format, 1753 explicit_backing->filename, 1754 explicit_backing->drv->format_name, NULL, 1755 size, flags, false, &local_err); 1756 } else { 1757 bdrv_img_create(backup->target, format, NULL, NULL, NULL, 1758 size, flags, false, &local_err); 1759 } 1760 } 1761 1762 if (local_err) { 1763 error_propagate(errp, local_err); 1764 goto out; 1765 } 1766 1767 options = qdict_new(); 1768 qdict_put_str(options, "discard", "unmap"); 1769 qdict_put_str(options, "detect-zeroes", "unmap"); 1770 if (format) { 1771 qdict_put_str(options, "driver", format); 1772 } 1773 1774 target_bs = bdrv_open(backup->target, NULL, options, flags, errp); 1775 if (!target_bs) { 1776 goto out; 1777 } 1778 1779 /* Honor bdrv_try_change_aio_context() context acquisition requirements. */ 1780 old_context = bdrv_get_aio_context(target_bs); 1781 aio_context_release(aio_context); 1782 aio_context_acquire(old_context); 1783 1784 ret = bdrv_try_change_aio_context(target_bs, aio_context, NULL, errp); 1785 if (ret < 0) { 1786 bdrv_unref(target_bs); 1787 aio_context_release(old_context); 1788 return; 1789 } 1790 1791 aio_context_release(old_context); 1792 aio_context_acquire(aio_context); 1793 1794 if (set_backing_hd) { 1795 if (bdrv_set_backing_hd(target_bs, source, errp) < 0) { 1796 goto unref; 1797 } 1798 } 1799 1800 state->job = do_backup_common(qapi_DriveBackup_base(backup), 1801 bs, target_bs, aio_context, 1802 common->block_job_txn, errp); 1803 1804 unref: 1805 bdrv_unref(target_bs); 1806 out: 1807 aio_context_release(aio_context); 1808 } 1809 1810 static void drive_backup_commit(BlkActionState *common) 1811 { 1812 DriveBackupState *state = DO_UPCAST(DriveBackupState, common, common); 1813 AioContext *aio_context; 1814 1815 aio_context = bdrv_get_aio_context(state->bs); 1816 aio_context_acquire(aio_context); 1817 1818 assert(state->job); 1819 job_start(&state->job->job); 1820 1821 aio_context_release(aio_context); 1822 } 1823 1824 static void drive_backup_abort(BlkActionState *common) 1825 { 1826 DriveBackupState *state = DO_UPCAST(DriveBackupState, common, common); 1827 1828 if (state->job) { 1829 job_cancel_sync(&state->job->job, true); 1830 } 1831 } 1832 1833 static void drive_backup_clean(BlkActionState *common) 1834 { 1835 DriveBackupState *state = DO_UPCAST(DriveBackupState, common, common); 1836 AioContext *aio_context; 1837 1838 if (!state->bs) { 1839 return; 1840 } 1841 1842 aio_context = bdrv_get_aio_context(state->bs); 1843 aio_context_acquire(aio_context); 1844 1845 bdrv_drained_end(state->bs); 1846 1847 aio_context_release(aio_context); 1848 } 1849 1850 typedef struct BlockdevBackupState { 1851 BlkActionState common; 1852 BlockDriverState *bs; 1853 BlockJob *job; 1854 } BlockdevBackupState; 1855 1856 static void blockdev_backup_prepare(BlkActionState *common, Error **errp) 1857 { 1858 BlockdevBackupState *state = DO_UPCAST(BlockdevBackupState, common, common); 1859 BlockdevBackup *backup; 1860 BlockDriverState *bs; 1861 BlockDriverState *target_bs; 1862 AioContext *aio_context; 1863 AioContext *old_context; 1864 int ret; 1865 1866 assert(common->action->type == TRANSACTION_ACTION_KIND_BLOCKDEV_BACKUP); 1867 backup = common->action->u.blockdev_backup.data; 1868 1869 bs = bdrv_lookup_bs(backup->device, backup->device, errp); 1870 if (!bs) { 1871 return; 1872 } 1873 1874 target_bs = bdrv_lookup_bs(backup->target, backup->target, errp); 1875 if (!target_bs) { 1876 return; 1877 } 1878 1879 /* Honor bdrv_try_change_aio_context() context acquisition requirements. */ 1880 aio_context = bdrv_get_aio_context(bs); 1881 old_context = bdrv_get_aio_context(target_bs); 1882 aio_context_acquire(old_context); 1883 1884 ret = bdrv_try_change_aio_context(target_bs, aio_context, NULL, errp); 1885 if (ret < 0) { 1886 aio_context_release(old_context); 1887 return; 1888 } 1889 1890 aio_context_release(old_context); 1891 aio_context_acquire(aio_context); 1892 state->bs = bs; 1893 1894 /* Paired with .clean() */ 1895 bdrv_drained_begin(state->bs); 1896 1897 state->job = do_backup_common(qapi_BlockdevBackup_base(backup), 1898 bs, target_bs, aio_context, 1899 common->block_job_txn, errp); 1900 1901 aio_context_release(aio_context); 1902 } 1903 1904 static void blockdev_backup_commit(BlkActionState *common) 1905 { 1906 BlockdevBackupState *state = DO_UPCAST(BlockdevBackupState, common, common); 1907 AioContext *aio_context; 1908 1909 aio_context = bdrv_get_aio_context(state->bs); 1910 aio_context_acquire(aio_context); 1911 1912 assert(state->job); 1913 job_start(&state->job->job); 1914 1915 aio_context_release(aio_context); 1916 } 1917 1918 static void blockdev_backup_abort(BlkActionState *common) 1919 { 1920 BlockdevBackupState *state = DO_UPCAST(BlockdevBackupState, common, common); 1921 1922 if (state->job) { 1923 job_cancel_sync(&state->job->job, true); 1924 } 1925 } 1926 1927 static void blockdev_backup_clean(BlkActionState *common) 1928 { 1929 BlockdevBackupState *state = DO_UPCAST(BlockdevBackupState, common, common); 1930 AioContext *aio_context; 1931 1932 if (!state->bs) { 1933 return; 1934 } 1935 1936 aio_context = bdrv_get_aio_context(state->bs); 1937 aio_context_acquire(aio_context); 1938 1939 bdrv_drained_end(state->bs); 1940 1941 aio_context_release(aio_context); 1942 } 1943 1944 typedef struct BlockDirtyBitmapState { 1945 BlkActionState common; 1946 BdrvDirtyBitmap *bitmap; 1947 BlockDriverState *bs; 1948 HBitmap *backup; 1949 bool prepared; 1950 bool was_enabled; 1951 } BlockDirtyBitmapState; 1952 1953 static void block_dirty_bitmap_add_prepare(BlkActionState *common, 1954 Error **errp) 1955 { 1956 Error *local_err = NULL; 1957 BlockDirtyBitmapAdd *action; 1958 BlockDirtyBitmapState *state = DO_UPCAST(BlockDirtyBitmapState, 1959 common, common); 1960 1961 if (action_check_completion_mode(common, errp) < 0) { 1962 return; 1963 } 1964 1965 action = common->action->u.block_dirty_bitmap_add.data; 1966 /* AIO context taken and released within qmp_block_dirty_bitmap_add */ 1967 qmp_block_dirty_bitmap_add(action->node, action->name, 1968 action->has_granularity, action->granularity, 1969 action->has_persistent, action->persistent, 1970 action->has_disabled, action->disabled, 1971 &local_err); 1972 1973 if (!local_err) { 1974 state->prepared = true; 1975 } else { 1976 error_propagate(errp, local_err); 1977 } 1978 } 1979 1980 static void block_dirty_bitmap_add_abort(BlkActionState *common) 1981 { 1982 BlockDirtyBitmapAdd *action; 1983 BlockDirtyBitmapState *state = DO_UPCAST(BlockDirtyBitmapState, 1984 common, common); 1985 1986 action = common->action->u.block_dirty_bitmap_add.data; 1987 /* Should not be able to fail: IF the bitmap was added via .prepare(), 1988 * then the node reference and bitmap name must have been valid. 1989 */ 1990 if (state->prepared) { 1991 qmp_block_dirty_bitmap_remove(action->node, action->name, &error_abort); 1992 } 1993 } 1994 1995 static void block_dirty_bitmap_clear_prepare(BlkActionState *common, 1996 Error **errp) 1997 { 1998 BlockDirtyBitmapState *state = DO_UPCAST(BlockDirtyBitmapState, 1999 common, common); 2000 BlockDirtyBitmap *action; 2001 2002 if (action_check_completion_mode(common, errp) < 0) { 2003 return; 2004 } 2005 2006 action = common->action->u.block_dirty_bitmap_clear.data; 2007 state->bitmap = block_dirty_bitmap_lookup(action->node, 2008 action->name, 2009 &state->bs, 2010 errp); 2011 if (!state->bitmap) { 2012 return; 2013 } 2014 2015 if (bdrv_dirty_bitmap_check(state->bitmap, BDRV_BITMAP_DEFAULT, errp)) { 2016 return; 2017 } 2018 2019 bdrv_clear_dirty_bitmap(state->bitmap, &state->backup); 2020 } 2021 2022 static void block_dirty_bitmap_restore(BlkActionState *common) 2023 { 2024 BlockDirtyBitmapState *state = DO_UPCAST(BlockDirtyBitmapState, 2025 common, common); 2026 2027 if (state->backup) { 2028 bdrv_restore_dirty_bitmap(state->bitmap, state->backup); 2029 } 2030 } 2031 2032 static void block_dirty_bitmap_free_backup(BlkActionState *common) 2033 { 2034 BlockDirtyBitmapState *state = DO_UPCAST(BlockDirtyBitmapState, 2035 common, common); 2036 2037 hbitmap_free(state->backup); 2038 } 2039 2040 static void block_dirty_bitmap_enable_prepare(BlkActionState *common, 2041 Error **errp) 2042 { 2043 BlockDirtyBitmap *action; 2044 BlockDirtyBitmapState *state = DO_UPCAST(BlockDirtyBitmapState, 2045 common, common); 2046 2047 if (action_check_completion_mode(common, errp) < 0) { 2048 return; 2049 } 2050 2051 action = common->action->u.block_dirty_bitmap_enable.data; 2052 state->bitmap = block_dirty_bitmap_lookup(action->node, 2053 action->name, 2054 NULL, 2055 errp); 2056 if (!state->bitmap) { 2057 return; 2058 } 2059 2060 if (bdrv_dirty_bitmap_check(state->bitmap, BDRV_BITMAP_ALLOW_RO, errp)) { 2061 return; 2062 } 2063 2064 state->was_enabled = bdrv_dirty_bitmap_enabled(state->bitmap); 2065 bdrv_enable_dirty_bitmap(state->bitmap); 2066 } 2067 2068 static void block_dirty_bitmap_enable_abort(BlkActionState *common) 2069 { 2070 BlockDirtyBitmapState *state = DO_UPCAST(BlockDirtyBitmapState, 2071 common, common); 2072 2073 if (!state->was_enabled) { 2074 bdrv_disable_dirty_bitmap(state->bitmap); 2075 } 2076 } 2077 2078 static void block_dirty_bitmap_disable_prepare(BlkActionState *common, 2079 Error **errp) 2080 { 2081 BlockDirtyBitmap *action; 2082 BlockDirtyBitmapState *state = DO_UPCAST(BlockDirtyBitmapState, 2083 common, common); 2084 2085 if (action_check_completion_mode(common, errp) < 0) { 2086 return; 2087 } 2088 2089 action = common->action->u.block_dirty_bitmap_disable.data; 2090 state->bitmap = block_dirty_bitmap_lookup(action->node, 2091 action->name, 2092 NULL, 2093 errp); 2094 if (!state->bitmap) { 2095 return; 2096 } 2097 2098 if (bdrv_dirty_bitmap_check(state->bitmap, BDRV_BITMAP_ALLOW_RO, errp)) { 2099 return; 2100 } 2101 2102 state->was_enabled = bdrv_dirty_bitmap_enabled(state->bitmap); 2103 bdrv_disable_dirty_bitmap(state->bitmap); 2104 } 2105 2106 static void block_dirty_bitmap_disable_abort(BlkActionState *common) 2107 { 2108 BlockDirtyBitmapState *state = DO_UPCAST(BlockDirtyBitmapState, 2109 common, common); 2110 2111 if (state->was_enabled) { 2112 bdrv_enable_dirty_bitmap(state->bitmap); 2113 } 2114 } 2115 2116 static void block_dirty_bitmap_merge_prepare(BlkActionState *common, 2117 Error **errp) 2118 { 2119 BlockDirtyBitmapMerge *action; 2120 BlockDirtyBitmapState *state = DO_UPCAST(BlockDirtyBitmapState, 2121 common, common); 2122 2123 if (action_check_completion_mode(common, errp) < 0) { 2124 return; 2125 } 2126 2127 action = common->action->u.block_dirty_bitmap_merge.data; 2128 2129 state->bitmap = block_dirty_bitmap_merge(action->node, action->target, 2130 action->bitmaps, &state->backup, 2131 errp); 2132 } 2133 2134 static void block_dirty_bitmap_remove_prepare(BlkActionState *common, 2135 Error **errp) 2136 { 2137 BlockDirtyBitmap *action; 2138 BlockDirtyBitmapState *state = DO_UPCAST(BlockDirtyBitmapState, 2139 common, common); 2140 2141 if (action_check_completion_mode(common, errp) < 0) { 2142 return; 2143 } 2144 2145 action = common->action->u.block_dirty_bitmap_remove.data; 2146 2147 state->bitmap = block_dirty_bitmap_remove(action->node, action->name, 2148 false, &state->bs, errp); 2149 if (state->bitmap) { 2150 bdrv_dirty_bitmap_skip_store(state->bitmap, true); 2151 bdrv_dirty_bitmap_set_busy(state->bitmap, true); 2152 } 2153 } 2154 2155 static void block_dirty_bitmap_remove_abort(BlkActionState *common) 2156 { 2157 BlockDirtyBitmapState *state = DO_UPCAST(BlockDirtyBitmapState, 2158 common, common); 2159 2160 if (state->bitmap) { 2161 bdrv_dirty_bitmap_skip_store(state->bitmap, false); 2162 bdrv_dirty_bitmap_set_busy(state->bitmap, false); 2163 } 2164 } 2165 2166 static void block_dirty_bitmap_remove_commit(BlkActionState *common) 2167 { 2168 BlockDirtyBitmapState *state = DO_UPCAST(BlockDirtyBitmapState, 2169 common, common); 2170 2171 bdrv_dirty_bitmap_set_busy(state->bitmap, false); 2172 bdrv_release_dirty_bitmap(state->bitmap); 2173 } 2174 2175 static void abort_prepare(BlkActionState *common, Error **errp) 2176 { 2177 error_setg(errp, "Transaction aborted using Abort action"); 2178 } 2179 2180 static void abort_commit(BlkActionState *common) 2181 { 2182 g_assert_not_reached(); /* this action never succeeds */ 2183 } 2184 2185 static const BlkActionOps actions[] = { 2186 [TRANSACTION_ACTION_KIND_BLOCKDEV_SNAPSHOT] = { 2187 .instance_size = sizeof(ExternalSnapshotState), 2188 .prepare = external_snapshot_prepare, 2189 .commit = external_snapshot_commit, 2190 .abort = external_snapshot_abort, 2191 .clean = external_snapshot_clean, 2192 }, 2193 [TRANSACTION_ACTION_KIND_BLOCKDEV_SNAPSHOT_SYNC] = { 2194 .instance_size = sizeof(ExternalSnapshotState), 2195 .prepare = external_snapshot_prepare, 2196 .commit = external_snapshot_commit, 2197 .abort = external_snapshot_abort, 2198 .clean = external_snapshot_clean, 2199 }, 2200 [TRANSACTION_ACTION_KIND_DRIVE_BACKUP] = { 2201 .instance_size = sizeof(DriveBackupState), 2202 .prepare = drive_backup_prepare, 2203 .commit = drive_backup_commit, 2204 .abort = drive_backup_abort, 2205 .clean = drive_backup_clean, 2206 }, 2207 [TRANSACTION_ACTION_KIND_BLOCKDEV_BACKUP] = { 2208 .instance_size = sizeof(BlockdevBackupState), 2209 .prepare = blockdev_backup_prepare, 2210 .commit = blockdev_backup_commit, 2211 .abort = blockdev_backup_abort, 2212 .clean = blockdev_backup_clean, 2213 }, 2214 [TRANSACTION_ACTION_KIND_ABORT] = { 2215 .instance_size = sizeof(BlkActionState), 2216 .prepare = abort_prepare, 2217 .commit = abort_commit, 2218 }, 2219 [TRANSACTION_ACTION_KIND_BLOCKDEV_SNAPSHOT_INTERNAL_SYNC] = { 2220 .instance_size = sizeof(InternalSnapshotState), 2221 .prepare = internal_snapshot_prepare, 2222 .abort = internal_snapshot_abort, 2223 .clean = internal_snapshot_clean, 2224 }, 2225 [TRANSACTION_ACTION_KIND_BLOCK_DIRTY_BITMAP_ADD] = { 2226 .instance_size = sizeof(BlockDirtyBitmapState), 2227 .prepare = block_dirty_bitmap_add_prepare, 2228 .abort = block_dirty_bitmap_add_abort, 2229 }, 2230 [TRANSACTION_ACTION_KIND_BLOCK_DIRTY_BITMAP_CLEAR] = { 2231 .instance_size = sizeof(BlockDirtyBitmapState), 2232 .prepare = block_dirty_bitmap_clear_prepare, 2233 .commit = block_dirty_bitmap_free_backup, 2234 .abort = block_dirty_bitmap_restore, 2235 }, 2236 [TRANSACTION_ACTION_KIND_BLOCK_DIRTY_BITMAP_ENABLE] = { 2237 .instance_size = sizeof(BlockDirtyBitmapState), 2238 .prepare = block_dirty_bitmap_enable_prepare, 2239 .abort = block_dirty_bitmap_enable_abort, 2240 }, 2241 [TRANSACTION_ACTION_KIND_BLOCK_DIRTY_BITMAP_DISABLE] = { 2242 .instance_size = sizeof(BlockDirtyBitmapState), 2243 .prepare = block_dirty_bitmap_disable_prepare, 2244 .abort = block_dirty_bitmap_disable_abort, 2245 }, 2246 [TRANSACTION_ACTION_KIND_BLOCK_DIRTY_BITMAP_MERGE] = { 2247 .instance_size = sizeof(BlockDirtyBitmapState), 2248 .prepare = block_dirty_bitmap_merge_prepare, 2249 .commit = block_dirty_bitmap_free_backup, 2250 .abort = block_dirty_bitmap_restore, 2251 }, 2252 [TRANSACTION_ACTION_KIND_BLOCK_DIRTY_BITMAP_REMOVE] = { 2253 .instance_size = sizeof(BlockDirtyBitmapState), 2254 .prepare = block_dirty_bitmap_remove_prepare, 2255 .commit = block_dirty_bitmap_remove_commit, 2256 .abort = block_dirty_bitmap_remove_abort, 2257 }, 2258 /* Where are transactions for MIRROR, COMMIT and STREAM? 2259 * Although these blockjobs use transaction callbacks like the backup job, 2260 * these jobs do not necessarily adhere to transaction semantics. 2261 * These jobs may not fully undo all of their actions on abort, nor do they 2262 * necessarily work in transactions with more than one job in them. 2263 */ 2264 }; 2265 2266 /** 2267 * Allocate a TransactionProperties structure if necessary, and fill 2268 * that structure with desired defaults if they are unset. 2269 */ 2270 static TransactionProperties *get_transaction_properties( 2271 TransactionProperties *props) 2272 { 2273 if (!props) { 2274 props = g_new0(TransactionProperties, 1); 2275 } 2276 2277 if (!props->has_completion_mode) { 2278 props->has_completion_mode = true; 2279 props->completion_mode = ACTION_COMPLETION_MODE_INDIVIDUAL; 2280 } 2281 2282 return props; 2283 } 2284 2285 /* 2286 * 'Atomic' group operations. The operations are performed as a set, and if 2287 * any fail then we roll back all operations in the group. 2288 * 2289 * Always run under BQL. 2290 */ 2291 void qmp_transaction(TransactionActionList *dev_list, 2292 struct TransactionProperties *props, 2293 Error **errp) 2294 { 2295 TransactionActionList *dev_entry = dev_list; 2296 bool has_props = !!props; 2297 JobTxn *block_job_txn = NULL; 2298 BlkActionState *state, *next; 2299 Error *local_err = NULL; 2300 2301 GLOBAL_STATE_CODE(); 2302 2303 QTAILQ_HEAD(, BlkActionState) snap_bdrv_states; 2304 QTAILQ_INIT(&snap_bdrv_states); 2305 2306 /* Does this transaction get canceled as a group on failure? 2307 * If not, we don't really need to make a JobTxn. 2308 */ 2309 props = get_transaction_properties(props); 2310 if (props->completion_mode != ACTION_COMPLETION_MODE_INDIVIDUAL) { 2311 block_job_txn = job_txn_new(); 2312 } 2313 2314 /* drain all i/o before any operations */ 2315 bdrv_drain_all(); 2316 2317 /* We don't do anything in this loop that commits us to the operations */ 2318 while (NULL != dev_entry) { 2319 TransactionAction *dev_info = NULL; 2320 const BlkActionOps *ops; 2321 2322 dev_info = dev_entry->value; 2323 dev_entry = dev_entry->next; 2324 2325 assert(dev_info->type < ARRAY_SIZE(actions)); 2326 2327 ops = &actions[dev_info->type]; 2328 assert(ops->instance_size > 0); 2329 2330 state = g_malloc0(ops->instance_size); 2331 state->ops = ops; 2332 state->action = dev_info; 2333 state->block_job_txn = block_job_txn; 2334 state->txn_props = props; 2335 QTAILQ_INSERT_TAIL(&snap_bdrv_states, state, entry); 2336 2337 state->ops->prepare(state, &local_err); 2338 if (local_err) { 2339 error_propagate(errp, local_err); 2340 goto delete_and_fail; 2341 } 2342 } 2343 2344 QTAILQ_FOREACH(state, &snap_bdrv_states, entry) { 2345 if (state->ops->commit) { 2346 state->ops->commit(state); 2347 } 2348 } 2349 2350 /* success */ 2351 goto exit; 2352 2353 delete_and_fail: 2354 /* failure, and it is all-or-none; roll back all operations */ 2355 QTAILQ_FOREACH_REVERSE(state, &snap_bdrv_states, entry) { 2356 if (state->ops->abort) { 2357 state->ops->abort(state); 2358 } 2359 } 2360 exit: 2361 QTAILQ_FOREACH_SAFE(state, &snap_bdrv_states, entry, next) { 2362 if (state->ops->clean) { 2363 state->ops->clean(state); 2364 } 2365 g_free(state); 2366 } 2367 if (!has_props) { 2368 qapi_free_TransactionProperties(props); 2369 } 2370 job_txn_unref(block_job_txn); 2371 } 2372 2373 BlockDirtyBitmapSha256 *qmp_x_debug_block_dirty_bitmap_sha256(const char *node, 2374 const char *name, 2375 Error **errp) 2376 { 2377 BdrvDirtyBitmap *bitmap; 2378 BlockDriverState *bs; 2379 BlockDirtyBitmapSha256 *ret = NULL; 2380 char *sha256; 2381 2382 bitmap = block_dirty_bitmap_lookup(node, name, &bs, errp); 2383 if (!bitmap || !bs) { 2384 return NULL; 2385 } 2386 2387 sha256 = bdrv_dirty_bitmap_sha256(bitmap, errp); 2388 if (sha256 == NULL) { 2389 return NULL; 2390 } 2391 2392 ret = g_new(BlockDirtyBitmapSha256, 1); 2393 ret->sha256 = sha256; 2394 2395 return ret; 2396 } 2397 2398 void coroutine_fn qmp_block_resize(const char *device, const char *node_name, 2399 int64_t size, Error **errp) 2400 { 2401 Error *local_err = NULL; 2402 BlockBackend *blk; 2403 BlockDriverState *bs; 2404 AioContext *old_ctx; 2405 2406 bs = bdrv_lookup_bs(device, node_name, &local_err); 2407 if (local_err) { 2408 error_propagate(errp, local_err); 2409 return; 2410 } 2411 2412 if (size < 0) { 2413 error_setg(errp, QERR_INVALID_PARAMETER_VALUE, "size", "a >0 size"); 2414 return; 2415 } 2416 2417 if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_RESIZE, NULL)) { 2418 error_setg(errp, QERR_DEVICE_IN_USE, device); 2419 return; 2420 } 2421 2422 blk = blk_new_with_bs(bs, BLK_PERM_RESIZE, BLK_PERM_ALL, errp); 2423 if (!blk) { 2424 return; 2425 } 2426 2427 bdrv_co_lock(bs); 2428 bdrv_drained_begin(bs); 2429 bdrv_co_unlock(bs); 2430 2431 old_ctx = bdrv_co_enter(bs); 2432 blk_co_truncate(blk, size, false, PREALLOC_MODE_OFF, 0, errp); 2433 bdrv_co_leave(bs, old_ctx); 2434 2435 bdrv_co_lock(bs); 2436 bdrv_drained_end(bs); 2437 blk_unref(blk); 2438 bdrv_co_unlock(bs); 2439 } 2440 2441 void qmp_block_stream(const char *job_id, const char *device, 2442 const char *base, 2443 const char *base_node, 2444 const char *backing_file, 2445 const char *bottom, 2446 bool has_speed, int64_t speed, 2447 bool has_on_error, BlockdevOnError on_error, 2448 const char *filter_node_name, 2449 bool has_auto_finalize, bool auto_finalize, 2450 bool has_auto_dismiss, bool auto_dismiss, 2451 Error **errp) 2452 { 2453 BlockDriverState *bs, *iter, *iter_end; 2454 BlockDriverState *base_bs = NULL; 2455 BlockDriverState *bottom_bs = NULL; 2456 AioContext *aio_context; 2457 Error *local_err = NULL; 2458 int job_flags = JOB_DEFAULT; 2459 2460 if (base && base_node) { 2461 error_setg(errp, "'base' and 'base-node' cannot be specified " 2462 "at the same time"); 2463 return; 2464 } 2465 2466 if (base && bottom) { 2467 error_setg(errp, "'base' and 'bottom' cannot be specified " 2468 "at the same time"); 2469 return; 2470 } 2471 2472 if (bottom && base_node) { 2473 error_setg(errp, "'bottom' and 'base-node' cannot be specified " 2474 "at the same time"); 2475 return; 2476 } 2477 2478 if (!has_on_error) { 2479 on_error = BLOCKDEV_ON_ERROR_REPORT; 2480 } 2481 2482 bs = bdrv_lookup_bs(device, device, errp); 2483 if (!bs) { 2484 return; 2485 } 2486 2487 aio_context = bdrv_get_aio_context(bs); 2488 aio_context_acquire(aio_context); 2489 2490 if (base) { 2491 base_bs = bdrv_find_backing_image(bs, base); 2492 if (base_bs == NULL) { 2493 error_setg(errp, "Can't find '%s' in the backing chain", base); 2494 goto out; 2495 } 2496 assert(bdrv_get_aio_context(base_bs) == aio_context); 2497 } 2498 2499 if (base_node) { 2500 base_bs = bdrv_lookup_bs(NULL, base_node, errp); 2501 if (!base_bs) { 2502 goto out; 2503 } 2504 if (bs == base_bs || !bdrv_chain_contains(bs, base_bs)) { 2505 error_setg(errp, "Node '%s' is not a backing image of '%s'", 2506 base_node, device); 2507 goto out; 2508 } 2509 assert(bdrv_get_aio_context(base_bs) == aio_context); 2510 bdrv_refresh_filename(base_bs); 2511 } 2512 2513 if (bottom) { 2514 bottom_bs = bdrv_lookup_bs(NULL, bottom, errp); 2515 if (!bottom_bs) { 2516 goto out; 2517 } 2518 if (!bottom_bs->drv) { 2519 error_setg(errp, "Node '%s' is not open", bottom); 2520 goto out; 2521 } 2522 if (bottom_bs->drv->is_filter) { 2523 error_setg(errp, "Node '%s' is a filter, use a non-filter node " 2524 "as 'bottom'", bottom); 2525 goto out; 2526 } 2527 if (!bdrv_chain_contains(bs, bottom_bs)) { 2528 error_setg(errp, "Node '%s' is not in a chain starting from '%s'", 2529 bottom, device); 2530 goto out; 2531 } 2532 assert(bdrv_get_aio_context(bottom_bs) == aio_context); 2533 } 2534 2535 /* 2536 * Check for op blockers in the whole chain between bs and base (or bottom) 2537 */ 2538 iter_end = bottom ? bdrv_filter_or_cow_bs(bottom_bs) : base_bs; 2539 for (iter = bs; iter && iter != iter_end; 2540 iter = bdrv_filter_or_cow_bs(iter)) 2541 { 2542 if (bdrv_op_is_blocked(iter, BLOCK_OP_TYPE_STREAM, errp)) { 2543 goto out; 2544 } 2545 } 2546 2547 /* if we are streaming the entire chain, the result will have no backing 2548 * file, and specifying one is therefore an error */ 2549 if (!base_bs && backing_file) { 2550 error_setg(errp, "backing file specified, but streaming the " 2551 "entire chain"); 2552 goto out; 2553 } 2554 2555 if (has_auto_finalize && !auto_finalize) { 2556 job_flags |= JOB_MANUAL_FINALIZE; 2557 } 2558 if (has_auto_dismiss && !auto_dismiss) { 2559 job_flags |= JOB_MANUAL_DISMISS; 2560 } 2561 2562 stream_start(job_id, bs, base_bs, backing_file, 2563 bottom_bs, job_flags, has_speed ? speed : 0, on_error, 2564 filter_node_name, &local_err); 2565 if (local_err) { 2566 error_propagate(errp, local_err); 2567 goto out; 2568 } 2569 2570 trace_qmp_block_stream(bs); 2571 2572 out: 2573 aio_context_release(aio_context); 2574 } 2575 2576 void qmp_block_commit(const char *job_id, const char *device, 2577 const char *base_node, 2578 const char *base, 2579 const char *top_node, 2580 const char *top, 2581 const char *backing_file, 2582 bool has_speed, int64_t speed, 2583 bool has_on_error, BlockdevOnError on_error, 2584 const char *filter_node_name, 2585 bool has_auto_finalize, bool auto_finalize, 2586 bool has_auto_dismiss, bool auto_dismiss, 2587 Error **errp) 2588 { 2589 BlockDriverState *bs; 2590 BlockDriverState *iter; 2591 BlockDriverState *base_bs, *top_bs; 2592 AioContext *aio_context; 2593 Error *local_err = NULL; 2594 int job_flags = JOB_DEFAULT; 2595 uint64_t top_perm, top_shared; 2596 2597 if (!has_speed) { 2598 speed = 0; 2599 } 2600 if (!has_on_error) { 2601 on_error = BLOCKDEV_ON_ERROR_REPORT; 2602 } 2603 if (has_auto_finalize && !auto_finalize) { 2604 job_flags |= JOB_MANUAL_FINALIZE; 2605 } 2606 if (has_auto_dismiss && !auto_dismiss) { 2607 job_flags |= JOB_MANUAL_DISMISS; 2608 } 2609 2610 /* Important Note: 2611 * libvirt relies on the DeviceNotFound error class in order to probe for 2612 * live commit feature versions; for this to work, we must make sure to 2613 * perform the device lookup before any generic errors that may occur in a 2614 * scenario in which all optional arguments are omitted. */ 2615 bs = qmp_get_root_bs(device, &local_err); 2616 if (!bs) { 2617 bs = bdrv_lookup_bs(device, device, NULL); 2618 if (!bs) { 2619 error_free(local_err); 2620 error_set(errp, ERROR_CLASS_DEVICE_NOT_FOUND, 2621 "Device '%s' not found", device); 2622 } else { 2623 error_propagate(errp, local_err); 2624 } 2625 return; 2626 } 2627 2628 aio_context = bdrv_get_aio_context(bs); 2629 aio_context_acquire(aio_context); 2630 2631 if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_COMMIT_SOURCE, errp)) { 2632 goto out; 2633 } 2634 2635 /* default top_bs is the active layer */ 2636 top_bs = bs; 2637 2638 if (top_node && top) { 2639 error_setg(errp, "'top-node' and 'top' are mutually exclusive"); 2640 goto out; 2641 } else if (top_node) { 2642 top_bs = bdrv_lookup_bs(NULL, top_node, errp); 2643 if (top_bs == NULL) { 2644 goto out; 2645 } 2646 if (!bdrv_chain_contains(bs, top_bs)) { 2647 error_setg(errp, "'%s' is not in this backing file chain", 2648 top_node); 2649 goto out; 2650 } 2651 } else if (top) { 2652 /* This strcmp() is just a shortcut, there is no need to 2653 * refresh @bs's filename. If it mismatches, 2654 * bdrv_find_backing_image() will do the refresh and may still 2655 * return @bs. */ 2656 if (strcmp(bs->filename, top) != 0) { 2657 top_bs = bdrv_find_backing_image(bs, top); 2658 } 2659 } 2660 2661 if (top_bs == NULL) { 2662 error_setg(errp, "Top image file %s not found", top ? top : "NULL"); 2663 goto out; 2664 } 2665 2666 assert(bdrv_get_aio_context(top_bs) == aio_context); 2667 2668 if (base_node && base) { 2669 error_setg(errp, "'base-node' and 'base' are mutually exclusive"); 2670 goto out; 2671 } else if (base_node) { 2672 base_bs = bdrv_lookup_bs(NULL, base_node, errp); 2673 if (base_bs == NULL) { 2674 goto out; 2675 } 2676 if (!bdrv_chain_contains(top_bs, base_bs)) { 2677 error_setg(errp, "'%s' is not in this backing file chain", 2678 base_node); 2679 goto out; 2680 } 2681 } else if (base) { 2682 base_bs = bdrv_find_backing_image(top_bs, base); 2683 if (base_bs == NULL) { 2684 error_setg(errp, "Can't find '%s' in the backing chain", base); 2685 goto out; 2686 } 2687 } else { 2688 base_bs = bdrv_find_base(top_bs); 2689 if (base_bs == NULL) { 2690 error_setg(errp, "There is no backimg image"); 2691 goto out; 2692 } 2693 } 2694 2695 assert(bdrv_get_aio_context(base_bs) == aio_context); 2696 2697 for (iter = top_bs; iter != bdrv_filter_or_cow_bs(base_bs); 2698 iter = bdrv_filter_or_cow_bs(iter)) 2699 { 2700 if (bdrv_op_is_blocked(iter, BLOCK_OP_TYPE_COMMIT_TARGET, errp)) { 2701 goto out; 2702 } 2703 } 2704 2705 /* Do not allow attempts to commit an image into itself */ 2706 if (top_bs == base_bs) { 2707 error_setg(errp, "cannot commit an image into itself"); 2708 goto out; 2709 } 2710 2711 /* 2712 * Active commit is required if and only if someone has taken a 2713 * WRITE permission on the top node. Historically, we have always 2714 * used active commit for top nodes, so continue that practice 2715 * lest we possibly break clients that rely on this behavior, e.g. 2716 * to later attach this node to a writing parent. 2717 * (Active commit is never really wrong.) 2718 */ 2719 bdrv_get_cumulative_perm(top_bs, &top_perm, &top_shared); 2720 if (top_perm & BLK_PERM_WRITE || 2721 bdrv_skip_filters(top_bs) == bdrv_skip_filters(bs)) 2722 { 2723 if (backing_file) { 2724 if (bdrv_skip_filters(top_bs) == bdrv_skip_filters(bs)) { 2725 error_setg(errp, "'backing-file' specified," 2726 " but 'top' is the active layer"); 2727 } else { 2728 error_setg(errp, "'backing-file' specified, but 'top' has a " 2729 "writer on it"); 2730 } 2731 goto out; 2732 } 2733 if (!job_id) { 2734 /* 2735 * Emulate here what block_job_create() does, because it 2736 * is possible that @bs != @top_bs (the block job should 2737 * be named after @bs, even if @top_bs is the actual 2738 * source) 2739 */ 2740 job_id = bdrv_get_device_name(bs); 2741 } 2742 commit_active_start(job_id, top_bs, base_bs, job_flags, speed, on_error, 2743 filter_node_name, NULL, NULL, false, &local_err); 2744 } else { 2745 BlockDriverState *overlay_bs = bdrv_find_overlay(bs, top_bs); 2746 if (bdrv_op_is_blocked(overlay_bs, BLOCK_OP_TYPE_COMMIT_TARGET, errp)) { 2747 goto out; 2748 } 2749 commit_start(job_id, bs, base_bs, top_bs, job_flags, 2750 speed, on_error, backing_file, 2751 filter_node_name, &local_err); 2752 } 2753 if (local_err != NULL) { 2754 error_propagate(errp, local_err); 2755 goto out; 2756 } 2757 2758 out: 2759 aio_context_release(aio_context); 2760 } 2761 2762 /* Common QMP interface for drive-backup and blockdev-backup */ 2763 static BlockJob *do_backup_common(BackupCommon *backup, 2764 BlockDriverState *bs, 2765 BlockDriverState *target_bs, 2766 AioContext *aio_context, 2767 JobTxn *txn, Error **errp) 2768 { 2769 BlockJob *job = NULL; 2770 BdrvDirtyBitmap *bmap = NULL; 2771 BackupPerf perf = { .max_workers = 64 }; 2772 int job_flags = JOB_DEFAULT; 2773 2774 if (!backup->has_speed) { 2775 backup->speed = 0; 2776 } 2777 if (!backup->has_on_source_error) { 2778 backup->on_source_error = BLOCKDEV_ON_ERROR_REPORT; 2779 } 2780 if (!backup->has_on_target_error) { 2781 backup->on_target_error = BLOCKDEV_ON_ERROR_REPORT; 2782 } 2783 if (!backup->has_auto_finalize) { 2784 backup->auto_finalize = true; 2785 } 2786 if (!backup->has_auto_dismiss) { 2787 backup->auto_dismiss = true; 2788 } 2789 if (!backup->has_compress) { 2790 backup->compress = false; 2791 } 2792 2793 if (backup->x_perf) { 2794 if (backup->x_perf->has_use_copy_range) { 2795 perf.use_copy_range = backup->x_perf->use_copy_range; 2796 } 2797 if (backup->x_perf->has_max_workers) { 2798 perf.max_workers = backup->x_perf->max_workers; 2799 } 2800 if (backup->x_perf->has_max_chunk) { 2801 perf.max_chunk = backup->x_perf->max_chunk; 2802 } 2803 } 2804 2805 if ((backup->sync == MIRROR_SYNC_MODE_BITMAP) || 2806 (backup->sync == MIRROR_SYNC_MODE_INCREMENTAL)) { 2807 /* done before desugaring 'incremental' to print the right message */ 2808 if (!backup->bitmap) { 2809 error_setg(errp, "must provide a valid bitmap name for " 2810 "'%s' sync mode", MirrorSyncMode_str(backup->sync)); 2811 return NULL; 2812 } 2813 } 2814 2815 if (backup->sync == MIRROR_SYNC_MODE_INCREMENTAL) { 2816 if (backup->has_bitmap_mode && 2817 backup->bitmap_mode != BITMAP_SYNC_MODE_ON_SUCCESS) { 2818 error_setg(errp, "Bitmap sync mode must be '%s' " 2819 "when using sync mode '%s'", 2820 BitmapSyncMode_str(BITMAP_SYNC_MODE_ON_SUCCESS), 2821 MirrorSyncMode_str(backup->sync)); 2822 return NULL; 2823 } 2824 backup->has_bitmap_mode = true; 2825 backup->sync = MIRROR_SYNC_MODE_BITMAP; 2826 backup->bitmap_mode = BITMAP_SYNC_MODE_ON_SUCCESS; 2827 } 2828 2829 if (backup->bitmap) { 2830 bmap = bdrv_find_dirty_bitmap(bs, backup->bitmap); 2831 if (!bmap) { 2832 error_setg(errp, "Bitmap '%s' could not be found", backup->bitmap); 2833 return NULL; 2834 } 2835 if (!backup->has_bitmap_mode) { 2836 error_setg(errp, "Bitmap sync mode must be given " 2837 "when providing a bitmap"); 2838 return NULL; 2839 } 2840 if (bdrv_dirty_bitmap_check(bmap, BDRV_BITMAP_ALLOW_RO, errp)) { 2841 return NULL; 2842 } 2843 2844 /* This does not produce a useful bitmap artifact: */ 2845 if (backup->sync == MIRROR_SYNC_MODE_NONE) { 2846 error_setg(errp, "sync mode '%s' does not produce meaningful bitmap" 2847 " outputs", MirrorSyncMode_str(backup->sync)); 2848 return NULL; 2849 } 2850 2851 /* If the bitmap isn't used for input or output, this is useless: */ 2852 if (backup->bitmap_mode == BITMAP_SYNC_MODE_NEVER && 2853 backup->sync != MIRROR_SYNC_MODE_BITMAP) { 2854 error_setg(errp, "Bitmap sync mode '%s' has no meaningful effect" 2855 " when combined with sync mode '%s'", 2856 BitmapSyncMode_str(backup->bitmap_mode), 2857 MirrorSyncMode_str(backup->sync)); 2858 return NULL; 2859 } 2860 } 2861 2862 if (!backup->bitmap && backup->has_bitmap_mode) { 2863 error_setg(errp, "Cannot specify bitmap sync mode without a bitmap"); 2864 return NULL; 2865 } 2866 2867 if (!backup->auto_finalize) { 2868 job_flags |= JOB_MANUAL_FINALIZE; 2869 } 2870 if (!backup->auto_dismiss) { 2871 job_flags |= JOB_MANUAL_DISMISS; 2872 } 2873 2874 job = backup_job_create(backup->job_id, bs, target_bs, backup->speed, 2875 backup->sync, bmap, backup->bitmap_mode, 2876 backup->compress, 2877 backup->filter_node_name, 2878 &perf, 2879 backup->on_source_error, 2880 backup->on_target_error, 2881 job_flags, NULL, NULL, txn, errp); 2882 return job; 2883 } 2884 2885 void qmp_drive_backup(DriveBackup *backup, Error **errp) 2886 { 2887 TransactionAction action = { 2888 .type = TRANSACTION_ACTION_KIND_DRIVE_BACKUP, 2889 .u.drive_backup.data = backup, 2890 }; 2891 blockdev_do_action(&action, errp); 2892 } 2893 2894 BlockDeviceInfoList *qmp_query_named_block_nodes(bool has_flat, 2895 bool flat, 2896 Error **errp) 2897 { 2898 bool return_flat = has_flat && flat; 2899 2900 return bdrv_named_nodes_list(return_flat, errp); 2901 } 2902 2903 XDbgBlockGraph *qmp_x_debug_query_block_graph(Error **errp) 2904 { 2905 return bdrv_get_xdbg_block_graph(errp); 2906 } 2907 2908 void qmp_blockdev_backup(BlockdevBackup *backup, Error **errp) 2909 { 2910 TransactionAction action = { 2911 .type = TRANSACTION_ACTION_KIND_BLOCKDEV_BACKUP, 2912 .u.blockdev_backup.data = backup, 2913 }; 2914 blockdev_do_action(&action, errp); 2915 } 2916 2917 /* Parameter check and block job starting for drive mirroring. 2918 * Caller should hold @device and @target's aio context (must be the same). 2919 **/ 2920 static void blockdev_mirror_common(const char *job_id, BlockDriverState *bs, 2921 BlockDriverState *target, 2922 const char *replaces, 2923 enum MirrorSyncMode sync, 2924 BlockMirrorBackingMode backing_mode, 2925 bool zero_target, 2926 bool has_speed, int64_t speed, 2927 bool has_granularity, uint32_t granularity, 2928 bool has_buf_size, int64_t buf_size, 2929 bool has_on_source_error, 2930 BlockdevOnError on_source_error, 2931 bool has_on_target_error, 2932 BlockdevOnError on_target_error, 2933 bool has_unmap, bool unmap, 2934 const char *filter_node_name, 2935 bool has_copy_mode, MirrorCopyMode copy_mode, 2936 bool has_auto_finalize, bool auto_finalize, 2937 bool has_auto_dismiss, bool auto_dismiss, 2938 Error **errp) 2939 { 2940 BlockDriverState *unfiltered_bs; 2941 int job_flags = JOB_DEFAULT; 2942 2943 if (!has_speed) { 2944 speed = 0; 2945 } 2946 if (!has_on_source_error) { 2947 on_source_error = BLOCKDEV_ON_ERROR_REPORT; 2948 } 2949 if (!has_on_target_error) { 2950 on_target_error = BLOCKDEV_ON_ERROR_REPORT; 2951 } 2952 if (!has_granularity) { 2953 granularity = 0; 2954 } 2955 if (!has_buf_size) { 2956 buf_size = 0; 2957 } 2958 if (!has_unmap) { 2959 unmap = true; 2960 } 2961 if (!has_copy_mode) { 2962 copy_mode = MIRROR_COPY_MODE_BACKGROUND; 2963 } 2964 if (has_auto_finalize && !auto_finalize) { 2965 job_flags |= JOB_MANUAL_FINALIZE; 2966 } 2967 if (has_auto_dismiss && !auto_dismiss) { 2968 job_flags |= JOB_MANUAL_DISMISS; 2969 } 2970 2971 if (granularity != 0 && (granularity < 512 || granularity > 1048576 * 64)) { 2972 error_setg(errp, QERR_INVALID_PARAMETER_VALUE, "granularity", 2973 "a value in range [512B, 64MB]"); 2974 return; 2975 } 2976 if (granularity & (granularity - 1)) { 2977 error_setg(errp, QERR_INVALID_PARAMETER_VALUE, "granularity", 2978 "a power of 2"); 2979 return; 2980 } 2981 2982 if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_MIRROR_SOURCE, errp)) { 2983 return; 2984 } 2985 if (bdrv_op_is_blocked(target, BLOCK_OP_TYPE_MIRROR_TARGET, errp)) { 2986 return; 2987 } 2988 2989 if (!bdrv_backing_chain_next(bs) && sync == MIRROR_SYNC_MODE_TOP) { 2990 sync = MIRROR_SYNC_MODE_FULL; 2991 } 2992 2993 if (!replaces) { 2994 /* We want to mirror from @bs, but keep implicit filters on top */ 2995 unfiltered_bs = bdrv_skip_implicit_filters(bs); 2996 if (unfiltered_bs != bs) { 2997 replaces = unfiltered_bs->node_name; 2998 } 2999 } 3000 3001 if (replaces) { 3002 BlockDriverState *to_replace_bs; 3003 AioContext *replace_aio_context; 3004 int64_t bs_size, replace_size; 3005 3006 bs_size = bdrv_getlength(bs); 3007 if (bs_size < 0) { 3008 error_setg_errno(errp, -bs_size, "Failed to query device's size"); 3009 return; 3010 } 3011 3012 to_replace_bs = check_to_replace_node(bs, replaces, errp); 3013 if (!to_replace_bs) { 3014 return; 3015 } 3016 3017 replace_aio_context = bdrv_get_aio_context(to_replace_bs); 3018 aio_context_acquire(replace_aio_context); 3019 replace_size = bdrv_getlength(to_replace_bs); 3020 aio_context_release(replace_aio_context); 3021 3022 if (replace_size < 0) { 3023 error_setg_errno(errp, -replace_size, 3024 "Failed to query the replacement node's size"); 3025 return; 3026 } 3027 if (bs_size != replace_size) { 3028 error_setg(errp, "cannot replace image with a mirror image of " 3029 "different size"); 3030 return; 3031 } 3032 } 3033 3034 /* pass the node name to replace to mirror start since it's loose coupling 3035 * and will allow to check whether the node still exist at mirror completion 3036 */ 3037 mirror_start(job_id, bs, target, 3038 replaces, job_flags, 3039 speed, granularity, buf_size, sync, backing_mode, zero_target, 3040 on_source_error, on_target_error, unmap, filter_node_name, 3041 copy_mode, errp); 3042 } 3043 3044 void qmp_drive_mirror(DriveMirror *arg, Error **errp) 3045 { 3046 BlockDriverState *bs; 3047 BlockDriverState *target_backing_bs, *target_bs; 3048 AioContext *aio_context; 3049 AioContext *old_context; 3050 BlockMirrorBackingMode backing_mode; 3051 Error *local_err = NULL; 3052 QDict *options = NULL; 3053 int flags; 3054 int64_t size; 3055 const char *format = arg->format; 3056 bool zero_target; 3057 int ret; 3058 3059 bs = qmp_get_root_bs(arg->device, errp); 3060 if (!bs) { 3061 return; 3062 } 3063 3064 /* Early check to avoid creating target */ 3065 if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_MIRROR_SOURCE, errp)) { 3066 return; 3067 } 3068 3069 aio_context = bdrv_get_aio_context(bs); 3070 aio_context_acquire(aio_context); 3071 3072 if (!arg->has_mode) { 3073 arg->mode = NEW_IMAGE_MODE_ABSOLUTE_PATHS; 3074 } 3075 3076 if (!arg->format) { 3077 format = (arg->mode == NEW_IMAGE_MODE_EXISTING 3078 ? NULL : bs->drv->format_name); 3079 } 3080 3081 flags = bs->open_flags | BDRV_O_RDWR; 3082 target_backing_bs = bdrv_cow_bs(bdrv_skip_filters(bs)); 3083 if (!target_backing_bs && arg->sync == MIRROR_SYNC_MODE_TOP) { 3084 arg->sync = MIRROR_SYNC_MODE_FULL; 3085 } 3086 if (arg->sync == MIRROR_SYNC_MODE_NONE) { 3087 target_backing_bs = bs; 3088 } 3089 3090 size = bdrv_getlength(bs); 3091 if (size < 0) { 3092 error_setg_errno(errp, -size, "bdrv_getlength failed"); 3093 goto out; 3094 } 3095 3096 if (arg->replaces) { 3097 if (!arg->node_name) { 3098 error_setg(errp, "a node-name must be provided when replacing a" 3099 " named node of the graph"); 3100 goto out; 3101 } 3102 } 3103 3104 if (arg->mode == NEW_IMAGE_MODE_ABSOLUTE_PATHS) { 3105 backing_mode = MIRROR_SOURCE_BACKING_CHAIN; 3106 } else { 3107 backing_mode = MIRROR_OPEN_BACKING_CHAIN; 3108 } 3109 3110 /* Don't open backing image in create() */ 3111 flags |= BDRV_O_NO_BACKING; 3112 3113 if ((arg->sync == MIRROR_SYNC_MODE_FULL || !target_backing_bs) 3114 && arg->mode != NEW_IMAGE_MODE_EXISTING) 3115 { 3116 /* create new image w/o backing file */ 3117 assert(format); 3118 bdrv_img_create(arg->target, format, 3119 NULL, NULL, NULL, size, flags, false, &local_err); 3120 } else { 3121 /* Implicit filters should not appear in the filename */ 3122 BlockDriverState *explicit_backing = 3123 bdrv_skip_implicit_filters(target_backing_bs); 3124 3125 switch (arg->mode) { 3126 case NEW_IMAGE_MODE_EXISTING: 3127 break; 3128 case NEW_IMAGE_MODE_ABSOLUTE_PATHS: 3129 /* create new image with backing file */ 3130 bdrv_refresh_filename(explicit_backing); 3131 bdrv_img_create(arg->target, format, 3132 explicit_backing->filename, 3133 explicit_backing->drv->format_name, 3134 NULL, size, flags, false, &local_err); 3135 break; 3136 default: 3137 abort(); 3138 } 3139 } 3140 3141 if (local_err) { 3142 error_propagate(errp, local_err); 3143 goto out; 3144 } 3145 3146 options = qdict_new(); 3147 if (arg->node_name) { 3148 qdict_put_str(options, "node-name", arg->node_name); 3149 } 3150 if (format) { 3151 qdict_put_str(options, "driver", format); 3152 } 3153 3154 /* Mirroring takes care of copy-on-write using the source's backing 3155 * file. 3156 */ 3157 target_bs = bdrv_open(arg->target, NULL, options, flags, errp); 3158 if (!target_bs) { 3159 goto out; 3160 } 3161 3162 zero_target = (arg->sync == MIRROR_SYNC_MODE_FULL && 3163 (arg->mode == NEW_IMAGE_MODE_EXISTING || 3164 !bdrv_has_zero_init(target_bs))); 3165 3166 3167 /* Honor bdrv_try_change_aio_context() context acquisition requirements. */ 3168 old_context = bdrv_get_aio_context(target_bs); 3169 aio_context_release(aio_context); 3170 aio_context_acquire(old_context); 3171 3172 ret = bdrv_try_change_aio_context(target_bs, aio_context, NULL, errp); 3173 if (ret < 0) { 3174 bdrv_unref(target_bs); 3175 aio_context_release(old_context); 3176 return; 3177 } 3178 3179 aio_context_release(old_context); 3180 aio_context_acquire(aio_context); 3181 3182 blockdev_mirror_common(arg->job_id, bs, target_bs, 3183 arg->replaces, arg->sync, 3184 backing_mode, zero_target, 3185 arg->has_speed, arg->speed, 3186 arg->has_granularity, arg->granularity, 3187 arg->has_buf_size, arg->buf_size, 3188 arg->has_on_source_error, arg->on_source_error, 3189 arg->has_on_target_error, arg->on_target_error, 3190 arg->has_unmap, arg->unmap, 3191 NULL, 3192 arg->has_copy_mode, arg->copy_mode, 3193 arg->has_auto_finalize, arg->auto_finalize, 3194 arg->has_auto_dismiss, arg->auto_dismiss, 3195 errp); 3196 bdrv_unref(target_bs); 3197 out: 3198 aio_context_release(aio_context); 3199 } 3200 3201 void qmp_blockdev_mirror(const char *job_id, 3202 const char *device, const char *target, 3203 const char *replaces, 3204 MirrorSyncMode sync, 3205 bool has_speed, int64_t speed, 3206 bool has_granularity, uint32_t granularity, 3207 bool has_buf_size, int64_t buf_size, 3208 bool has_on_source_error, 3209 BlockdevOnError on_source_error, 3210 bool has_on_target_error, 3211 BlockdevOnError on_target_error, 3212 const char *filter_node_name, 3213 bool has_copy_mode, MirrorCopyMode copy_mode, 3214 bool has_auto_finalize, bool auto_finalize, 3215 bool has_auto_dismiss, bool auto_dismiss, 3216 Error **errp) 3217 { 3218 BlockDriverState *bs; 3219 BlockDriverState *target_bs; 3220 AioContext *aio_context; 3221 AioContext *old_context; 3222 BlockMirrorBackingMode backing_mode = MIRROR_LEAVE_BACKING_CHAIN; 3223 bool zero_target; 3224 int ret; 3225 3226 bs = qmp_get_root_bs(device, errp); 3227 if (!bs) { 3228 return; 3229 } 3230 3231 target_bs = bdrv_lookup_bs(target, target, errp); 3232 if (!target_bs) { 3233 return; 3234 } 3235 3236 zero_target = (sync == MIRROR_SYNC_MODE_FULL); 3237 3238 /* Honor bdrv_try_change_aio_context() context acquisition requirements. */ 3239 old_context = bdrv_get_aio_context(target_bs); 3240 aio_context = bdrv_get_aio_context(bs); 3241 aio_context_acquire(old_context); 3242 3243 ret = bdrv_try_change_aio_context(target_bs, aio_context, NULL, errp); 3244 3245 aio_context_release(old_context); 3246 aio_context_acquire(aio_context); 3247 3248 if (ret < 0) { 3249 goto out; 3250 } 3251 3252 blockdev_mirror_common(job_id, bs, target_bs, 3253 replaces, sync, backing_mode, 3254 zero_target, has_speed, speed, 3255 has_granularity, granularity, 3256 has_buf_size, buf_size, 3257 has_on_source_error, on_source_error, 3258 has_on_target_error, on_target_error, 3259 true, true, filter_node_name, 3260 has_copy_mode, copy_mode, 3261 has_auto_finalize, auto_finalize, 3262 has_auto_dismiss, auto_dismiss, 3263 errp); 3264 out: 3265 aio_context_release(aio_context); 3266 } 3267 3268 /* 3269 * Get a block job using its ID. Called with job_mutex held. 3270 */ 3271 static BlockJob *find_block_job_locked(const char *id, Error **errp) 3272 { 3273 BlockJob *job; 3274 3275 assert(id != NULL); 3276 3277 job = block_job_get_locked(id); 3278 3279 if (!job) { 3280 error_set(errp, ERROR_CLASS_DEVICE_NOT_ACTIVE, 3281 "Block job '%s' not found", id); 3282 return NULL; 3283 } 3284 3285 return job; 3286 } 3287 3288 void qmp_block_job_set_speed(const char *device, int64_t speed, Error **errp) 3289 { 3290 BlockJob *job; 3291 3292 JOB_LOCK_GUARD(); 3293 job = find_block_job_locked(device, errp); 3294 3295 if (!job) { 3296 return; 3297 } 3298 3299 block_job_set_speed_locked(job, speed, errp); 3300 } 3301 3302 void qmp_block_job_cancel(const char *device, 3303 bool has_force, bool force, Error **errp) 3304 { 3305 BlockJob *job; 3306 3307 JOB_LOCK_GUARD(); 3308 job = find_block_job_locked(device, errp); 3309 3310 if (!job) { 3311 return; 3312 } 3313 3314 if (!has_force) { 3315 force = false; 3316 } 3317 3318 if (job_user_paused_locked(&job->job) && !force) { 3319 error_setg(errp, "The block job for device '%s' is currently paused", 3320 device); 3321 return; 3322 } 3323 3324 trace_qmp_block_job_cancel(job); 3325 job_user_cancel_locked(&job->job, force, errp); 3326 } 3327 3328 void qmp_block_job_pause(const char *device, Error **errp) 3329 { 3330 BlockJob *job; 3331 3332 JOB_LOCK_GUARD(); 3333 job = find_block_job_locked(device, errp); 3334 3335 if (!job) { 3336 return; 3337 } 3338 3339 trace_qmp_block_job_pause(job); 3340 job_user_pause_locked(&job->job, errp); 3341 } 3342 3343 void qmp_block_job_resume(const char *device, Error **errp) 3344 { 3345 BlockJob *job; 3346 3347 JOB_LOCK_GUARD(); 3348 job = find_block_job_locked(device, errp); 3349 3350 if (!job) { 3351 return; 3352 } 3353 3354 trace_qmp_block_job_resume(job); 3355 job_user_resume_locked(&job->job, errp); 3356 } 3357 3358 void qmp_block_job_complete(const char *device, Error **errp) 3359 { 3360 BlockJob *job; 3361 3362 JOB_LOCK_GUARD(); 3363 job = find_block_job_locked(device, errp); 3364 3365 if (!job) { 3366 return; 3367 } 3368 3369 trace_qmp_block_job_complete(job); 3370 job_complete_locked(&job->job, errp); 3371 } 3372 3373 void qmp_block_job_finalize(const char *id, Error **errp) 3374 { 3375 BlockJob *job; 3376 3377 JOB_LOCK_GUARD(); 3378 job = find_block_job_locked(id, errp); 3379 3380 if (!job) { 3381 return; 3382 } 3383 3384 trace_qmp_block_job_finalize(job); 3385 job_ref_locked(&job->job); 3386 job_finalize_locked(&job->job, errp); 3387 3388 job_unref_locked(&job->job); 3389 } 3390 3391 void qmp_block_job_dismiss(const char *id, Error **errp) 3392 { 3393 BlockJob *bjob; 3394 Job *job; 3395 3396 JOB_LOCK_GUARD(); 3397 bjob = find_block_job_locked(id, errp); 3398 3399 if (!bjob) { 3400 return; 3401 } 3402 3403 trace_qmp_block_job_dismiss(bjob); 3404 job = &bjob->job; 3405 job_dismiss_locked(&job, errp); 3406 } 3407 3408 void qmp_change_backing_file(const char *device, 3409 const char *image_node_name, 3410 const char *backing_file, 3411 Error **errp) 3412 { 3413 BlockDriverState *bs = NULL; 3414 AioContext *aio_context; 3415 BlockDriverState *image_bs = NULL; 3416 Error *local_err = NULL; 3417 bool ro; 3418 int ret; 3419 3420 bs = qmp_get_root_bs(device, errp); 3421 if (!bs) { 3422 return; 3423 } 3424 3425 aio_context = bdrv_get_aio_context(bs); 3426 aio_context_acquire(aio_context); 3427 3428 image_bs = bdrv_lookup_bs(NULL, image_node_name, &local_err); 3429 if (local_err) { 3430 error_propagate(errp, local_err); 3431 goto out; 3432 } 3433 3434 if (!image_bs) { 3435 error_setg(errp, "image file not found"); 3436 goto out; 3437 } 3438 3439 if (bdrv_find_base(image_bs) == image_bs) { 3440 error_setg(errp, "not allowing backing file change on an image " 3441 "without a backing file"); 3442 goto out; 3443 } 3444 3445 /* even though we are not necessarily operating on bs, we need it to 3446 * determine if block ops are currently prohibited on the chain */ 3447 if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_CHANGE, errp)) { 3448 goto out; 3449 } 3450 3451 /* final sanity check */ 3452 if (!bdrv_chain_contains(bs, image_bs)) { 3453 error_setg(errp, "'%s' and image file are not in the same chain", 3454 device); 3455 goto out; 3456 } 3457 3458 /* if not r/w, reopen to make r/w */ 3459 ro = bdrv_is_read_only(image_bs); 3460 3461 if (ro) { 3462 if (bdrv_reopen_set_read_only(image_bs, false, errp) != 0) { 3463 goto out; 3464 } 3465 } 3466 3467 ret = bdrv_change_backing_file(image_bs, backing_file, 3468 image_bs->drv ? image_bs->drv->format_name : "", 3469 false); 3470 3471 if (ret < 0) { 3472 error_setg_errno(errp, -ret, "Could not change backing file to '%s'", 3473 backing_file); 3474 /* don't exit here, so we can try to restore open flags if 3475 * appropriate */ 3476 } 3477 3478 if (ro) { 3479 bdrv_reopen_set_read_only(image_bs, true, errp); 3480 } 3481 3482 out: 3483 aio_context_release(aio_context); 3484 } 3485 3486 void qmp_blockdev_add(BlockdevOptions *options, Error **errp) 3487 { 3488 BlockDriverState *bs; 3489 QObject *obj; 3490 Visitor *v = qobject_output_visitor_new(&obj); 3491 QDict *qdict; 3492 3493 visit_type_BlockdevOptions(v, NULL, &options, &error_abort); 3494 visit_complete(v, &obj); 3495 qdict = qobject_to(QDict, obj); 3496 3497 qdict_flatten(qdict); 3498 3499 if (!qdict_get_try_str(qdict, "node-name")) { 3500 error_setg(errp, "'node-name' must be specified for the root node"); 3501 goto fail; 3502 } 3503 3504 bs = bds_tree_init(qdict, errp); 3505 if (!bs) { 3506 goto fail; 3507 } 3508 3509 bdrv_set_monitor_owned(bs); 3510 3511 fail: 3512 visit_free(v); 3513 } 3514 3515 void qmp_blockdev_reopen(BlockdevOptionsList *reopen_list, Error **errp) 3516 { 3517 BlockReopenQueue *queue = NULL; 3518 GSList *drained = NULL; 3519 GSList *p; 3520 3521 /* Add each one of the BDS that we want to reopen to the queue */ 3522 for (; reopen_list != NULL; reopen_list = reopen_list->next) { 3523 BlockdevOptions *options = reopen_list->value; 3524 BlockDriverState *bs; 3525 AioContext *ctx; 3526 QObject *obj; 3527 Visitor *v; 3528 QDict *qdict; 3529 3530 /* Check for the selected node name */ 3531 if (!options->node_name) { 3532 error_setg(errp, "node-name not specified"); 3533 goto fail; 3534 } 3535 3536 bs = bdrv_find_node(options->node_name); 3537 if (!bs) { 3538 error_setg(errp, "Failed to find node with node-name='%s'", 3539 options->node_name); 3540 goto fail; 3541 } 3542 3543 /* Put all options in a QDict and flatten it */ 3544 v = qobject_output_visitor_new(&obj); 3545 visit_type_BlockdevOptions(v, NULL, &options, &error_abort); 3546 visit_complete(v, &obj); 3547 visit_free(v); 3548 3549 qdict = qobject_to(QDict, obj); 3550 3551 qdict_flatten(qdict); 3552 3553 ctx = bdrv_get_aio_context(bs); 3554 aio_context_acquire(ctx); 3555 3556 bdrv_subtree_drained_begin(bs); 3557 queue = bdrv_reopen_queue(queue, bs, qdict, false); 3558 drained = g_slist_prepend(drained, bs); 3559 3560 aio_context_release(ctx); 3561 } 3562 3563 /* Perform the reopen operation */ 3564 bdrv_reopen_multiple(queue, errp); 3565 queue = NULL; 3566 3567 fail: 3568 bdrv_reopen_queue_free(queue); 3569 for (p = drained; p; p = p->next) { 3570 BlockDriverState *bs = p->data; 3571 AioContext *ctx = bdrv_get_aio_context(bs); 3572 3573 aio_context_acquire(ctx); 3574 bdrv_subtree_drained_end(bs); 3575 aio_context_release(ctx); 3576 } 3577 g_slist_free(drained); 3578 } 3579 3580 void qmp_blockdev_del(const char *node_name, Error **errp) 3581 { 3582 AioContext *aio_context; 3583 BlockDriverState *bs; 3584 3585 GLOBAL_STATE_CODE(); 3586 3587 bs = bdrv_find_node(node_name); 3588 if (!bs) { 3589 error_setg(errp, "Failed to find node with node-name='%s'", node_name); 3590 return; 3591 } 3592 if (bdrv_has_blk(bs)) { 3593 error_setg(errp, "Node %s is in use", node_name); 3594 return; 3595 } 3596 aio_context = bdrv_get_aio_context(bs); 3597 aio_context_acquire(aio_context); 3598 3599 if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_DRIVE_DEL, errp)) { 3600 goto out; 3601 } 3602 3603 if (!QTAILQ_IN_USE(bs, monitor_list)) { 3604 error_setg(errp, "Node %s is not owned by the monitor", 3605 bs->node_name); 3606 goto out; 3607 } 3608 3609 if (bs->refcnt > 1) { 3610 error_setg(errp, "Block device %s is in use", 3611 bdrv_get_device_or_node_name(bs)); 3612 goto out; 3613 } 3614 3615 QTAILQ_REMOVE(&monitor_bdrv_states, bs, monitor_list); 3616 bdrv_unref(bs); 3617 3618 out: 3619 aio_context_release(aio_context); 3620 } 3621 3622 static BdrvChild *bdrv_find_child(BlockDriverState *parent_bs, 3623 const char *child_name) 3624 { 3625 BdrvChild *child; 3626 3627 QLIST_FOREACH(child, &parent_bs->children, next) { 3628 if (strcmp(child->name, child_name) == 0) { 3629 return child; 3630 } 3631 } 3632 3633 return NULL; 3634 } 3635 3636 void qmp_x_blockdev_change(const char *parent, const char *child, 3637 const char *node, Error **errp) 3638 { 3639 BlockDriverState *parent_bs, *new_bs = NULL; 3640 BdrvChild *p_child; 3641 3642 parent_bs = bdrv_lookup_bs(parent, parent, errp); 3643 if (!parent_bs) { 3644 return; 3645 } 3646 3647 if (!child == !node) { 3648 if (child) { 3649 error_setg(errp, "The parameters child and node are in conflict"); 3650 } else { 3651 error_setg(errp, "Either child or node must be specified"); 3652 } 3653 return; 3654 } 3655 3656 if (child) { 3657 p_child = bdrv_find_child(parent_bs, child); 3658 if (!p_child) { 3659 error_setg(errp, "Node '%s' does not have child '%s'", 3660 parent, child); 3661 return; 3662 } 3663 bdrv_del_child(parent_bs, p_child, errp); 3664 } 3665 3666 if (node) { 3667 new_bs = bdrv_find_node(node); 3668 if (!new_bs) { 3669 error_setg(errp, "Node '%s' not found", node); 3670 return; 3671 } 3672 bdrv_add_child(parent_bs, new_bs, errp); 3673 } 3674 } 3675 3676 BlockJobInfoList *qmp_query_block_jobs(Error **errp) 3677 { 3678 BlockJobInfoList *head = NULL, **tail = &head; 3679 BlockJob *job; 3680 3681 JOB_LOCK_GUARD(); 3682 3683 for (job = block_job_next_locked(NULL); job; 3684 job = block_job_next_locked(job)) { 3685 BlockJobInfo *value; 3686 3687 if (block_job_is_internal(job)) { 3688 continue; 3689 } 3690 value = block_job_query_locked(job, errp); 3691 if (!value) { 3692 qapi_free_BlockJobInfoList(head); 3693 return NULL; 3694 } 3695 QAPI_LIST_APPEND(tail, value); 3696 } 3697 3698 return head; 3699 } 3700 3701 void qmp_x_blockdev_set_iothread(const char *node_name, StrOrNull *iothread, 3702 bool has_force, bool force, Error **errp) 3703 { 3704 AioContext *old_context; 3705 AioContext *new_context; 3706 BlockDriverState *bs; 3707 3708 bs = bdrv_find_node(node_name); 3709 if (!bs) { 3710 error_setg(errp, "Failed to find node with node-name='%s'", node_name); 3711 return; 3712 } 3713 3714 /* Protects against accidents. */ 3715 if (!(has_force && force) && bdrv_has_blk(bs)) { 3716 error_setg(errp, "Node %s is associated with a BlockBackend and could " 3717 "be in use (use force=true to override this check)", 3718 node_name); 3719 return; 3720 } 3721 3722 if (iothread->type == QTYPE_QSTRING) { 3723 IOThread *obj = iothread_by_id(iothread->u.s); 3724 if (!obj) { 3725 error_setg(errp, "Cannot find iothread %s", iothread->u.s); 3726 return; 3727 } 3728 3729 new_context = iothread_get_aio_context(obj); 3730 } else { 3731 new_context = qemu_get_aio_context(); 3732 } 3733 3734 old_context = bdrv_get_aio_context(bs); 3735 aio_context_acquire(old_context); 3736 3737 bdrv_try_change_aio_context(bs, new_context, NULL, errp); 3738 3739 aio_context_release(old_context); 3740 } 3741 3742 QemuOptsList qemu_common_drive_opts = { 3743 .name = "drive", 3744 .head = QTAILQ_HEAD_INITIALIZER(qemu_common_drive_opts.head), 3745 .desc = { 3746 { 3747 .name = "snapshot", 3748 .type = QEMU_OPT_BOOL, 3749 .help = "enable/disable snapshot mode", 3750 },{ 3751 .name = "aio", 3752 .type = QEMU_OPT_STRING, 3753 .help = "host AIO implementation (threads, native, io_uring)", 3754 },{ 3755 .name = BDRV_OPT_CACHE_WB, 3756 .type = QEMU_OPT_BOOL, 3757 .help = "Enable writeback mode", 3758 },{ 3759 .name = "format", 3760 .type = QEMU_OPT_STRING, 3761 .help = "disk format (raw, qcow2, ...)", 3762 },{ 3763 .name = "rerror", 3764 .type = QEMU_OPT_STRING, 3765 .help = "read error action", 3766 },{ 3767 .name = "werror", 3768 .type = QEMU_OPT_STRING, 3769 .help = "write error action", 3770 },{ 3771 .name = BDRV_OPT_READ_ONLY, 3772 .type = QEMU_OPT_BOOL, 3773 .help = "open drive file as read-only", 3774 }, 3775 3776 THROTTLE_OPTS, 3777 3778 { 3779 .name = "throttling.group", 3780 .type = QEMU_OPT_STRING, 3781 .help = "name of the block throttling group", 3782 },{ 3783 .name = "copy-on-read", 3784 .type = QEMU_OPT_BOOL, 3785 .help = "copy read data from backing file into image file", 3786 },{ 3787 .name = "detect-zeroes", 3788 .type = QEMU_OPT_STRING, 3789 .help = "try to optimize zero writes (off, on, unmap)", 3790 },{ 3791 .name = "stats-account-invalid", 3792 .type = QEMU_OPT_BOOL, 3793 .help = "whether to account for invalid I/O operations " 3794 "in the statistics", 3795 },{ 3796 .name = "stats-account-failed", 3797 .type = QEMU_OPT_BOOL, 3798 .help = "whether to account for failed I/O operations " 3799 "in the statistics", 3800 }, 3801 { /* end of list */ } 3802 }, 3803 }; 3804 3805 QemuOptsList qemu_drive_opts = { 3806 .name = "drive", 3807 .head = QTAILQ_HEAD_INITIALIZER(qemu_drive_opts.head), 3808 .desc = { 3809 /* 3810 * no elements => accept any params 3811 * validation will happen later 3812 */ 3813 { /* end of list */ } 3814 }, 3815 }; 3816