156ee8626SKevin Wolf /* 256ee8626SKevin Wolf * Common block export infrastructure 356ee8626SKevin Wolf * 456ee8626SKevin Wolf * Copyright (c) 2012, 2020 Red Hat, Inc. 556ee8626SKevin Wolf * 656ee8626SKevin Wolf * Authors: 756ee8626SKevin Wolf * Paolo Bonzini <pbonzini@redhat.com> 856ee8626SKevin Wolf * Kevin Wolf <kwolf@redhat.com> 956ee8626SKevin Wolf * 1056ee8626SKevin Wolf * This work is licensed under the terms of the GNU GPL, version 2 or 1156ee8626SKevin Wolf * later. See the COPYING file in the top-level directory. 1256ee8626SKevin Wolf */ 1356ee8626SKevin Wolf 1456ee8626SKevin Wolf #include "qemu/osdep.h" 1556ee8626SKevin Wolf 169b562c64SKevin Wolf #include "block/block.h" 179b562c64SKevin Wolf #include "sysemu/block-backend.h" 18f51d23c8SStefan Hajnoczi #include "sysemu/iothread.h" 1956ee8626SKevin Wolf #include "block/export.h" 200c9b70d5SMax Reitz #include "block/fuse.h" 2156ee8626SKevin Wolf #include "block/nbd.h" 2256ee8626SKevin Wolf #include "qapi/error.h" 2356ee8626SKevin Wolf #include "qapi/qapi-commands-block-export.h" 241a9f7a80SKevin Wolf #include "qapi/qapi-events-block-export.h" 25d53be9ceSKevin Wolf #include "qemu/id.h" 26bc15e44cSStefan Hajnoczi #ifdef CONFIG_VHOST_USER_BLK_SERVER 273a213f83SStefan Hajnoczi #include "vhost-user-blk-server.h" 283a213f83SStefan Hajnoczi #endif 292a2359b8SXie Yongji #ifdef CONFIG_VDUSE_BLK_EXPORT 302a2359b8SXie Yongji #include "vduse-blk.h" 312a2359b8SXie Yongji #endif 3256ee8626SKevin Wolf 3356ee8626SKevin Wolf static const BlockExportDriver *blk_exp_drivers[] = { 3456ee8626SKevin Wolf &blk_exp_nbd, 35bc15e44cSStefan Hajnoczi #ifdef CONFIG_VHOST_USER_BLK_SERVER 3690fc91d5SStefan Hajnoczi &blk_exp_vhost_user_blk, 3790fc91d5SStefan Hajnoczi #endif 380c9b70d5SMax Reitz #ifdef CONFIG_FUSE 390c9b70d5SMax Reitz &blk_exp_fuse, 400c9b70d5SMax Reitz #endif 412a2359b8SXie Yongji #ifdef CONFIG_VDUSE_BLK_EXPORT 422a2359b8SXie Yongji &blk_exp_vduse_blk, 432a2359b8SXie Yongji #endif 4456ee8626SKevin Wolf }; 4556ee8626SKevin Wolf 46bc4ee65bSKevin Wolf /* Only accessed from the main thread */ 47bc4ee65bSKevin Wolf static QLIST_HEAD(, BlockExport) block_exports = 48bc4ee65bSKevin Wolf QLIST_HEAD_INITIALIZER(block_exports); 49bc4ee65bSKevin Wolf 503c3bc462SKevin Wolf BlockExport *blk_exp_find(const char *id) 51d53be9ceSKevin Wolf { 52d53be9ceSKevin Wolf BlockExport *exp; 53d53be9ceSKevin Wolf 54d53be9ceSKevin Wolf QLIST_FOREACH(exp, &block_exports, next) { 55d53be9ceSKevin Wolf if (strcmp(id, exp->id) == 0) { 56d53be9ceSKevin Wolf return exp; 57d53be9ceSKevin Wolf } 58d53be9ceSKevin Wolf } 59d53be9ceSKevin Wolf 60d53be9ceSKevin Wolf return NULL; 61d53be9ceSKevin Wolf } 62d53be9ceSKevin Wolf 6356ee8626SKevin Wolf static const BlockExportDriver *blk_exp_find_driver(BlockExportType type) 6456ee8626SKevin Wolf { 6556ee8626SKevin Wolf int i; 6656ee8626SKevin Wolf 6756ee8626SKevin Wolf for (i = 0; i < ARRAY_SIZE(blk_exp_drivers); i++) { 6856ee8626SKevin Wolf if (blk_exp_drivers[i]->type == type) { 6956ee8626SKevin Wolf return blk_exp_drivers[i]; 7056ee8626SKevin Wolf } 7156ee8626SKevin Wolf } 7256ee8626SKevin Wolf return NULL; 7356ee8626SKevin Wolf } 7456ee8626SKevin Wolf 759b562c64SKevin Wolf BlockExport *blk_exp_add(BlockExportOptions *export, Error **errp) 7656ee8626SKevin Wolf { 77f51d23c8SStefan Hajnoczi bool fixed_iothread = export->has_fixed_iothread && export->fixed_iothread; 7856ee8626SKevin Wolf const BlockExportDriver *drv; 79331170e0SKevin Wolf BlockExport *exp = NULL; 80331170e0SKevin Wolf BlockDriverState *bs; 81f51d23c8SStefan Hajnoczi BlockBackend *blk = NULL; 82331170e0SKevin Wolf AioContext *ctx; 8330dbc81dSKevin Wolf uint64_t perm; 84a6ff7989SKevin Wolf int ret; 8556ee8626SKevin Wolf 862b3912f1SKevin Wolf GLOBAL_STATE_CODE(); 872b3912f1SKevin Wolf 88d53be9ceSKevin Wolf if (!id_wellformed(export->id)) { 89d53be9ceSKevin Wolf error_setg(errp, "Invalid block export id"); 90d53be9ceSKevin Wolf return NULL; 91d53be9ceSKevin Wolf } 92d53be9ceSKevin Wolf if (blk_exp_find(export->id)) { 93d53be9ceSKevin Wolf error_setg(errp, "Block export id '%s' is already in use", export->id); 94d53be9ceSKevin Wolf return NULL; 95d53be9ceSKevin Wolf } 96d53be9ceSKevin Wolf 9756ee8626SKevin Wolf drv = blk_exp_find_driver(export->type); 9856ee8626SKevin Wolf if (!drv) { 9956ee8626SKevin Wolf error_setg(errp, "No driver found for the requested export type"); 1009b562c64SKevin Wolf return NULL; 10156ee8626SKevin Wolf } 10256ee8626SKevin Wolf 103331170e0SKevin Wolf bs = bdrv_lookup_bs(NULL, export->node_name, errp); 104331170e0SKevin Wolf if (!bs) { 105331170e0SKevin Wolf return NULL; 106331170e0SKevin Wolf } 107331170e0SKevin Wolf 10830dbc81dSKevin Wolf if (!export->has_writable) { 10930dbc81dSKevin Wolf export->writable = false; 11030dbc81dSKevin Wolf } 11130dbc81dSKevin Wolf if (bdrv_is_read_only(bs) && export->writable) { 11230dbc81dSKevin Wolf error_setg(errp, "Cannot export read-only node as writable"); 11330dbc81dSKevin Wolf return NULL; 11430dbc81dSKevin Wolf } 11530dbc81dSKevin Wolf 116331170e0SKevin Wolf ctx = bdrv_get_aio_context(bs); 117331170e0SKevin Wolf 11854fde4ffSMarkus Armbruster if (export->iothread) { 119f51d23c8SStefan Hajnoczi IOThread *iothread; 120f51d23c8SStefan Hajnoczi AioContext *new_ctx; 1218573823fSMax Reitz Error **set_context_errp; 122f51d23c8SStefan Hajnoczi 123f51d23c8SStefan Hajnoczi iothread = iothread_by_id(export->iothread); 124f51d23c8SStefan Hajnoczi if (!iothread) { 125f51d23c8SStefan Hajnoczi error_setg(errp, "iothread \"%s\" not found", export->iothread); 126f51d23c8SStefan Hajnoczi goto fail; 127f51d23c8SStefan Hajnoczi } 128f51d23c8SStefan Hajnoczi 129f51d23c8SStefan Hajnoczi new_ctx = iothread_get_aio_context(iothread); 130f51d23c8SStefan Hajnoczi 1318573823fSMax Reitz /* Ignore errors with fixed-iothread=false */ 1328573823fSMax Reitz set_context_errp = fixed_iothread ? errp : NULL; 133142e6907SEmanuele Giuseppe Esposito ret = bdrv_try_change_aio_context(bs, new_ctx, NULL, set_context_errp); 134f51d23c8SStefan Hajnoczi if (ret == 0) { 135f51d23c8SStefan Hajnoczi ctx = new_ctx; 136f51d23c8SStefan Hajnoczi } else if (fixed_iothread) { 137f51d23c8SStefan Hajnoczi goto fail; 138f51d23c8SStefan Hajnoczi } 139f51d23c8SStefan Hajnoczi } 140f51d23c8SStefan Hajnoczi 141331170e0SKevin Wolf /* 142331170e0SKevin Wolf * Block exports are used for non-shared storage migration. Make sure 143331170e0SKevin Wolf * that BDRV_O_INACTIVE is cleared and the image is ready for write 144331170e0SKevin Wolf * access since the export could be available before migration handover. 145331170e0SKevin Wolf * ctx was acquired in the caller. 146331170e0SKevin Wolf */ 1472b3912f1SKevin Wolf bdrv_graph_rdlock_main_loop(); 148a94750d9SEmanuele Giuseppe Esposito bdrv_activate(bs, NULL); 1492b3912f1SKevin Wolf bdrv_graph_rdunlock_main_loop(); 150331170e0SKevin Wolf 15130dbc81dSKevin Wolf perm = BLK_PERM_CONSISTENT_READ; 15230dbc81dSKevin Wolf if (export->writable) { 15330dbc81dSKevin Wolf perm |= BLK_PERM_WRITE; 15430dbc81dSKevin Wolf } 15530dbc81dSKevin Wolf 15630dbc81dSKevin Wolf blk = blk_new(ctx, perm, BLK_PERM_ALL); 157f51d23c8SStefan Hajnoczi 158f51d23c8SStefan Hajnoczi if (!fixed_iothread) { 159f51d23c8SStefan Hajnoczi blk_set_allow_aio_context_change(blk, true); 160f51d23c8SStefan Hajnoczi } 161f51d23c8SStefan Hajnoczi 162331170e0SKevin Wolf ret = blk_insert_bs(blk, bs, errp); 163331170e0SKevin Wolf if (ret < 0) { 164331170e0SKevin Wolf goto fail; 165331170e0SKevin Wolf } 166331170e0SKevin Wolf 167331170e0SKevin Wolf if (!export->has_writethrough) { 168331170e0SKevin Wolf export->writethrough = false; 169331170e0SKevin Wolf } 170331170e0SKevin Wolf blk_set_enable_write_cache(blk, !export->writethrough); 171331170e0SKevin Wolf 172a6ff7989SKevin Wolf assert(drv->instance_size >= sizeof(BlockExport)); 173a6ff7989SKevin Wolf exp = g_malloc0(drv->instance_size); 174a6ff7989SKevin Wolf *exp = (BlockExport) { 175a6ff7989SKevin Wolf .drv = drv, 176a6ff7989SKevin Wolf .refcount = 1, 1773859ad36SKevin Wolf .user_owned = true, 178d53be9ceSKevin Wolf .id = g_strdup(export->id), 179331170e0SKevin Wolf .ctx = ctx, 180331170e0SKevin Wolf .blk = blk, 181a6ff7989SKevin Wolf }; 182a6ff7989SKevin Wolf 183a6ff7989SKevin Wolf ret = drv->create(exp, export, errp); 184a6ff7989SKevin Wolf if (ret < 0) { 185331170e0SKevin Wolf goto fail; 186a6ff7989SKevin Wolf } 187a6ff7989SKevin Wolf 18837a4f70cSKevin Wolf assert(exp->blk != NULL); 18937a4f70cSKevin Wolf 190bc4ee65bSKevin Wolf QLIST_INSERT_HEAD(&block_exports, exp, next); 191a6ff7989SKevin Wolf return exp; 192331170e0SKevin Wolf 193331170e0SKevin Wolf fail: 194a1845637SKevin Wolf if (blk) { 195a1845637SKevin Wolf blk_set_dev_ops(blk, NULL, NULL); 196331170e0SKevin Wolf blk_unref(blk); 197a1845637SKevin Wolf } 198331170e0SKevin Wolf if (exp) { 199331170e0SKevin Wolf g_free(exp->id); 200331170e0SKevin Wolf g_free(exp); 201331170e0SKevin Wolf } 202331170e0SKevin Wolf return NULL; 2039b562c64SKevin Wolf } 2049b562c64SKevin Wolf 205c69de1beSKevin Wolf void blk_exp_ref(BlockExport *exp) 206c69de1beSKevin Wolf { 2073d499a43SStefan Hajnoczi assert(qatomic_read(&exp->refcount) > 0); 2083d499a43SStefan Hajnoczi qatomic_inc(&exp->refcount); 209c69de1beSKevin Wolf } 210c69de1beSKevin Wolf 211bc4ee65bSKevin Wolf /* Runs in the main thread */ 212bc4ee65bSKevin Wolf static void blk_exp_delete_bh(void *opaque) 213bc4ee65bSKevin Wolf { 214bc4ee65bSKevin Wolf BlockExport *exp = opaque; 215bc4ee65bSKevin Wolf 216bc4ee65bSKevin Wolf assert(exp->refcount == 0); 217bc4ee65bSKevin Wolf QLIST_REMOVE(exp, next); 218bc4ee65bSKevin Wolf exp->drv->delete(exp); 219de79b526SStefan Hajnoczi blk_set_dev_ops(exp->blk, NULL, NULL); 22037a4f70cSKevin Wolf blk_unref(exp->blk); 2211a9f7a80SKevin Wolf qapi_event_send_block_export_deleted(exp->id); 222d53be9ceSKevin Wolf g_free(exp->id); 223bc4ee65bSKevin Wolf g_free(exp); 224bc4ee65bSKevin Wolf } 225bc4ee65bSKevin Wolf 226c69de1beSKevin Wolf void blk_exp_unref(BlockExport *exp) 227c69de1beSKevin Wolf { 2283d499a43SStefan Hajnoczi assert(qatomic_read(&exp->refcount) > 0); 2293d499a43SStefan Hajnoczi if (qatomic_fetch_dec(&exp->refcount) == 1) { 230bc4ee65bSKevin Wolf /* Touch the block_exports list only in the main thread */ 231bc4ee65bSKevin Wolf aio_bh_schedule_oneshot(qemu_get_aio_context(), blk_exp_delete_bh, 232bc4ee65bSKevin Wolf exp); 233c69de1beSKevin Wolf } 234c69de1beSKevin Wolf } 235c69de1beSKevin Wolf 236bc4ee65bSKevin Wolf /* 237bc4ee65bSKevin Wolf * Drops the user reference to the export and requests that all client 238bc4ee65bSKevin Wolf * connections and other internally held references start to shut down. When 239bc4ee65bSKevin Wolf * the function returns, there may still be active references while the export 240bc4ee65bSKevin Wolf * is in the process of shutting down. 241bc4ee65bSKevin Wolf */ 242bc4ee65bSKevin Wolf void blk_exp_request_shutdown(BlockExport *exp) 243bc4ee65bSKevin Wolf { 2443c3bc462SKevin Wolf /* 2453c3bc462SKevin Wolf * If the user doesn't own the export any more, it is already shutting 2463c3bc462SKevin Wolf * down. We must not call .request_shutdown and decrease the refcount a 2473c3bc462SKevin Wolf * second time. 2483c3bc462SKevin Wolf */ 2493c3bc462SKevin Wolf if (!exp->user_owned) { 250*b49f4755SStefan Hajnoczi return; 2513c3bc462SKevin Wolf } 2523c3bc462SKevin Wolf 253bc4ee65bSKevin Wolf exp->drv->request_shutdown(exp); 2543859ad36SKevin Wolf 2553859ad36SKevin Wolf assert(exp->user_owned); 2563859ad36SKevin Wolf exp->user_owned = false; 2573859ad36SKevin Wolf blk_exp_unref(exp); 258bc4ee65bSKevin Wolf } 259bc4ee65bSKevin Wolf 260bc4ee65bSKevin Wolf /* 261bc4ee65bSKevin Wolf * Returns whether a block export of the given type exists. 262bc4ee65bSKevin Wolf * type == BLOCK_EXPORT_TYPE__MAX checks for an export of any type. 263bc4ee65bSKevin Wolf */ 264bc4ee65bSKevin Wolf static bool blk_exp_has_type(BlockExportType type) 265bc4ee65bSKevin Wolf { 266bc4ee65bSKevin Wolf BlockExport *exp; 267bc4ee65bSKevin Wolf 268bc4ee65bSKevin Wolf if (type == BLOCK_EXPORT_TYPE__MAX) { 269bc4ee65bSKevin Wolf return !QLIST_EMPTY(&block_exports); 270bc4ee65bSKevin Wolf } 271bc4ee65bSKevin Wolf 272bc4ee65bSKevin Wolf QLIST_FOREACH(exp, &block_exports, next) { 273bc4ee65bSKevin Wolf if (exp->drv->type == type) { 274bc4ee65bSKevin Wolf return true; 275bc4ee65bSKevin Wolf } 276bc4ee65bSKevin Wolf } 277bc4ee65bSKevin Wolf 278bc4ee65bSKevin Wolf return false; 279bc4ee65bSKevin Wolf } 280bc4ee65bSKevin Wolf 281bc4ee65bSKevin Wolf /* type == BLOCK_EXPORT_TYPE__MAX for all types */ 282bc4ee65bSKevin Wolf void blk_exp_close_all_type(BlockExportType type) 283bc4ee65bSKevin Wolf { 284bc4ee65bSKevin Wolf BlockExport *exp, *next; 285bc4ee65bSKevin Wolf 286bc4ee65bSKevin Wolf assert(in_aio_context_home_thread(qemu_get_aio_context())); 287bc4ee65bSKevin Wolf 288bc4ee65bSKevin Wolf QLIST_FOREACH_SAFE(exp, &block_exports, next, next) { 289bc4ee65bSKevin Wolf if (type != BLOCK_EXPORT_TYPE__MAX && exp->drv->type != type) { 290bc4ee65bSKevin Wolf continue; 291bc4ee65bSKevin Wolf } 292bc4ee65bSKevin Wolf blk_exp_request_shutdown(exp); 293bc4ee65bSKevin Wolf } 294bc4ee65bSKevin Wolf 295e5568a66SStefan Hajnoczi AIO_WAIT_WHILE_UNLOCKED(NULL, blk_exp_has_type(type)); 296bc4ee65bSKevin Wolf } 297bc4ee65bSKevin Wolf 298bc4ee65bSKevin Wolf void blk_exp_close_all(void) 299bc4ee65bSKevin Wolf { 300bc4ee65bSKevin Wolf blk_exp_close_all_type(BLOCK_EXPORT_TYPE__MAX); 301bc4ee65bSKevin Wolf } 302bc4ee65bSKevin Wolf 3039b562c64SKevin Wolf void qmp_block_export_add(BlockExportOptions *export, Error **errp) 3049b562c64SKevin Wolf { 3059b562c64SKevin Wolf blk_exp_add(export, errp); 30656ee8626SKevin Wolf } 3073c3bc462SKevin Wolf 3083c3bc462SKevin Wolf void qmp_block_export_del(const char *id, 3093c3bc462SKevin Wolf bool has_mode, BlockExportRemoveMode mode, 3103c3bc462SKevin Wolf Error **errp) 3113c3bc462SKevin Wolf { 3123c3bc462SKevin Wolf ERRP_GUARD(); 3133c3bc462SKevin Wolf BlockExport *exp; 3143c3bc462SKevin Wolf 3153c3bc462SKevin Wolf exp = blk_exp_find(id); 3163c3bc462SKevin Wolf if (exp == NULL) { 3173c3bc462SKevin Wolf error_setg(errp, "Export '%s' is not found", id); 3183c3bc462SKevin Wolf return; 3193c3bc462SKevin Wolf } 3203c3bc462SKevin Wolf if (!exp->user_owned) { 3213c3bc462SKevin Wolf error_setg(errp, "Export '%s' is already shutting down", id); 3223c3bc462SKevin Wolf return; 3233c3bc462SKevin Wolf } 3243c3bc462SKevin Wolf 3253c3bc462SKevin Wolf if (!has_mode) { 3263c3bc462SKevin Wolf mode = BLOCK_EXPORT_REMOVE_MODE_SAFE; 3273c3bc462SKevin Wolf } 3283d499a43SStefan Hajnoczi if (mode == BLOCK_EXPORT_REMOVE_MODE_SAFE && 3293d499a43SStefan Hajnoczi qatomic_read(&exp->refcount) > 1) { 3303c3bc462SKevin Wolf error_setg(errp, "export '%s' still in use", exp->id); 3313c3bc462SKevin Wolf error_append_hint(errp, "Use mode='hard' to force client " 3323c3bc462SKevin Wolf "disconnect\n"); 3333c3bc462SKevin Wolf return; 3343c3bc462SKevin Wolf } 3353c3bc462SKevin Wolf 3363c3bc462SKevin Wolf blk_exp_request_shutdown(exp); 3373c3bc462SKevin Wolf } 3388cade320SKevin Wolf 3398cade320SKevin Wolf BlockExportInfoList *qmp_query_block_exports(Error **errp) 3408cade320SKevin Wolf { 341c3033fd3SEric Blake BlockExportInfoList *head = NULL, **tail = &head; 3428cade320SKevin Wolf BlockExport *exp; 3438cade320SKevin Wolf 3448cade320SKevin Wolf QLIST_FOREACH(exp, &block_exports, next) { 3458cade320SKevin Wolf BlockExportInfo *info = g_new(BlockExportInfo, 1); 3468cade320SKevin Wolf *info = (BlockExportInfo) { 3478cade320SKevin Wolf .id = g_strdup(exp->id), 3488cade320SKevin Wolf .type = exp->drv->type, 3498cade320SKevin Wolf .node_name = g_strdup(bdrv_get_node_name(blk_bs(exp->blk))), 3508cade320SKevin Wolf .shutting_down = !exp->user_owned, 3518cade320SKevin Wolf }; 3528cade320SKevin Wolf 353c3033fd3SEric Blake QAPI_LIST_APPEND(tail, info); 3548cade320SKevin Wolf } 3558cade320SKevin Wolf 3568cade320SKevin Wolf return head; 3578cade320SKevin Wolf } 358