156ee8626SKevin Wolf /* 256ee8626SKevin Wolf * Common block export infrastructure 356ee8626SKevin Wolf * 456ee8626SKevin Wolf * Copyright (c) 2012, 2020 Red Hat, Inc. 556ee8626SKevin Wolf * 656ee8626SKevin Wolf * Authors: 756ee8626SKevin Wolf * Paolo Bonzini <pbonzini@redhat.com> 856ee8626SKevin Wolf * Kevin Wolf <kwolf@redhat.com> 956ee8626SKevin Wolf * 1056ee8626SKevin Wolf * This work is licensed under the terms of the GNU GPL, version 2 or 1156ee8626SKevin Wolf * later. See the COPYING file in the top-level directory. 1256ee8626SKevin Wolf */ 1356ee8626SKevin Wolf 1456ee8626SKevin Wolf #include "qemu/osdep.h" 1556ee8626SKevin Wolf 169b562c64SKevin Wolf #include "block/block.h" 179b562c64SKevin Wolf #include "sysemu/block-backend.h" 18f51d23c8SStefan Hajnoczi #include "sysemu/iothread.h" 1956ee8626SKevin Wolf #include "block/export.h" 200c9b70d5SMax Reitz #include "block/fuse.h" 2156ee8626SKevin Wolf #include "block/nbd.h" 2256ee8626SKevin Wolf #include "qapi/error.h" 2356ee8626SKevin Wolf #include "qapi/qapi-commands-block-export.h" 241a9f7a80SKevin Wolf #include "qapi/qapi-events-block-export.h" 25d53be9ceSKevin Wolf #include "qemu/id.h" 26bc15e44cSStefan Hajnoczi #ifdef CONFIG_VHOST_USER_BLK_SERVER 273a213f83SStefan Hajnoczi #include "vhost-user-blk-server.h" 283a213f83SStefan Hajnoczi #endif 2956ee8626SKevin Wolf 3056ee8626SKevin Wolf static const BlockExportDriver *blk_exp_drivers[] = { 3156ee8626SKevin Wolf &blk_exp_nbd, 32bc15e44cSStefan Hajnoczi #ifdef CONFIG_VHOST_USER_BLK_SERVER 3390fc91d5SStefan Hajnoczi &blk_exp_vhost_user_blk, 3490fc91d5SStefan Hajnoczi #endif 350c9b70d5SMax Reitz #ifdef CONFIG_FUSE 360c9b70d5SMax Reitz &blk_exp_fuse, 370c9b70d5SMax Reitz #endif 3856ee8626SKevin Wolf }; 3956ee8626SKevin Wolf 40bc4ee65bSKevin Wolf /* Only accessed from the main thread */ 41bc4ee65bSKevin Wolf static QLIST_HEAD(, BlockExport) block_exports = 42bc4ee65bSKevin Wolf QLIST_HEAD_INITIALIZER(block_exports); 43bc4ee65bSKevin Wolf 443c3bc462SKevin Wolf BlockExport *blk_exp_find(const char *id) 45d53be9ceSKevin Wolf { 46d53be9ceSKevin Wolf BlockExport *exp; 47d53be9ceSKevin Wolf 48d53be9ceSKevin Wolf QLIST_FOREACH(exp, &block_exports, next) { 49d53be9ceSKevin Wolf if (strcmp(id, exp->id) == 0) { 50d53be9ceSKevin Wolf return exp; 51d53be9ceSKevin Wolf } 52d53be9ceSKevin Wolf } 53d53be9ceSKevin Wolf 54d53be9ceSKevin Wolf return NULL; 55d53be9ceSKevin Wolf } 56d53be9ceSKevin Wolf 5756ee8626SKevin Wolf static const BlockExportDriver *blk_exp_find_driver(BlockExportType type) 5856ee8626SKevin Wolf { 5956ee8626SKevin Wolf int i; 6056ee8626SKevin Wolf 6156ee8626SKevin Wolf for (i = 0; i < ARRAY_SIZE(blk_exp_drivers); i++) { 6256ee8626SKevin Wolf if (blk_exp_drivers[i]->type == type) { 6356ee8626SKevin Wolf return blk_exp_drivers[i]; 6456ee8626SKevin Wolf } 6556ee8626SKevin Wolf } 6656ee8626SKevin Wolf return NULL; 6756ee8626SKevin Wolf } 6856ee8626SKevin Wolf 699b562c64SKevin Wolf BlockExport *blk_exp_add(BlockExportOptions *export, Error **errp) 7056ee8626SKevin Wolf { 71f51d23c8SStefan Hajnoczi bool fixed_iothread = export->has_fixed_iothread && export->fixed_iothread; 7256ee8626SKevin Wolf const BlockExportDriver *drv; 73331170e0SKevin Wolf BlockExport *exp = NULL; 74331170e0SKevin Wolf BlockDriverState *bs; 75f51d23c8SStefan Hajnoczi BlockBackend *blk = NULL; 76331170e0SKevin Wolf AioContext *ctx; 7730dbc81dSKevin Wolf uint64_t perm; 78a6ff7989SKevin Wolf int ret; 7956ee8626SKevin Wolf 80d53be9ceSKevin Wolf if (!id_wellformed(export->id)) { 81d53be9ceSKevin Wolf error_setg(errp, "Invalid block export id"); 82d53be9ceSKevin Wolf return NULL; 83d53be9ceSKevin Wolf } 84d53be9ceSKevin Wolf if (blk_exp_find(export->id)) { 85d53be9ceSKevin Wolf error_setg(errp, "Block export id '%s' is already in use", export->id); 86d53be9ceSKevin Wolf return NULL; 87d53be9ceSKevin Wolf } 88d53be9ceSKevin Wolf 8956ee8626SKevin Wolf drv = blk_exp_find_driver(export->type); 9056ee8626SKevin Wolf if (!drv) { 9156ee8626SKevin Wolf error_setg(errp, "No driver found for the requested export type"); 929b562c64SKevin Wolf return NULL; 9356ee8626SKevin Wolf } 9456ee8626SKevin Wolf 95331170e0SKevin Wolf bs = bdrv_lookup_bs(NULL, export->node_name, errp); 96331170e0SKevin Wolf if (!bs) { 97331170e0SKevin Wolf return NULL; 98331170e0SKevin Wolf } 99331170e0SKevin Wolf 10030dbc81dSKevin Wolf if (!export->has_writable) { 10130dbc81dSKevin Wolf export->writable = false; 10230dbc81dSKevin Wolf } 10330dbc81dSKevin Wolf if (bdrv_is_read_only(bs) && export->writable) { 10430dbc81dSKevin Wolf error_setg(errp, "Cannot export read-only node as writable"); 10530dbc81dSKevin Wolf return NULL; 10630dbc81dSKevin Wolf } 10730dbc81dSKevin Wolf 108331170e0SKevin Wolf ctx = bdrv_get_aio_context(bs); 109331170e0SKevin Wolf aio_context_acquire(ctx); 110331170e0SKevin Wolf 111f51d23c8SStefan Hajnoczi if (export->has_iothread) { 112f51d23c8SStefan Hajnoczi IOThread *iothread; 113f51d23c8SStefan Hajnoczi AioContext *new_ctx; 114*8573823fSMax Reitz Error **set_context_errp; 115f51d23c8SStefan Hajnoczi 116f51d23c8SStefan Hajnoczi iothread = iothread_by_id(export->iothread); 117f51d23c8SStefan Hajnoczi if (!iothread) { 118f51d23c8SStefan Hajnoczi error_setg(errp, "iothread \"%s\" not found", export->iothread); 119f51d23c8SStefan Hajnoczi goto fail; 120f51d23c8SStefan Hajnoczi } 121f51d23c8SStefan Hajnoczi 122f51d23c8SStefan Hajnoczi new_ctx = iothread_get_aio_context(iothread); 123f51d23c8SStefan Hajnoczi 124*8573823fSMax Reitz /* Ignore errors with fixed-iothread=false */ 125*8573823fSMax Reitz set_context_errp = fixed_iothread ? errp : NULL; 126*8573823fSMax Reitz ret = bdrv_try_set_aio_context(bs, new_ctx, set_context_errp); 127f51d23c8SStefan Hajnoczi if (ret == 0) { 128f51d23c8SStefan Hajnoczi aio_context_release(ctx); 129f51d23c8SStefan Hajnoczi aio_context_acquire(new_ctx); 130f51d23c8SStefan Hajnoczi ctx = new_ctx; 131f51d23c8SStefan Hajnoczi } else if (fixed_iothread) { 132f51d23c8SStefan Hajnoczi goto fail; 133f51d23c8SStefan Hajnoczi } 134f51d23c8SStefan Hajnoczi } 135f51d23c8SStefan Hajnoczi 136331170e0SKevin Wolf /* 137331170e0SKevin Wolf * Block exports are used for non-shared storage migration. Make sure 138331170e0SKevin Wolf * that BDRV_O_INACTIVE is cleared and the image is ready for write 139331170e0SKevin Wolf * access since the export could be available before migration handover. 140331170e0SKevin Wolf * ctx was acquired in the caller. 141331170e0SKevin Wolf */ 142331170e0SKevin Wolf bdrv_invalidate_cache(bs, NULL); 143331170e0SKevin Wolf 14430dbc81dSKevin Wolf perm = BLK_PERM_CONSISTENT_READ; 14530dbc81dSKevin Wolf if (export->writable) { 14630dbc81dSKevin Wolf perm |= BLK_PERM_WRITE; 14730dbc81dSKevin Wolf } 14830dbc81dSKevin Wolf 14930dbc81dSKevin Wolf blk = blk_new(ctx, perm, BLK_PERM_ALL); 150f51d23c8SStefan Hajnoczi 151f51d23c8SStefan Hajnoczi if (!fixed_iothread) { 152f51d23c8SStefan Hajnoczi blk_set_allow_aio_context_change(blk, true); 153f51d23c8SStefan Hajnoczi } 154f51d23c8SStefan Hajnoczi 155331170e0SKevin Wolf ret = blk_insert_bs(blk, bs, errp); 156331170e0SKevin Wolf if (ret < 0) { 157331170e0SKevin Wolf goto fail; 158331170e0SKevin Wolf } 159331170e0SKevin Wolf 160331170e0SKevin Wolf if (!export->has_writethrough) { 161331170e0SKevin Wolf export->writethrough = false; 162331170e0SKevin Wolf } 163331170e0SKevin Wolf blk_set_enable_write_cache(blk, !export->writethrough); 164331170e0SKevin Wolf 165a6ff7989SKevin Wolf assert(drv->instance_size >= sizeof(BlockExport)); 166a6ff7989SKevin Wolf exp = g_malloc0(drv->instance_size); 167a6ff7989SKevin Wolf *exp = (BlockExport) { 168a6ff7989SKevin Wolf .drv = drv, 169a6ff7989SKevin Wolf .refcount = 1, 1703859ad36SKevin Wolf .user_owned = true, 171d53be9ceSKevin Wolf .id = g_strdup(export->id), 172331170e0SKevin Wolf .ctx = ctx, 173331170e0SKevin Wolf .blk = blk, 174a6ff7989SKevin Wolf }; 175a6ff7989SKevin Wolf 176a6ff7989SKevin Wolf ret = drv->create(exp, export, errp); 177a6ff7989SKevin Wolf if (ret < 0) { 178331170e0SKevin Wolf goto fail; 179a6ff7989SKevin Wolf } 180a6ff7989SKevin Wolf 18137a4f70cSKevin Wolf assert(exp->blk != NULL); 18237a4f70cSKevin Wolf 183bc4ee65bSKevin Wolf QLIST_INSERT_HEAD(&block_exports, exp, next); 184331170e0SKevin Wolf 185331170e0SKevin Wolf aio_context_release(ctx); 186a6ff7989SKevin Wolf return exp; 187331170e0SKevin Wolf 188331170e0SKevin Wolf fail: 189331170e0SKevin Wolf blk_unref(blk); 190331170e0SKevin Wolf aio_context_release(ctx); 191331170e0SKevin Wolf if (exp) { 192331170e0SKevin Wolf g_free(exp->id); 193331170e0SKevin Wolf g_free(exp); 194331170e0SKevin Wolf } 195331170e0SKevin Wolf return NULL; 1969b562c64SKevin Wolf } 1979b562c64SKevin Wolf 1988612c686SKevin Wolf /* Callers must hold exp->ctx lock */ 199c69de1beSKevin Wolf void blk_exp_ref(BlockExport *exp) 200c69de1beSKevin Wolf { 201c69de1beSKevin Wolf assert(exp->refcount > 0); 202c69de1beSKevin Wolf exp->refcount++; 203c69de1beSKevin Wolf } 204c69de1beSKevin Wolf 205bc4ee65bSKevin Wolf /* Runs in the main thread */ 206bc4ee65bSKevin Wolf static void blk_exp_delete_bh(void *opaque) 207bc4ee65bSKevin Wolf { 208bc4ee65bSKevin Wolf BlockExport *exp = opaque; 209bc4ee65bSKevin Wolf AioContext *aio_context = exp->ctx; 210bc4ee65bSKevin Wolf 211bc4ee65bSKevin Wolf aio_context_acquire(aio_context); 212bc4ee65bSKevin Wolf 213bc4ee65bSKevin Wolf assert(exp->refcount == 0); 214bc4ee65bSKevin Wolf QLIST_REMOVE(exp, next); 215bc4ee65bSKevin Wolf exp->drv->delete(exp); 21637a4f70cSKevin Wolf blk_unref(exp->blk); 2171a9f7a80SKevin Wolf qapi_event_send_block_export_deleted(exp->id); 218d53be9ceSKevin Wolf g_free(exp->id); 219bc4ee65bSKevin Wolf g_free(exp); 220bc4ee65bSKevin Wolf 221bc4ee65bSKevin Wolf aio_context_release(aio_context); 222bc4ee65bSKevin Wolf } 223bc4ee65bSKevin Wolf 2248612c686SKevin Wolf /* Callers must hold exp->ctx lock */ 225c69de1beSKevin Wolf void blk_exp_unref(BlockExport *exp) 226c69de1beSKevin Wolf { 227c69de1beSKevin Wolf assert(exp->refcount > 0); 228c69de1beSKevin Wolf if (--exp->refcount == 0) { 229bc4ee65bSKevin Wolf /* Touch the block_exports list only in the main thread */ 230bc4ee65bSKevin Wolf aio_bh_schedule_oneshot(qemu_get_aio_context(), blk_exp_delete_bh, 231bc4ee65bSKevin Wolf exp); 232c69de1beSKevin Wolf } 233c69de1beSKevin Wolf } 234c69de1beSKevin Wolf 235bc4ee65bSKevin Wolf /* 236bc4ee65bSKevin Wolf * Drops the user reference to the export and requests that all client 237bc4ee65bSKevin Wolf * connections and other internally held references start to shut down. When 238bc4ee65bSKevin Wolf * the function returns, there may still be active references while the export 239bc4ee65bSKevin Wolf * is in the process of shutting down. 240bc4ee65bSKevin Wolf * 241bc4ee65bSKevin Wolf * Acquires exp->ctx internally. Callers must *not* hold the lock. 242bc4ee65bSKevin Wolf */ 243bc4ee65bSKevin Wolf void blk_exp_request_shutdown(BlockExport *exp) 244bc4ee65bSKevin Wolf { 245bc4ee65bSKevin Wolf AioContext *aio_context = exp->ctx; 246bc4ee65bSKevin Wolf 247bc4ee65bSKevin Wolf aio_context_acquire(aio_context); 2483c3bc462SKevin Wolf 2493c3bc462SKevin Wolf /* 2503c3bc462SKevin Wolf * If the user doesn't own the export any more, it is already shutting 2513c3bc462SKevin Wolf * down. We must not call .request_shutdown and decrease the refcount a 2523c3bc462SKevin Wolf * second time. 2533c3bc462SKevin Wolf */ 2543c3bc462SKevin Wolf if (!exp->user_owned) { 2553c3bc462SKevin Wolf goto out; 2563c3bc462SKevin Wolf } 2573c3bc462SKevin Wolf 258bc4ee65bSKevin Wolf exp->drv->request_shutdown(exp); 2593859ad36SKevin Wolf 2603859ad36SKevin Wolf assert(exp->user_owned); 2613859ad36SKevin Wolf exp->user_owned = false; 2623859ad36SKevin Wolf blk_exp_unref(exp); 2633859ad36SKevin Wolf 2643c3bc462SKevin Wolf out: 265bc4ee65bSKevin Wolf aio_context_release(aio_context); 266bc4ee65bSKevin Wolf } 267bc4ee65bSKevin Wolf 268bc4ee65bSKevin Wolf /* 269bc4ee65bSKevin Wolf * Returns whether a block export of the given type exists. 270bc4ee65bSKevin Wolf * type == BLOCK_EXPORT_TYPE__MAX checks for an export of any type. 271bc4ee65bSKevin Wolf */ 272bc4ee65bSKevin Wolf static bool blk_exp_has_type(BlockExportType type) 273bc4ee65bSKevin Wolf { 274bc4ee65bSKevin Wolf BlockExport *exp; 275bc4ee65bSKevin Wolf 276bc4ee65bSKevin Wolf if (type == BLOCK_EXPORT_TYPE__MAX) { 277bc4ee65bSKevin Wolf return !QLIST_EMPTY(&block_exports); 278bc4ee65bSKevin Wolf } 279bc4ee65bSKevin Wolf 280bc4ee65bSKevin Wolf QLIST_FOREACH(exp, &block_exports, next) { 281bc4ee65bSKevin Wolf if (exp->drv->type == type) { 282bc4ee65bSKevin Wolf return true; 283bc4ee65bSKevin Wolf } 284bc4ee65bSKevin Wolf } 285bc4ee65bSKevin Wolf 286bc4ee65bSKevin Wolf return false; 287bc4ee65bSKevin Wolf } 288bc4ee65bSKevin Wolf 289bc4ee65bSKevin Wolf /* type == BLOCK_EXPORT_TYPE__MAX for all types */ 290bc4ee65bSKevin Wolf void blk_exp_close_all_type(BlockExportType type) 291bc4ee65bSKevin Wolf { 292bc4ee65bSKevin Wolf BlockExport *exp, *next; 293bc4ee65bSKevin Wolf 294bc4ee65bSKevin Wolf assert(in_aio_context_home_thread(qemu_get_aio_context())); 295bc4ee65bSKevin Wolf 296bc4ee65bSKevin Wolf QLIST_FOREACH_SAFE(exp, &block_exports, next, next) { 297bc4ee65bSKevin Wolf if (type != BLOCK_EXPORT_TYPE__MAX && exp->drv->type != type) { 298bc4ee65bSKevin Wolf continue; 299bc4ee65bSKevin Wolf } 300bc4ee65bSKevin Wolf blk_exp_request_shutdown(exp); 301bc4ee65bSKevin Wolf } 302bc4ee65bSKevin Wolf 303bc4ee65bSKevin Wolf AIO_WAIT_WHILE(NULL, blk_exp_has_type(type)); 304bc4ee65bSKevin Wolf } 305bc4ee65bSKevin Wolf 306bc4ee65bSKevin Wolf void blk_exp_close_all(void) 307bc4ee65bSKevin Wolf { 308bc4ee65bSKevin Wolf blk_exp_close_all_type(BLOCK_EXPORT_TYPE__MAX); 309bc4ee65bSKevin Wolf } 310bc4ee65bSKevin Wolf 3119b562c64SKevin Wolf void qmp_block_export_add(BlockExportOptions *export, Error **errp) 3129b562c64SKevin Wolf { 3139b562c64SKevin Wolf blk_exp_add(export, errp); 31456ee8626SKevin Wolf } 3153c3bc462SKevin Wolf 3163c3bc462SKevin Wolf void qmp_block_export_del(const char *id, 3173c3bc462SKevin Wolf bool has_mode, BlockExportRemoveMode mode, 3183c3bc462SKevin Wolf Error **errp) 3193c3bc462SKevin Wolf { 3203c3bc462SKevin Wolf ERRP_GUARD(); 3213c3bc462SKevin Wolf BlockExport *exp; 3223c3bc462SKevin Wolf 3233c3bc462SKevin Wolf exp = blk_exp_find(id); 3243c3bc462SKevin Wolf if (exp == NULL) { 3253c3bc462SKevin Wolf error_setg(errp, "Export '%s' is not found", id); 3263c3bc462SKevin Wolf return; 3273c3bc462SKevin Wolf } 3283c3bc462SKevin Wolf if (!exp->user_owned) { 3293c3bc462SKevin Wolf error_setg(errp, "Export '%s' is already shutting down", id); 3303c3bc462SKevin Wolf return; 3313c3bc462SKevin Wolf } 3323c3bc462SKevin Wolf 3333c3bc462SKevin Wolf if (!has_mode) { 3343c3bc462SKevin Wolf mode = BLOCK_EXPORT_REMOVE_MODE_SAFE; 3353c3bc462SKevin Wolf } 3363c3bc462SKevin Wolf if (mode == BLOCK_EXPORT_REMOVE_MODE_SAFE && exp->refcount > 1) { 3373c3bc462SKevin Wolf error_setg(errp, "export '%s' still in use", exp->id); 3383c3bc462SKevin Wolf error_append_hint(errp, "Use mode='hard' to force client " 3393c3bc462SKevin Wolf "disconnect\n"); 3403c3bc462SKevin Wolf return; 3413c3bc462SKevin Wolf } 3423c3bc462SKevin Wolf 3433c3bc462SKevin Wolf blk_exp_request_shutdown(exp); 3443c3bc462SKevin Wolf } 3458cade320SKevin Wolf 3468cade320SKevin Wolf BlockExportInfoList *qmp_query_block_exports(Error **errp) 3478cade320SKevin Wolf { 348c3033fd3SEric Blake BlockExportInfoList *head = NULL, **tail = &head; 3498cade320SKevin Wolf BlockExport *exp; 3508cade320SKevin Wolf 3518cade320SKevin Wolf QLIST_FOREACH(exp, &block_exports, next) { 3528cade320SKevin Wolf BlockExportInfo *info = g_new(BlockExportInfo, 1); 3538cade320SKevin Wolf *info = (BlockExportInfo) { 3548cade320SKevin Wolf .id = g_strdup(exp->id), 3558cade320SKevin Wolf .type = exp->drv->type, 3568cade320SKevin Wolf .node_name = g_strdup(bdrv_get_node_name(blk_bs(exp->blk))), 3578cade320SKevin Wolf .shutting_down = !exp->user_owned, 3588cade320SKevin Wolf }; 3598cade320SKevin Wolf 360c3033fd3SEric Blake QAPI_LIST_APPEND(tail, info); 3618cade320SKevin Wolf } 3628cade320SKevin Wolf 3638cade320SKevin Wolf return head; 3648cade320SKevin Wolf } 365