156ee8626SKevin Wolf /* 256ee8626SKevin Wolf * Common block export infrastructure 356ee8626SKevin Wolf * 456ee8626SKevin Wolf * Copyright (c) 2012, 2020 Red Hat, Inc. 556ee8626SKevin Wolf * 656ee8626SKevin Wolf * Authors: 756ee8626SKevin Wolf * Paolo Bonzini <pbonzini@redhat.com> 856ee8626SKevin Wolf * Kevin Wolf <kwolf@redhat.com> 956ee8626SKevin Wolf * 1056ee8626SKevin Wolf * This work is licensed under the terms of the GNU GPL, version 2 or 1156ee8626SKevin Wolf * later. See the COPYING file in the top-level directory. 1256ee8626SKevin Wolf */ 1356ee8626SKevin Wolf 1456ee8626SKevin Wolf #include "qemu/osdep.h" 1556ee8626SKevin Wolf 169b562c64SKevin Wolf #include "block/block.h" 179b562c64SKevin Wolf #include "sysemu/block-backend.h" 18f51d23c8SStefan Hajnoczi #include "sysemu/iothread.h" 1956ee8626SKevin Wolf #include "block/export.h" 2056ee8626SKevin Wolf #include "block/nbd.h" 2156ee8626SKevin Wolf #include "qapi/error.h" 2256ee8626SKevin Wolf #include "qapi/qapi-commands-block-export.h" 231a9f7a80SKevin Wolf #include "qapi/qapi-events-block-export.h" 24d53be9ceSKevin Wolf #include "qemu/id.h" 25*bc15e44cSStefan Hajnoczi #ifdef CONFIG_VHOST_USER_BLK_SERVER 263a213f83SStefan Hajnoczi #include "vhost-user-blk-server.h" 273a213f83SStefan Hajnoczi #endif 2856ee8626SKevin Wolf 2956ee8626SKevin Wolf static const BlockExportDriver *blk_exp_drivers[] = { 3056ee8626SKevin Wolf &blk_exp_nbd, 31*bc15e44cSStefan Hajnoczi #ifdef CONFIG_VHOST_USER_BLK_SERVER 3290fc91d5SStefan Hajnoczi &blk_exp_vhost_user_blk, 3390fc91d5SStefan Hajnoczi #endif 3456ee8626SKevin Wolf }; 3556ee8626SKevin Wolf 36bc4ee65bSKevin Wolf /* Only accessed from the main thread */ 37bc4ee65bSKevin Wolf static QLIST_HEAD(, BlockExport) block_exports = 38bc4ee65bSKevin Wolf QLIST_HEAD_INITIALIZER(block_exports); 39bc4ee65bSKevin Wolf 403c3bc462SKevin Wolf BlockExport *blk_exp_find(const char *id) 41d53be9ceSKevin Wolf { 42d53be9ceSKevin Wolf BlockExport *exp; 43d53be9ceSKevin Wolf 44d53be9ceSKevin Wolf QLIST_FOREACH(exp, &block_exports, next) { 45d53be9ceSKevin Wolf if (strcmp(id, exp->id) == 0) { 46d53be9ceSKevin Wolf return exp; 47d53be9ceSKevin Wolf } 48d53be9ceSKevin Wolf } 49d53be9ceSKevin Wolf 50d53be9ceSKevin Wolf return NULL; 51d53be9ceSKevin Wolf } 52d53be9ceSKevin Wolf 5356ee8626SKevin Wolf static const BlockExportDriver *blk_exp_find_driver(BlockExportType type) 5456ee8626SKevin Wolf { 5556ee8626SKevin Wolf int i; 5656ee8626SKevin Wolf 5756ee8626SKevin Wolf for (i = 0; i < ARRAY_SIZE(blk_exp_drivers); i++) { 5856ee8626SKevin Wolf if (blk_exp_drivers[i]->type == type) { 5956ee8626SKevin Wolf return blk_exp_drivers[i]; 6056ee8626SKevin Wolf } 6156ee8626SKevin Wolf } 6256ee8626SKevin Wolf return NULL; 6356ee8626SKevin Wolf } 6456ee8626SKevin Wolf 659b562c64SKevin Wolf BlockExport *blk_exp_add(BlockExportOptions *export, Error **errp) 6656ee8626SKevin Wolf { 67f51d23c8SStefan Hajnoczi bool fixed_iothread = export->has_fixed_iothread && export->fixed_iothread; 6856ee8626SKevin Wolf const BlockExportDriver *drv; 69331170e0SKevin Wolf BlockExport *exp = NULL; 70331170e0SKevin Wolf BlockDriverState *bs; 71f51d23c8SStefan Hajnoczi BlockBackend *blk = NULL; 72331170e0SKevin Wolf AioContext *ctx; 7330dbc81dSKevin Wolf uint64_t perm; 74a6ff7989SKevin Wolf int ret; 7556ee8626SKevin Wolf 76d53be9ceSKevin Wolf if (!id_wellformed(export->id)) { 77d53be9ceSKevin Wolf error_setg(errp, "Invalid block export id"); 78d53be9ceSKevin Wolf return NULL; 79d53be9ceSKevin Wolf } 80d53be9ceSKevin Wolf if (blk_exp_find(export->id)) { 81d53be9ceSKevin Wolf error_setg(errp, "Block export id '%s' is already in use", export->id); 82d53be9ceSKevin Wolf return NULL; 83d53be9ceSKevin Wolf } 84d53be9ceSKevin Wolf 8556ee8626SKevin Wolf drv = blk_exp_find_driver(export->type); 8656ee8626SKevin Wolf if (!drv) { 8756ee8626SKevin Wolf error_setg(errp, "No driver found for the requested export type"); 889b562c64SKevin Wolf return NULL; 8956ee8626SKevin Wolf } 9056ee8626SKevin Wolf 91331170e0SKevin Wolf bs = bdrv_lookup_bs(NULL, export->node_name, errp); 92331170e0SKevin Wolf if (!bs) { 93331170e0SKevin Wolf return NULL; 94331170e0SKevin Wolf } 95331170e0SKevin Wolf 9630dbc81dSKevin Wolf if (!export->has_writable) { 9730dbc81dSKevin Wolf export->writable = false; 9830dbc81dSKevin Wolf } 9930dbc81dSKevin Wolf if (bdrv_is_read_only(bs) && export->writable) { 10030dbc81dSKevin Wolf error_setg(errp, "Cannot export read-only node as writable"); 10130dbc81dSKevin Wolf return NULL; 10230dbc81dSKevin Wolf } 10330dbc81dSKevin Wolf 104331170e0SKevin Wolf ctx = bdrv_get_aio_context(bs); 105331170e0SKevin Wolf aio_context_acquire(ctx); 106331170e0SKevin Wolf 107f51d23c8SStefan Hajnoczi if (export->has_iothread) { 108f51d23c8SStefan Hajnoczi IOThread *iothread; 109f51d23c8SStefan Hajnoczi AioContext *new_ctx; 110f51d23c8SStefan Hajnoczi 111f51d23c8SStefan Hajnoczi iothread = iothread_by_id(export->iothread); 112f51d23c8SStefan Hajnoczi if (!iothread) { 113f51d23c8SStefan Hajnoczi error_setg(errp, "iothread \"%s\" not found", export->iothread); 114f51d23c8SStefan Hajnoczi goto fail; 115f51d23c8SStefan Hajnoczi } 116f51d23c8SStefan Hajnoczi 117f51d23c8SStefan Hajnoczi new_ctx = iothread_get_aio_context(iothread); 118f51d23c8SStefan Hajnoczi 119f51d23c8SStefan Hajnoczi ret = bdrv_try_set_aio_context(bs, new_ctx, errp); 120f51d23c8SStefan Hajnoczi if (ret == 0) { 121f51d23c8SStefan Hajnoczi aio_context_release(ctx); 122f51d23c8SStefan Hajnoczi aio_context_acquire(new_ctx); 123f51d23c8SStefan Hajnoczi ctx = new_ctx; 124f51d23c8SStefan Hajnoczi } else if (fixed_iothread) { 125f51d23c8SStefan Hajnoczi goto fail; 126f51d23c8SStefan Hajnoczi } 127f51d23c8SStefan Hajnoczi } 128f51d23c8SStefan Hajnoczi 129331170e0SKevin Wolf /* 130331170e0SKevin Wolf * Block exports are used for non-shared storage migration. Make sure 131331170e0SKevin Wolf * that BDRV_O_INACTIVE is cleared and the image is ready for write 132331170e0SKevin Wolf * access since the export could be available before migration handover. 133331170e0SKevin Wolf * ctx was acquired in the caller. 134331170e0SKevin Wolf */ 135331170e0SKevin Wolf bdrv_invalidate_cache(bs, NULL); 136331170e0SKevin Wolf 13730dbc81dSKevin Wolf perm = BLK_PERM_CONSISTENT_READ; 13830dbc81dSKevin Wolf if (export->writable) { 13930dbc81dSKevin Wolf perm |= BLK_PERM_WRITE; 14030dbc81dSKevin Wolf } 14130dbc81dSKevin Wolf 14230dbc81dSKevin Wolf blk = blk_new(ctx, perm, BLK_PERM_ALL); 143f51d23c8SStefan Hajnoczi 144f51d23c8SStefan Hajnoczi if (!fixed_iothread) { 145f51d23c8SStefan Hajnoczi blk_set_allow_aio_context_change(blk, true); 146f51d23c8SStefan Hajnoczi } 147f51d23c8SStefan Hajnoczi 148331170e0SKevin Wolf ret = blk_insert_bs(blk, bs, errp); 149331170e0SKevin Wolf if (ret < 0) { 150331170e0SKevin Wolf goto fail; 151331170e0SKevin Wolf } 152331170e0SKevin Wolf 153331170e0SKevin Wolf if (!export->has_writethrough) { 154331170e0SKevin Wolf export->writethrough = false; 155331170e0SKevin Wolf } 156331170e0SKevin Wolf blk_set_enable_write_cache(blk, !export->writethrough); 157331170e0SKevin Wolf 158a6ff7989SKevin Wolf assert(drv->instance_size >= sizeof(BlockExport)); 159a6ff7989SKevin Wolf exp = g_malloc0(drv->instance_size); 160a6ff7989SKevin Wolf *exp = (BlockExport) { 161a6ff7989SKevin Wolf .drv = drv, 162a6ff7989SKevin Wolf .refcount = 1, 1633859ad36SKevin Wolf .user_owned = true, 164d53be9ceSKevin Wolf .id = g_strdup(export->id), 165331170e0SKevin Wolf .ctx = ctx, 166331170e0SKevin Wolf .blk = blk, 167a6ff7989SKevin Wolf }; 168a6ff7989SKevin Wolf 169a6ff7989SKevin Wolf ret = drv->create(exp, export, errp); 170a6ff7989SKevin Wolf if (ret < 0) { 171331170e0SKevin Wolf goto fail; 172a6ff7989SKevin Wolf } 173a6ff7989SKevin Wolf 17437a4f70cSKevin Wolf assert(exp->blk != NULL); 17537a4f70cSKevin Wolf 176bc4ee65bSKevin Wolf QLIST_INSERT_HEAD(&block_exports, exp, next); 177331170e0SKevin Wolf 178331170e0SKevin Wolf aio_context_release(ctx); 179a6ff7989SKevin Wolf return exp; 180331170e0SKevin Wolf 181331170e0SKevin Wolf fail: 182331170e0SKevin Wolf blk_unref(blk); 183331170e0SKevin Wolf aio_context_release(ctx); 184331170e0SKevin Wolf if (exp) { 185331170e0SKevin Wolf g_free(exp->id); 186331170e0SKevin Wolf g_free(exp); 187331170e0SKevin Wolf } 188331170e0SKevin Wolf return NULL; 1899b562c64SKevin Wolf } 1909b562c64SKevin Wolf 1918612c686SKevin Wolf /* Callers must hold exp->ctx lock */ 192c69de1beSKevin Wolf void blk_exp_ref(BlockExport *exp) 193c69de1beSKevin Wolf { 194c69de1beSKevin Wolf assert(exp->refcount > 0); 195c69de1beSKevin Wolf exp->refcount++; 196c69de1beSKevin Wolf } 197c69de1beSKevin Wolf 198bc4ee65bSKevin Wolf /* Runs in the main thread */ 199bc4ee65bSKevin Wolf static void blk_exp_delete_bh(void *opaque) 200bc4ee65bSKevin Wolf { 201bc4ee65bSKevin Wolf BlockExport *exp = opaque; 202bc4ee65bSKevin Wolf AioContext *aio_context = exp->ctx; 203bc4ee65bSKevin Wolf 204bc4ee65bSKevin Wolf aio_context_acquire(aio_context); 205bc4ee65bSKevin Wolf 206bc4ee65bSKevin Wolf assert(exp->refcount == 0); 207bc4ee65bSKevin Wolf QLIST_REMOVE(exp, next); 208bc4ee65bSKevin Wolf exp->drv->delete(exp); 20937a4f70cSKevin Wolf blk_unref(exp->blk); 2101a9f7a80SKevin Wolf qapi_event_send_block_export_deleted(exp->id); 211d53be9ceSKevin Wolf g_free(exp->id); 212bc4ee65bSKevin Wolf g_free(exp); 213bc4ee65bSKevin Wolf 214bc4ee65bSKevin Wolf aio_context_release(aio_context); 215bc4ee65bSKevin Wolf } 216bc4ee65bSKevin Wolf 2178612c686SKevin Wolf /* Callers must hold exp->ctx lock */ 218c69de1beSKevin Wolf void blk_exp_unref(BlockExport *exp) 219c69de1beSKevin Wolf { 220c69de1beSKevin Wolf assert(exp->refcount > 0); 221c69de1beSKevin Wolf if (--exp->refcount == 0) { 222bc4ee65bSKevin Wolf /* Touch the block_exports list only in the main thread */ 223bc4ee65bSKevin Wolf aio_bh_schedule_oneshot(qemu_get_aio_context(), blk_exp_delete_bh, 224bc4ee65bSKevin Wolf exp); 225c69de1beSKevin Wolf } 226c69de1beSKevin Wolf } 227c69de1beSKevin Wolf 228bc4ee65bSKevin Wolf /* 229bc4ee65bSKevin Wolf * Drops the user reference to the export and requests that all client 230bc4ee65bSKevin Wolf * connections and other internally held references start to shut down. When 231bc4ee65bSKevin Wolf * the function returns, there may still be active references while the export 232bc4ee65bSKevin Wolf * is in the process of shutting down. 233bc4ee65bSKevin Wolf * 234bc4ee65bSKevin Wolf * Acquires exp->ctx internally. Callers must *not* hold the lock. 235bc4ee65bSKevin Wolf */ 236bc4ee65bSKevin Wolf void blk_exp_request_shutdown(BlockExport *exp) 237bc4ee65bSKevin Wolf { 238bc4ee65bSKevin Wolf AioContext *aio_context = exp->ctx; 239bc4ee65bSKevin Wolf 240bc4ee65bSKevin Wolf aio_context_acquire(aio_context); 2413c3bc462SKevin Wolf 2423c3bc462SKevin Wolf /* 2433c3bc462SKevin Wolf * If the user doesn't own the export any more, it is already shutting 2443c3bc462SKevin Wolf * down. We must not call .request_shutdown and decrease the refcount a 2453c3bc462SKevin Wolf * second time. 2463c3bc462SKevin Wolf */ 2473c3bc462SKevin Wolf if (!exp->user_owned) { 2483c3bc462SKevin Wolf goto out; 2493c3bc462SKevin Wolf } 2503c3bc462SKevin Wolf 251bc4ee65bSKevin Wolf exp->drv->request_shutdown(exp); 2523859ad36SKevin Wolf 2533859ad36SKevin Wolf assert(exp->user_owned); 2543859ad36SKevin Wolf exp->user_owned = false; 2553859ad36SKevin Wolf blk_exp_unref(exp); 2563859ad36SKevin Wolf 2573c3bc462SKevin Wolf out: 258bc4ee65bSKevin Wolf aio_context_release(aio_context); 259bc4ee65bSKevin Wolf } 260bc4ee65bSKevin Wolf 261bc4ee65bSKevin Wolf /* 262bc4ee65bSKevin Wolf * Returns whether a block export of the given type exists. 263bc4ee65bSKevin Wolf * type == BLOCK_EXPORT_TYPE__MAX checks for an export of any type. 264bc4ee65bSKevin Wolf */ 265bc4ee65bSKevin Wolf static bool blk_exp_has_type(BlockExportType type) 266bc4ee65bSKevin Wolf { 267bc4ee65bSKevin Wolf BlockExport *exp; 268bc4ee65bSKevin Wolf 269bc4ee65bSKevin Wolf if (type == BLOCK_EXPORT_TYPE__MAX) { 270bc4ee65bSKevin Wolf return !QLIST_EMPTY(&block_exports); 271bc4ee65bSKevin Wolf } 272bc4ee65bSKevin Wolf 273bc4ee65bSKevin Wolf QLIST_FOREACH(exp, &block_exports, next) { 274bc4ee65bSKevin Wolf if (exp->drv->type == type) { 275bc4ee65bSKevin Wolf return true; 276bc4ee65bSKevin Wolf } 277bc4ee65bSKevin Wolf } 278bc4ee65bSKevin Wolf 279bc4ee65bSKevin Wolf return false; 280bc4ee65bSKevin Wolf } 281bc4ee65bSKevin Wolf 282bc4ee65bSKevin Wolf /* type == BLOCK_EXPORT_TYPE__MAX for all types */ 283bc4ee65bSKevin Wolf void blk_exp_close_all_type(BlockExportType type) 284bc4ee65bSKevin Wolf { 285bc4ee65bSKevin Wolf BlockExport *exp, *next; 286bc4ee65bSKevin Wolf 287bc4ee65bSKevin Wolf assert(in_aio_context_home_thread(qemu_get_aio_context())); 288bc4ee65bSKevin Wolf 289bc4ee65bSKevin Wolf QLIST_FOREACH_SAFE(exp, &block_exports, next, next) { 290bc4ee65bSKevin Wolf if (type != BLOCK_EXPORT_TYPE__MAX && exp->drv->type != type) { 291bc4ee65bSKevin Wolf continue; 292bc4ee65bSKevin Wolf } 293bc4ee65bSKevin Wolf blk_exp_request_shutdown(exp); 294bc4ee65bSKevin Wolf } 295bc4ee65bSKevin Wolf 296bc4ee65bSKevin Wolf AIO_WAIT_WHILE(NULL, blk_exp_has_type(type)); 297bc4ee65bSKevin Wolf } 298bc4ee65bSKevin Wolf 299bc4ee65bSKevin Wolf void blk_exp_close_all(void) 300bc4ee65bSKevin Wolf { 301bc4ee65bSKevin Wolf blk_exp_close_all_type(BLOCK_EXPORT_TYPE__MAX); 302bc4ee65bSKevin Wolf } 303bc4ee65bSKevin Wolf 3049b562c64SKevin Wolf void qmp_block_export_add(BlockExportOptions *export, Error **errp) 3059b562c64SKevin Wolf { 3069b562c64SKevin Wolf blk_exp_add(export, errp); 30756ee8626SKevin Wolf } 3083c3bc462SKevin Wolf 3093c3bc462SKevin Wolf void qmp_block_export_del(const char *id, 3103c3bc462SKevin Wolf bool has_mode, BlockExportRemoveMode mode, 3113c3bc462SKevin Wolf Error **errp) 3123c3bc462SKevin Wolf { 3133c3bc462SKevin Wolf ERRP_GUARD(); 3143c3bc462SKevin Wolf BlockExport *exp; 3153c3bc462SKevin Wolf 3163c3bc462SKevin Wolf exp = blk_exp_find(id); 3173c3bc462SKevin Wolf if (exp == NULL) { 3183c3bc462SKevin Wolf error_setg(errp, "Export '%s' is not found", id); 3193c3bc462SKevin Wolf return; 3203c3bc462SKevin Wolf } 3213c3bc462SKevin Wolf if (!exp->user_owned) { 3223c3bc462SKevin Wolf error_setg(errp, "Export '%s' is already shutting down", id); 3233c3bc462SKevin Wolf return; 3243c3bc462SKevin Wolf } 3253c3bc462SKevin Wolf 3263c3bc462SKevin Wolf if (!has_mode) { 3273c3bc462SKevin Wolf mode = BLOCK_EXPORT_REMOVE_MODE_SAFE; 3283c3bc462SKevin Wolf } 3293c3bc462SKevin Wolf if (mode == BLOCK_EXPORT_REMOVE_MODE_SAFE && exp->refcount > 1) { 3303c3bc462SKevin Wolf error_setg(errp, "export '%s' still in use", exp->id); 3313c3bc462SKevin Wolf error_append_hint(errp, "Use mode='hard' to force client " 3323c3bc462SKevin Wolf "disconnect\n"); 3333c3bc462SKevin Wolf return; 3343c3bc462SKevin Wolf } 3353c3bc462SKevin Wolf 3363c3bc462SKevin Wolf blk_exp_request_shutdown(exp); 3373c3bc462SKevin Wolf } 3388cade320SKevin Wolf 3398cade320SKevin Wolf BlockExportInfoList *qmp_query_block_exports(Error **errp) 3408cade320SKevin Wolf { 3418cade320SKevin Wolf BlockExportInfoList *head = NULL, **p_next = &head; 3428cade320SKevin Wolf BlockExport *exp; 3438cade320SKevin Wolf 3448cade320SKevin Wolf QLIST_FOREACH(exp, &block_exports, next) { 3458cade320SKevin Wolf BlockExportInfoList *entry = g_new0(BlockExportInfoList, 1); 3468cade320SKevin Wolf BlockExportInfo *info = g_new(BlockExportInfo, 1); 3478cade320SKevin Wolf *info = (BlockExportInfo) { 3488cade320SKevin Wolf .id = g_strdup(exp->id), 3498cade320SKevin Wolf .type = exp->drv->type, 3508cade320SKevin Wolf .node_name = g_strdup(bdrv_get_node_name(blk_bs(exp->blk))), 3518cade320SKevin Wolf .shutting_down = !exp->user_owned, 3528cade320SKevin Wolf }; 3538cade320SKevin Wolf 3548cade320SKevin Wolf entry->value = info; 3558cade320SKevin Wolf *p_next = entry; 3568cade320SKevin Wolf p_next = &entry->next; 3578cade320SKevin Wolf } 3588cade320SKevin Wolf 3598cade320SKevin Wolf return head; 3608cade320SKevin Wolf } 361