156ee8626SKevin Wolf /*
256ee8626SKevin Wolf * Common block export infrastructure
356ee8626SKevin Wolf *
456ee8626SKevin Wolf * Copyright (c) 2012, 2020 Red Hat, Inc.
556ee8626SKevin Wolf *
656ee8626SKevin Wolf * Authors:
756ee8626SKevin Wolf * Paolo Bonzini <pbonzini@redhat.com>
856ee8626SKevin Wolf * Kevin Wolf <kwolf@redhat.com>
956ee8626SKevin Wolf *
1056ee8626SKevin Wolf * This work is licensed under the terms of the GNU GPL, version 2 or
1156ee8626SKevin Wolf * later. See the COPYING file in the top-level directory.
1256ee8626SKevin Wolf */
1356ee8626SKevin Wolf
1456ee8626SKevin Wolf #include "qemu/osdep.h"
1556ee8626SKevin Wolf
169b562c64SKevin Wolf #include "block/block.h"
179b562c64SKevin Wolf #include "sysemu/block-backend.h"
18f51d23c8SStefan Hajnoczi #include "sysemu/iothread.h"
1956ee8626SKevin Wolf #include "block/export.h"
200c9b70d5SMax Reitz #include "block/fuse.h"
2156ee8626SKevin Wolf #include "block/nbd.h"
2256ee8626SKevin Wolf #include "qapi/error.h"
2356ee8626SKevin Wolf #include "qapi/qapi-commands-block-export.h"
241a9f7a80SKevin Wolf #include "qapi/qapi-events-block-export.h"
25d53be9ceSKevin Wolf #include "qemu/id.h"
26bc15e44cSStefan Hajnoczi #ifdef CONFIG_VHOST_USER_BLK_SERVER
273a213f83SStefan Hajnoczi #include "vhost-user-blk-server.h"
283a213f83SStefan Hajnoczi #endif
292a2359b8SXie Yongji #ifdef CONFIG_VDUSE_BLK_EXPORT
302a2359b8SXie Yongji #include "vduse-blk.h"
312a2359b8SXie Yongji #endif
3256ee8626SKevin Wolf
3356ee8626SKevin Wolf static const BlockExportDriver *blk_exp_drivers[] = {
3456ee8626SKevin Wolf &blk_exp_nbd,
35bc15e44cSStefan Hajnoczi #ifdef CONFIG_VHOST_USER_BLK_SERVER
3690fc91d5SStefan Hajnoczi &blk_exp_vhost_user_blk,
3790fc91d5SStefan Hajnoczi #endif
380c9b70d5SMax Reitz #ifdef CONFIG_FUSE
390c9b70d5SMax Reitz &blk_exp_fuse,
400c9b70d5SMax Reitz #endif
412a2359b8SXie Yongji #ifdef CONFIG_VDUSE_BLK_EXPORT
422a2359b8SXie Yongji &blk_exp_vduse_blk,
432a2359b8SXie Yongji #endif
4456ee8626SKevin Wolf };
4556ee8626SKevin Wolf
46bc4ee65bSKevin Wolf /* Only accessed from the main thread */
47bc4ee65bSKevin Wolf static QLIST_HEAD(, BlockExport) block_exports =
48bc4ee65bSKevin Wolf QLIST_HEAD_INITIALIZER(block_exports);
49bc4ee65bSKevin Wolf
blk_exp_find(const char * id)503c3bc462SKevin Wolf BlockExport *blk_exp_find(const char *id)
51d53be9ceSKevin Wolf {
52d53be9ceSKevin Wolf BlockExport *exp;
53d53be9ceSKevin Wolf
54d53be9ceSKevin Wolf QLIST_FOREACH(exp, &block_exports, next) {
55d53be9ceSKevin Wolf if (strcmp(id, exp->id) == 0) {
56d53be9ceSKevin Wolf return exp;
57d53be9ceSKevin Wolf }
58d53be9ceSKevin Wolf }
59d53be9ceSKevin Wolf
60d53be9ceSKevin Wolf return NULL;
61d53be9ceSKevin Wolf }
62d53be9ceSKevin Wolf
blk_exp_find_driver(BlockExportType type)6356ee8626SKevin Wolf static const BlockExportDriver *blk_exp_find_driver(BlockExportType type)
6456ee8626SKevin Wolf {
6556ee8626SKevin Wolf int i;
6656ee8626SKevin Wolf
6756ee8626SKevin Wolf for (i = 0; i < ARRAY_SIZE(blk_exp_drivers); i++) {
6856ee8626SKevin Wolf if (blk_exp_drivers[i]->type == type) {
6956ee8626SKevin Wolf return blk_exp_drivers[i];
7056ee8626SKevin Wolf }
7156ee8626SKevin Wolf }
7256ee8626SKevin Wolf return NULL;
7356ee8626SKevin Wolf }
7456ee8626SKevin Wolf
blk_exp_add(BlockExportOptions * export,Error ** errp)759b562c64SKevin Wolf BlockExport *blk_exp_add(BlockExportOptions *export, Error **errp)
7656ee8626SKevin Wolf {
77f51d23c8SStefan Hajnoczi bool fixed_iothread = export->has_fixed_iothread && export->fixed_iothread;
7856ee8626SKevin Wolf const BlockExportDriver *drv;
79331170e0SKevin Wolf BlockExport *exp = NULL;
80331170e0SKevin Wolf BlockDriverState *bs;
81f51d23c8SStefan Hajnoczi BlockBackend *blk = NULL;
82331170e0SKevin Wolf AioContext *ctx;
8330dbc81dSKevin Wolf uint64_t perm;
84a6ff7989SKevin Wolf int ret;
8556ee8626SKevin Wolf
862b3912f1SKevin Wolf GLOBAL_STATE_CODE();
872b3912f1SKevin Wolf
88d53be9ceSKevin Wolf if (!id_wellformed(export->id)) {
89d53be9ceSKevin Wolf error_setg(errp, "Invalid block export id");
90d53be9ceSKevin Wolf return NULL;
91d53be9ceSKevin Wolf }
92d53be9ceSKevin Wolf if (blk_exp_find(export->id)) {
93d53be9ceSKevin Wolf error_setg(errp, "Block export id '%s' is already in use", export->id);
94d53be9ceSKevin Wolf return NULL;
95d53be9ceSKevin Wolf }
96d53be9ceSKevin Wolf
9756ee8626SKevin Wolf drv = blk_exp_find_driver(export->type);
9856ee8626SKevin Wolf if (!drv) {
9956ee8626SKevin Wolf error_setg(errp, "No driver found for the requested export type");
1009b562c64SKevin Wolf return NULL;
10156ee8626SKevin Wolf }
10256ee8626SKevin Wolf
103331170e0SKevin Wolf bs = bdrv_lookup_bs(NULL, export->node_name, errp);
104331170e0SKevin Wolf if (!bs) {
105331170e0SKevin Wolf return NULL;
106331170e0SKevin Wolf }
107331170e0SKevin Wolf
10830dbc81dSKevin Wolf if (!export->has_writable) {
10930dbc81dSKevin Wolf export->writable = false;
11030dbc81dSKevin Wolf }
11130dbc81dSKevin Wolf if (bdrv_is_read_only(bs) && export->writable) {
11230dbc81dSKevin Wolf error_setg(errp, "Cannot export read-only node as writable");
11330dbc81dSKevin Wolf return NULL;
11430dbc81dSKevin Wolf }
11530dbc81dSKevin Wolf
116331170e0SKevin Wolf ctx = bdrv_get_aio_context(bs);
117331170e0SKevin Wolf
11854fde4ffSMarkus Armbruster if (export->iothread) {
119f51d23c8SStefan Hajnoczi IOThread *iothread;
120f51d23c8SStefan Hajnoczi AioContext *new_ctx;
1218573823fSMax Reitz Error **set_context_errp;
122f51d23c8SStefan Hajnoczi
123f51d23c8SStefan Hajnoczi iothread = iothread_by_id(export->iothread);
124f51d23c8SStefan Hajnoczi if (!iothread) {
125f51d23c8SStefan Hajnoczi error_setg(errp, "iothread \"%s\" not found", export->iothread);
126f51d23c8SStefan Hajnoczi goto fail;
127f51d23c8SStefan Hajnoczi }
128f51d23c8SStefan Hajnoczi
129f51d23c8SStefan Hajnoczi new_ctx = iothread_get_aio_context(iothread);
130f51d23c8SStefan Hajnoczi
1318573823fSMax Reitz /* Ignore errors with fixed-iothread=false */
1328573823fSMax Reitz set_context_errp = fixed_iothread ? errp : NULL;
133142e6907SEmanuele Giuseppe Esposito ret = bdrv_try_change_aio_context(bs, new_ctx, NULL, set_context_errp);
134f51d23c8SStefan Hajnoczi if (ret == 0) {
135f51d23c8SStefan Hajnoczi ctx = new_ctx;
136f51d23c8SStefan Hajnoczi } else if (fixed_iothread) {
137f51d23c8SStefan Hajnoczi goto fail;
138f51d23c8SStefan Hajnoczi }
139f51d23c8SStefan Hajnoczi }
140f51d23c8SStefan Hajnoczi
141331170e0SKevin Wolf /*
142331170e0SKevin Wolf * Block exports are used for non-shared storage migration. Make sure
143331170e0SKevin Wolf * that BDRV_O_INACTIVE is cleared and the image is ready for write
144331170e0SKevin Wolf * access since the export could be available before migration handover.
145331170e0SKevin Wolf * ctx was acquired in the caller.
146331170e0SKevin Wolf */
1472b3912f1SKevin Wolf bdrv_graph_rdlock_main_loop();
148a94750d9SEmanuele Giuseppe Esposito bdrv_activate(bs, NULL);
1492b3912f1SKevin Wolf bdrv_graph_rdunlock_main_loop();
150331170e0SKevin Wolf
15130dbc81dSKevin Wolf perm = BLK_PERM_CONSISTENT_READ;
15230dbc81dSKevin Wolf if (export->writable) {
15330dbc81dSKevin Wolf perm |= BLK_PERM_WRITE;
15430dbc81dSKevin Wolf }
15530dbc81dSKevin Wolf
15630dbc81dSKevin Wolf blk = blk_new(ctx, perm, BLK_PERM_ALL);
157f51d23c8SStefan Hajnoczi
158f51d23c8SStefan Hajnoczi if (!fixed_iothread) {
159f51d23c8SStefan Hajnoczi blk_set_allow_aio_context_change(blk, true);
160f51d23c8SStefan Hajnoczi }
161f51d23c8SStefan Hajnoczi
162331170e0SKevin Wolf ret = blk_insert_bs(blk, bs, errp);
163331170e0SKevin Wolf if (ret < 0) {
164331170e0SKevin Wolf goto fail;
165331170e0SKevin Wolf }
166331170e0SKevin Wolf
167331170e0SKevin Wolf if (!export->has_writethrough) {
168331170e0SKevin Wolf export->writethrough = false;
169331170e0SKevin Wolf }
170331170e0SKevin Wolf blk_set_enable_write_cache(blk, !export->writethrough);
171331170e0SKevin Wolf
172a6ff7989SKevin Wolf assert(drv->instance_size >= sizeof(BlockExport));
173a6ff7989SKevin Wolf exp = g_malloc0(drv->instance_size);
174a6ff7989SKevin Wolf *exp = (BlockExport) {
175a6ff7989SKevin Wolf .drv = drv,
176a6ff7989SKevin Wolf .refcount = 1,
1773859ad36SKevin Wolf .user_owned = true,
178d53be9ceSKevin Wolf .id = g_strdup(export->id),
179331170e0SKevin Wolf .ctx = ctx,
180331170e0SKevin Wolf .blk = blk,
181a6ff7989SKevin Wolf };
182a6ff7989SKevin Wolf
183a6ff7989SKevin Wolf ret = drv->create(exp, export, errp);
184a6ff7989SKevin Wolf if (ret < 0) {
185331170e0SKevin Wolf goto fail;
186a6ff7989SKevin Wolf }
187a6ff7989SKevin Wolf
18837a4f70cSKevin Wolf assert(exp->blk != NULL);
18937a4f70cSKevin Wolf
190bc4ee65bSKevin Wolf QLIST_INSERT_HEAD(&block_exports, exp, next);
191a6ff7989SKevin Wolf return exp;
192331170e0SKevin Wolf
193331170e0SKevin Wolf fail:
194a1845637SKevin Wolf if (blk) {
195a1845637SKevin Wolf blk_set_dev_ops(blk, NULL, NULL);
196331170e0SKevin Wolf blk_unref(blk);
197a1845637SKevin Wolf }
198331170e0SKevin Wolf if (exp) {
199331170e0SKevin Wolf g_free(exp->id);
200331170e0SKevin Wolf g_free(exp);
201331170e0SKevin Wolf }
202331170e0SKevin Wolf return NULL;
2039b562c64SKevin Wolf }
2049b562c64SKevin Wolf
blk_exp_ref(BlockExport * exp)205c69de1beSKevin Wolf void blk_exp_ref(BlockExport *exp)
206c69de1beSKevin Wolf {
2073d499a43SStefan Hajnoczi assert(qatomic_read(&exp->refcount) > 0);
2083d499a43SStefan Hajnoczi qatomic_inc(&exp->refcount);
209c69de1beSKevin Wolf }
210c69de1beSKevin Wolf
211bc4ee65bSKevin Wolf /* Runs in the main thread */
blk_exp_delete_bh(void * opaque)212bc4ee65bSKevin Wolf static void blk_exp_delete_bh(void *opaque)
213bc4ee65bSKevin Wolf {
214bc4ee65bSKevin Wolf BlockExport *exp = opaque;
215bc4ee65bSKevin Wolf
216bc4ee65bSKevin Wolf assert(exp->refcount == 0);
217bc4ee65bSKevin Wolf QLIST_REMOVE(exp, next);
218bc4ee65bSKevin Wolf exp->drv->delete(exp);
219de79b526SStefan Hajnoczi blk_set_dev_ops(exp->blk, NULL, NULL);
22037a4f70cSKevin Wolf blk_unref(exp->blk);
2211a9f7a80SKevin Wolf qapi_event_send_block_export_deleted(exp->id);
222d53be9ceSKevin Wolf g_free(exp->id);
223bc4ee65bSKevin Wolf g_free(exp);
224bc4ee65bSKevin Wolf }
225bc4ee65bSKevin Wolf
blk_exp_unref(BlockExport * exp)226c69de1beSKevin Wolf void blk_exp_unref(BlockExport *exp)
227c69de1beSKevin Wolf {
2283d499a43SStefan Hajnoczi assert(qatomic_read(&exp->refcount) > 0);
2293d499a43SStefan Hajnoczi if (qatomic_fetch_dec(&exp->refcount) == 1) {
230bc4ee65bSKevin Wolf /* Touch the block_exports list only in the main thread */
231bc4ee65bSKevin Wolf aio_bh_schedule_oneshot(qemu_get_aio_context(), blk_exp_delete_bh,
232bc4ee65bSKevin Wolf exp);
233c69de1beSKevin Wolf }
234c69de1beSKevin Wolf }
235c69de1beSKevin Wolf
236bc4ee65bSKevin Wolf /*
237bc4ee65bSKevin Wolf * Drops the user reference to the export and requests that all client
238bc4ee65bSKevin Wolf * connections and other internally held references start to shut down. When
239bc4ee65bSKevin Wolf * the function returns, there may still be active references while the export
240bc4ee65bSKevin Wolf * is in the process of shutting down.
241bc4ee65bSKevin Wolf */
blk_exp_request_shutdown(BlockExport * exp)242bc4ee65bSKevin Wolf void blk_exp_request_shutdown(BlockExport *exp)
243bc4ee65bSKevin Wolf {
2443c3bc462SKevin Wolf /*
2453c3bc462SKevin Wolf * If the user doesn't own the export any more, it is already shutting
2463c3bc462SKevin Wolf * down. We must not call .request_shutdown and decrease the refcount a
2473c3bc462SKevin Wolf * second time.
2483c3bc462SKevin Wolf */
2493c3bc462SKevin Wolf if (!exp->user_owned) {
250*b49f4755SStefan Hajnoczi return;
2513c3bc462SKevin Wolf }
2523c3bc462SKevin Wolf
253bc4ee65bSKevin Wolf exp->drv->request_shutdown(exp);
2543859ad36SKevin Wolf
2553859ad36SKevin Wolf assert(exp->user_owned);
2563859ad36SKevin Wolf exp->user_owned = false;
2573859ad36SKevin Wolf blk_exp_unref(exp);
258bc4ee65bSKevin Wolf }
259bc4ee65bSKevin Wolf
260bc4ee65bSKevin Wolf /*
261bc4ee65bSKevin Wolf * Returns whether a block export of the given type exists.
262bc4ee65bSKevin Wolf * type == BLOCK_EXPORT_TYPE__MAX checks for an export of any type.
263bc4ee65bSKevin Wolf */
blk_exp_has_type(BlockExportType type)264bc4ee65bSKevin Wolf static bool blk_exp_has_type(BlockExportType type)
265bc4ee65bSKevin Wolf {
266bc4ee65bSKevin Wolf BlockExport *exp;
267bc4ee65bSKevin Wolf
268bc4ee65bSKevin Wolf if (type == BLOCK_EXPORT_TYPE__MAX) {
269bc4ee65bSKevin Wolf return !QLIST_EMPTY(&block_exports);
270bc4ee65bSKevin Wolf }
271bc4ee65bSKevin Wolf
272bc4ee65bSKevin Wolf QLIST_FOREACH(exp, &block_exports, next) {
273bc4ee65bSKevin Wolf if (exp->drv->type == type) {
274bc4ee65bSKevin Wolf return true;
275bc4ee65bSKevin Wolf }
276bc4ee65bSKevin Wolf }
277bc4ee65bSKevin Wolf
278bc4ee65bSKevin Wolf return false;
279bc4ee65bSKevin Wolf }
280bc4ee65bSKevin Wolf
281bc4ee65bSKevin Wolf /* type == BLOCK_EXPORT_TYPE__MAX for all types */
blk_exp_close_all_type(BlockExportType type)282bc4ee65bSKevin Wolf void blk_exp_close_all_type(BlockExportType type)
283bc4ee65bSKevin Wolf {
284bc4ee65bSKevin Wolf BlockExport *exp, *next;
285bc4ee65bSKevin Wolf
286bc4ee65bSKevin Wolf assert(in_aio_context_home_thread(qemu_get_aio_context()));
287bc4ee65bSKevin Wolf
288bc4ee65bSKevin Wolf QLIST_FOREACH_SAFE(exp, &block_exports, next, next) {
289bc4ee65bSKevin Wolf if (type != BLOCK_EXPORT_TYPE__MAX && exp->drv->type != type) {
290bc4ee65bSKevin Wolf continue;
291bc4ee65bSKevin Wolf }
292bc4ee65bSKevin Wolf blk_exp_request_shutdown(exp);
293bc4ee65bSKevin Wolf }
294bc4ee65bSKevin Wolf
295e5568a66SStefan Hajnoczi AIO_WAIT_WHILE_UNLOCKED(NULL, blk_exp_has_type(type));
296bc4ee65bSKevin Wolf }
297bc4ee65bSKevin Wolf
blk_exp_close_all(void)298bc4ee65bSKevin Wolf void blk_exp_close_all(void)
299bc4ee65bSKevin Wolf {
300bc4ee65bSKevin Wolf blk_exp_close_all_type(BLOCK_EXPORT_TYPE__MAX);
301bc4ee65bSKevin Wolf }
302bc4ee65bSKevin Wolf
qmp_block_export_add(BlockExportOptions * export,Error ** errp)3039b562c64SKevin Wolf void qmp_block_export_add(BlockExportOptions *export, Error **errp)
3049b562c64SKevin Wolf {
3059b562c64SKevin Wolf blk_exp_add(export, errp);
30656ee8626SKevin Wolf }
3073c3bc462SKevin Wolf
qmp_block_export_del(const char * id,bool has_mode,BlockExportRemoveMode mode,Error ** errp)3083c3bc462SKevin Wolf void qmp_block_export_del(const char *id,
3093c3bc462SKevin Wolf bool has_mode, BlockExportRemoveMode mode,
3103c3bc462SKevin Wolf Error **errp)
3113c3bc462SKevin Wolf {
3123c3bc462SKevin Wolf ERRP_GUARD();
3133c3bc462SKevin Wolf BlockExport *exp;
3143c3bc462SKevin Wolf
3153c3bc462SKevin Wolf exp = blk_exp_find(id);
3163c3bc462SKevin Wolf if (exp == NULL) {
3173c3bc462SKevin Wolf error_setg(errp, "Export '%s' is not found", id);
3183c3bc462SKevin Wolf return;
3193c3bc462SKevin Wolf }
3203c3bc462SKevin Wolf if (!exp->user_owned) {
3213c3bc462SKevin Wolf error_setg(errp, "Export '%s' is already shutting down", id);
3223c3bc462SKevin Wolf return;
3233c3bc462SKevin Wolf }
3243c3bc462SKevin Wolf
3253c3bc462SKevin Wolf if (!has_mode) {
3263c3bc462SKevin Wolf mode = BLOCK_EXPORT_REMOVE_MODE_SAFE;
3273c3bc462SKevin Wolf }
3283d499a43SStefan Hajnoczi if (mode == BLOCK_EXPORT_REMOVE_MODE_SAFE &&
3293d499a43SStefan Hajnoczi qatomic_read(&exp->refcount) > 1) {
3303c3bc462SKevin Wolf error_setg(errp, "export '%s' still in use", exp->id);
3313c3bc462SKevin Wolf error_append_hint(errp, "Use mode='hard' to force client "
3323c3bc462SKevin Wolf "disconnect\n");
3333c3bc462SKevin Wolf return;
3343c3bc462SKevin Wolf }
3353c3bc462SKevin Wolf
3363c3bc462SKevin Wolf blk_exp_request_shutdown(exp);
3373c3bc462SKevin Wolf }
3388cade320SKevin Wolf
qmp_query_block_exports(Error ** errp)3398cade320SKevin Wolf BlockExportInfoList *qmp_query_block_exports(Error **errp)
3408cade320SKevin Wolf {
341c3033fd3SEric Blake BlockExportInfoList *head = NULL, **tail = &head;
3428cade320SKevin Wolf BlockExport *exp;
3438cade320SKevin Wolf
3448cade320SKevin Wolf QLIST_FOREACH(exp, &block_exports, next) {
3458cade320SKevin Wolf BlockExportInfo *info = g_new(BlockExportInfo, 1);
3468cade320SKevin Wolf *info = (BlockExportInfo) {
3478cade320SKevin Wolf .id = g_strdup(exp->id),
3488cade320SKevin Wolf .type = exp->drv->type,
3498cade320SKevin Wolf .node_name = g_strdup(bdrv_get_node_name(blk_bs(exp->blk))),
3508cade320SKevin Wolf .shutting_down = !exp->user_owned,
3518cade320SKevin Wolf };
3528cade320SKevin Wolf
353c3033fd3SEric Blake QAPI_LIST_APPEND(tail, info);
3548cade320SKevin Wolf }
3558cade320SKevin Wolf
3568cade320SKevin Wolf return head;
3578cade320SKevin Wolf }
358