xref: /openbmc/qemu/block/export/export.c (revision 8573823f3ba2b63926f82d5732473e0cd73c1213)
156ee8626SKevin Wolf /*
256ee8626SKevin Wolf  * Common block export infrastructure
356ee8626SKevin Wolf  *
456ee8626SKevin Wolf  * Copyright (c) 2012, 2020 Red Hat, Inc.
556ee8626SKevin Wolf  *
656ee8626SKevin Wolf  * Authors:
756ee8626SKevin Wolf  * Paolo Bonzini <pbonzini@redhat.com>
856ee8626SKevin Wolf  * Kevin Wolf <kwolf@redhat.com>
956ee8626SKevin Wolf  *
1056ee8626SKevin Wolf  * This work is licensed under the terms of the GNU GPL, version 2 or
1156ee8626SKevin Wolf  * later.  See the COPYING file in the top-level directory.
1256ee8626SKevin Wolf  */
1356ee8626SKevin Wolf 
1456ee8626SKevin Wolf #include "qemu/osdep.h"
1556ee8626SKevin Wolf 
169b562c64SKevin Wolf #include "block/block.h"
179b562c64SKevin Wolf #include "sysemu/block-backend.h"
18f51d23c8SStefan Hajnoczi #include "sysemu/iothread.h"
1956ee8626SKevin Wolf #include "block/export.h"
200c9b70d5SMax Reitz #include "block/fuse.h"
2156ee8626SKevin Wolf #include "block/nbd.h"
2256ee8626SKevin Wolf #include "qapi/error.h"
2356ee8626SKevin Wolf #include "qapi/qapi-commands-block-export.h"
241a9f7a80SKevin Wolf #include "qapi/qapi-events-block-export.h"
25d53be9ceSKevin Wolf #include "qemu/id.h"
26bc15e44cSStefan Hajnoczi #ifdef CONFIG_VHOST_USER_BLK_SERVER
273a213f83SStefan Hajnoczi #include "vhost-user-blk-server.h"
283a213f83SStefan Hajnoczi #endif
2956ee8626SKevin Wolf 
3056ee8626SKevin Wolf static const BlockExportDriver *blk_exp_drivers[] = {
3156ee8626SKevin Wolf     &blk_exp_nbd,
32bc15e44cSStefan Hajnoczi #ifdef CONFIG_VHOST_USER_BLK_SERVER
3390fc91d5SStefan Hajnoczi     &blk_exp_vhost_user_blk,
3490fc91d5SStefan Hajnoczi #endif
350c9b70d5SMax Reitz #ifdef CONFIG_FUSE
360c9b70d5SMax Reitz     &blk_exp_fuse,
370c9b70d5SMax Reitz #endif
3856ee8626SKevin Wolf };
3956ee8626SKevin Wolf 
40bc4ee65bSKevin Wolf /* Only accessed from the main thread */
41bc4ee65bSKevin Wolf static QLIST_HEAD(, BlockExport) block_exports =
42bc4ee65bSKevin Wolf     QLIST_HEAD_INITIALIZER(block_exports);
43bc4ee65bSKevin Wolf 
443c3bc462SKevin Wolf BlockExport *blk_exp_find(const char *id)
45d53be9ceSKevin Wolf {
46d53be9ceSKevin Wolf     BlockExport *exp;
47d53be9ceSKevin Wolf 
48d53be9ceSKevin Wolf     QLIST_FOREACH(exp, &block_exports, next) {
49d53be9ceSKevin Wolf         if (strcmp(id, exp->id) == 0) {
50d53be9ceSKevin Wolf             return exp;
51d53be9ceSKevin Wolf         }
52d53be9ceSKevin Wolf     }
53d53be9ceSKevin Wolf 
54d53be9ceSKevin Wolf     return NULL;
55d53be9ceSKevin Wolf }
56d53be9ceSKevin Wolf 
5756ee8626SKevin Wolf static const BlockExportDriver *blk_exp_find_driver(BlockExportType type)
5856ee8626SKevin Wolf {
5956ee8626SKevin Wolf     int i;
6056ee8626SKevin Wolf 
6156ee8626SKevin Wolf     for (i = 0; i < ARRAY_SIZE(blk_exp_drivers); i++) {
6256ee8626SKevin Wolf         if (blk_exp_drivers[i]->type == type) {
6356ee8626SKevin Wolf             return blk_exp_drivers[i];
6456ee8626SKevin Wolf         }
6556ee8626SKevin Wolf     }
6656ee8626SKevin Wolf     return NULL;
6756ee8626SKevin Wolf }
6856ee8626SKevin Wolf 
699b562c64SKevin Wolf BlockExport *blk_exp_add(BlockExportOptions *export, Error **errp)
7056ee8626SKevin Wolf {
71f51d23c8SStefan Hajnoczi     bool fixed_iothread = export->has_fixed_iothread && export->fixed_iothread;
7256ee8626SKevin Wolf     const BlockExportDriver *drv;
73331170e0SKevin Wolf     BlockExport *exp = NULL;
74331170e0SKevin Wolf     BlockDriverState *bs;
75f51d23c8SStefan Hajnoczi     BlockBackend *blk = NULL;
76331170e0SKevin Wolf     AioContext *ctx;
7730dbc81dSKevin Wolf     uint64_t perm;
78a6ff7989SKevin Wolf     int ret;
7956ee8626SKevin Wolf 
80d53be9ceSKevin Wolf     if (!id_wellformed(export->id)) {
81d53be9ceSKevin Wolf         error_setg(errp, "Invalid block export id");
82d53be9ceSKevin Wolf         return NULL;
83d53be9ceSKevin Wolf     }
84d53be9ceSKevin Wolf     if (blk_exp_find(export->id)) {
85d53be9ceSKevin Wolf         error_setg(errp, "Block export id '%s' is already in use", export->id);
86d53be9ceSKevin Wolf         return NULL;
87d53be9ceSKevin Wolf     }
88d53be9ceSKevin Wolf 
8956ee8626SKevin Wolf     drv = blk_exp_find_driver(export->type);
9056ee8626SKevin Wolf     if (!drv) {
9156ee8626SKevin Wolf         error_setg(errp, "No driver found for the requested export type");
929b562c64SKevin Wolf         return NULL;
9356ee8626SKevin Wolf     }
9456ee8626SKevin Wolf 
95331170e0SKevin Wolf     bs = bdrv_lookup_bs(NULL, export->node_name, errp);
96331170e0SKevin Wolf     if (!bs) {
97331170e0SKevin Wolf         return NULL;
98331170e0SKevin Wolf     }
99331170e0SKevin Wolf 
10030dbc81dSKevin Wolf     if (!export->has_writable) {
10130dbc81dSKevin Wolf         export->writable = false;
10230dbc81dSKevin Wolf     }
10330dbc81dSKevin Wolf     if (bdrv_is_read_only(bs) && export->writable) {
10430dbc81dSKevin Wolf         error_setg(errp, "Cannot export read-only node as writable");
10530dbc81dSKevin Wolf         return NULL;
10630dbc81dSKevin Wolf     }
10730dbc81dSKevin Wolf 
108331170e0SKevin Wolf     ctx = bdrv_get_aio_context(bs);
109331170e0SKevin Wolf     aio_context_acquire(ctx);
110331170e0SKevin Wolf 
111f51d23c8SStefan Hajnoczi     if (export->has_iothread) {
112f51d23c8SStefan Hajnoczi         IOThread *iothread;
113f51d23c8SStefan Hajnoczi         AioContext *new_ctx;
114*8573823fSMax Reitz         Error **set_context_errp;
115f51d23c8SStefan Hajnoczi 
116f51d23c8SStefan Hajnoczi         iothread = iothread_by_id(export->iothread);
117f51d23c8SStefan Hajnoczi         if (!iothread) {
118f51d23c8SStefan Hajnoczi             error_setg(errp, "iothread \"%s\" not found", export->iothread);
119f51d23c8SStefan Hajnoczi             goto fail;
120f51d23c8SStefan Hajnoczi         }
121f51d23c8SStefan Hajnoczi 
122f51d23c8SStefan Hajnoczi         new_ctx = iothread_get_aio_context(iothread);
123f51d23c8SStefan Hajnoczi 
124*8573823fSMax Reitz         /* Ignore errors with fixed-iothread=false */
125*8573823fSMax Reitz         set_context_errp = fixed_iothread ? errp : NULL;
126*8573823fSMax Reitz         ret = bdrv_try_set_aio_context(bs, new_ctx, set_context_errp);
127f51d23c8SStefan Hajnoczi         if (ret == 0) {
128f51d23c8SStefan Hajnoczi             aio_context_release(ctx);
129f51d23c8SStefan Hajnoczi             aio_context_acquire(new_ctx);
130f51d23c8SStefan Hajnoczi             ctx = new_ctx;
131f51d23c8SStefan Hajnoczi         } else if (fixed_iothread) {
132f51d23c8SStefan Hajnoczi             goto fail;
133f51d23c8SStefan Hajnoczi         }
134f51d23c8SStefan Hajnoczi     }
135f51d23c8SStefan Hajnoczi 
136331170e0SKevin Wolf     /*
137331170e0SKevin Wolf      * Block exports are used for non-shared storage migration. Make sure
138331170e0SKevin Wolf      * that BDRV_O_INACTIVE is cleared and the image is ready for write
139331170e0SKevin Wolf      * access since the export could be available before migration handover.
140331170e0SKevin Wolf      * ctx was acquired in the caller.
141331170e0SKevin Wolf      */
142331170e0SKevin Wolf     bdrv_invalidate_cache(bs, NULL);
143331170e0SKevin Wolf 
14430dbc81dSKevin Wolf     perm = BLK_PERM_CONSISTENT_READ;
14530dbc81dSKevin Wolf     if (export->writable) {
14630dbc81dSKevin Wolf         perm |= BLK_PERM_WRITE;
14730dbc81dSKevin Wolf     }
14830dbc81dSKevin Wolf 
14930dbc81dSKevin Wolf     blk = blk_new(ctx, perm, BLK_PERM_ALL);
150f51d23c8SStefan Hajnoczi 
151f51d23c8SStefan Hajnoczi     if (!fixed_iothread) {
152f51d23c8SStefan Hajnoczi         blk_set_allow_aio_context_change(blk, true);
153f51d23c8SStefan Hajnoczi     }
154f51d23c8SStefan Hajnoczi 
155331170e0SKevin Wolf     ret = blk_insert_bs(blk, bs, errp);
156331170e0SKevin Wolf     if (ret < 0) {
157331170e0SKevin Wolf         goto fail;
158331170e0SKevin Wolf     }
159331170e0SKevin Wolf 
160331170e0SKevin Wolf     if (!export->has_writethrough) {
161331170e0SKevin Wolf         export->writethrough = false;
162331170e0SKevin Wolf     }
163331170e0SKevin Wolf     blk_set_enable_write_cache(blk, !export->writethrough);
164331170e0SKevin Wolf 
165a6ff7989SKevin Wolf     assert(drv->instance_size >= sizeof(BlockExport));
166a6ff7989SKevin Wolf     exp = g_malloc0(drv->instance_size);
167a6ff7989SKevin Wolf     *exp = (BlockExport) {
168a6ff7989SKevin Wolf         .drv        = drv,
169a6ff7989SKevin Wolf         .refcount   = 1,
1703859ad36SKevin Wolf         .user_owned = true,
171d53be9ceSKevin Wolf         .id         = g_strdup(export->id),
172331170e0SKevin Wolf         .ctx        = ctx,
173331170e0SKevin Wolf         .blk        = blk,
174a6ff7989SKevin Wolf     };
175a6ff7989SKevin Wolf 
176a6ff7989SKevin Wolf     ret = drv->create(exp, export, errp);
177a6ff7989SKevin Wolf     if (ret < 0) {
178331170e0SKevin Wolf         goto fail;
179a6ff7989SKevin Wolf     }
180a6ff7989SKevin Wolf 
18137a4f70cSKevin Wolf     assert(exp->blk != NULL);
18237a4f70cSKevin Wolf 
183bc4ee65bSKevin Wolf     QLIST_INSERT_HEAD(&block_exports, exp, next);
184331170e0SKevin Wolf 
185331170e0SKevin Wolf     aio_context_release(ctx);
186a6ff7989SKevin Wolf     return exp;
187331170e0SKevin Wolf 
188331170e0SKevin Wolf fail:
189331170e0SKevin Wolf     blk_unref(blk);
190331170e0SKevin Wolf     aio_context_release(ctx);
191331170e0SKevin Wolf     if (exp) {
192331170e0SKevin Wolf         g_free(exp->id);
193331170e0SKevin Wolf         g_free(exp);
194331170e0SKevin Wolf     }
195331170e0SKevin Wolf     return NULL;
1969b562c64SKevin Wolf }
1979b562c64SKevin Wolf 
1988612c686SKevin Wolf /* Callers must hold exp->ctx lock */
199c69de1beSKevin Wolf void blk_exp_ref(BlockExport *exp)
200c69de1beSKevin Wolf {
201c69de1beSKevin Wolf     assert(exp->refcount > 0);
202c69de1beSKevin Wolf     exp->refcount++;
203c69de1beSKevin Wolf }
204c69de1beSKevin Wolf 
205bc4ee65bSKevin Wolf /* Runs in the main thread */
206bc4ee65bSKevin Wolf static void blk_exp_delete_bh(void *opaque)
207bc4ee65bSKevin Wolf {
208bc4ee65bSKevin Wolf     BlockExport *exp = opaque;
209bc4ee65bSKevin Wolf     AioContext *aio_context = exp->ctx;
210bc4ee65bSKevin Wolf 
211bc4ee65bSKevin Wolf     aio_context_acquire(aio_context);
212bc4ee65bSKevin Wolf 
213bc4ee65bSKevin Wolf     assert(exp->refcount == 0);
214bc4ee65bSKevin Wolf     QLIST_REMOVE(exp, next);
215bc4ee65bSKevin Wolf     exp->drv->delete(exp);
21637a4f70cSKevin Wolf     blk_unref(exp->blk);
2171a9f7a80SKevin Wolf     qapi_event_send_block_export_deleted(exp->id);
218d53be9ceSKevin Wolf     g_free(exp->id);
219bc4ee65bSKevin Wolf     g_free(exp);
220bc4ee65bSKevin Wolf 
221bc4ee65bSKevin Wolf     aio_context_release(aio_context);
222bc4ee65bSKevin Wolf }
223bc4ee65bSKevin Wolf 
2248612c686SKevin Wolf /* Callers must hold exp->ctx lock */
225c69de1beSKevin Wolf void blk_exp_unref(BlockExport *exp)
226c69de1beSKevin Wolf {
227c69de1beSKevin Wolf     assert(exp->refcount > 0);
228c69de1beSKevin Wolf     if (--exp->refcount == 0) {
229bc4ee65bSKevin Wolf         /* Touch the block_exports list only in the main thread */
230bc4ee65bSKevin Wolf         aio_bh_schedule_oneshot(qemu_get_aio_context(), blk_exp_delete_bh,
231bc4ee65bSKevin Wolf                                 exp);
232c69de1beSKevin Wolf     }
233c69de1beSKevin Wolf }
234c69de1beSKevin Wolf 
235bc4ee65bSKevin Wolf /*
236bc4ee65bSKevin Wolf  * Drops the user reference to the export and requests that all client
237bc4ee65bSKevin Wolf  * connections and other internally held references start to shut down. When
238bc4ee65bSKevin Wolf  * the function returns, there may still be active references while the export
239bc4ee65bSKevin Wolf  * is in the process of shutting down.
240bc4ee65bSKevin Wolf  *
241bc4ee65bSKevin Wolf  * Acquires exp->ctx internally. Callers must *not* hold the lock.
242bc4ee65bSKevin Wolf  */
243bc4ee65bSKevin Wolf void blk_exp_request_shutdown(BlockExport *exp)
244bc4ee65bSKevin Wolf {
245bc4ee65bSKevin Wolf     AioContext *aio_context = exp->ctx;
246bc4ee65bSKevin Wolf 
247bc4ee65bSKevin Wolf     aio_context_acquire(aio_context);
2483c3bc462SKevin Wolf 
2493c3bc462SKevin Wolf     /*
2503c3bc462SKevin Wolf      * If the user doesn't own the export any more, it is already shutting
2513c3bc462SKevin Wolf      * down. We must not call .request_shutdown and decrease the refcount a
2523c3bc462SKevin Wolf      * second time.
2533c3bc462SKevin Wolf      */
2543c3bc462SKevin Wolf     if (!exp->user_owned) {
2553c3bc462SKevin Wolf         goto out;
2563c3bc462SKevin Wolf     }
2573c3bc462SKevin Wolf 
258bc4ee65bSKevin Wolf     exp->drv->request_shutdown(exp);
2593859ad36SKevin Wolf 
2603859ad36SKevin Wolf     assert(exp->user_owned);
2613859ad36SKevin Wolf     exp->user_owned = false;
2623859ad36SKevin Wolf     blk_exp_unref(exp);
2633859ad36SKevin Wolf 
2643c3bc462SKevin Wolf out:
265bc4ee65bSKevin Wolf     aio_context_release(aio_context);
266bc4ee65bSKevin Wolf }
267bc4ee65bSKevin Wolf 
268bc4ee65bSKevin Wolf /*
269bc4ee65bSKevin Wolf  * Returns whether a block export of the given type exists.
270bc4ee65bSKevin Wolf  * type == BLOCK_EXPORT_TYPE__MAX checks for an export of any type.
271bc4ee65bSKevin Wolf  */
272bc4ee65bSKevin Wolf static bool blk_exp_has_type(BlockExportType type)
273bc4ee65bSKevin Wolf {
274bc4ee65bSKevin Wolf     BlockExport *exp;
275bc4ee65bSKevin Wolf 
276bc4ee65bSKevin Wolf     if (type == BLOCK_EXPORT_TYPE__MAX) {
277bc4ee65bSKevin Wolf         return !QLIST_EMPTY(&block_exports);
278bc4ee65bSKevin Wolf     }
279bc4ee65bSKevin Wolf 
280bc4ee65bSKevin Wolf     QLIST_FOREACH(exp, &block_exports, next) {
281bc4ee65bSKevin Wolf         if (exp->drv->type == type) {
282bc4ee65bSKevin Wolf             return true;
283bc4ee65bSKevin Wolf         }
284bc4ee65bSKevin Wolf     }
285bc4ee65bSKevin Wolf 
286bc4ee65bSKevin Wolf     return false;
287bc4ee65bSKevin Wolf }
288bc4ee65bSKevin Wolf 
289bc4ee65bSKevin Wolf /* type == BLOCK_EXPORT_TYPE__MAX for all types */
290bc4ee65bSKevin Wolf void blk_exp_close_all_type(BlockExportType type)
291bc4ee65bSKevin Wolf {
292bc4ee65bSKevin Wolf     BlockExport *exp, *next;
293bc4ee65bSKevin Wolf 
294bc4ee65bSKevin Wolf     assert(in_aio_context_home_thread(qemu_get_aio_context()));
295bc4ee65bSKevin Wolf 
296bc4ee65bSKevin Wolf     QLIST_FOREACH_SAFE(exp, &block_exports, next, next) {
297bc4ee65bSKevin Wolf         if (type != BLOCK_EXPORT_TYPE__MAX && exp->drv->type != type) {
298bc4ee65bSKevin Wolf             continue;
299bc4ee65bSKevin Wolf         }
300bc4ee65bSKevin Wolf         blk_exp_request_shutdown(exp);
301bc4ee65bSKevin Wolf     }
302bc4ee65bSKevin Wolf 
303bc4ee65bSKevin Wolf     AIO_WAIT_WHILE(NULL, blk_exp_has_type(type));
304bc4ee65bSKevin Wolf }
305bc4ee65bSKevin Wolf 
306bc4ee65bSKevin Wolf void blk_exp_close_all(void)
307bc4ee65bSKevin Wolf {
308bc4ee65bSKevin Wolf     blk_exp_close_all_type(BLOCK_EXPORT_TYPE__MAX);
309bc4ee65bSKevin Wolf }
310bc4ee65bSKevin Wolf 
3119b562c64SKevin Wolf void qmp_block_export_add(BlockExportOptions *export, Error **errp)
3129b562c64SKevin Wolf {
3139b562c64SKevin Wolf     blk_exp_add(export, errp);
31456ee8626SKevin Wolf }
3153c3bc462SKevin Wolf 
3163c3bc462SKevin Wolf void qmp_block_export_del(const char *id,
3173c3bc462SKevin Wolf                           bool has_mode, BlockExportRemoveMode mode,
3183c3bc462SKevin Wolf                           Error **errp)
3193c3bc462SKevin Wolf {
3203c3bc462SKevin Wolf     ERRP_GUARD();
3213c3bc462SKevin Wolf     BlockExport *exp;
3223c3bc462SKevin Wolf 
3233c3bc462SKevin Wolf     exp = blk_exp_find(id);
3243c3bc462SKevin Wolf     if (exp == NULL) {
3253c3bc462SKevin Wolf         error_setg(errp, "Export '%s' is not found", id);
3263c3bc462SKevin Wolf         return;
3273c3bc462SKevin Wolf     }
3283c3bc462SKevin Wolf     if (!exp->user_owned) {
3293c3bc462SKevin Wolf         error_setg(errp, "Export '%s' is already shutting down", id);
3303c3bc462SKevin Wolf         return;
3313c3bc462SKevin Wolf     }
3323c3bc462SKevin Wolf 
3333c3bc462SKevin Wolf     if (!has_mode) {
3343c3bc462SKevin Wolf         mode = BLOCK_EXPORT_REMOVE_MODE_SAFE;
3353c3bc462SKevin Wolf     }
3363c3bc462SKevin Wolf     if (mode == BLOCK_EXPORT_REMOVE_MODE_SAFE && exp->refcount > 1) {
3373c3bc462SKevin Wolf         error_setg(errp, "export '%s' still in use", exp->id);
3383c3bc462SKevin Wolf         error_append_hint(errp, "Use mode='hard' to force client "
3393c3bc462SKevin Wolf                           "disconnect\n");
3403c3bc462SKevin Wolf         return;
3413c3bc462SKevin Wolf     }
3423c3bc462SKevin Wolf 
3433c3bc462SKevin Wolf     blk_exp_request_shutdown(exp);
3443c3bc462SKevin Wolf }
3458cade320SKevin Wolf 
3468cade320SKevin Wolf BlockExportInfoList *qmp_query_block_exports(Error **errp)
3478cade320SKevin Wolf {
348c3033fd3SEric Blake     BlockExportInfoList *head = NULL, **tail = &head;
3498cade320SKevin Wolf     BlockExport *exp;
3508cade320SKevin Wolf 
3518cade320SKevin Wolf     QLIST_FOREACH(exp, &block_exports, next) {
3528cade320SKevin Wolf         BlockExportInfo *info = g_new(BlockExportInfo, 1);
3538cade320SKevin Wolf         *info = (BlockExportInfo) {
3548cade320SKevin Wolf             .id             = g_strdup(exp->id),
3558cade320SKevin Wolf             .type           = exp->drv->type,
3568cade320SKevin Wolf             .node_name      = g_strdup(bdrv_get_node_name(blk_bs(exp->blk))),
3578cade320SKevin Wolf             .shutting_down  = !exp->user_owned,
3588cade320SKevin Wolf         };
3598cade320SKevin Wolf 
360c3033fd3SEric Blake         QAPI_LIST_APPEND(tail, info);
3618cade320SKevin Wolf     }
3628cade320SKevin Wolf 
3638cade320SKevin Wolf     return head;
3648cade320SKevin Wolf }
365