xref: /openbmc/qemu/migration/file.c (revision becd69449791c747100d57dfba24e19be82cff39)
12a9e2e59SSteve Sistare /*
22a9e2e59SSteve Sistare  * Copyright (c) 2021-2023 Oracle and/or its affiliates.
32a9e2e59SSteve Sistare  *
42a9e2e59SSteve Sistare  * This work is licensed under the terms of the GNU GPL, version 2 or later.
52a9e2e59SSteve Sistare  * See the COPYING file in the top-level directory.
62a9e2e59SSteve Sistare  */
72a9e2e59SSteve Sistare 
82a9e2e59SSteve Sistare #include "qemu/osdep.h"
9d117ed06SFabiano Rosas #include "exec/ramblock.h"
10385f510dSSteve Sistare #include "qemu/cutils.h"
112dd7ee7aSFabiano Rosas #include "qemu/error-report.h"
12385f510dSSteve Sistare #include "qapi/error.h"
132a9e2e59SSteve Sistare #include "channel.h"
142a9e2e59SSteve Sistare #include "file.h"
152a9e2e59SSteve Sistare #include "migration.h"
162a9e2e59SSteve Sistare #include "io/channel-file.h"
1773f6f9a1SFabiano Rosas #include "io/channel-socket.h"
182a9e2e59SSteve Sistare #include "io/channel-util.h"
192dd7ee7aSFabiano Rosas #include "options.h"
202a9e2e59SSteve Sistare #include "trace.h"
212a9e2e59SSteve Sistare 
22385f510dSSteve Sistare #define OFFSET_OPTION ",offset="
23385f510dSSteve Sistare 
24b7b03eb6SFabiano Rosas static struct FileOutgoingArgs {
25b7b03eb6SFabiano Rosas     char *fname;
26b7b03eb6SFabiano Rosas } outgoing_args;
27b7b03eb6SFabiano Rosas 
28385f510dSSteve Sistare /* Remove the offset option from @filespec and return it in @offsetp. */
29385f510dSSteve Sistare 
file_parse_offset(char * filespec,uint64_t * offsetp,Error ** errp)3072a8192eSHet Gala int file_parse_offset(char *filespec, uint64_t *offsetp, Error **errp)
31385f510dSSteve Sistare {
32385f510dSSteve Sistare     char *option = strstr(filespec, OFFSET_OPTION);
33385f510dSSteve Sistare     int ret;
34385f510dSSteve Sistare 
35385f510dSSteve Sistare     if (option) {
36385f510dSSteve Sistare         *option = 0;
37385f510dSSteve Sistare         option += sizeof(OFFSET_OPTION) - 1;
38385f510dSSteve Sistare         ret = qemu_strtosz(option, NULL, offsetp);
39385f510dSSteve Sistare         if (ret) {
40385f510dSSteve Sistare             error_setg_errno(errp, -ret, "file URI has bad offset %s", option);
41385f510dSSteve Sistare             return -1;
42385f510dSSteve Sistare         }
43385f510dSSteve Sistare     }
44385f510dSSteve Sistare     return 0;
45385f510dSSteve Sistare }
46385f510dSSteve Sistare 
file_cleanup_outgoing_migration(void)47b7b03eb6SFabiano Rosas void file_cleanup_outgoing_migration(void)
48b7b03eb6SFabiano Rosas {
49b7b03eb6SFabiano Rosas     g_free(outgoing_args.fname);
50b7b03eb6SFabiano Rosas     outgoing_args.fname = NULL;
51b7b03eb6SFabiano Rosas }
52b7b03eb6SFabiano Rosas 
file_enable_direct_io(int * flags)539d70239eSFabiano Rosas static void file_enable_direct_io(int *flags)
549d70239eSFabiano Rosas {
559d70239eSFabiano Rosas #ifdef O_DIRECT
569d70239eSFabiano Rosas     *flags |= O_DIRECT;
579d70239eSFabiano Rosas #else
589d70239eSFabiano Rosas     /* it should have been rejected when setting the parameter */
599d70239eSFabiano Rosas     g_assert_not_reached();
609d70239eSFabiano Rosas #endif
619d70239eSFabiano Rosas }
629d70239eSFabiano Rosas 
file_send_channel_create(gpointer opaque,Error ** errp)63b7b03eb6SFabiano Rosas bool file_send_channel_create(gpointer opaque, Error **errp)
64b7b03eb6SFabiano Rosas {
65b7b03eb6SFabiano Rosas     QIOChannelFile *ioc;
66b7b03eb6SFabiano Rosas     int flags = O_WRONLY;
67bd4480b0SFabiano Rosas     bool ret = true;
68b7b03eb6SFabiano Rosas 
699d70239eSFabiano Rosas     if (migrate_direct_io()) {
709d70239eSFabiano Rosas         /*
719d70239eSFabiano Rosas          * Enable O_DIRECT for the secondary channels. These are used
729d70239eSFabiano Rosas          * for sending ram pages and writes should be guaranteed to be
739d70239eSFabiano Rosas          * aligned to at least page size.
749d70239eSFabiano Rosas          */
759d70239eSFabiano Rosas         file_enable_direct_io(&flags);
769d70239eSFabiano Rosas     }
779d70239eSFabiano Rosas 
78b7b03eb6SFabiano Rosas     ioc = qio_channel_file_new_path(outgoing_args.fname, flags, 0, errp);
79b7b03eb6SFabiano Rosas     if (!ioc) {
80bd4480b0SFabiano Rosas         ret = false;
81b7b03eb6SFabiano Rosas         goto out;
82b7b03eb6SFabiano Rosas     }
83b7b03eb6SFabiano Rosas 
84b7b03eb6SFabiano Rosas     multifd_channel_connect(opaque, QIO_CHANNEL(ioc));
85b7b03eb6SFabiano Rosas 
86b7b03eb6SFabiano Rosas out:
87b7b03eb6SFabiano Rosas     /*
88b7b03eb6SFabiano Rosas      * File channel creation is synchronous. However posting this
89b7b03eb6SFabiano Rosas      * semaphore here is simpler than adding a special case.
90b7b03eb6SFabiano Rosas      */
91b7b03eb6SFabiano Rosas     multifd_send_channel_created();
92b7b03eb6SFabiano Rosas 
93b7b03eb6SFabiano Rosas     return ret;
94b7b03eb6SFabiano Rosas }
95b7b03eb6SFabiano Rosas 
file_start_outgoing_migration(MigrationState * s,FileMigrationArgs * file_args,Error ** errp)9602afba63SFabiano Rosas void file_start_outgoing_migration(MigrationState *s,
9702afba63SFabiano Rosas                                    FileMigrationArgs *file_args, Error **errp)
982a9e2e59SSteve Sistare {
992a9e2e59SSteve Sistare     g_autoptr(QIOChannelFile) fioc = NULL;
10002afba63SFabiano Rosas     g_autofree char *filename = g_strdup(file_args->filename);
10102afba63SFabiano Rosas     uint64_t offset = file_args->offset;
1022a9e2e59SSteve Sistare     QIOChannel *ioc;
1032a9e2e59SSteve Sistare 
1042a9e2e59SSteve Sistare     trace_migration_file_outgoing(filename);
1052a9e2e59SSteve Sistare 
1066d327965SFabiano Rosas     fioc = qio_channel_file_new_path(filename, O_CREAT | O_WRONLY, 0600, errp);
1072a9e2e59SSteve Sistare     if (!fioc) {
1082a9e2e59SSteve Sistare         return;
1092a9e2e59SSteve Sistare     }
1102a9e2e59SSteve Sistare 
1116d327965SFabiano Rosas     if (ftruncate(fioc->fd, offset)) {
1126d327965SFabiano Rosas         error_setg_errno(errp, errno,
1136d327965SFabiano Rosas                          "failed to truncate migration file to offset %" PRIx64,
1146d327965SFabiano Rosas                          offset);
1156d327965SFabiano Rosas         return;
1166d327965SFabiano Rosas     }
1176d327965SFabiano Rosas 
118b7b03eb6SFabiano Rosas     outgoing_args.fname = g_strdup(filename);
119b7b03eb6SFabiano Rosas 
1202a9e2e59SSteve Sistare     ioc = QIO_CHANNEL(fioc);
121385f510dSSteve Sistare     if (offset && qio_channel_io_seek(ioc, offset, SEEK_SET, errp) < 0) {
122385f510dSSteve Sistare         return;
123385f510dSSteve Sistare     }
1242a9e2e59SSteve Sistare     qio_channel_set_name(ioc, "migration-file-outgoing");
1252a9e2e59SSteve Sistare     migration_channel_connect(s, ioc, NULL, NULL);
1262a9e2e59SSteve Sistare }
1272a9e2e59SSteve Sistare 
file_accept_incoming_migration(QIOChannel * ioc,GIOCondition condition,gpointer opaque)1282a9e2e59SSteve Sistare static gboolean file_accept_incoming_migration(QIOChannel *ioc,
1292a9e2e59SSteve Sistare                                                GIOCondition condition,
1302a9e2e59SSteve Sistare                                                gpointer opaque)
1312a9e2e59SSteve Sistare {
1322a9e2e59SSteve Sistare     migration_channel_process_incoming(ioc);
1332a9e2e59SSteve Sistare     object_unref(OBJECT(ioc));
1342a9e2e59SSteve Sistare     return G_SOURCE_REMOVE;
1352a9e2e59SSteve Sistare }
1362a9e2e59SSteve Sistare 
file_create_incoming_channels(QIOChannel * ioc,char * filename,Error ** errp)1379d70239eSFabiano Rosas static void file_create_incoming_channels(QIOChannel *ioc, char *filename,
1389d70239eSFabiano Rosas                                           Error **errp)
13974228c59SFabiano Rosas {
1409d70239eSFabiano Rosas     int i, channels = 1;
14174228c59SFabiano Rosas     g_autofree QIOChannel **iocs = NULL;
1429d70239eSFabiano Rosas     int flags = O_RDONLY;
14374228c59SFabiano Rosas 
14474228c59SFabiano Rosas     if (migrate_multifd()) {
14574228c59SFabiano Rosas         channels += migrate_multifd_channels();
1469d70239eSFabiano Rosas         if (migrate_direct_io()) {
1479d70239eSFabiano Rosas             file_enable_direct_io(&flags);
1489d70239eSFabiano Rosas         }
14974228c59SFabiano Rosas     }
15074228c59SFabiano Rosas 
15174228c59SFabiano Rosas     iocs = g_new0(QIOChannel *, channels);
15274228c59SFabiano Rosas     iocs[0] = ioc;
15374228c59SFabiano Rosas 
15474228c59SFabiano Rosas     for (i = 1; i < channels; i++) {
1559d70239eSFabiano Rosas         QIOChannelFile *fioc = qio_channel_file_new_path(filename, flags, 0, errp);
15674228c59SFabiano Rosas 
15774228c59SFabiano Rosas         if (!fioc) {
15874228c59SFabiano Rosas             while (i) {
15974228c59SFabiano Rosas                 object_unref(iocs[--i]);
16074228c59SFabiano Rosas             }
16174228c59SFabiano Rosas             return;
16274228c59SFabiano Rosas         }
16374228c59SFabiano Rosas 
16474228c59SFabiano Rosas         iocs[i] = QIO_CHANNEL(fioc);
16574228c59SFabiano Rosas     }
16674228c59SFabiano Rosas 
16774228c59SFabiano Rosas     for (i = 0; i < channels; i++) {
16874228c59SFabiano Rosas         qio_channel_set_name(iocs[i], "migration-file-incoming");
16974228c59SFabiano Rosas         qio_channel_add_watch_full(iocs[i], G_IO_IN,
17074228c59SFabiano Rosas                                    file_accept_incoming_migration,
17174228c59SFabiano Rosas                                    NULL, NULL,
17274228c59SFabiano Rosas                                    g_main_context_get_thread_default());
17374228c59SFabiano Rosas     }
17474228c59SFabiano Rosas }
17574228c59SFabiano Rosas 
file_start_incoming_migration(FileMigrationArgs * file_args,Error ** errp)17602afba63SFabiano Rosas void file_start_incoming_migration(FileMigrationArgs *file_args, Error **errp)
1772a9e2e59SSteve Sistare {
17802afba63SFabiano Rosas     g_autofree char *filename = g_strdup(file_args->filename);
1792a9e2e59SSteve Sistare     QIOChannelFile *fioc = NULL;
18002afba63SFabiano Rosas     uint64_t offset = file_args->offset;
1812a9e2e59SSteve Sistare 
1822a9e2e59SSteve Sistare     trace_migration_file_incoming(filename);
1832a9e2e59SSteve Sistare 
1842a9e2e59SSteve Sistare     fioc = qio_channel_file_new_path(filename, O_RDONLY, 0, errp);
1852a9e2e59SSteve Sistare     if (!fioc) {
1862a9e2e59SSteve Sistare         return;
1872a9e2e59SSteve Sistare     }
1882a9e2e59SSteve Sistare 
1892dd7ee7aSFabiano Rosas     if (offset &&
1902dd7ee7aSFabiano Rosas         qio_channel_io_seek(QIO_CHANNEL(fioc), offset, SEEK_SET, errp) < 0) {
19174228c59SFabiano Rosas         object_unref(OBJECT(fioc));
192385f510dSSteve Sistare         return;
193385f510dSSteve Sistare     }
1942dd7ee7aSFabiano Rosas 
1959d70239eSFabiano Rosas     file_create_incoming_channels(QIO_CHANNEL(fioc), filename, errp);
1962a9e2e59SSteve Sistare }
197f427d90bSFabiano Rosas 
file_write_ramblock_iov(QIOChannel * ioc,const struct iovec * iov,int niov,MultiFDPages_t * pages,Error ** errp)198f427d90bSFabiano Rosas int file_write_ramblock_iov(QIOChannel *ioc, const struct iovec *iov,
199*112f7d1bSFabiano Rosas                             int niov, MultiFDPages_t *pages, Error **errp)
200f427d90bSFabiano Rosas {
20144fe138eSFabiano Rosas     ssize_t ret = 0;
202f427d90bSFabiano Rosas     int i, slice_idx, slice_num;
203f427d90bSFabiano Rosas     uintptr_t base, next, offset;
204f427d90bSFabiano Rosas     size_t len;
205*112f7d1bSFabiano Rosas     RAMBlock *block = pages->block;
206f427d90bSFabiano Rosas 
207f427d90bSFabiano Rosas     slice_idx = 0;
208f427d90bSFabiano Rosas     slice_num = 1;
209f427d90bSFabiano Rosas 
210f427d90bSFabiano Rosas     /*
211f427d90bSFabiano Rosas      * If the iov array doesn't have contiguous elements, we need to
212f427d90bSFabiano Rosas      * split it in slices because we only have one file offset for the
213f427d90bSFabiano Rosas      * whole iov. Do this here so callers don't need to break the iov
214f427d90bSFabiano Rosas      * array themselves.
215f427d90bSFabiano Rosas      */
216f427d90bSFabiano Rosas     for (i = 0; i < niov; i++, slice_num++) {
217f427d90bSFabiano Rosas         base = (uintptr_t) iov[i].iov_base;
218f427d90bSFabiano Rosas 
219f427d90bSFabiano Rosas         if (i != niov - 1) {
220f427d90bSFabiano Rosas             len = iov[i].iov_len;
221f427d90bSFabiano Rosas             next = (uintptr_t) iov[i + 1].iov_base;
222f427d90bSFabiano Rosas 
223f427d90bSFabiano Rosas             if (base + len == next) {
224f427d90bSFabiano Rosas                 continue;
225f427d90bSFabiano Rosas             }
226f427d90bSFabiano Rosas         }
227f427d90bSFabiano Rosas 
228f427d90bSFabiano Rosas         /*
229f427d90bSFabiano Rosas          * Use the offset of the first element of the segment that
230f427d90bSFabiano Rosas          * we're sending.
231f427d90bSFabiano Rosas          */
232f427d90bSFabiano Rosas         offset = (uintptr_t) iov[slice_idx].iov_base - (uintptr_t) block->host;
233f427d90bSFabiano Rosas         if (offset >= block->used_length) {
234a1bb5dd1SAnthony PERARD             error_setg(errp, "offset %" PRIxPTR
235f427d90bSFabiano Rosas                        "outside of ramblock %s range", offset, block->idstr);
236f427d90bSFabiano Rosas             ret = -1;
237f427d90bSFabiano Rosas             break;
238f427d90bSFabiano Rosas         }
239f427d90bSFabiano Rosas 
240f427d90bSFabiano Rosas         ret = qio_channel_pwritev(ioc, &iov[slice_idx], slice_num,
241f427d90bSFabiano Rosas                                   block->pages_offset + offset, errp);
242f427d90bSFabiano Rosas         if (ret < 0) {
243f427d90bSFabiano Rosas             break;
244f427d90bSFabiano Rosas         }
245f427d90bSFabiano Rosas 
246f427d90bSFabiano Rosas         slice_idx += slice_num;
247f427d90bSFabiano Rosas         slice_num = 0;
248f427d90bSFabiano Rosas     }
249f427d90bSFabiano Rosas 
250f427d90bSFabiano Rosas     return (ret < 0) ? ret : 0;
251f427d90bSFabiano Rosas }
252a49d15a3SFabiano Rosas 
multifd_file_recv_data(MultiFDRecvParams * p,Error ** errp)253a49d15a3SFabiano Rosas int multifd_file_recv_data(MultiFDRecvParams *p, Error **errp)
254a49d15a3SFabiano Rosas {
255a49d15a3SFabiano Rosas     MultiFDRecvData *data = p->data;
256a49d15a3SFabiano Rosas     size_t ret;
257a49d15a3SFabiano Rosas 
258a49d15a3SFabiano Rosas     ret = qio_channel_pread(p->c, (char *) data->opaque,
259a49d15a3SFabiano Rosas                             data->size, data->file_offset, errp);
260a49d15a3SFabiano Rosas     if (ret != data->size) {
261a49d15a3SFabiano Rosas         error_prepend(errp,
262a49d15a3SFabiano Rosas                       "multifd recv (%u): read 0x%zx, expected 0x%zx",
263a49d15a3SFabiano Rosas                       p->id, ret, data->size);
264a49d15a3SFabiano Rosas         return -1;
265a49d15a3SFabiano Rosas     }
266a49d15a3SFabiano Rosas 
267a49d15a3SFabiano Rosas     return 0;
268a49d15a3SFabiano Rosas }
269