12a9e2e59SSteve Sistare /*
22a9e2e59SSteve Sistare * Copyright (c) 2021-2023 Oracle and/or its affiliates.
32a9e2e59SSteve Sistare *
42a9e2e59SSteve Sistare * This work is licensed under the terms of the GNU GPL, version 2 or later.
52a9e2e59SSteve Sistare * See the COPYING file in the top-level directory.
62a9e2e59SSteve Sistare */
72a9e2e59SSteve Sistare
82a9e2e59SSteve Sistare #include "qemu/osdep.h"
9d117ed06SFabiano Rosas #include "exec/ramblock.h"
10385f510dSSteve Sistare #include "qemu/cutils.h"
112dd7ee7aSFabiano Rosas #include "qemu/error-report.h"
12385f510dSSteve Sistare #include "qapi/error.h"
132a9e2e59SSteve Sistare #include "channel.h"
142a9e2e59SSteve Sistare #include "file.h"
152a9e2e59SSteve Sistare #include "migration.h"
162a9e2e59SSteve Sistare #include "io/channel-file.h"
1773f6f9a1SFabiano Rosas #include "io/channel-socket.h"
182a9e2e59SSteve Sistare #include "io/channel-util.h"
192dd7ee7aSFabiano Rosas #include "options.h"
202a9e2e59SSteve Sistare #include "trace.h"
212a9e2e59SSteve Sistare
22385f510dSSteve Sistare #define OFFSET_OPTION ",offset="
23385f510dSSteve Sistare
24b7b03eb6SFabiano Rosas static struct FileOutgoingArgs {
25b7b03eb6SFabiano Rosas char *fname;
26b7b03eb6SFabiano Rosas } outgoing_args;
27b7b03eb6SFabiano Rosas
28385f510dSSteve Sistare /* Remove the offset option from @filespec and return it in @offsetp. */
29385f510dSSteve Sistare
file_parse_offset(char * filespec,uint64_t * offsetp,Error ** errp)3072a8192eSHet Gala int file_parse_offset(char *filespec, uint64_t *offsetp, Error **errp)
31385f510dSSteve Sistare {
32385f510dSSteve Sistare char *option = strstr(filespec, OFFSET_OPTION);
33385f510dSSteve Sistare int ret;
34385f510dSSteve Sistare
35385f510dSSteve Sistare if (option) {
36385f510dSSteve Sistare *option = 0;
37385f510dSSteve Sistare option += sizeof(OFFSET_OPTION) - 1;
38385f510dSSteve Sistare ret = qemu_strtosz(option, NULL, offsetp);
39385f510dSSteve Sistare if (ret) {
40385f510dSSteve Sistare error_setg_errno(errp, -ret, "file URI has bad offset %s", option);
41385f510dSSteve Sistare return -1;
42385f510dSSteve Sistare }
43385f510dSSteve Sistare }
44385f510dSSteve Sistare return 0;
45385f510dSSteve Sistare }
46385f510dSSteve Sistare
file_cleanup_outgoing_migration(void)47b7b03eb6SFabiano Rosas void file_cleanup_outgoing_migration(void)
48b7b03eb6SFabiano Rosas {
49b7b03eb6SFabiano Rosas g_free(outgoing_args.fname);
50b7b03eb6SFabiano Rosas outgoing_args.fname = NULL;
51b7b03eb6SFabiano Rosas }
52b7b03eb6SFabiano Rosas
file_enable_direct_io(int * flags)539d70239eSFabiano Rosas static void file_enable_direct_io(int *flags)
549d70239eSFabiano Rosas {
559d70239eSFabiano Rosas #ifdef O_DIRECT
569d70239eSFabiano Rosas *flags |= O_DIRECT;
579d70239eSFabiano Rosas #else
589d70239eSFabiano Rosas /* it should have been rejected when setting the parameter */
599d70239eSFabiano Rosas g_assert_not_reached();
609d70239eSFabiano Rosas #endif
619d70239eSFabiano Rosas }
629d70239eSFabiano Rosas
file_send_channel_create(gpointer opaque,Error ** errp)63b7b03eb6SFabiano Rosas bool file_send_channel_create(gpointer opaque, Error **errp)
64b7b03eb6SFabiano Rosas {
65b7b03eb6SFabiano Rosas QIOChannelFile *ioc;
66b7b03eb6SFabiano Rosas int flags = O_WRONLY;
67bd4480b0SFabiano Rosas bool ret = true;
68b7b03eb6SFabiano Rosas
699d70239eSFabiano Rosas if (migrate_direct_io()) {
709d70239eSFabiano Rosas /*
719d70239eSFabiano Rosas * Enable O_DIRECT for the secondary channels. These are used
729d70239eSFabiano Rosas * for sending ram pages and writes should be guaranteed to be
739d70239eSFabiano Rosas * aligned to at least page size.
749d70239eSFabiano Rosas */
759d70239eSFabiano Rosas file_enable_direct_io(&flags);
769d70239eSFabiano Rosas }
779d70239eSFabiano Rosas
78b7b03eb6SFabiano Rosas ioc = qio_channel_file_new_path(outgoing_args.fname, flags, 0, errp);
79b7b03eb6SFabiano Rosas if (!ioc) {
80bd4480b0SFabiano Rosas ret = false;
81b7b03eb6SFabiano Rosas goto out;
82b7b03eb6SFabiano Rosas }
83b7b03eb6SFabiano Rosas
84b7b03eb6SFabiano Rosas multifd_channel_connect(opaque, QIO_CHANNEL(ioc));
85b7b03eb6SFabiano Rosas
86b7b03eb6SFabiano Rosas out:
87b7b03eb6SFabiano Rosas /*
88b7b03eb6SFabiano Rosas * File channel creation is synchronous. However posting this
89b7b03eb6SFabiano Rosas * semaphore here is simpler than adding a special case.
90b7b03eb6SFabiano Rosas */
91b7b03eb6SFabiano Rosas multifd_send_channel_created();
92b7b03eb6SFabiano Rosas
93b7b03eb6SFabiano Rosas return ret;
94b7b03eb6SFabiano Rosas }
95b7b03eb6SFabiano Rosas
file_start_outgoing_migration(MigrationState * s,FileMigrationArgs * file_args,Error ** errp)9602afba63SFabiano Rosas void file_start_outgoing_migration(MigrationState *s,
9702afba63SFabiano Rosas FileMigrationArgs *file_args, Error **errp)
982a9e2e59SSteve Sistare {
992a9e2e59SSteve Sistare g_autoptr(QIOChannelFile) fioc = NULL;
10002afba63SFabiano Rosas g_autofree char *filename = g_strdup(file_args->filename);
10102afba63SFabiano Rosas uint64_t offset = file_args->offset;
1022a9e2e59SSteve Sistare QIOChannel *ioc;
1032a9e2e59SSteve Sistare
1042a9e2e59SSteve Sistare trace_migration_file_outgoing(filename);
1052a9e2e59SSteve Sistare
1066d327965SFabiano Rosas fioc = qio_channel_file_new_path(filename, O_CREAT | O_WRONLY, 0600, errp);
1072a9e2e59SSteve Sistare if (!fioc) {
1082a9e2e59SSteve Sistare return;
1092a9e2e59SSteve Sistare }
1102a9e2e59SSteve Sistare
1116d327965SFabiano Rosas if (ftruncate(fioc->fd, offset)) {
1126d327965SFabiano Rosas error_setg_errno(errp, errno,
1136d327965SFabiano Rosas "failed to truncate migration file to offset %" PRIx64,
1146d327965SFabiano Rosas offset);
1156d327965SFabiano Rosas return;
1166d327965SFabiano Rosas }
1176d327965SFabiano Rosas
118b7b03eb6SFabiano Rosas outgoing_args.fname = g_strdup(filename);
119b7b03eb6SFabiano Rosas
1202a9e2e59SSteve Sistare ioc = QIO_CHANNEL(fioc);
121385f510dSSteve Sistare if (offset && qio_channel_io_seek(ioc, offset, SEEK_SET, errp) < 0) {
122385f510dSSteve Sistare return;
123385f510dSSteve Sistare }
1242a9e2e59SSteve Sistare qio_channel_set_name(ioc, "migration-file-outgoing");
1252a9e2e59SSteve Sistare migration_channel_connect(s, ioc, NULL, NULL);
1262a9e2e59SSteve Sistare }
1272a9e2e59SSteve Sistare
file_accept_incoming_migration(QIOChannel * ioc,GIOCondition condition,gpointer opaque)1282a9e2e59SSteve Sistare static gboolean file_accept_incoming_migration(QIOChannel *ioc,
1292a9e2e59SSteve Sistare GIOCondition condition,
1302a9e2e59SSteve Sistare gpointer opaque)
1312a9e2e59SSteve Sistare {
1322a9e2e59SSteve Sistare migration_channel_process_incoming(ioc);
1332a9e2e59SSteve Sistare object_unref(OBJECT(ioc));
1342a9e2e59SSteve Sistare return G_SOURCE_REMOVE;
1352a9e2e59SSteve Sistare }
1362a9e2e59SSteve Sistare
file_create_incoming_channels(QIOChannel * ioc,char * filename,Error ** errp)1379d70239eSFabiano Rosas static void file_create_incoming_channels(QIOChannel *ioc, char *filename,
1389d70239eSFabiano Rosas Error **errp)
13974228c59SFabiano Rosas {
1409d70239eSFabiano Rosas int i, channels = 1;
14174228c59SFabiano Rosas g_autofree QIOChannel **iocs = NULL;
1429d70239eSFabiano Rosas int flags = O_RDONLY;
14374228c59SFabiano Rosas
14474228c59SFabiano Rosas if (migrate_multifd()) {
14574228c59SFabiano Rosas channels += migrate_multifd_channels();
1469d70239eSFabiano Rosas if (migrate_direct_io()) {
1479d70239eSFabiano Rosas file_enable_direct_io(&flags);
1489d70239eSFabiano Rosas }
14974228c59SFabiano Rosas }
15074228c59SFabiano Rosas
15174228c59SFabiano Rosas iocs = g_new0(QIOChannel *, channels);
15274228c59SFabiano Rosas iocs[0] = ioc;
15374228c59SFabiano Rosas
15474228c59SFabiano Rosas for (i = 1; i < channels; i++) {
1559d70239eSFabiano Rosas QIOChannelFile *fioc = qio_channel_file_new_path(filename, flags, 0, errp);
15674228c59SFabiano Rosas
15774228c59SFabiano Rosas if (!fioc) {
15874228c59SFabiano Rosas while (i) {
15974228c59SFabiano Rosas object_unref(iocs[--i]);
16074228c59SFabiano Rosas }
16174228c59SFabiano Rosas return;
16274228c59SFabiano Rosas }
16374228c59SFabiano Rosas
16474228c59SFabiano Rosas iocs[i] = QIO_CHANNEL(fioc);
16574228c59SFabiano Rosas }
16674228c59SFabiano Rosas
16774228c59SFabiano Rosas for (i = 0; i < channels; i++) {
16874228c59SFabiano Rosas qio_channel_set_name(iocs[i], "migration-file-incoming");
16974228c59SFabiano Rosas qio_channel_add_watch_full(iocs[i], G_IO_IN,
17074228c59SFabiano Rosas file_accept_incoming_migration,
17174228c59SFabiano Rosas NULL, NULL,
17274228c59SFabiano Rosas g_main_context_get_thread_default());
17374228c59SFabiano Rosas }
17474228c59SFabiano Rosas }
17574228c59SFabiano Rosas
file_start_incoming_migration(FileMigrationArgs * file_args,Error ** errp)17602afba63SFabiano Rosas void file_start_incoming_migration(FileMigrationArgs *file_args, Error **errp)
1772a9e2e59SSteve Sistare {
17802afba63SFabiano Rosas g_autofree char *filename = g_strdup(file_args->filename);
1792a9e2e59SSteve Sistare QIOChannelFile *fioc = NULL;
18002afba63SFabiano Rosas uint64_t offset = file_args->offset;
1812a9e2e59SSteve Sistare
1822a9e2e59SSteve Sistare trace_migration_file_incoming(filename);
1832a9e2e59SSteve Sistare
1842a9e2e59SSteve Sistare fioc = qio_channel_file_new_path(filename, O_RDONLY, 0, errp);
1852a9e2e59SSteve Sistare if (!fioc) {
1862a9e2e59SSteve Sistare return;
1872a9e2e59SSteve Sistare }
1882a9e2e59SSteve Sistare
1892dd7ee7aSFabiano Rosas if (offset &&
1902dd7ee7aSFabiano Rosas qio_channel_io_seek(QIO_CHANNEL(fioc), offset, SEEK_SET, errp) < 0) {
19174228c59SFabiano Rosas object_unref(OBJECT(fioc));
192385f510dSSteve Sistare return;
193385f510dSSteve Sistare }
1942dd7ee7aSFabiano Rosas
1959d70239eSFabiano Rosas file_create_incoming_channels(QIO_CHANNEL(fioc), filename, errp);
1962a9e2e59SSteve Sistare }
197f427d90bSFabiano Rosas
file_write_ramblock_iov(QIOChannel * ioc,const struct iovec * iov,int niov,MultiFDPages_t * pages,Error ** errp)198f427d90bSFabiano Rosas int file_write_ramblock_iov(QIOChannel *ioc, const struct iovec *iov,
199*112f7d1bSFabiano Rosas int niov, MultiFDPages_t *pages, Error **errp)
200f427d90bSFabiano Rosas {
20144fe138eSFabiano Rosas ssize_t ret = 0;
202f427d90bSFabiano Rosas int i, slice_idx, slice_num;
203f427d90bSFabiano Rosas uintptr_t base, next, offset;
204f427d90bSFabiano Rosas size_t len;
205*112f7d1bSFabiano Rosas RAMBlock *block = pages->block;
206f427d90bSFabiano Rosas
207f427d90bSFabiano Rosas slice_idx = 0;
208f427d90bSFabiano Rosas slice_num = 1;
209f427d90bSFabiano Rosas
210f427d90bSFabiano Rosas /*
211f427d90bSFabiano Rosas * If the iov array doesn't have contiguous elements, we need to
212f427d90bSFabiano Rosas * split it in slices because we only have one file offset for the
213f427d90bSFabiano Rosas * whole iov. Do this here so callers don't need to break the iov
214f427d90bSFabiano Rosas * array themselves.
215f427d90bSFabiano Rosas */
216f427d90bSFabiano Rosas for (i = 0; i < niov; i++, slice_num++) {
217f427d90bSFabiano Rosas base = (uintptr_t) iov[i].iov_base;
218f427d90bSFabiano Rosas
219f427d90bSFabiano Rosas if (i != niov - 1) {
220f427d90bSFabiano Rosas len = iov[i].iov_len;
221f427d90bSFabiano Rosas next = (uintptr_t) iov[i + 1].iov_base;
222f427d90bSFabiano Rosas
223f427d90bSFabiano Rosas if (base + len == next) {
224f427d90bSFabiano Rosas continue;
225f427d90bSFabiano Rosas }
226f427d90bSFabiano Rosas }
227f427d90bSFabiano Rosas
228f427d90bSFabiano Rosas /*
229f427d90bSFabiano Rosas * Use the offset of the first element of the segment that
230f427d90bSFabiano Rosas * we're sending.
231f427d90bSFabiano Rosas */
232f427d90bSFabiano Rosas offset = (uintptr_t) iov[slice_idx].iov_base - (uintptr_t) block->host;
233f427d90bSFabiano Rosas if (offset >= block->used_length) {
234a1bb5dd1SAnthony PERARD error_setg(errp, "offset %" PRIxPTR
235f427d90bSFabiano Rosas "outside of ramblock %s range", offset, block->idstr);
236f427d90bSFabiano Rosas ret = -1;
237f427d90bSFabiano Rosas break;
238f427d90bSFabiano Rosas }
239f427d90bSFabiano Rosas
240f427d90bSFabiano Rosas ret = qio_channel_pwritev(ioc, &iov[slice_idx], slice_num,
241f427d90bSFabiano Rosas block->pages_offset + offset, errp);
242f427d90bSFabiano Rosas if (ret < 0) {
243f427d90bSFabiano Rosas break;
244f427d90bSFabiano Rosas }
245f427d90bSFabiano Rosas
246f427d90bSFabiano Rosas slice_idx += slice_num;
247f427d90bSFabiano Rosas slice_num = 0;
248f427d90bSFabiano Rosas }
249f427d90bSFabiano Rosas
250f427d90bSFabiano Rosas return (ret < 0) ? ret : 0;
251f427d90bSFabiano Rosas }
252a49d15a3SFabiano Rosas
multifd_file_recv_data(MultiFDRecvParams * p,Error ** errp)253a49d15a3SFabiano Rosas int multifd_file_recv_data(MultiFDRecvParams *p, Error **errp)
254a49d15a3SFabiano Rosas {
255a49d15a3SFabiano Rosas MultiFDRecvData *data = p->data;
256a49d15a3SFabiano Rosas size_t ret;
257a49d15a3SFabiano Rosas
258a49d15a3SFabiano Rosas ret = qio_channel_pread(p->c, (char *) data->opaque,
259a49d15a3SFabiano Rosas data->size, data->file_offset, errp);
260a49d15a3SFabiano Rosas if (ret != data->size) {
261a49d15a3SFabiano Rosas error_prepend(errp,
262a49d15a3SFabiano Rosas "multifd recv (%u): read 0x%zx, expected 0x%zx",
263a49d15a3SFabiano Rosas p->id, ret, data->size);
264a49d15a3SFabiano Rosas return -1;
265a49d15a3SFabiano Rosas }
266a49d15a3SFabiano Rosas
267a49d15a3SFabiano Rosas return 0;
268a49d15a3SFabiano Rosas }
269