xref: /openbmc/linux/arch/um/drivers/virtio_uml.c (revision abdeb4fa)
1 // SPDX-License-Identifier: GPL-2.0-or-later
2 /*
3  * Virtio vhost-user driver
4  *
5  * Copyright(c) 2019 Intel Corporation
6  *
7  * This driver allows virtio devices to be used over a vhost-user socket.
8  *
9  * Guest devices can be instantiated by kernel module or command line
10  * parameters. One device will be created for each parameter. Syntax:
11  *
12  *		virtio_uml.device=<socket>:<virtio_id>[:<platform_id>]
13  * where:
14  *		<socket>	:= vhost-user socket path to connect
15  *		<virtio_id>	:= virtio device id (as in virtio_ids.h)
16  *		<platform_id>	:= (optional) platform device id
17  *
18  * example:
19  *		virtio_uml.device=/var/uml.socket:1
20  *
21  * Based on Virtio MMIO driver by Pawel Moll, copyright 2011-2014, ARM Ltd.
22  */
23 #include <linux/module.h>
24 #include <linux/of.h>
25 #include <linux/platform_device.h>
26 #include <linux/slab.h>
27 #include <linux/virtio.h>
28 #include <linux/virtio_config.h>
29 #include <linux/virtio_ring.h>
30 #include <linux/time-internal.h>
31 #include <linux/virtio-uml.h>
32 #include <shared/as-layout.h>
33 #include <irq_kern.h>
34 #include <init.h>
35 #include <os.h>
36 #include "vhost_user.h"
37 
38 #define MAX_SUPPORTED_QUEUE_SIZE	256
39 
40 #define to_virtio_uml_device(_vdev) \
41 	container_of(_vdev, struct virtio_uml_device, vdev)
42 
43 struct virtio_uml_platform_data {
44 	u32 virtio_device_id;
45 	const char *socket_path;
46 	struct work_struct conn_broken_wk;
47 	struct platform_device *pdev;
48 };
49 
50 struct virtio_uml_device {
51 	struct virtio_device vdev;
52 	struct platform_device *pdev;
53 	struct virtio_uml_platform_data *pdata;
54 
55 	spinlock_t sock_lock;
56 	int sock, req_fd, irq;
57 	u64 features;
58 	u64 protocol_features;
59 	u8 status;
60 	u8 registered:1;
61 	u8 suspended:1;
62 	u8 no_vq_suspend:1;
63 
64 	u8 config_changed_irq:1;
65 	uint64_t vq_irq_vq_map;
66 	int recv_rc;
67 };
68 
69 struct virtio_uml_vq_info {
70 	int kick_fd, call_fd;
71 	char name[32];
72 	bool suspended;
73 };
74 
75 extern unsigned long long physmem_size, highmem;
76 
77 #define vu_err(vu_dev, ...)	dev_err(&(vu_dev)->pdev->dev, ##__VA_ARGS__)
78 
79 /* Vhost-user protocol */
80 
full_sendmsg_fds(int fd,const void * buf,unsigned int len,const int * fds,unsigned int fds_num)81 static int full_sendmsg_fds(int fd, const void *buf, unsigned int len,
82 			    const int *fds, unsigned int fds_num)
83 {
84 	int rc;
85 
86 	do {
87 		rc = os_sendmsg_fds(fd, buf, len, fds, fds_num);
88 		if (rc > 0) {
89 			buf += rc;
90 			len -= rc;
91 			fds = NULL;
92 			fds_num = 0;
93 		}
94 	} while (len && (rc >= 0 || rc == -EINTR));
95 
96 	if (rc < 0)
97 		return rc;
98 	return 0;
99 }
100 
full_read(int fd,void * buf,int len,bool abortable)101 static int full_read(int fd, void *buf, int len, bool abortable)
102 {
103 	int rc;
104 
105 	if (!len)
106 		return 0;
107 
108 	do {
109 		rc = os_read_file(fd, buf, len);
110 		if (rc > 0) {
111 			buf += rc;
112 			len -= rc;
113 		}
114 	} while (len && (rc > 0 || rc == -EINTR || (!abortable && rc == -EAGAIN)));
115 
116 	if (rc < 0)
117 		return rc;
118 	if (rc == 0)
119 		return -ECONNRESET;
120 	return 0;
121 }
122 
vhost_user_recv_header(int fd,struct vhost_user_msg * msg)123 static int vhost_user_recv_header(int fd, struct vhost_user_msg *msg)
124 {
125 	return full_read(fd, msg, sizeof(msg->header), true);
126 }
127 
vhost_user_recv(struct virtio_uml_device * vu_dev,int fd,struct vhost_user_msg * msg,size_t max_payload_size,bool wait)128 static int vhost_user_recv(struct virtio_uml_device *vu_dev,
129 			   int fd, struct vhost_user_msg *msg,
130 			   size_t max_payload_size, bool wait)
131 {
132 	size_t size;
133 	int rc;
134 
135 	/*
136 	 * In virtio time-travel mode, we're handling all the vhost-user
137 	 * FDs by polling them whenever appropriate. However, we may get
138 	 * into a situation where we're sending out an interrupt message
139 	 * to a device (e.g. a net device) and need to handle a simulation
140 	 * time message while doing so, e.g. one that tells us to update
141 	 * our idea of how long we can run without scheduling.
142 	 *
143 	 * Thus, we need to not just read() from the given fd, but need
144 	 * to also handle messages for the simulation time - this function
145 	 * does that for us while waiting for the given fd to be readable.
146 	 */
147 	if (wait)
148 		time_travel_wait_readable(fd);
149 
150 	rc = vhost_user_recv_header(fd, msg);
151 
152 	if (rc)
153 		return rc;
154 	size = msg->header.size;
155 	if (size > max_payload_size)
156 		return -EPROTO;
157 	return full_read(fd, &msg->payload, size, false);
158 }
159 
vhost_user_check_reset(struct virtio_uml_device * vu_dev,int rc)160 static void vhost_user_check_reset(struct virtio_uml_device *vu_dev,
161 				   int rc)
162 {
163 	struct virtio_uml_platform_data *pdata = vu_dev->pdata;
164 
165 	if (rc != -ECONNRESET)
166 		return;
167 
168 	if (!vu_dev->registered)
169 		return;
170 
171 	vu_dev->registered = 0;
172 
173 	schedule_work(&pdata->conn_broken_wk);
174 }
175 
vhost_user_recv_resp(struct virtio_uml_device * vu_dev,struct vhost_user_msg * msg,size_t max_payload_size)176 static int vhost_user_recv_resp(struct virtio_uml_device *vu_dev,
177 				struct vhost_user_msg *msg,
178 				size_t max_payload_size)
179 {
180 	int rc = vhost_user_recv(vu_dev, vu_dev->sock, msg,
181 				 max_payload_size, true);
182 
183 	if (rc) {
184 		vhost_user_check_reset(vu_dev, rc);
185 		return rc;
186 	}
187 
188 	if (msg->header.flags != (VHOST_USER_FLAG_REPLY | VHOST_USER_VERSION))
189 		return -EPROTO;
190 
191 	return 0;
192 }
193 
vhost_user_recv_u64(struct virtio_uml_device * vu_dev,u64 * value)194 static int vhost_user_recv_u64(struct virtio_uml_device *vu_dev,
195 			       u64 *value)
196 {
197 	struct vhost_user_msg msg;
198 	int rc = vhost_user_recv_resp(vu_dev, &msg,
199 				      sizeof(msg.payload.integer));
200 
201 	if (rc)
202 		return rc;
203 	if (msg.header.size != sizeof(msg.payload.integer))
204 		return -EPROTO;
205 	*value = msg.payload.integer;
206 	return 0;
207 }
208 
vhost_user_recv_req(struct virtio_uml_device * vu_dev,struct vhost_user_msg * msg,size_t max_payload_size)209 static int vhost_user_recv_req(struct virtio_uml_device *vu_dev,
210 			       struct vhost_user_msg *msg,
211 			       size_t max_payload_size)
212 {
213 	int rc = vhost_user_recv(vu_dev, vu_dev->req_fd, msg,
214 				 max_payload_size, false);
215 
216 	if (rc)
217 		return rc;
218 
219 	if ((msg->header.flags & ~VHOST_USER_FLAG_NEED_REPLY) !=
220 			VHOST_USER_VERSION)
221 		return -EPROTO;
222 
223 	return 0;
224 }
225 
vhost_user_send(struct virtio_uml_device * vu_dev,bool need_response,struct vhost_user_msg * msg,int * fds,size_t num_fds)226 static int vhost_user_send(struct virtio_uml_device *vu_dev,
227 			   bool need_response, struct vhost_user_msg *msg,
228 			   int *fds, size_t num_fds)
229 {
230 	size_t size = sizeof(msg->header) + msg->header.size;
231 	unsigned long flags;
232 	bool request_ack;
233 	int rc;
234 
235 	msg->header.flags |= VHOST_USER_VERSION;
236 
237 	/*
238 	 * The need_response flag indicates that we already need a response,
239 	 * e.g. to read the features. In these cases, don't request an ACK as
240 	 * it is meaningless. Also request an ACK only if supported.
241 	 */
242 	request_ack = !need_response;
243 	if (!(vu_dev->protocol_features &
244 			BIT_ULL(VHOST_USER_PROTOCOL_F_REPLY_ACK)))
245 		request_ack = false;
246 
247 	if (request_ack)
248 		msg->header.flags |= VHOST_USER_FLAG_NEED_REPLY;
249 
250 	spin_lock_irqsave(&vu_dev->sock_lock, flags);
251 	rc = full_sendmsg_fds(vu_dev->sock, msg, size, fds, num_fds);
252 	if (rc < 0)
253 		goto out;
254 
255 	if (request_ack) {
256 		uint64_t status;
257 
258 		rc = vhost_user_recv_u64(vu_dev, &status);
259 		if (rc)
260 			goto out;
261 
262 		if (status) {
263 			vu_err(vu_dev, "slave reports error: %llu\n", status);
264 			rc = -EIO;
265 			goto out;
266 		}
267 	}
268 
269 out:
270 	spin_unlock_irqrestore(&vu_dev->sock_lock, flags);
271 	return rc;
272 }
273 
vhost_user_send_no_payload(struct virtio_uml_device * vu_dev,bool need_response,u32 request)274 static int vhost_user_send_no_payload(struct virtio_uml_device *vu_dev,
275 				      bool need_response, u32 request)
276 {
277 	struct vhost_user_msg msg = {
278 		.header.request = request,
279 	};
280 
281 	return vhost_user_send(vu_dev, need_response, &msg, NULL, 0);
282 }
283 
vhost_user_send_no_payload_fd(struct virtio_uml_device * vu_dev,u32 request,int fd)284 static int vhost_user_send_no_payload_fd(struct virtio_uml_device *vu_dev,
285 					 u32 request, int fd)
286 {
287 	struct vhost_user_msg msg = {
288 		.header.request = request,
289 	};
290 
291 	return vhost_user_send(vu_dev, false, &msg, &fd, 1);
292 }
293 
vhost_user_send_u64(struct virtio_uml_device * vu_dev,u32 request,u64 value)294 static int vhost_user_send_u64(struct virtio_uml_device *vu_dev,
295 			       u32 request, u64 value)
296 {
297 	struct vhost_user_msg msg = {
298 		.header.request = request,
299 		.header.size = sizeof(msg.payload.integer),
300 		.payload.integer = value,
301 	};
302 
303 	return vhost_user_send(vu_dev, false, &msg, NULL, 0);
304 }
305 
vhost_user_set_owner(struct virtio_uml_device * vu_dev)306 static int vhost_user_set_owner(struct virtio_uml_device *vu_dev)
307 {
308 	return vhost_user_send_no_payload(vu_dev, false, VHOST_USER_SET_OWNER);
309 }
310 
vhost_user_get_features(struct virtio_uml_device * vu_dev,u64 * features)311 static int vhost_user_get_features(struct virtio_uml_device *vu_dev,
312 				   u64 *features)
313 {
314 	int rc = vhost_user_send_no_payload(vu_dev, true,
315 					    VHOST_USER_GET_FEATURES);
316 
317 	if (rc)
318 		return rc;
319 	return vhost_user_recv_u64(vu_dev, features);
320 }
321 
vhost_user_set_features(struct virtio_uml_device * vu_dev,u64 features)322 static int vhost_user_set_features(struct virtio_uml_device *vu_dev,
323 				   u64 features)
324 {
325 	return vhost_user_send_u64(vu_dev, VHOST_USER_SET_FEATURES, features);
326 }
327 
vhost_user_get_protocol_features(struct virtio_uml_device * vu_dev,u64 * protocol_features)328 static int vhost_user_get_protocol_features(struct virtio_uml_device *vu_dev,
329 					    u64 *protocol_features)
330 {
331 	int rc = vhost_user_send_no_payload(vu_dev, true,
332 			VHOST_USER_GET_PROTOCOL_FEATURES);
333 
334 	if (rc)
335 		return rc;
336 	return vhost_user_recv_u64(vu_dev, protocol_features);
337 }
338 
vhost_user_set_protocol_features(struct virtio_uml_device * vu_dev,u64 protocol_features)339 static int vhost_user_set_protocol_features(struct virtio_uml_device *vu_dev,
340 					    u64 protocol_features)
341 {
342 	return vhost_user_send_u64(vu_dev, VHOST_USER_SET_PROTOCOL_FEATURES,
343 				   protocol_features);
344 }
345 
vhost_user_reply(struct virtio_uml_device * vu_dev,struct vhost_user_msg * msg,int response)346 static void vhost_user_reply(struct virtio_uml_device *vu_dev,
347 			     struct vhost_user_msg *msg, int response)
348 {
349 	struct vhost_user_msg reply = {
350 		.payload.integer = response,
351 	};
352 	size_t size = sizeof(reply.header) + sizeof(reply.payload.integer);
353 	int rc;
354 
355 	reply.header = msg->header;
356 	reply.header.flags &= ~VHOST_USER_FLAG_NEED_REPLY;
357 	reply.header.flags |= VHOST_USER_FLAG_REPLY;
358 	reply.header.size = sizeof(reply.payload.integer);
359 
360 	rc = full_sendmsg_fds(vu_dev->req_fd, &reply, size, NULL, 0);
361 
362 	if (rc)
363 		vu_err(vu_dev,
364 		       "sending reply to slave request failed: %d (size %zu)\n",
365 		       rc, size);
366 }
367 
vu_req_read_message(struct virtio_uml_device * vu_dev,struct time_travel_event * ev)368 static irqreturn_t vu_req_read_message(struct virtio_uml_device *vu_dev,
369 				       struct time_travel_event *ev)
370 {
371 	struct virtqueue *vq;
372 	int response = 1;
373 	struct {
374 		struct vhost_user_msg msg;
375 		u8 extra_payload[512];
376 	} msg;
377 	int rc;
378 	irqreturn_t irq_rc = IRQ_NONE;
379 
380 	while (1) {
381 		rc = vhost_user_recv_req(vu_dev, &msg.msg,
382 					 sizeof(msg.msg.payload) +
383 					 sizeof(msg.extra_payload));
384 		if (rc)
385 			break;
386 
387 		switch (msg.msg.header.request) {
388 		case VHOST_USER_SLAVE_CONFIG_CHANGE_MSG:
389 			vu_dev->config_changed_irq = true;
390 			response = 0;
391 			break;
392 		case VHOST_USER_SLAVE_VRING_CALL:
393 			virtio_device_for_each_vq((&vu_dev->vdev), vq) {
394 				if (vq->index == msg.msg.payload.vring_state.index) {
395 					response = 0;
396 					vu_dev->vq_irq_vq_map |= BIT_ULL(vq->index);
397 					break;
398 				}
399 			}
400 			break;
401 		case VHOST_USER_SLAVE_IOTLB_MSG:
402 			/* not supported - VIRTIO_F_ACCESS_PLATFORM */
403 		case VHOST_USER_SLAVE_VRING_HOST_NOTIFIER_MSG:
404 			/* not supported - VHOST_USER_PROTOCOL_F_HOST_NOTIFIER */
405 		default:
406 			vu_err(vu_dev, "unexpected slave request %d\n",
407 			       msg.msg.header.request);
408 		}
409 
410 		if (ev && !vu_dev->suspended)
411 			time_travel_add_irq_event(ev);
412 
413 		if (msg.msg.header.flags & VHOST_USER_FLAG_NEED_REPLY)
414 			vhost_user_reply(vu_dev, &msg.msg, response);
415 		irq_rc = IRQ_HANDLED;
416 	}
417 	/* mask EAGAIN as we try non-blocking read until socket is empty */
418 	vu_dev->recv_rc = (rc == -EAGAIN) ? 0 : rc;
419 	return irq_rc;
420 }
421 
vu_req_interrupt(int irq,void * data)422 static irqreturn_t vu_req_interrupt(int irq, void *data)
423 {
424 	struct virtio_uml_device *vu_dev = data;
425 	irqreturn_t ret = IRQ_HANDLED;
426 
427 	if (!um_irq_timetravel_handler_used())
428 		ret = vu_req_read_message(vu_dev, NULL);
429 
430 	if (vu_dev->recv_rc) {
431 		vhost_user_check_reset(vu_dev, vu_dev->recv_rc);
432 	} else if (vu_dev->vq_irq_vq_map) {
433 		struct virtqueue *vq;
434 
435 		virtio_device_for_each_vq((&vu_dev->vdev), vq) {
436 			if (vu_dev->vq_irq_vq_map & BIT_ULL(vq->index))
437 				vring_interrupt(0 /* ignored */, vq);
438 		}
439 		vu_dev->vq_irq_vq_map = 0;
440 	} else if (vu_dev->config_changed_irq) {
441 		virtio_config_changed(&vu_dev->vdev);
442 		vu_dev->config_changed_irq = false;
443 	}
444 
445 	return ret;
446 }
447 
vu_req_interrupt_comm_handler(int irq,int fd,void * data,struct time_travel_event * ev)448 static void vu_req_interrupt_comm_handler(int irq, int fd, void *data,
449 					  struct time_travel_event *ev)
450 {
451 	vu_req_read_message(data, ev);
452 }
453 
vhost_user_init_slave_req(struct virtio_uml_device * vu_dev)454 static int vhost_user_init_slave_req(struct virtio_uml_device *vu_dev)
455 {
456 	int rc, req_fds[2];
457 
458 	/* Use a pipe for slave req fd, SIGIO is not supported for eventfd */
459 	rc = os_pipe(req_fds, true, true);
460 	if (rc < 0)
461 		return rc;
462 	vu_dev->req_fd = req_fds[0];
463 
464 	rc = um_request_irq_tt(UM_IRQ_ALLOC, vu_dev->req_fd, IRQ_READ,
465 			       vu_req_interrupt, IRQF_SHARED,
466 			       vu_dev->pdev->name, vu_dev,
467 			       vu_req_interrupt_comm_handler);
468 	if (rc < 0)
469 		goto err_close;
470 
471 	vu_dev->irq = rc;
472 
473 	rc = vhost_user_send_no_payload_fd(vu_dev, VHOST_USER_SET_SLAVE_REQ_FD,
474 					   req_fds[1]);
475 	if (rc)
476 		goto err_free_irq;
477 
478 	goto out;
479 
480 err_free_irq:
481 	um_free_irq(vu_dev->irq, vu_dev);
482 err_close:
483 	os_close_file(req_fds[0]);
484 out:
485 	/* Close unused write end of request fds */
486 	os_close_file(req_fds[1]);
487 	return rc;
488 }
489 
vhost_user_init(struct virtio_uml_device * vu_dev)490 static int vhost_user_init(struct virtio_uml_device *vu_dev)
491 {
492 	int rc = vhost_user_set_owner(vu_dev);
493 
494 	if (rc)
495 		return rc;
496 	rc = vhost_user_get_features(vu_dev, &vu_dev->features);
497 	if (rc)
498 		return rc;
499 
500 	if (vu_dev->features & BIT_ULL(VHOST_USER_F_PROTOCOL_FEATURES)) {
501 		rc = vhost_user_get_protocol_features(vu_dev,
502 				&vu_dev->protocol_features);
503 		if (rc)
504 			return rc;
505 		vu_dev->protocol_features &= VHOST_USER_SUPPORTED_PROTOCOL_F;
506 		rc = vhost_user_set_protocol_features(vu_dev,
507 				vu_dev->protocol_features);
508 		if (rc)
509 			return rc;
510 	}
511 
512 	if (vu_dev->protocol_features &
513 			BIT_ULL(VHOST_USER_PROTOCOL_F_SLAVE_REQ)) {
514 		rc = vhost_user_init_slave_req(vu_dev);
515 		if (rc)
516 			return rc;
517 	}
518 
519 	return 0;
520 }
521 
vhost_user_get_config(struct virtio_uml_device * vu_dev,u32 offset,void * buf,u32 len)522 static void vhost_user_get_config(struct virtio_uml_device *vu_dev,
523 				  u32 offset, void *buf, u32 len)
524 {
525 	u32 cfg_size = offset + len;
526 	struct vhost_user_msg *msg;
527 	size_t payload_size = sizeof(msg->payload.config) + cfg_size;
528 	size_t msg_size = sizeof(msg->header) + payload_size;
529 	int rc;
530 
531 	if (!(vu_dev->protocol_features &
532 	      BIT_ULL(VHOST_USER_PROTOCOL_F_CONFIG)))
533 		return;
534 
535 	msg = kzalloc(msg_size, GFP_KERNEL);
536 	if (!msg)
537 		return;
538 	msg->header.request = VHOST_USER_GET_CONFIG;
539 	msg->header.size = payload_size;
540 	msg->payload.config.offset = 0;
541 	msg->payload.config.size = cfg_size;
542 
543 	rc = vhost_user_send(vu_dev, true, msg, NULL, 0);
544 	if (rc) {
545 		vu_err(vu_dev, "sending VHOST_USER_GET_CONFIG failed: %d\n",
546 		       rc);
547 		goto free;
548 	}
549 
550 	rc = vhost_user_recv_resp(vu_dev, msg, msg_size);
551 	if (rc) {
552 		vu_err(vu_dev,
553 		       "receiving VHOST_USER_GET_CONFIG response failed: %d\n",
554 		       rc);
555 		goto free;
556 	}
557 
558 	if (msg->header.size != payload_size ||
559 	    msg->payload.config.size != cfg_size) {
560 		rc = -EPROTO;
561 		vu_err(vu_dev,
562 		       "Invalid VHOST_USER_GET_CONFIG sizes (payload %d expected %zu, config %u expected %u)\n",
563 		       msg->header.size, payload_size,
564 		       msg->payload.config.size, cfg_size);
565 		goto free;
566 	}
567 	memcpy(buf, msg->payload.config.payload + offset, len);
568 
569 free:
570 	kfree(msg);
571 }
572 
vhost_user_set_config(struct virtio_uml_device * vu_dev,u32 offset,const void * buf,u32 len)573 static void vhost_user_set_config(struct virtio_uml_device *vu_dev,
574 				  u32 offset, const void *buf, u32 len)
575 {
576 	struct vhost_user_msg *msg;
577 	size_t payload_size = sizeof(msg->payload.config) + len;
578 	size_t msg_size = sizeof(msg->header) + payload_size;
579 	int rc;
580 
581 	if (!(vu_dev->protocol_features &
582 	      BIT_ULL(VHOST_USER_PROTOCOL_F_CONFIG)))
583 		return;
584 
585 	msg = kzalloc(msg_size, GFP_KERNEL);
586 	if (!msg)
587 		return;
588 	msg->header.request = VHOST_USER_SET_CONFIG;
589 	msg->header.size = payload_size;
590 	msg->payload.config.offset = offset;
591 	msg->payload.config.size = len;
592 	memcpy(msg->payload.config.payload, buf, len);
593 
594 	rc = vhost_user_send(vu_dev, false, msg, NULL, 0);
595 	if (rc)
596 		vu_err(vu_dev, "sending VHOST_USER_SET_CONFIG failed: %d\n",
597 		       rc);
598 
599 	kfree(msg);
600 }
601 
vhost_user_init_mem_region(u64 addr,u64 size,int * fd_out,struct vhost_user_mem_region * region_out)602 static int vhost_user_init_mem_region(u64 addr, u64 size, int *fd_out,
603 				      struct vhost_user_mem_region *region_out)
604 {
605 	unsigned long long mem_offset;
606 	int rc = phys_mapping(addr, &mem_offset);
607 
608 	if (WARN(rc < 0, "phys_mapping of 0x%llx returned %d\n", addr, rc))
609 		return -EFAULT;
610 	*fd_out = rc;
611 	region_out->guest_addr = addr;
612 	region_out->user_addr = addr;
613 	region_out->size = size;
614 	region_out->mmap_offset = mem_offset;
615 
616 	/* Ensure mapping is valid for the entire region */
617 	rc = phys_mapping(addr + size - 1, &mem_offset);
618 	if (WARN(rc != *fd_out, "phys_mapping of 0x%llx failed: %d != %d\n",
619 		 addr + size - 1, rc, *fd_out))
620 		return -EFAULT;
621 	return 0;
622 }
623 
vhost_user_set_mem_table(struct virtio_uml_device * vu_dev)624 static int vhost_user_set_mem_table(struct virtio_uml_device *vu_dev)
625 {
626 	struct vhost_user_msg msg = {
627 		.header.request = VHOST_USER_SET_MEM_TABLE,
628 		.header.size = sizeof(msg.payload.mem_regions),
629 		.payload.mem_regions.num = 1,
630 	};
631 	unsigned long reserved = uml_reserved - uml_physmem;
632 	int fds[2];
633 	int rc;
634 
635 	/*
636 	 * This is a bit tricky, see also the comment with setup_physmem().
637 	 *
638 	 * Essentially, setup_physmem() uses a file to mmap() our physmem,
639 	 * but the code and data we *already* have is omitted. To us, this
640 	 * is no difference, since they both become part of our address
641 	 * space and memory consumption. To somebody looking in from the
642 	 * outside, however, it is different because the part of our memory
643 	 * consumption that's already part of the binary (code/data) is not
644 	 * mapped from the file, so it's not visible to another mmap from
645 	 * the file descriptor.
646 	 *
647 	 * Thus, don't advertise this space to the vhost-user slave. This
648 	 * means that the slave will likely abort or similar when we give
649 	 * it an address from the hidden range, since it's not marked as
650 	 * a valid address, but at least that way we detect the issue and
651 	 * don't just have the slave read an all-zeroes buffer from the
652 	 * shared memory file, or write something there that we can never
653 	 * see (depending on the direction of the virtqueue traffic.)
654 	 *
655 	 * Since we usually don't want to use .text for virtio buffers,
656 	 * this effectively means that you cannot use
657 	 *  1) global variables, which are in the .bss and not in the shm
658 	 *     file-backed memory
659 	 *  2) the stack in some processes, depending on where they have
660 	 *     their stack (or maybe only no interrupt stack?)
661 	 *
662 	 * The stack is already not typically valid for DMA, so this isn't
663 	 * much of a restriction, but global variables might be encountered.
664 	 *
665 	 * It might be possible to fix it by copying around the data that's
666 	 * between bss_start and where we map the file now, but it's not
667 	 * something that you typically encounter with virtio drivers, so
668 	 * it didn't seem worthwhile.
669 	 */
670 	rc = vhost_user_init_mem_region(reserved, physmem_size - reserved,
671 					&fds[0],
672 					&msg.payload.mem_regions.regions[0]);
673 
674 	if (rc < 0)
675 		return rc;
676 	if (highmem) {
677 		msg.payload.mem_regions.num++;
678 		rc = vhost_user_init_mem_region(__pa(end_iomem), highmem,
679 				&fds[1], &msg.payload.mem_regions.regions[1]);
680 		if (rc < 0)
681 			return rc;
682 	}
683 
684 	return vhost_user_send(vu_dev, false, &msg, fds,
685 			       msg.payload.mem_regions.num);
686 }
687 
vhost_user_set_vring_state(struct virtio_uml_device * vu_dev,u32 request,u32 index,u32 num)688 static int vhost_user_set_vring_state(struct virtio_uml_device *vu_dev,
689 				      u32 request, u32 index, u32 num)
690 {
691 	struct vhost_user_msg msg = {
692 		.header.request = request,
693 		.header.size = sizeof(msg.payload.vring_state),
694 		.payload.vring_state.index = index,
695 		.payload.vring_state.num = num,
696 	};
697 
698 	return vhost_user_send(vu_dev, false, &msg, NULL, 0);
699 }
700 
vhost_user_set_vring_num(struct virtio_uml_device * vu_dev,u32 index,u32 num)701 static int vhost_user_set_vring_num(struct virtio_uml_device *vu_dev,
702 				    u32 index, u32 num)
703 {
704 	return vhost_user_set_vring_state(vu_dev, VHOST_USER_SET_VRING_NUM,
705 					  index, num);
706 }
707 
vhost_user_set_vring_base(struct virtio_uml_device * vu_dev,u32 index,u32 offset)708 static int vhost_user_set_vring_base(struct virtio_uml_device *vu_dev,
709 				     u32 index, u32 offset)
710 {
711 	return vhost_user_set_vring_state(vu_dev, VHOST_USER_SET_VRING_BASE,
712 					  index, offset);
713 }
714 
vhost_user_set_vring_addr(struct virtio_uml_device * vu_dev,u32 index,u64 desc,u64 used,u64 avail,u64 log)715 static int vhost_user_set_vring_addr(struct virtio_uml_device *vu_dev,
716 				     u32 index, u64 desc, u64 used, u64 avail,
717 				     u64 log)
718 {
719 	struct vhost_user_msg msg = {
720 		.header.request = VHOST_USER_SET_VRING_ADDR,
721 		.header.size = sizeof(msg.payload.vring_addr),
722 		.payload.vring_addr.index = index,
723 		.payload.vring_addr.desc = desc,
724 		.payload.vring_addr.used = used,
725 		.payload.vring_addr.avail = avail,
726 		.payload.vring_addr.log = log,
727 	};
728 
729 	return vhost_user_send(vu_dev, false, &msg, NULL, 0);
730 }
731 
vhost_user_set_vring_fd(struct virtio_uml_device * vu_dev,u32 request,int index,int fd)732 static int vhost_user_set_vring_fd(struct virtio_uml_device *vu_dev,
733 				   u32 request, int index, int fd)
734 {
735 	struct vhost_user_msg msg = {
736 		.header.request = request,
737 		.header.size = sizeof(msg.payload.integer),
738 		.payload.integer = index,
739 	};
740 
741 	if (index & ~VHOST_USER_VRING_INDEX_MASK)
742 		return -EINVAL;
743 	if (fd < 0) {
744 		msg.payload.integer |= VHOST_USER_VRING_POLL_MASK;
745 		return vhost_user_send(vu_dev, false, &msg, NULL, 0);
746 	}
747 	return vhost_user_send(vu_dev, false, &msg, &fd, 1);
748 }
749 
vhost_user_set_vring_call(struct virtio_uml_device * vu_dev,int index,int fd)750 static int vhost_user_set_vring_call(struct virtio_uml_device *vu_dev,
751 				     int index, int fd)
752 {
753 	return vhost_user_set_vring_fd(vu_dev, VHOST_USER_SET_VRING_CALL,
754 				       index, fd);
755 }
756 
vhost_user_set_vring_kick(struct virtio_uml_device * vu_dev,int index,int fd)757 static int vhost_user_set_vring_kick(struct virtio_uml_device *vu_dev,
758 				     int index, int fd)
759 {
760 	return vhost_user_set_vring_fd(vu_dev, VHOST_USER_SET_VRING_KICK,
761 				       index, fd);
762 }
763 
vhost_user_set_vring_enable(struct virtio_uml_device * vu_dev,u32 index,bool enable)764 static int vhost_user_set_vring_enable(struct virtio_uml_device *vu_dev,
765 				       u32 index, bool enable)
766 {
767 	if (!(vu_dev->features & BIT_ULL(VHOST_USER_F_PROTOCOL_FEATURES)))
768 		return 0;
769 
770 	return vhost_user_set_vring_state(vu_dev, VHOST_USER_SET_VRING_ENABLE,
771 					  index, enable);
772 }
773 
774 
775 /* Virtio interface */
776 
vu_notify(struct virtqueue * vq)777 static bool vu_notify(struct virtqueue *vq)
778 {
779 	struct virtio_uml_vq_info *info = vq->priv;
780 	const uint64_t n = 1;
781 	int rc;
782 
783 	if (info->suspended)
784 		return true;
785 
786 	time_travel_propagate_time();
787 
788 	if (info->kick_fd < 0) {
789 		struct virtio_uml_device *vu_dev;
790 
791 		vu_dev = to_virtio_uml_device(vq->vdev);
792 
793 		return vhost_user_set_vring_state(vu_dev, VHOST_USER_VRING_KICK,
794 						  vq->index, 0) == 0;
795 	}
796 
797 	do {
798 		rc = os_write_file(info->kick_fd, &n, sizeof(n));
799 	} while (rc == -EINTR);
800 	return !WARN(rc != sizeof(n), "write returned %d\n", rc);
801 }
802 
vu_interrupt(int irq,void * opaque)803 static irqreturn_t vu_interrupt(int irq, void *opaque)
804 {
805 	struct virtqueue *vq = opaque;
806 	struct virtio_uml_vq_info *info = vq->priv;
807 	uint64_t n;
808 	int rc;
809 	irqreturn_t ret = IRQ_NONE;
810 
811 	do {
812 		rc = os_read_file(info->call_fd, &n, sizeof(n));
813 		if (rc == sizeof(n))
814 			ret |= vring_interrupt(irq, vq);
815 	} while (rc == sizeof(n) || rc == -EINTR);
816 	WARN(rc != -EAGAIN, "read returned %d\n", rc);
817 	return ret;
818 }
819 
820 
vu_get(struct virtio_device * vdev,unsigned offset,void * buf,unsigned len)821 static void vu_get(struct virtio_device *vdev, unsigned offset,
822 		   void *buf, unsigned len)
823 {
824 	struct virtio_uml_device *vu_dev = to_virtio_uml_device(vdev);
825 
826 	vhost_user_get_config(vu_dev, offset, buf, len);
827 }
828 
vu_set(struct virtio_device * vdev,unsigned offset,const void * buf,unsigned len)829 static void vu_set(struct virtio_device *vdev, unsigned offset,
830 		   const void *buf, unsigned len)
831 {
832 	struct virtio_uml_device *vu_dev = to_virtio_uml_device(vdev);
833 
834 	vhost_user_set_config(vu_dev, offset, buf, len);
835 }
836 
vu_get_status(struct virtio_device * vdev)837 static u8 vu_get_status(struct virtio_device *vdev)
838 {
839 	struct virtio_uml_device *vu_dev = to_virtio_uml_device(vdev);
840 
841 	return vu_dev->status;
842 }
843 
vu_set_status(struct virtio_device * vdev,u8 status)844 static void vu_set_status(struct virtio_device *vdev, u8 status)
845 {
846 	struct virtio_uml_device *vu_dev = to_virtio_uml_device(vdev);
847 
848 	vu_dev->status = status;
849 }
850 
vu_reset(struct virtio_device * vdev)851 static void vu_reset(struct virtio_device *vdev)
852 {
853 	struct virtio_uml_device *vu_dev = to_virtio_uml_device(vdev);
854 
855 	vu_dev->status = 0;
856 }
857 
vu_del_vq(struct virtqueue * vq)858 static void vu_del_vq(struct virtqueue *vq)
859 {
860 	struct virtio_uml_vq_info *info = vq->priv;
861 
862 	if (info->call_fd >= 0) {
863 		struct virtio_uml_device *vu_dev;
864 
865 		vu_dev = to_virtio_uml_device(vq->vdev);
866 
867 		um_free_irq(vu_dev->irq, vq);
868 		os_close_file(info->call_fd);
869 	}
870 
871 	if (info->kick_fd >= 0)
872 		os_close_file(info->kick_fd);
873 
874 	vring_del_virtqueue(vq);
875 	kfree(info);
876 }
877 
vu_del_vqs(struct virtio_device * vdev)878 static void vu_del_vqs(struct virtio_device *vdev)
879 {
880 	struct virtio_uml_device *vu_dev = to_virtio_uml_device(vdev);
881 	struct virtqueue *vq, *n;
882 	u64 features;
883 
884 	/* Note: reverse order as a workaround to a decoding bug in snabb */
885 	list_for_each_entry_reverse(vq, &vdev->vqs, list)
886 		WARN_ON(vhost_user_set_vring_enable(vu_dev, vq->index, false));
887 
888 	/* Ensure previous messages have been processed */
889 	WARN_ON(vhost_user_get_features(vu_dev, &features));
890 
891 	list_for_each_entry_safe(vq, n, &vdev->vqs, list)
892 		vu_del_vq(vq);
893 }
894 
vu_setup_vq_call_fd(struct virtio_uml_device * vu_dev,struct virtqueue * vq)895 static int vu_setup_vq_call_fd(struct virtio_uml_device *vu_dev,
896 			       struct virtqueue *vq)
897 {
898 	struct virtio_uml_vq_info *info = vq->priv;
899 	int call_fds[2];
900 	int rc;
901 
902 	/* no call FD needed/desired in this case */
903 	if (vu_dev->protocol_features &
904 			BIT_ULL(VHOST_USER_PROTOCOL_F_INBAND_NOTIFICATIONS) &&
905 	    vu_dev->protocol_features &
906 			BIT_ULL(VHOST_USER_PROTOCOL_F_SLAVE_REQ)) {
907 		info->call_fd = -1;
908 		return 0;
909 	}
910 
911 	/* Use a pipe for call fd, since SIGIO is not supported for eventfd */
912 	rc = os_pipe(call_fds, true, true);
913 	if (rc < 0)
914 		return rc;
915 
916 	info->call_fd = call_fds[0];
917 	rc = um_request_irq(vu_dev->irq, info->call_fd, IRQ_READ,
918 			    vu_interrupt, IRQF_SHARED, info->name, vq);
919 	if (rc < 0)
920 		goto close_both;
921 
922 	rc = vhost_user_set_vring_call(vu_dev, vq->index, call_fds[1]);
923 	if (rc)
924 		goto release_irq;
925 
926 	goto out;
927 
928 release_irq:
929 	um_free_irq(vu_dev->irq, vq);
930 close_both:
931 	os_close_file(call_fds[0]);
932 out:
933 	/* Close (unused) write end of call fds */
934 	os_close_file(call_fds[1]);
935 
936 	return rc;
937 }
938 
vu_setup_vq(struct virtio_device * vdev,unsigned index,vq_callback_t * callback,const char * name,bool ctx)939 static struct virtqueue *vu_setup_vq(struct virtio_device *vdev,
940 				     unsigned index, vq_callback_t *callback,
941 				     const char *name, bool ctx)
942 {
943 	struct virtio_uml_device *vu_dev = to_virtio_uml_device(vdev);
944 	struct platform_device *pdev = vu_dev->pdev;
945 	struct virtio_uml_vq_info *info;
946 	struct virtqueue *vq;
947 	int num = MAX_SUPPORTED_QUEUE_SIZE;
948 	int rc;
949 
950 	info = kzalloc(sizeof(*info), GFP_KERNEL);
951 	if (!info) {
952 		rc = -ENOMEM;
953 		goto error_kzalloc;
954 	}
955 	snprintf(info->name, sizeof(info->name), "%s.%d-%s", pdev->name,
956 		 pdev->id, name);
957 
958 	vq = vring_create_virtqueue(index, num, PAGE_SIZE, vdev, true, true,
959 				    ctx, vu_notify, callback, info->name);
960 	if (!vq) {
961 		rc = -ENOMEM;
962 		goto error_create;
963 	}
964 	vq->priv = info;
965 	vq->num_max = num;
966 	num = virtqueue_get_vring_size(vq);
967 
968 	if (vu_dev->protocol_features &
969 			BIT_ULL(VHOST_USER_PROTOCOL_F_INBAND_NOTIFICATIONS)) {
970 		info->kick_fd = -1;
971 	} else {
972 		rc = os_eventfd(0, 0);
973 		if (rc < 0)
974 			goto error_kick;
975 		info->kick_fd = rc;
976 	}
977 
978 	rc = vu_setup_vq_call_fd(vu_dev, vq);
979 	if (rc)
980 		goto error_call;
981 
982 	rc = vhost_user_set_vring_num(vu_dev, index, num);
983 	if (rc)
984 		goto error_setup;
985 
986 	rc = vhost_user_set_vring_base(vu_dev, index, 0);
987 	if (rc)
988 		goto error_setup;
989 
990 	rc = vhost_user_set_vring_addr(vu_dev, index,
991 				       virtqueue_get_desc_addr(vq),
992 				       virtqueue_get_used_addr(vq),
993 				       virtqueue_get_avail_addr(vq),
994 				       (u64) -1);
995 	if (rc)
996 		goto error_setup;
997 
998 	return vq;
999 
1000 error_setup:
1001 	if (info->call_fd >= 0) {
1002 		um_free_irq(vu_dev->irq, vq);
1003 		os_close_file(info->call_fd);
1004 	}
1005 error_call:
1006 	if (info->kick_fd >= 0)
1007 		os_close_file(info->kick_fd);
1008 error_kick:
1009 	vring_del_virtqueue(vq);
1010 error_create:
1011 	kfree(info);
1012 error_kzalloc:
1013 	return ERR_PTR(rc);
1014 }
1015 
vu_find_vqs(struct virtio_device * vdev,unsigned nvqs,struct virtqueue * vqs[],vq_callback_t * callbacks[],const char * const names[],const bool * ctx,struct irq_affinity * desc)1016 static int vu_find_vqs(struct virtio_device *vdev, unsigned nvqs,
1017 		       struct virtqueue *vqs[], vq_callback_t *callbacks[],
1018 		       const char * const names[], const bool *ctx,
1019 		       struct irq_affinity *desc)
1020 {
1021 	struct virtio_uml_device *vu_dev = to_virtio_uml_device(vdev);
1022 	int i, queue_idx = 0, rc;
1023 	struct virtqueue *vq;
1024 
1025 	/* not supported for now */
1026 	if (WARN_ON(nvqs > 64))
1027 		return -EINVAL;
1028 
1029 	rc = vhost_user_set_mem_table(vu_dev);
1030 	if (rc)
1031 		return rc;
1032 
1033 	for (i = 0; i < nvqs; ++i) {
1034 		if (!names[i]) {
1035 			vqs[i] = NULL;
1036 			continue;
1037 		}
1038 
1039 		vqs[i] = vu_setup_vq(vdev, queue_idx++, callbacks[i], names[i],
1040 				     ctx ? ctx[i] : false);
1041 		if (IS_ERR(vqs[i])) {
1042 			rc = PTR_ERR(vqs[i]);
1043 			goto error_setup;
1044 		}
1045 	}
1046 
1047 	list_for_each_entry(vq, &vdev->vqs, list) {
1048 		struct virtio_uml_vq_info *info = vq->priv;
1049 
1050 		if (info->kick_fd >= 0) {
1051 			rc = vhost_user_set_vring_kick(vu_dev, vq->index,
1052 						       info->kick_fd);
1053 			if (rc)
1054 				goto error_setup;
1055 		}
1056 
1057 		rc = vhost_user_set_vring_enable(vu_dev, vq->index, true);
1058 		if (rc)
1059 			goto error_setup;
1060 	}
1061 
1062 	return 0;
1063 
1064 error_setup:
1065 	vu_del_vqs(vdev);
1066 	return rc;
1067 }
1068 
vu_get_features(struct virtio_device * vdev)1069 static u64 vu_get_features(struct virtio_device *vdev)
1070 {
1071 	struct virtio_uml_device *vu_dev = to_virtio_uml_device(vdev);
1072 
1073 	return vu_dev->features;
1074 }
1075 
vu_finalize_features(struct virtio_device * vdev)1076 static int vu_finalize_features(struct virtio_device *vdev)
1077 {
1078 	struct virtio_uml_device *vu_dev = to_virtio_uml_device(vdev);
1079 	u64 supported = vdev->features & VHOST_USER_SUPPORTED_F;
1080 
1081 	vring_transport_features(vdev);
1082 	vu_dev->features = vdev->features | supported;
1083 
1084 	return vhost_user_set_features(vu_dev, vu_dev->features);
1085 }
1086 
vu_bus_name(struct virtio_device * vdev)1087 static const char *vu_bus_name(struct virtio_device *vdev)
1088 {
1089 	struct virtio_uml_device *vu_dev = to_virtio_uml_device(vdev);
1090 
1091 	return vu_dev->pdev->name;
1092 }
1093 
1094 static const struct virtio_config_ops virtio_uml_config_ops = {
1095 	.get = vu_get,
1096 	.set = vu_set,
1097 	.get_status = vu_get_status,
1098 	.set_status = vu_set_status,
1099 	.reset = vu_reset,
1100 	.find_vqs = vu_find_vqs,
1101 	.del_vqs = vu_del_vqs,
1102 	.get_features = vu_get_features,
1103 	.finalize_features = vu_finalize_features,
1104 	.bus_name = vu_bus_name,
1105 };
1106 
virtio_uml_release_dev(struct device * d)1107 static void virtio_uml_release_dev(struct device *d)
1108 {
1109 	struct virtio_device *vdev =
1110 			container_of(d, struct virtio_device, dev);
1111 	struct virtio_uml_device *vu_dev = to_virtio_uml_device(vdev);
1112 
1113 	time_travel_propagate_time();
1114 
1115 	/* might not have been opened due to not negotiating the feature */
1116 	if (vu_dev->req_fd >= 0) {
1117 		um_free_irq(vu_dev->irq, vu_dev);
1118 		os_close_file(vu_dev->req_fd);
1119 	}
1120 
1121 	os_close_file(vu_dev->sock);
1122 	kfree(vu_dev);
1123 }
1124 
virtio_uml_set_no_vq_suspend(struct virtio_device * vdev,bool no_vq_suspend)1125 void virtio_uml_set_no_vq_suspend(struct virtio_device *vdev,
1126 				  bool no_vq_suspend)
1127 {
1128 	struct virtio_uml_device *vu_dev = to_virtio_uml_device(vdev);
1129 
1130 	if (WARN_ON(vdev->config != &virtio_uml_config_ops))
1131 		return;
1132 
1133 	vu_dev->no_vq_suspend = no_vq_suspend;
1134 	dev_info(&vdev->dev, "%sabled VQ suspend\n",
1135 		 no_vq_suspend ? "dis" : "en");
1136 }
1137 
vu_of_conn_broken(struct work_struct * wk)1138 static void vu_of_conn_broken(struct work_struct *wk)
1139 {
1140 	struct virtio_uml_platform_data *pdata;
1141 	struct virtio_uml_device *vu_dev;
1142 
1143 	pdata = container_of(wk, struct virtio_uml_platform_data, conn_broken_wk);
1144 
1145 	vu_dev = platform_get_drvdata(pdata->pdev);
1146 
1147 	virtio_break_device(&vu_dev->vdev);
1148 
1149 	/*
1150 	 * We can't remove the device from the devicetree so the only thing we
1151 	 * can do is warn.
1152 	 */
1153 	WARN_ON(1);
1154 }
1155 
1156 /* Platform device */
1157 
1158 static struct virtio_uml_platform_data *
virtio_uml_create_pdata(struct platform_device * pdev)1159 virtio_uml_create_pdata(struct platform_device *pdev)
1160 {
1161 	struct device_node *np = pdev->dev.of_node;
1162 	struct virtio_uml_platform_data *pdata;
1163 	int ret;
1164 
1165 	if (!np)
1166 		return ERR_PTR(-EINVAL);
1167 
1168 	pdata = devm_kzalloc(&pdev->dev, sizeof(*pdata), GFP_KERNEL);
1169 	if (!pdata)
1170 		return ERR_PTR(-ENOMEM);
1171 
1172 	INIT_WORK(&pdata->conn_broken_wk, vu_of_conn_broken);
1173 	pdata->pdev = pdev;
1174 
1175 	ret = of_property_read_string(np, "socket-path", &pdata->socket_path);
1176 	if (ret)
1177 		return ERR_PTR(ret);
1178 
1179 	ret = of_property_read_u32(np, "virtio-device-id",
1180 				   &pdata->virtio_device_id);
1181 	if (ret)
1182 		return ERR_PTR(ret);
1183 
1184 	return pdata;
1185 }
1186 
virtio_uml_probe(struct platform_device * pdev)1187 static int virtio_uml_probe(struct platform_device *pdev)
1188 {
1189 	struct virtio_uml_platform_data *pdata = pdev->dev.platform_data;
1190 	struct virtio_uml_device *vu_dev;
1191 	int rc;
1192 
1193 	if (!pdata) {
1194 		pdata = virtio_uml_create_pdata(pdev);
1195 		if (IS_ERR(pdata))
1196 			return PTR_ERR(pdata);
1197 	}
1198 
1199 	vu_dev = kzalloc(sizeof(*vu_dev), GFP_KERNEL);
1200 	if (!vu_dev)
1201 		return -ENOMEM;
1202 
1203 	vu_dev->pdata = pdata;
1204 	vu_dev->vdev.dev.parent = &pdev->dev;
1205 	vu_dev->vdev.dev.release = virtio_uml_release_dev;
1206 	vu_dev->vdev.config = &virtio_uml_config_ops;
1207 	vu_dev->vdev.id.device = pdata->virtio_device_id;
1208 	vu_dev->vdev.id.vendor = VIRTIO_DEV_ANY_ID;
1209 	vu_dev->pdev = pdev;
1210 	vu_dev->req_fd = -1;
1211 
1212 	time_travel_propagate_time();
1213 
1214 	do {
1215 		rc = os_connect_socket(pdata->socket_path);
1216 	} while (rc == -EINTR);
1217 	if (rc < 0)
1218 		goto error_free;
1219 	vu_dev->sock = rc;
1220 
1221 	spin_lock_init(&vu_dev->sock_lock);
1222 
1223 	rc = vhost_user_init(vu_dev);
1224 	if (rc)
1225 		goto error_init;
1226 
1227 	platform_set_drvdata(pdev, vu_dev);
1228 
1229 	device_set_wakeup_capable(&vu_dev->vdev.dev, true);
1230 
1231 	rc = register_virtio_device(&vu_dev->vdev);
1232 	if (rc)
1233 		put_device(&vu_dev->vdev.dev);
1234 	vu_dev->registered = 1;
1235 	return rc;
1236 
1237 error_init:
1238 	os_close_file(vu_dev->sock);
1239 error_free:
1240 	kfree(vu_dev);
1241 	return rc;
1242 }
1243 
virtio_uml_remove(struct platform_device * pdev)1244 static int virtio_uml_remove(struct platform_device *pdev)
1245 {
1246 	struct virtio_uml_device *vu_dev = platform_get_drvdata(pdev);
1247 
1248 	unregister_virtio_device(&vu_dev->vdev);
1249 	return 0;
1250 }
1251 
1252 /* Command line device list */
1253 
vu_cmdline_release_dev(struct device * d)1254 static void vu_cmdline_release_dev(struct device *d)
1255 {
1256 }
1257 
1258 static struct device vu_cmdline_parent = {
1259 	.init_name = "virtio-uml-cmdline",
1260 	.release = vu_cmdline_release_dev,
1261 };
1262 
1263 static bool vu_cmdline_parent_registered;
1264 static int vu_cmdline_id;
1265 
vu_unregister_cmdline_device(struct device * dev,void * data)1266 static int vu_unregister_cmdline_device(struct device *dev, void *data)
1267 {
1268 	struct platform_device *pdev = to_platform_device(dev);
1269 	struct virtio_uml_platform_data *pdata = pdev->dev.platform_data;
1270 
1271 	kfree(pdata->socket_path);
1272 	platform_device_unregister(pdev);
1273 	return 0;
1274 }
1275 
vu_conn_broken(struct work_struct * wk)1276 static void vu_conn_broken(struct work_struct *wk)
1277 {
1278 	struct virtio_uml_platform_data *pdata;
1279 	struct virtio_uml_device *vu_dev;
1280 
1281 	pdata = container_of(wk, struct virtio_uml_platform_data, conn_broken_wk);
1282 
1283 	vu_dev = platform_get_drvdata(pdata->pdev);
1284 
1285 	virtio_break_device(&vu_dev->vdev);
1286 
1287 	vu_unregister_cmdline_device(&pdata->pdev->dev, NULL);
1288 }
1289 
vu_cmdline_set(const char * device,const struct kernel_param * kp)1290 static int vu_cmdline_set(const char *device, const struct kernel_param *kp)
1291 {
1292 	const char *ids = strchr(device, ':');
1293 	unsigned int virtio_device_id;
1294 	int processed, consumed, err;
1295 	char *socket_path;
1296 	struct virtio_uml_platform_data pdata, *ppdata;
1297 	struct platform_device *pdev;
1298 
1299 	if (!ids || ids == device)
1300 		return -EINVAL;
1301 
1302 	processed = sscanf(ids, ":%u%n:%d%n",
1303 			   &virtio_device_id, &consumed,
1304 			   &vu_cmdline_id, &consumed);
1305 
1306 	if (processed < 1 || ids[consumed])
1307 		return -EINVAL;
1308 
1309 	if (!vu_cmdline_parent_registered) {
1310 		err = device_register(&vu_cmdline_parent);
1311 		if (err) {
1312 			pr_err("Failed to register parent device!\n");
1313 			put_device(&vu_cmdline_parent);
1314 			return err;
1315 		}
1316 		vu_cmdline_parent_registered = true;
1317 	}
1318 
1319 	socket_path = kmemdup_nul(device, ids - device, GFP_KERNEL);
1320 	if (!socket_path)
1321 		return -ENOMEM;
1322 
1323 	pdata.virtio_device_id = (u32) virtio_device_id;
1324 	pdata.socket_path = socket_path;
1325 
1326 	pr_info("Registering device virtio-uml.%d id=%d at %s\n",
1327 		vu_cmdline_id, virtio_device_id, socket_path);
1328 
1329 	pdev = platform_device_register_data(&vu_cmdline_parent, "virtio-uml",
1330 					     vu_cmdline_id++, &pdata,
1331 					     sizeof(pdata));
1332 	err = PTR_ERR_OR_ZERO(pdev);
1333 	if (err)
1334 		goto free;
1335 
1336 	ppdata = pdev->dev.platform_data;
1337 	ppdata->pdev = pdev;
1338 	INIT_WORK(&ppdata->conn_broken_wk, vu_conn_broken);
1339 
1340 	return 0;
1341 
1342 free:
1343 	kfree(socket_path);
1344 	return err;
1345 }
1346 
vu_cmdline_get_device(struct device * dev,void * data)1347 static int vu_cmdline_get_device(struct device *dev, void *data)
1348 {
1349 	struct platform_device *pdev = to_platform_device(dev);
1350 	struct virtio_uml_platform_data *pdata = pdev->dev.platform_data;
1351 	char *buffer = data;
1352 	unsigned int len = strlen(buffer);
1353 
1354 	snprintf(buffer + len, PAGE_SIZE - len, "%s:%d:%d\n",
1355 		 pdata->socket_path, pdata->virtio_device_id, pdev->id);
1356 	return 0;
1357 }
1358 
vu_cmdline_get(char * buffer,const struct kernel_param * kp)1359 static int vu_cmdline_get(char *buffer, const struct kernel_param *kp)
1360 {
1361 	buffer[0] = '\0';
1362 	if (vu_cmdline_parent_registered)
1363 		device_for_each_child(&vu_cmdline_parent, buffer,
1364 				      vu_cmdline_get_device);
1365 	return strlen(buffer) + 1;
1366 }
1367 
1368 static const struct kernel_param_ops vu_cmdline_param_ops = {
1369 	.set = vu_cmdline_set,
1370 	.get = vu_cmdline_get,
1371 };
1372 
1373 device_param_cb(device, &vu_cmdline_param_ops, NULL, S_IRUSR);
1374 __uml_help(vu_cmdline_param_ops,
1375 "virtio_uml.device=<socket>:<virtio_id>[:<platform_id>]\n"
1376 "    Configure a virtio device over a vhost-user socket.\n"
1377 "    See virtio_ids.h for a list of possible virtio device id values.\n"
1378 "    Optionally use a specific platform_device id.\n\n"
1379 );
1380 
1381 
vu_unregister_cmdline_devices(void)1382 static void vu_unregister_cmdline_devices(void)
1383 {
1384 	if (vu_cmdline_parent_registered) {
1385 		device_for_each_child(&vu_cmdline_parent, NULL,
1386 				      vu_unregister_cmdline_device);
1387 		device_unregister(&vu_cmdline_parent);
1388 		vu_cmdline_parent_registered = false;
1389 	}
1390 }
1391 
1392 /* Platform driver */
1393 
1394 static const struct of_device_id virtio_uml_match[] = {
1395 	{ .compatible = "virtio,uml", },
1396 	{ }
1397 };
1398 MODULE_DEVICE_TABLE(of, virtio_uml_match);
1399 
virtio_uml_suspend(struct platform_device * pdev,pm_message_t state)1400 static int virtio_uml_suspend(struct platform_device *pdev, pm_message_t state)
1401 {
1402 	struct virtio_uml_device *vu_dev = platform_get_drvdata(pdev);
1403 
1404 	if (!vu_dev->no_vq_suspend) {
1405 		struct virtqueue *vq;
1406 
1407 		virtio_device_for_each_vq((&vu_dev->vdev), vq) {
1408 			struct virtio_uml_vq_info *info = vq->priv;
1409 
1410 			info->suspended = true;
1411 			vhost_user_set_vring_enable(vu_dev, vq->index, false);
1412 		}
1413 	}
1414 
1415 	if (!device_may_wakeup(&vu_dev->vdev.dev)) {
1416 		vu_dev->suspended = true;
1417 		return 0;
1418 	}
1419 
1420 	return irq_set_irq_wake(vu_dev->irq, 1);
1421 }
1422 
virtio_uml_resume(struct platform_device * pdev)1423 static int virtio_uml_resume(struct platform_device *pdev)
1424 {
1425 	struct virtio_uml_device *vu_dev = platform_get_drvdata(pdev);
1426 
1427 	if (!vu_dev->no_vq_suspend) {
1428 		struct virtqueue *vq;
1429 
1430 		virtio_device_for_each_vq((&vu_dev->vdev), vq) {
1431 			struct virtio_uml_vq_info *info = vq->priv;
1432 
1433 			info->suspended = false;
1434 			vhost_user_set_vring_enable(vu_dev, vq->index, true);
1435 		}
1436 	}
1437 
1438 	vu_dev->suspended = false;
1439 
1440 	if (!device_may_wakeup(&vu_dev->vdev.dev))
1441 		return 0;
1442 
1443 	return irq_set_irq_wake(vu_dev->irq, 0);
1444 }
1445 
1446 static struct platform_driver virtio_uml_driver = {
1447 	.probe = virtio_uml_probe,
1448 	.remove = virtio_uml_remove,
1449 	.driver = {
1450 		.name = "virtio-uml",
1451 		.of_match_table = virtio_uml_match,
1452 	},
1453 	.suspend = virtio_uml_suspend,
1454 	.resume = virtio_uml_resume,
1455 };
1456 
virtio_uml_init(void)1457 static int __init virtio_uml_init(void)
1458 {
1459 	return platform_driver_register(&virtio_uml_driver);
1460 }
1461 
virtio_uml_exit(void)1462 static void __exit virtio_uml_exit(void)
1463 {
1464 	platform_driver_unregister(&virtio_uml_driver);
1465 	vu_unregister_cmdline_devices();
1466 }
1467 
1468 module_init(virtio_uml_init);
1469 module_exit(virtio_uml_exit);
1470 __uml_exitcall(virtio_uml_exit);
1471 
1472 MODULE_DESCRIPTION("UML driver for vhost-user virtio devices");
1473 MODULE_LICENSE("GPL");
1474