1 /* 2 * Xen 9p backend 3 * 4 * Copyright Aporeto 2017 5 * 6 * Authors: 7 * Stefano Stabellini <stefano@aporeto.com> 8 * 9 */ 10 11 #include "qemu/osdep.h" 12 13 #include "hw/hw.h" 14 #include "hw/9pfs/9p.h" 15 #include "hw/xen/xen_backend.h" 16 #include "hw/9pfs/xen-9pfs.h" 17 #include "qemu/config-file.h" 18 #include "fsdev/qemu-fsdev.h" 19 20 #define VERSIONS "1" 21 #define MAX_RINGS 8 22 #define MAX_RING_ORDER 8 23 24 typedef struct Xen9pfsRing { 25 struct Xen9pfsDev *priv; 26 27 int ref; 28 xenevtchn_handle *evtchndev; 29 int evtchn; 30 int local_port; 31 int ring_order; 32 struct xen_9pfs_data_intf *intf; 33 unsigned char *data; 34 struct xen_9pfs_data ring; 35 36 struct iovec *sg; 37 QEMUBH *bh; 38 39 /* local copies, so that we can read/write PDU data directly from 40 * the ring */ 41 RING_IDX out_cons, out_size, in_cons; 42 bool inprogress; 43 } Xen9pfsRing; 44 45 typedef struct Xen9pfsDev { 46 struct XenDevice xendev; /* must be first */ 47 V9fsState state; 48 char *path; 49 char *security_model; 50 char *tag; 51 char *id; 52 53 int num_rings; 54 Xen9pfsRing *rings; 55 } Xen9pfsDev; 56 57 static void xen_9pfs_in_sg(Xen9pfsRing *ring, 58 struct iovec *in_sg, 59 int *num, 60 uint32_t idx, 61 uint32_t size) 62 { 63 RING_IDX cons, prod, masked_prod, masked_cons; 64 65 cons = ring->intf->in_cons; 66 prod = ring->intf->in_prod; 67 xen_rmb(); 68 masked_prod = xen_9pfs_mask(prod, XEN_FLEX_RING_SIZE(ring->ring_order)); 69 masked_cons = xen_9pfs_mask(cons, XEN_FLEX_RING_SIZE(ring->ring_order)); 70 71 if (masked_prod < masked_cons) { 72 in_sg[0].iov_base = ring->ring.in + masked_prod; 73 in_sg[0].iov_len = masked_cons - masked_prod; 74 *num = 1; 75 } else { 76 in_sg[0].iov_base = ring->ring.in + masked_prod; 77 in_sg[0].iov_len = XEN_FLEX_RING_SIZE(ring->ring_order) - masked_prod; 78 in_sg[1].iov_base = ring->ring.in; 79 in_sg[1].iov_len = masked_cons; 80 *num = 2; 81 } 82 } 83 84 static void xen_9pfs_out_sg(Xen9pfsRing *ring, 85 struct iovec *out_sg, 86 int *num, 87 uint32_t idx) 88 { 89 RING_IDX cons, prod, masked_prod, masked_cons; 90 91 cons = ring->intf->out_cons; 92 prod = ring->intf->out_prod; 93 xen_rmb(); 94 masked_prod = xen_9pfs_mask(prod, XEN_FLEX_RING_SIZE(ring->ring_order)); 95 masked_cons = xen_9pfs_mask(cons, XEN_FLEX_RING_SIZE(ring->ring_order)); 96 97 if (masked_cons < masked_prod) { 98 out_sg[0].iov_base = ring->ring.out + masked_cons; 99 out_sg[0].iov_len = ring->out_size; 100 *num = 1; 101 } else { 102 if (ring->out_size > 103 (XEN_FLEX_RING_SIZE(ring->ring_order) - masked_cons)) { 104 out_sg[0].iov_base = ring->ring.out + masked_cons; 105 out_sg[0].iov_len = XEN_FLEX_RING_SIZE(ring->ring_order) - 106 masked_cons; 107 out_sg[1].iov_base = ring->ring.out; 108 out_sg[1].iov_len = ring->out_size - 109 (XEN_FLEX_RING_SIZE(ring->ring_order) - 110 masked_cons); 111 *num = 2; 112 } else { 113 out_sg[0].iov_base = ring->ring.out + masked_cons; 114 out_sg[0].iov_len = ring->out_size; 115 *num = 1; 116 } 117 } 118 } 119 120 static ssize_t xen_9pfs_pdu_vmarshal(V9fsPDU *pdu, 121 size_t offset, 122 const char *fmt, 123 va_list ap) 124 { 125 Xen9pfsDev *xen_9pfs = container_of(pdu->s, Xen9pfsDev, state); 126 struct iovec in_sg[2]; 127 int num; 128 129 xen_9pfs_in_sg(&xen_9pfs->rings[pdu->tag % xen_9pfs->num_rings], 130 in_sg, &num, pdu->idx, ROUND_UP(offset + 128, 512)); 131 return v9fs_iov_vmarshal(in_sg, num, offset, 0, fmt, ap); 132 } 133 134 static ssize_t xen_9pfs_pdu_vunmarshal(V9fsPDU *pdu, 135 size_t offset, 136 const char *fmt, 137 va_list ap) 138 { 139 Xen9pfsDev *xen_9pfs = container_of(pdu->s, Xen9pfsDev, state); 140 struct iovec out_sg[2]; 141 int num; 142 143 xen_9pfs_out_sg(&xen_9pfs->rings[pdu->tag % xen_9pfs->num_rings], 144 out_sg, &num, pdu->idx); 145 return v9fs_iov_vunmarshal(out_sg, num, offset, 0, fmt, ap); 146 } 147 148 static void xen_9pfs_init_out_iov_from_pdu(V9fsPDU *pdu, 149 struct iovec **piov, 150 unsigned int *pniov) 151 { 152 Xen9pfsDev *xen_9pfs = container_of(pdu->s, Xen9pfsDev, state); 153 Xen9pfsRing *ring = &xen_9pfs->rings[pdu->tag % xen_9pfs->num_rings]; 154 int num; 155 156 g_free(ring->sg); 157 158 ring->sg = g_malloc0(sizeof(*ring->sg) * 2); 159 xen_9pfs_out_sg(ring, ring->sg, &num, pdu->idx); 160 *piov = ring->sg; 161 *pniov = num; 162 } 163 164 static void xen_9pfs_init_in_iov_from_pdu(V9fsPDU *pdu, 165 struct iovec **piov, 166 unsigned int *pniov, 167 size_t size) 168 { 169 Xen9pfsDev *xen_9pfs = container_of(pdu->s, Xen9pfsDev, state); 170 Xen9pfsRing *ring = &xen_9pfs->rings[pdu->tag % xen_9pfs->num_rings]; 171 int num; 172 173 g_free(ring->sg); 174 175 ring->sg = g_malloc0(sizeof(*ring->sg) * 2); 176 xen_9pfs_in_sg(ring, ring->sg, &num, pdu->idx, size); 177 *piov = ring->sg; 178 *pniov = num; 179 } 180 181 static void xen_9pfs_push_and_notify(V9fsPDU *pdu) 182 { 183 RING_IDX prod; 184 Xen9pfsDev *priv = container_of(pdu->s, Xen9pfsDev, state); 185 Xen9pfsRing *ring = &priv->rings[pdu->tag % priv->num_rings]; 186 187 g_free(ring->sg); 188 ring->sg = NULL; 189 190 ring->intf->out_cons = ring->out_cons; 191 xen_wmb(); 192 193 prod = ring->intf->in_prod; 194 xen_rmb(); 195 ring->intf->in_prod = prod + pdu->size; 196 xen_wmb(); 197 198 ring->inprogress = false; 199 xenevtchn_notify(ring->evtchndev, ring->local_port); 200 201 qemu_bh_schedule(ring->bh); 202 } 203 204 static const struct V9fsTransport xen_9p_transport = { 205 .pdu_vmarshal = xen_9pfs_pdu_vmarshal, 206 .pdu_vunmarshal = xen_9pfs_pdu_vunmarshal, 207 .init_in_iov_from_pdu = xen_9pfs_init_in_iov_from_pdu, 208 .init_out_iov_from_pdu = xen_9pfs_init_out_iov_from_pdu, 209 .push_and_notify = xen_9pfs_push_and_notify, 210 }; 211 212 static int xen_9pfs_init(struct XenDevice *xendev) 213 { 214 return 0; 215 } 216 217 static int xen_9pfs_receive(Xen9pfsRing *ring) 218 { 219 P9MsgHeader h; 220 RING_IDX cons, prod, masked_prod, masked_cons; 221 V9fsPDU *pdu; 222 223 if (ring->inprogress) { 224 return 0; 225 } 226 227 cons = ring->intf->out_cons; 228 prod = ring->intf->out_prod; 229 xen_rmb(); 230 231 if (xen_9pfs_queued(prod, cons, XEN_FLEX_RING_SIZE(ring->ring_order)) < 232 sizeof(h)) { 233 return 0; 234 } 235 ring->inprogress = true; 236 237 masked_prod = xen_9pfs_mask(prod, XEN_FLEX_RING_SIZE(ring->ring_order)); 238 masked_cons = xen_9pfs_mask(cons, XEN_FLEX_RING_SIZE(ring->ring_order)); 239 240 xen_9pfs_read_packet((uint8_t *) &h, ring->ring.out, sizeof(h), 241 masked_prod, &masked_cons, 242 XEN_FLEX_RING_SIZE(ring->ring_order)); 243 244 /* cannot fail, because we only handle one request per ring at a time */ 245 pdu = pdu_alloc(&ring->priv->state); 246 pdu->size = le32_to_cpu(h.size_le); 247 pdu->id = h.id; 248 pdu->tag = le32_to_cpu(h.tag_le); 249 ring->out_size = le32_to_cpu(h.size_le); 250 ring->out_cons = cons + le32_to_cpu(h.size_le); 251 252 qemu_co_queue_init(&pdu->complete); 253 pdu_submit(pdu); 254 255 return 0; 256 } 257 258 static void xen_9pfs_bh(void *opaque) 259 { 260 Xen9pfsRing *ring = opaque; 261 xen_9pfs_receive(ring); 262 } 263 264 static void xen_9pfs_evtchn_event(void *opaque) 265 { 266 Xen9pfsRing *ring = opaque; 267 evtchn_port_t port; 268 269 port = xenevtchn_pending(ring->evtchndev); 270 xenevtchn_unmask(ring->evtchndev, port); 271 272 qemu_bh_schedule(ring->bh); 273 } 274 275 static int xen_9pfs_free(struct XenDevice *xendev) 276 { 277 int i; 278 Xen9pfsDev *xen_9pdev = container_of(xendev, Xen9pfsDev, xendev); 279 280 g_free(xen_9pdev->id); 281 g_free(xen_9pdev->tag); 282 g_free(xen_9pdev->path); 283 g_free(xen_9pdev->security_model); 284 285 for (i = 0; i < xen_9pdev->num_rings; i++) { 286 if (xen_9pdev->rings[i].data != NULL) { 287 xengnttab_unmap(xen_9pdev->xendev.gnttabdev, 288 xen_9pdev->rings[i].data, 289 (1 << xen_9pdev->rings[i].ring_order)); 290 } 291 if (xen_9pdev->rings[i].intf != NULL) { 292 xengnttab_unmap(xen_9pdev->xendev.gnttabdev, 293 xen_9pdev->rings[i].intf, 294 1); 295 } 296 if (xen_9pdev->rings[i].evtchndev > 0) { 297 qemu_set_fd_handler(xenevtchn_fd(xen_9pdev->rings[i].evtchndev), 298 NULL, NULL, NULL); 299 xenevtchn_unbind(xen_9pdev->rings[i].evtchndev, 300 xen_9pdev->rings[i].local_port); 301 } 302 if (xen_9pdev->rings[i].bh != NULL) { 303 qemu_bh_delete(xen_9pdev->rings[i].bh); 304 } 305 } 306 g_free(xen_9pdev->rings); 307 return 0; 308 } 309 310 static int xen_9pfs_connect(struct XenDevice *xendev) 311 { 312 int i; 313 Xen9pfsDev *xen_9pdev = container_of(xendev, Xen9pfsDev, xendev); 314 V9fsState *s = &xen_9pdev->state; 315 QemuOpts *fsdev; 316 317 if (xenstore_read_fe_int(&xen_9pdev->xendev, "num-rings", 318 &xen_9pdev->num_rings) == -1 || 319 xen_9pdev->num_rings > MAX_RINGS || xen_9pdev->num_rings < 1) { 320 return -1; 321 } 322 323 xen_9pdev->rings = g_malloc0(xen_9pdev->num_rings * sizeof(Xen9pfsRing)); 324 for (i = 0; i < xen_9pdev->num_rings; i++) { 325 char *str; 326 int ring_order; 327 328 xen_9pdev->rings[i].priv = xen_9pdev; 329 xen_9pdev->rings[i].evtchn = -1; 330 xen_9pdev->rings[i].local_port = -1; 331 332 str = g_strdup_printf("ring-ref%u", i); 333 if (xenstore_read_fe_int(&xen_9pdev->xendev, str, 334 &xen_9pdev->rings[i].ref) == -1) { 335 goto out; 336 } 337 g_free(str); 338 str = g_strdup_printf("event-channel-%u", i); 339 if (xenstore_read_fe_int(&xen_9pdev->xendev, str, 340 &xen_9pdev->rings[i].evtchn) == -1) { 341 goto out; 342 } 343 g_free(str); 344 345 xen_9pdev->rings[i].intf = xengnttab_map_grant_ref( 346 xen_9pdev->xendev.gnttabdev, 347 xen_9pdev->xendev.dom, 348 xen_9pdev->rings[i].ref, 349 PROT_READ | PROT_WRITE); 350 if (!xen_9pdev->rings[i].intf) { 351 goto out; 352 } 353 ring_order = xen_9pdev->rings[i].intf->ring_order; 354 if (ring_order > MAX_RING_ORDER) { 355 goto out; 356 } 357 xen_9pdev->rings[i].ring_order = ring_order; 358 xen_9pdev->rings[i].data = xengnttab_map_domain_grant_refs( 359 xen_9pdev->xendev.gnttabdev, 360 (1 << ring_order), 361 xen_9pdev->xendev.dom, 362 xen_9pdev->rings[i].intf->ref, 363 PROT_READ | PROT_WRITE); 364 if (!xen_9pdev->rings[i].data) { 365 goto out; 366 } 367 xen_9pdev->rings[i].ring.in = xen_9pdev->rings[i].data; 368 xen_9pdev->rings[i].ring.out = xen_9pdev->rings[i].data + 369 XEN_FLEX_RING_SIZE(ring_order); 370 371 xen_9pdev->rings[i].bh = qemu_bh_new(xen_9pfs_bh, &xen_9pdev->rings[i]); 372 xen_9pdev->rings[i].out_cons = 0; 373 xen_9pdev->rings[i].out_size = 0; 374 xen_9pdev->rings[i].inprogress = false; 375 376 377 xen_9pdev->rings[i].evtchndev = xenevtchn_open(NULL, 0); 378 if (xen_9pdev->rings[i].evtchndev == NULL) { 379 goto out; 380 } 381 fcntl(xenevtchn_fd(xen_9pdev->rings[i].evtchndev), F_SETFD, FD_CLOEXEC); 382 xen_9pdev->rings[i].local_port = xenevtchn_bind_interdomain 383 (xen_9pdev->rings[i].evtchndev, 384 xendev->dom, 385 xen_9pdev->rings[i].evtchn); 386 if (xen_9pdev->rings[i].local_port == -1) { 387 xen_pv_printf(xendev, 0, 388 "xenevtchn_bind_interdomain failed port=%d\n", 389 xen_9pdev->rings[i].evtchn); 390 goto out; 391 } 392 xen_pv_printf(xendev, 2, "bind evtchn port %d\n", xendev->local_port); 393 qemu_set_fd_handler(xenevtchn_fd(xen_9pdev->rings[i].evtchndev), 394 xen_9pfs_evtchn_event, NULL, &xen_9pdev->rings[i]); 395 } 396 397 xen_9pdev->security_model = xenstore_read_be_str(xendev, "security_model"); 398 xen_9pdev->path = xenstore_read_be_str(xendev, "path"); 399 xen_9pdev->id = s->fsconf.fsdev_id = 400 g_strdup_printf("xen9p%d", xendev->dev); 401 xen_9pdev->tag = s->fsconf.tag = xenstore_read_fe_str(xendev, "tag"); 402 v9fs_register_transport(s, &xen_9p_transport); 403 fsdev = qemu_opts_create(qemu_find_opts("fsdev"), 404 s->fsconf.tag, 405 1, NULL); 406 qemu_opt_set(fsdev, "fsdriver", "local", NULL); 407 qemu_opt_set(fsdev, "path", xen_9pdev->path, NULL); 408 qemu_opt_set(fsdev, "security_model", xen_9pdev->security_model, NULL); 409 qemu_opts_set_id(fsdev, s->fsconf.fsdev_id); 410 qemu_fsdev_add(fsdev); 411 v9fs_device_realize_common(s, NULL); 412 413 return 0; 414 415 out: 416 xen_9pfs_free(xendev); 417 return -1; 418 } 419 420 static void xen_9pfs_alloc(struct XenDevice *xendev) 421 { 422 xenstore_write_be_str(xendev, "versions", VERSIONS); 423 xenstore_write_be_int(xendev, "max-rings", MAX_RINGS); 424 xenstore_write_be_int(xendev, "max-ring-page-order", MAX_RING_ORDER); 425 } 426 427 static void xen_9pfs_disconnect(struct XenDevice *xendev) 428 { 429 /* Dynamic hotplug of PV filesystems at runtime is not supported. */ 430 } 431 432 struct XenDevOps xen_9pfs_ops = { 433 .size = sizeof(Xen9pfsDev), 434 .flags = DEVOPS_FLAG_NEED_GNTDEV, 435 .alloc = xen_9pfs_alloc, 436 .init = xen_9pfs_init, 437 .initialise = xen_9pfs_connect, 438 .disconnect = xen_9pfs_disconnect, 439 .free = xen_9pfs_free, 440 }; 441