xref: /openbmc/qemu/net/dgram.c (revision d30b5bc95a9406b4125a35defba3a953358215cb)
1 /*
2  * QEMU System Emulator
3  *
4  * Copyright (c) 2003-2008 Fabrice Bellard
5  * Copyright (c) 2022 Red Hat, Inc.
6  *
7  * Permission is hereby granted, free of charge, to any person obtaining a copy
8  * of this software and associated documentation files (the "Software"), to deal
9  * in the Software without restriction, including without limitation the rights
10  * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
11  * copies of the Software, and to permit persons to whom the Software is
12  * furnished to do so, subject to the following conditions:
13  *
14  * The above copyright notice and this permission notice shall be included in
15  * all copies or substantial portions of the Software.
16  *
17  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
18  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
19  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
20  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
21  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
22  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
23  * THE SOFTWARE.
24  */
25 
26 #include "qemu/osdep.h"
27 
28 #include "net/net.h"
29 #include "clients.h"
30 #include "monitor/monitor.h"
31 #include "qapi/error.h"
32 #include "qemu/error-report.h"
33 #include "qemu/option.h"
34 #include "qemu/sockets.h"
35 #include "qemu/iov.h"
36 #include "qemu/main-loop.h"
37 #include "qemu/cutils.h"
38 
39 typedef struct NetDgramState {
40     NetClientState nc;
41     int fd;
42     SocketReadState rs;
43     bool read_poll;               /* waiting to receive data? */
44     bool write_poll;              /* waiting to transmit data? */
45     /* contains destination iff connectionless */
46     struct sockaddr *dest_addr;
47     socklen_t dest_len;
48 } NetDgramState;
49 
50 static void net_dgram_send(void *opaque);
51 static void net_dgram_writable(void *opaque);
52 
53 static void net_dgram_update_fd_handler(NetDgramState *s)
54 {
55     qemu_set_fd_handler(s->fd,
56                         s->read_poll ? net_dgram_send : NULL,
57                         s->write_poll ? net_dgram_writable : NULL,
58                         s);
59 }
60 
61 static void net_dgram_read_poll(NetDgramState *s, bool enable)
62 {
63     s->read_poll = enable;
64     net_dgram_update_fd_handler(s);
65 }
66 
67 static void net_dgram_write_poll(NetDgramState *s, bool enable)
68 {
69     s->write_poll = enable;
70     net_dgram_update_fd_handler(s);
71 }
72 
73 static void net_dgram_writable(void *opaque)
74 {
75     NetDgramState *s = opaque;
76 
77     net_dgram_write_poll(s, false);
78 
79     qemu_flush_queued_packets(&s->nc);
80 }
81 
82 static ssize_t net_dgram_receive(NetClientState *nc,
83                                  const uint8_t *buf, size_t size)
84 {
85     NetDgramState *s = DO_UPCAST(NetDgramState, nc, nc);
86     ssize_t ret;
87 
88     do {
89         if (s->dest_addr) {
90             ret = sendto(s->fd, buf, size, 0, s->dest_addr, s->dest_len);
91         } else {
92             ret = send(s->fd, buf, size, 0);
93         }
94     } while (ret == -1 && errno == EINTR);
95 
96     if (ret == -1 && errno == EAGAIN) {
97         net_dgram_write_poll(s, true);
98         return 0;
99     }
100     return ret;
101 }
102 
103 static void net_dgram_send_completed(NetClientState *nc, ssize_t len)
104 {
105     NetDgramState *s = DO_UPCAST(NetDgramState, nc, nc);
106 
107     if (!s->read_poll) {
108         net_dgram_read_poll(s, true);
109     }
110 }
111 
112 static void net_dgram_rs_finalize(SocketReadState *rs)
113 {
114     NetDgramState *s = container_of(rs, NetDgramState, rs);
115 
116     if (qemu_send_packet_async(&s->nc, rs->buf,
117                                rs->packet_len,
118                                net_dgram_send_completed) == 0) {
119         net_dgram_read_poll(s, false);
120     }
121 }
122 
123 static void net_dgram_send(void *opaque)
124 {
125     NetDgramState *s = opaque;
126     int size;
127 
128     size = recv(s->fd, s->rs.buf, sizeof(s->rs.buf), 0);
129     if (size < 0) {
130         return;
131     }
132     if (size == 0) {
133         /* end of connection */
134         net_dgram_read_poll(s, false);
135         net_dgram_write_poll(s, false);
136         return;
137     }
138     if (qemu_send_packet_async(&s->nc, s->rs.buf, size,
139                                net_dgram_send_completed) == 0) {
140         net_dgram_read_poll(s, false);
141     }
142 }
143 
144 static int net_dgram_mcast_create(struct sockaddr_in *mcastaddr,
145                                   struct in_addr *localaddr,
146                                   Error **errp)
147 {
148     struct ip_mreq imr;
149     int fd;
150     int val, ret;
151 #ifdef __OpenBSD__
152     unsigned char loop;
153 #else
154     int loop;
155 #endif
156 
157     if (!IN_MULTICAST(ntohl(mcastaddr->sin_addr.s_addr))) {
158         error_setg(errp, "specified mcastaddr %s (0x%08x) "
159                    "does not contain a multicast address",
160                    inet_ntoa(mcastaddr->sin_addr),
161                    (int)ntohl(mcastaddr->sin_addr.s_addr));
162         return -1;
163     }
164 
165     fd = qemu_socket(PF_INET, SOCK_DGRAM, 0);
166     if (fd < 0) {
167         error_setg_errno(errp, errno, "can't create datagram socket");
168         return -1;
169     }
170 
171     /*
172      * Allow multiple sockets to bind the same multicast ip and port by setting
173      * SO_REUSEADDR. This is the only situation where SO_REUSEADDR should be set
174      * on windows. Use socket_set_fast_reuse otherwise as it sets SO_REUSEADDR
175      * only on posix systems.
176      */
177     val = 1;
178     ret = setsockopt(fd, SOL_SOCKET, SO_REUSEADDR, &val, sizeof(val));
179     if (ret < 0) {
180         error_setg_errno(errp, errno, "can't set socket option SO_REUSEADDR");
181         goto fail;
182     }
183 
184     ret = bind(fd, (struct sockaddr *)mcastaddr, sizeof(*mcastaddr));
185     if (ret < 0) {
186         error_setg_errno(errp, errno, "can't bind ip=%s to socket",
187                          inet_ntoa(mcastaddr->sin_addr));
188         goto fail;
189     }
190 
191     /* Add host to multicast group */
192     imr.imr_multiaddr = mcastaddr->sin_addr;
193     if (localaddr) {
194         imr.imr_interface = *localaddr;
195     } else {
196         imr.imr_interface.s_addr = htonl(INADDR_ANY);
197     }
198 
199     ret = setsockopt(fd, IPPROTO_IP, IP_ADD_MEMBERSHIP,
200                      &imr, sizeof(struct ip_mreq));
201     if (ret < 0) {
202         error_setg_errno(errp, errno,
203                          "can't add socket to multicast group %s",
204                          inet_ntoa(imr.imr_multiaddr));
205         goto fail;
206     }
207 
208     /* Force mcast msgs to loopback (eg. several QEMUs in same host */
209     loop = 1;
210     ret = setsockopt(fd, IPPROTO_IP, IP_MULTICAST_LOOP,
211                      &loop, sizeof(loop));
212     if (ret < 0) {
213         error_setg_errno(errp, errno,
214                          "can't force multicast message to loopback");
215         goto fail;
216     }
217 
218     /* If a bind address is given, only send packets from that address */
219     if (localaddr != NULL) {
220         ret = setsockopt(fd, IPPROTO_IP, IP_MULTICAST_IF,
221                          localaddr, sizeof(*localaddr));
222         if (ret < 0) {
223             error_setg_errno(errp, errno,
224                              "can't set the default network send interface");
225             goto fail;
226         }
227     }
228 
229     qemu_socket_set_nonblock(fd);
230     return fd;
231 fail:
232     if (fd >= 0) {
233         close(fd);
234     }
235     return -1;
236 }
237 
238 static void net_dgram_cleanup(NetClientState *nc)
239 {
240     NetDgramState *s = DO_UPCAST(NetDgramState, nc, nc);
241     if (s->fd != -1) {
242         net_dgram_read_poll(s, false);
243         net_dgram_write_poll(s, false);
244         close(s->fd);
245         s->fd = -1;
246     }
247     g_free(s->dest_addr);
248     s->dest_addr = NULL;
249     s->dest_len = 0;
250 }
251 
252 static NetClientInfo net_dgram_socket_info = {
253     .type = NET_CLIENT_DRIVER_DGRAM,
254     .size = sizeof(NetDgramState),
255     .receive = net_dgram_receive,
256     .cleanup = net_dgram_cleanup,
257 };
258 
259 static NetDgramState *net_dgram_fd_init(NetClientState *peer,
260                                         const char *model,
261                                         const char *name,
262                                         int fd,
263                                         Error **errp)
264 {
265     NetClientState *nc;
266     NetDgramState *s;
267 
268     nc = qemu_new_net_client(&net_dgram_socket_info, peer, model, name);
269 
270     s = DO_UPCAST(NetDgramState, nc, nc);
271 
272     s->fd = fd;
273     net_socket_rs_init(&s->rs, net_dgram_rs_finalize, false);
274     net_dgram_read_poll(s, true);
275 
276     return s;
277 }
278 
279 static int net_dgram_mcast_init(NetClientState *peer,
280                                 const char *model,
281                                 const char *name,
282                                 SocketAddress *remote,
283                                 SocketAddress *local,
284                                 Error **errp)
285 {
286     NetDgramState *s;
287     int fd, ret;
288     struct sockaddr_in *saddr;
289 
290     if (remote->type != SOCKET_ADDRESS_TYPE_INET) {
291         error_setg(errp, "multicast only support inet type");
292         return -1;
293     }
294 
295     saddr = g_new(struct sockaddr_in, 1);
296     if (convert_host_port(saddr, remote->u.inet.host, remote->u.inet.port,
297                           errp) < 0) {
298         g_free(saddr);
299         return -1;
300     }
301 
302     if (!local) {
303         fd = net_dgram_mcast_create(saddr, NULL, errp);
304         if (fd < 0) {
305             g_free(saddr);
306             return -1;
307         }
308     } else {
309         switch (local->type) {
310         case SOCKET_ADDRESS_TYPE_INET: {
311             struct in_addr localaddr;
312 
313             if (inet_aton(local->u.inet.host, &localaddr) == 0) {
314                 g_free(saddr);
315                 error_setg(errp, "localaddr '%s' is not a valid IPv4 address",
316                            local->u.inet.host);
317                 return -1;
318             }
319 
320             fd = net_dgram_mcast_create(saddr, &localaddr, errp);
321             if (fd < 0) {
322                 g_free(saddr);
323                 return -1;
324             }
325             break;
326         }
327         case SOCKET_ADDRESS_TYPE_FD: {
328             int newfd;
329 
330             fd = monitor_fd_param(monitor_cur(), local->u.fd.str, errp);
331             if (fd == -1) {
332                 g_free(saddr);
333                 return -1;
334             }
335             ret = qemu_socket_try_set_nonblock(fd);
336             if (ret < 0) {
337                 g_free(saddr);
338                 error_setg_errno(errp, -ret, "%s: Can't use file descriptor %d",
339                                  name, fd);
340                 return -1;
341             }
342 
343             /*
344              * fd passed: multicast: "learn" dest_addr address from bound
345              * address and save it. Because this may be "shared" socket from a
346              * "master" process, datagrams would be recv() by ONLY ONE process:
347              * we must "clone" this dgram socket --jjo
348              */
349 
350             saddr = g_new(struct sockaddr_in, 1);
351 
352             if (convert_host_port(saddr, local->u.inet.host, local->u.inet.port,
353                                   errp) < 0) {
354                 g_free(saddr);
355                 close(fd);
356                 return -1;
357             }
358 
359             /* must be bound */
360             if (saddr->sin_addr.s_addr == 0) {
361                 error_setg(errp, "can't setup multicast destination address");
362                 g_free(saddr);
363                 close(fd);
364                 return -1;
365             }
366             /* clone dgram socket */
367             newfd = net_dgram_mcast_create(saddr, NULL, errp);
368             if (newfd < 0) {
369                 g_free(saddr);
370                 close(fd);
371                 return -1;
372             }
373             /* clone newfd to fd, close newfd */
374             dup2(newfd, fd);
375             close(newfd);
376             break;
377         }
378         default:
379             g_free(saddr);
380             error_setg(errp, "only support inet or fd type for local");
381             return -1;
382         }
383     }
384 
385     s = net_dgram_fd_init(peer, model, name, fd, errp);
386     if (!s) {
387         g_free(saddr);
388         return -1;
389     }
390 
391     g_assert(s->dest_addr == NULL);
392     s->dest_addr = (struct sockaddr *)saddr;
393     s->dest_len = sizeof(*saddr);
394 
395     if (!local) {
396         qemu_set_info_str(&s->nc, "mcast=%s:%d",
397                           inet_ntoa(saddr->sin_addr),
398                           ntohs(saddr->sin_port));
399     } else {
400         switch (local->type) {
401         case SOCKET_ADDRESS_TYPE_INET:
402             qemu_set_info_str(&s->nc, "mcast=%s:%d",
403                               inet_ntoa(saddr->sin_addr),
404                               ntohs(saddr->sin_port));
405             break;
406         case SOCKET_ADDRESS_TYPE_FD:
407             qemu_set_info_str(&s->nc, "fd=%d (cloned mcast=%s:%d)",
408                               fd, inet_ntoa(saddr->sin_addr),
409                               ntohs(saddr->sin_port));
410             break;
411         default:
412             g_assert_not_reached();
413         }
414     }
415 
416     return 0;
417 
418 }
419 
420 
421 int net_init_dgram(const Netdev *netdev, const char *name,
422                    NetClientState *peer, Error **errp)
423 {
424     NetDgramState *s;
425     int fd, ret;
426     SocketAddress *remote, *local;
427     struct sockaddr *dest_addr;
428     struct sockaddr_in laddr_in, raddr_in;
429     struct sockaddr_un laddr_un, raddr_un;
430     socklen_t dest_len;
431 
432     assert(netdev->type == NET_CLIENT_DRIVER_DGRAM);
433 
434     remote = netdev->u.dgram.remote;
435     local = netdev->u.dgram.local;
436 
437     /* detect multicast address */
438     if (remote && remote->type == SOCKET_ADDRESS_TYPE_INET) {
439         struct sockaddr_in mcastaddr;
440 
441         if (convert_host_port(&mcastaddr, remote->u.inet.host,
442                               remote->u.inet.port, errp) < 0) {
443             return -1;
444         }
445 
446         if (IN_MULTICAST(ntohl(mcastaddr.sin_addr.s_addr))) {
447             return net_dgram_mcast_init(peer, "dram", name, remote, local,
448                                            errp);
449         }
450     }
451 
452     /* unicast address */
453     if (!local) {
454         error_setg(errp, "dgram requires local= parameter");
455         return -1;
456     }
457 
458     if (remote) {
459         if (local->type == SOCKET_ADDRESS_TYPE_FD) {
460             error_setg(errp, "don't set remote with local.fd");
461             return -1;
462         }
463         if (remote->type != local->type) {
464             error_setg(errp, "remote and local types must be the same");
465             return -1;
466         }
467     } else {
468         if (local->type != SOCKET_ADDRESS_TYPE_FD) {
469             error_setg(errp,
470                        "type=inet or type=unix requires remote parameter");
471             return -1;
472         }
473     }
474 
475     switch (local->type) {
476     case SOCKET_ADDRESS_TYPE_INET:
477         if (convert_host_port(&laddr_in, local->u.inet.host, local->u.inet.port,
478                               errp) < 0) {
479             return -1;
480         }
481 
482         if (convert_host_port(&raddr_in, remote->u.inet.host,
483                               remote->u.inet.port, errp) < 0) {
484             return -1;
485         }
486 
487         fd = qemu_socket(PF_INET, SOCK_DGRAM, 0);
488         if (fd < 0) {
489             error_setg_errno(errp, errno, "can't create datagram socket");
490             return -1;
491         }
492 
493         ret = socket_set_fast_reuse(fd);
494         if (ret < 0) {
495             error_setg_errno(errp, errno,
496                              "can't set socket option SO_REUSEADDR");
497             close(fd);
498             return -1;
499         }
500         ret = bind(fd, (struct sockaddr *)&laddr_in, sizeof(laddr_in));
501         if (ret < 0) {
502             error_setg_errno(errp, errno, "can't bind ip=%s to socket",
503                              inet_ntoa(laddr_in.sin_addr));
504             close(fd);
505             return -1;
506         }
507         qemu_socket_set_nonblock(fd);
508 
509         dest_len = sizeof(raddr_in);
510         dest_addr = g_malloc(dest_len);
511         memcpy(dest_addr, &raddr_in, dest_len);
512         break;
513     case SOCKET_ADDRESS_TYPE_UNIX:
514         ret = unlink(local->u.q_unix.path);
515         if (ret < 0 && errno != ENOENT) {
516             error_setg_errno(errp, errno, "failed to unlink socket %s",
517                              local->u.q_unix.path);
518             return -1;
519         }
520 
521         laddr_un.sun_family = PF_UNIX;
522         ret = snprintf(laddr_un.sun_path, sizeof(laddr_un.sun_path), "%s",
523                        local->u.q_unix.path);
524         if (ret < 0 || ret >= sizeof(laddr_un.sun_path)) {
525             error_setg(errp, "UNIX socket path '%s' is too long",
526                        local->u.q_unix.path);
527             error_append_hint(errp, "Path must be less than %zu bytes\n",
528                               sizeof(laddr_un.sun_path));
529         }
530 
531         raddr_un.sun_family = PF_UNIX;
532         ret = snprintf(raddr_un.sun_path, sizeof(raddr_un.sun_path), "%s",
533                        remote->u.q_unix.path);
534         if (ret < 0 || ret >= sizeof(raddr_un.sun_path)) {
535             error_setg(errp, "UNIX socket path '%s' is too long",
536                        remote->u.q_unix.path);
537             error_append_hint(errp, "Path must be less than %zu bytes\n",
538                               sizeof(raddr_un.sun_path));
539         }
540 
541         fd = qemu_socket(PF_UNIX, SOCK_DGRAM, 0);
542         if (fd < 0) {
543             error_setg_errno(errp, errno, "can't create datagram socket");
544             return -1;
545         }
546 
547         ret = bind(fd, (struct sockaddr *)&laddr_un, sizeof(laddr_un));
548         if (ret < 0) {
549             error_setg_errno(errp, errno, "can't bind unix=%s to socket",
550                              laddr_un.sun_path);
551             close(fd);
552             return -1;
553         }
554         qemu_socket_set_nonblock(fd);
555 
556         dest_len = sizeof(raddr_un);
557         dest_addr = g_malloc(dest_len);
558         memcpy(dest_addr, &raddr_un, dest_len);
559         break;
560     case SOCKET_ADDRESS_TYPE_FD:
561         fd = monitor_fd_param(monitor_cur(), local->u.fd.str, errp);
562         if (fd == -1) {
563             return -1;
564         }
565         ret = qemu_socket_try_set_nonblock(fd);
566         if (ret < 0) {
567             error_setg_errno(errp, -ret, "%s: Can't use file descriptor %d",
568                              name, fd);
569             return -1;
570         }
571         dest_addr = NULL;
572         dest_len = 0;
573         break;
574     default:
575         error_setg(errp, "only support inet or fd type for local");
576         return -1;
577     }
578 
579     s = net_dgram_fd_init(peer, "dgram", name, fd, errp);
580     if (!s) {
581         return -1;
582     }
583 
584     if (remote) {
585         g_assert(s->dest_addr == NULL);
586         s->dest_addr = dest_addr;
587         s->dest_len = dest_len;
588     }
589 
590     switch (local->type) {
591     case SOCKET_ADDRESS_TYPE_INET:
592         qemu_set_info_str(&s->nc, "udp=%s:%d/%s:%d",
593                           inet_ntoa(laddr_in.sin_addr),
594                           ntohs(laddr_in.sin_port),
595                           inet_ntoa(raddr_in.sin_addr),
596                           ntohs(raddr_in.sin_port));
597         break;
598     case SOCKET_ADDRESS_TYPE_UNIX:
599         qemu_set_info_str(&s->nc, "udp=%s:%s",
600                           laddr_un.sun_path, raddr_un.sun_path);
601         break;
602     case SOCKET_ADDRESS_TYPE_FD: {
603         SocketAddress *sa;
604         SocketAddressType sa_type;
605 
606         sa = socket_local_address(fd, errp);
607         if (sa) {
608             sa_type = sa->type;
609             qapi_free_SocketAddress(sa);
610 
611             qemu_set_info_str(&s->nc, "fd=%d %s", fd,
612                               SocketAddressType_str(sa_type));
613         } else {
614             qemu_set_info_str(&s->nc, "fd=%d", fd);
615         }
616         break;
617     }
618     default:
619         g_assert_not_reached();
620     }
621 
622     return 0;
623 }
624