]> git.proxmox.com Git - mirror_qemu.git/blob - net/dgram.c
vdpa: rename vhost_vdpa_net_load to vhost_vdpa_net_cvq_load
[mirror_qemu.git] / net / dgram.c
1 /*
2 * QEMU System Emulator
3 *
4 * Copyright (c) 2003-2008 Fabrice Bellard
5 * Copyright (c) 2022 Red Hat, Inc.
6 *
7 * Permission is hereby granted, free of charge, to any person obtaining a copy
8 * of this software and associated documentation files (the "Software"), to deal
9 * in the Software without restriction, including without limitation the rights
10 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
11 * copies of the Software, and to permit persons to whom the Software is
12 * furnished to do so, subject to the following conditions:
13 *
14 * The above copyright notice and this permission notice shall be included in
15 * all copies or substantial portions of the Software.
16 *
17 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
18 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
19 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
20 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
21 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
22 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
23 * THE SOFTWARE.
24 */
25
26 #include "qemu/osdep.h"
27
28 #include "net/net.h"
29 #include "clients.h"
30 #include "monitor/monitor.h"
31 #include "qapi/error.h"
32 #include "qemu/error-report.h"
33 #include "qemu/option.h"
34 #include "qemu/sockets.h"
35 #include "qemu/iov.h"
36 #include "qemu/main-loop.h"
37 #include "qemu/cutils.h"
38
39 typedef struct NetDgramState {
40 NetClientState nc;
41 int fd;
42 SocketReadState rs;
43 bool read_poll; /* waiting to receive data? */
44 bool write_poll; /* waiting to transmit data? */
45 /* contains destination iff connectionless */
46 struct sockaddr *dest_addr;
47 socklen_t dest_len;
48 } NetDgramState;
49
50 static void net_dgram_send(void *opaque);
51 static void net_dgram_writable(void *opaque);
52
53 static void net_dgram_update_fd_handler(NetDgramState *s)
54 {
55 qemu_set_fd_handler(s->fd,
56 s->read_poll ? net_dgram_send : NULL,
57 s->write_poll ? net_dgram_writable : NULL,
58 s);
59 }
60
61 static void net_dgram_read_poll(NetDgramState *s, bool enable)
62 {
63 s->read_poll = enable;
64 net_dgram_update_fd_handler(s);
65 }
66
67 static void net_dgram_write_poll(NetDgramState *s, bool enable)
68 {
69 s->write_poll = enable;
70 net_dgram_update_fd_handler(s);
71 }
72
73 static void net_dgram_writable(void *opaque)
74 {
75 NetDgramState *s = opaque;
76
77 net_dgram_write_poll(s, false);
78
79 qemu_flush_queued_packets(&s->nc);
80 }
81
82 static ssize_t net_dgram_receive(NetClientState *nc,
83 const uint8_t *buf, size_t size)
84 {
85 NetDgramState *s = DO_UPCAST(NetDgramState, nc, nc);
86 ssize_t ret;
87
88 do {
89 if (s->dest_addr) {
90 ret = sendto(s->fd, buf, size, 0, s->dest_addr, s->dest_len);
91 } else {
92 ret = send(s->fd, buf, size, 0);
93 }
94 } while (ret == -1 && errno == EINTR);
95
96 if (ret == -1 && errno == EAGAIN) {
97 net_dgram_write_poll(s, true);
98 return 0;
99 }
100 return ret;
101 }
102
103 static void net_dgram_send_completed(NetClientState *nc, ssize_t len)
104 {
105 NetDgramState *s = DO_UPCAST(NetDgramState, nc, nc);
106
107 if (!s->read_poll) {
108 net_dgram_read_poll(s, true);
109 }
110 }
111
112 static void net_dgram_rs_finalize(SocketReadState *rs)
113 {
114 NetDgramState *s = container_of(rs, NetDgramState, rs);
115
116 if (qemu_send_packet_async(&s->nc, rs->buf,
117 rs->packet_len,
118 net_dgram_send_completed) == 0) {
119 net_dgram_read_poll(s, false);
120 }
121 }
122
123 static void net_dgram_send(void *opaque)
124 {
125 NetDgramState *s = opaque;
126 int size;
127
128 size = recv(s->fd, s->rs.buf, sizeof(s->rs.buf), 0);
129 if (size < 0) {
130 return;
131 }
132 if (size == 0) {
133 /* end of connection */
134 net_dgram_read_poll(s, false);
135 net_dgram_write_poll(s, false);
136 return;
137 }
138 if (qemu_send_packet_async(&s->nc, s->rs.buf, size,
139 net_dgram_send_completed) == 0) {
140 net_dgram_read_poll(s, false);
141 }
142 }
143
144 static int net_dgram_mcast_create(struct sockaddr_in *mcastaddr,
145 struct in_addr *localaddr,
146 Error **errp)
147 {
148 struct ip_mreq imr;
149 int fd;
150 int val, ret;
151 #ifdef __OpenBSD__
152 unsigned char loop;
153 #else
154 int loop;
155 #endif
156
157 if (!IN_MULTICAST(ntohl(mcastaddr->sin_addr.s_addr))) {
158 error_setg(errp, "specified mcastaddr %s (0x%08x) "
159 "does not contain a multicast address",
160 inet_ntoa(mcastaddr->sin_addr),
161 (int)ntohl(mcastaddr->sin_addr.s_addr));
162 return -1;
163 }
164
165 fd = qemu_socket(PF_INET, SOCK_DGRAM, 0);
166 if (fd < 0) {
167 error_setg_errno(errp, errno, "can't create datagram socket");
168 return -1;
169 }
170
171 /*
172 * Allow multiple sockets to bind the same multicast ip and port by setting
173 * SO_REUSEADDR. This is the only situation where SO_REUSEADDR should be set
174 * on windows. Use socket_set_fast_reuse otherwise as it sets SO_REUSEADDR
175 * only on posix systems.
176 */
177 val = 1;
178 ret = setsockopt(fd, SOL_SOCKET, SO_REUSEADDR, &val, sizeof(val));
179 if (ret < 0) {
180 error_setg_errno(errp, errno, "can't set socket option SO_REUSEADDR");
181 goto fail;
182 }
183
184 ret = bind(fd, (struct sockaddr *)mcastaddr, sizeof(*mcastaddr));
185 if (ret < 0) {
186 error_setg_errno(errp, errno, "can't bind ip=%s to socket",
187 inet_ntoa(mcastaddr->sin_addr));
188 goto fail;
189 }
190
191 /* Add host to multicast group */
192 imr.imr_multiaddr = mcastaddr->sin_addr;
193 if (localaddr) {
194 imr.imr_interface = *localaddr;
195 } else {
196 imr.imr_interface.s_addr = htonl(INADDR_ANY);
197 }
198
199 ret = setsockopt(fd, IPPROTO_IP, IP_ADD_MEMBERSHIP,
200 &imr, sizeof(struct ip_mreq));
201 if (ret < 0) {
202 error_setg_errno(errp, errno,
203 "can't add socket to multicast group %s",
204 inet_ntoa(imr.imr_multiaddr));
205 goto fail;
206 }
207
208 /* Force mcast msgs to loopback (eg. several QEMUs in same host */
209 loop = 1;
210 ret = setsockopt(fd, IPPROTO_IP, IP_MULTICAST_LOOP,
211 &loop, sizeof(loop));
212 if (ret < 0) {
213 error_setg_errno(errp, errno,
214 "can't force multicast message to loopback");
215 goto fail;
216 }
217
218 /* If a bind address is given, only send packets from that address */
219 if (localaddr != NULL) {
220 ret = setsockopt(fd, IPPROTO_IP, IP_MULTICAST_IF,
221 localaddr, sizeof(*localaddr));
222 if (ret < 0) {
223 error_setg_errno(errp, errno,
224 "can't set the default network send interface");
225 goto fail;
226 }
227 }
228
229 qemu_socket_set_nonblock(fd);
230 return fd;
231 fail:
232 if (fd >= 0) {
233 close(fd);
234 }
235 return -1;
236 }
237
238 static void net_dgram_cleanup(NetClientState *nc)
239 {
240 NetDgramState *s = DO_UPCAST(NetDgramState, nc, nc);
241 if (s->fd != -1) {
242 net_dgram_read_poll(s, false);
243 net_dgram_write_poll(s, false);
244 close(s->fd);
245 s->fd = -1;
246 }
247 g_free(s->dest_addr);
248 s->dest_addr = NULL;
249 s->dest_len = 0;
250 }
251
252 static NetClientInfo net_dgram_socket_info = {
253 .type = NET_CLIENT_DRIVER_DGRAM,
254 .size = sizeof(NetDgramState),
255 .receive = net_dgram_receive,
256 .cleanup = net_dgram_cleanup,
257 };
258
259 static NetDgramState *net_dgram_fd_init(NetClientState *peer,
260 const char *model,
261 const char *name,
262 int fd,
263 Error **errp)
264 {
265 NetClientState *nc;
266 NetDgramState *s;
267
268 nc = qemu_new_net_client(&net_dgram_socket_info, peer, model, name);
269
270 s = DO_UPCAST(NetDgramState, nc, nc);
271
272 s->fd = fd;
273 net_socket_rs_init(&s->rs, net_dgram_rs_finalize, false);
274 net_dgram_read_poll(s, true);
275
276 return s;
277 }
278
279 static int net_dgram_mcast_init(NetClientState *peer,
280 const char *model,
281 const char *name,
282 SocketAddress *remote,
283 SocketAddress *local,
284 Error **errp)
285 {
286 NetDgramState *s;
287 int fd, ret;
288 struct sockaddr_in *saddr;
289
290 if (remote->type != SOCKET_ADDRESS_TYPE_INET) {
291 error_setg(errp, "multicast only support inet type");
292 return -1;
293 }
294
295 saddr = g_new(struct sockaddr_in, 1);
296 if (convert_host_port(saddr, remote->u.inet.host, remote->u.inet.port,
297 errp) < 0) {
298 g_free(saddr);
299 return -1;
300 }
301
302 if (!local) {
303 fd = net_dgram_mcast_create(saddr, NULL, errp);
304 if (fd < 0) {
305 g_free(saddr);
306 return -1;
307 }
308 } else {
309 switch (local->type) {
310 case SOCKET_ADDRESS_TYPE_INET: {
311 struct in_addr localaddr;
312
313 if (inet_aton(local->u.inet.host, &localaddr) == 0) {
314 g_free(saddr);
315 error_setg(errp, "localaddr '%s' is not a valid IPv4 address",
316 local->u.inet.host);
317 return -1;
318 }
319
320 fd = net_dgram_mcast_create(saddr, &localaddr, errp);
321 if (fd < 0) {
322 g_free(saddr);
323 return -1;
324 }
325 break;
326 }
327 case SOCKET_ADDRESS_TYPE_FD: {
328 int newfd;
329
330 fd = monitor_fd_param(monitor_cur(), local->u.fd.str, errp);
331 if (fd == -1) {
332 g_free(saddr);
333 return -1;
334 }
335 ret = qemu_socket_try_set_nonblock(fd);
336 if (ret < 0) {
337 g_free(saddr);
338 error_setg_errno(errp, -ret, "%s: Can't use file descriptor %d",
339 name, fd);
340 return -1;
341 }
342
343 /*
344 * fd passed: multicast: "learn" dest_addr address from bound
345 * address and save it. Because this may be "shared" socket from a
346 * "master" process, datagrams would be recv() by ONLY ONE process:
347 * we must "clone" this dgram socket --jjo
348 */
349
350 saddr = g_new(struct sockaddr_in, 1);
351
352 if (convert_host_port(saddr, local->u.inet.host, local->u.inet.port,
353 errp) < 0) {
354 g_free(saddr);
355 close(fd);
356 return -1;
357 }
358
359 /* must be bound */
360 if (saddr->sin_addr.s_addr == 0) {
361 error_setg(errp, "can't setup multicast destination address");
362 g_free(saddr);
363 close(fd);
364 return -1;
365 }
366 /* clone dgram socket */
367 newfd = net_dgram_mcast_create(saddr, NULL, errp);
368 if (newfd < 0) {
369 g_free(saddr);
370 close(fd);
371 return -1;
372 }
373 /* clone newfd to fd, close newfd */
374 dup2(newfd, fd);
375 close(newfd);
376 break;
377 }
378 default:
379 g_free(saddr);
380 error_setg(errp, "only support inet or fd type for local");
381 return -1;
382 }
383 }
384
385 s = net_dgram_fd_init(peer, model, name, fd, errp);
386 if (!s) {
387 g_free(saddr);
388 return -1;
389 }
390
391 g_assert(s->dest_addr == NULL);
392 s->dest_addr = (struct sockaddr *)saddr;
393 s->dest_len = sizeof(*saddr);
394
395 if (!local) {
396 qemu_set_info_str(&s->nc, "mcast=%s:%d",
397 inet_ntoa(saddr->sin_addr),
398 ntohs(saddr->sin_port));
399 } else {
400 switch (local->type) {
401 case SOCKET_ADDRESS_TYPE_INET:
402 qemu_set_info_str(&s->nc, "mcast=%s:%d",
403 inet_ntoa(saddr->sin_addr),
404 ntohs(saddr->sin_port));
405 break;
406 case SOCKET_ADDRESS_TYPE_FD:
407 qemu_set_info_str(&s->nc, "fd=%d (cloned mcast=%s:%d)",
408 fd, inet_ntoa(saddr->sin_addr),
409 ntohs(saddr->sin_port));
410 break;
411 default:
412 g_assert_not_reached();
413 }
414 }
415
416 return 0;
417
418 }
419
420
421 int net_init_dgram(const Netdev *netdev, const char *name,
422 NetClientState *peer, Error **errp)
423 {
424 NetDgramState *s;
425 int fd, ret;
426 SocketAddress *remote, *local;
427 struct sockaddr *dest_addr;
428 struct sockaddr_in laddr_in, raddr_in;
429 struct sockaddr_un laddr_un, raddr_un;
430 socklen_t dest_len;
431
432 assert(netdev->type == NET_CLIENT_DRIVER_DGRAM);
433
434 remote = netdev->u.dgram.remote;
435 local = netdev->u.dgram.local;
436
437 /* detect multicast address */
438 if (remote && remote->type == SOCKET_ADDRESS_TYPE_INET) {
439 struct sockaddr_in mcastaddr;
440
441 if (convert_host_port(&mcastaddr, remote->u.inet.host,
442 remote->u.inet.port, errp) < 0) {
443 return -1;
444 }
445
446 if (IN_MULTICAST(ntohl(mcastaddr.sin_addr.s_addr))) {
447 return net_dgram_mcast_init(peer, "dram", name, remote, local,
448 errp);
449 }
450 }
451
452 /* unicast address */
453 if (!local) {
454 error_setg(errp, "dgram requires local= parameter");
455 return -1;
456 }
457
458 if (remote) {
459 if (local->type == SOCKET_ADDRESS_TYPE_FD) {
460 error_setg(errp, "don't set remote with local.fd");
461 return -1;
462 }
463 if (remote->type != local->type) {
464 error_setg(errp, "remote and local types must be the same");
465 return -1;
466 }
467 } else {
468 if (local->type != SOCKET_ADDRESS_TYPE_FD) {
469 error_setg(errp,
470 "type=inet or type=unix requires remote parameter");
471 return -1;
472 }
473 }
474
475 switch (local->type) {
476 case SOCKET_ADDRESS_TYPE_INET:
477 if (convert_host_port(&laddr_in, local->u.inet.host, local->u.inet.port,
478 errp) < 0) {
479 return -1;
480 }
481
482 if (convert_host_port(&raddr_in, remote->u.inet.host,
483 remote->u.inet.port, errp) < 0) {
484 return -1;
485 }
486
487 fd = qemu_socket(PF_INET, SOCK_DGRAM, 0);
488 if (fd < 0) {
489 error_setg_errno(errp, errno, "can't create datagram socket");
490 return -1;
491 }
492
493 ret = socket_set_fast_reuse(fd);
494 if (ret < 0) {
495 error_setg_errno(errp, errno,
496 "can't set socket option SO_REUSEADDR");
497 close(fd);
498 return -1;
499 }
500 ret = bind(fd, (struct sockaddr *)&laddr_in, sizeof(laddr_in));
501 if (ret < 0) {
502 error_setg_errno(errp, errno, "can't bind ip=%s to socket",
503 inet_ntoa(laddr_in.sin_addr));
504 close(fd);
505 return -1;
506 }
507 qemu_socket_set_nonblock(fd);
508
509 dest_len = sizeof(raddr_in);
510 dest_addr = g_malloc(dest_len);
511 memcpy(dest_addr, &raddr_in, dest_len);
512 break;
513 case SOCKET_ADDRESS_TYPE_UNIX:
514 ret = unlink(local->u.q_unix.path);
515 if (ret < 0 && errno != ENOENT) {
516 error_setg_errno(errp, errno, "failed to unlink socket %s",
517 local->u.q_unix.path);
518 return -1;
519 }
520
521 laddr_un.sun_family = PF_UNIX;
522 ret = snprintf(laddr_un.sun_path, sizeof(laddr_un.sun_path), "%s",
523 local->u.q_unix.path);
524 if (ret < 0 || ret >= sizeof(laddr_un.sun_path)) {
525 error_setg(errp, "UNIX socket path '%s' is too long",
526 local->u.q_unix.path);
527 error_append_hint(errp, "Path must be less than %zu bytes\n",
528 sizeof(laddr_un.sun_path));
529 }
530
531 raddr_un.sun_family = PF_UNIX;
532 ret = snprintf(raddr_un.sun_path, sizeof(raddr_un.sun_path), "%s",
533 remote->u.q_unix.path);
534 if (ret < 0 || ret >= sizeof(raddr_un.sun_path)) {
535 error_setg(errp, "UNIX socket path '%s' is too long",
536 remote->u.q_unix.path);
537 error_append_hint(errp, "Path must be less than %zu bytes\n",
538 sizeof(raddr_un.sun_path));
539 }
540
541 fd = qemu_socket(PF_UNIX, SOCK_DGRAM, 0);
542 if (fd < 0) {
543 error_setg_errno(errp, errno, "can't create datagram socket");
544 return -1;
545 }
546
547 ret = bind(fd, (struct sockaddr *)&laddr_un, sizeof(laddr_un));
548 if (ret < 0) {
549 error_setg_errno(errp, errno, "can't bind unix=%s to socket",
550 laddr_un.sun_path);
551 close(fd);
552 return -1;
553 }
554 qemu_socket_set_nonblock(fd);
555
556 dest_len = sizeof(raddr_un);
557 dest_addr = g_malloc(dest_len);
558 memcpy(dest_addr, &raddr_un, dest_len);
559 break;
560 case SOCKET_ADDRESS_TYPE_FD:
561 fd = monitor_fd_param(monitor_cur(), local->u.fd.str, errp);
562 if (fd == -1) {
563 return -1;
564 }
565 ret = qemu_socket_try_set_nonblock(fd);
566 if (ret < 0) {
567 error_setg_errno(errp, -ret, "%s: Can't use file descriptor %d",
568 name, fd);
569 return -1;
570 }
571 dest_addr = NULL;
572 dest_len = 0;
573 break;
574 default:
575 error_setg(errp, "only support inet or fd type for local");
576 return -1;
577 }
578
579 s = net_dgram_fd_init(peer, "dgram", name, fd, errp);
580 if (!s) {
581 return -1;
582 }
583
584 if (remote) {
585 g_assert(s->dest_addr == NULL);
586 s->dest_addr = dest_addr;
587 s->dest_len = dest_len;
588 }
589
590 switch (local->type) {
591 case SOCKET_ADDRESS_TYPE_INET:
592 qemu_set_info_str(&s->nc, "udp=%s:%d/%s:%d",
593 inet_ntoa(laddr_in.sin_addr),
594 ntohs(laddr_in.sin_port),
595 inet_ntoa(raddr_in.sin_addr),
596 ntohs(raddr_in.sin_port));
597 break;
598 case SOCKET_ADDRESS_TYPE_UNIX:
599 qemu_set_info_str(&s->nc, "udp=%s:%s",
600 laddr_un.sun_path, raddr_un.sun_path);
601 break;
602 case SOCKET_ADDRESS_TYPE_FD: {
603 SocketAddress *sa;
604 SocketAddressType sa_type;
605
606 sa = socket_local_address(fd, errp);
607 if (sa) {
608 sa_type = sa->type;
609 qapi_free_SocketAddress(sa);
610
611 qemu_set_info_str(&s->nc, "fd=%d %s", fd,
612 SocketAddressType_str(sa_type));
613 } else {
614 qemu_set_info_str(&s->nc, "fd=%d", fd);
615 }
616 break;
617 }
618 default:
619 g_assert_not_reached();
620 }
621
622 return 0;
623 }