784e7a2531
Signed-off-by: Laurent Vivier <lvivier@redhat.com> Reviewed-by: Stefano Brivio <sbrivio@redhat.com> Reviewed-by: David Gibson <david@gibson.dropbear.id.au> Acked-by: Michael S. Tsirkin <mst@redhat.com> Acked-by: Markus Armbruster <armbru@redhat.com> (QAPI schema) Signed-off-by: Jason Wang <jasowang@redhat.com>
624 lines
19 KiB
C
624 lines
19 KiB
C
/*
|
|
* QEMU System Emulator
|
|
*
|
|
* Copyright (c) 2003-2008 Fabrice Bellard
|
|
* Copyright (c) 2022 Red Hat, Inc.
|
|
*
|
|
* Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
* of this software and associated documentation files (the "Software"), to deal
|
|
* in the Software without restriction, including without limitation the rights
|
|
* to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
* copies of the Software, and to permit persons to whom the Software is
|
|
* furnished to do so, subject to the following conditions:
|
|
*
|
|
* The above copyright notice and this permission notice shall be included in
|
|
* all copies or substantial portions of the Software.
|
|
*
|
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
|
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
|
* THE SOFTWARE.
|
|
*/
|
|
|
|
#include "qemu/osdep.h"
|
|
|
|
#include "net/net.h"
|
|
#include "clients.h"
|
|
#include "monitor/monitor.h"
|
|
#include "qapi/error.h"
|
|
#include "qemu/error-report.h"
|
|
#include "qemu/option.h"
|
|
#include "qemu/sockets.h"
|
|
#include "qemu/iov.h"
|
|
#include "qemu/main-loop.h"
|
|
#include "qemu/cutils.h"
|
|
|
|
typedef struct NetDgramState {
|
|
NetClientState nc;
|
|
int fd;
|
|
SocketReadState rs;
|
|
bool read_poll; /* waiting to receive data? */
|
|
bool write_poll; /* waiting to transmit data? */
|
|
/* contains destination iff connectionless */
|
|
struct sockaddr *dest_addr;
|
|
socklen_t dest_len;
|
|
} NetDgramState;
|
|
|
|
static void net_dgram_send(void *opaque);
|
|
static void net_dgram_writable(void *opaque);
|
|
|
|
static void net_dgram_update_fd_handler(NetDgramState *s)
|
|
{
|
|
qemu_set_fd_handler(s->fd,
|
|
s->read_poll ? net_dgram_send : NULL,
|
|
s->write_poll ? net_dgram_writable : NULL,
|
|
s);
|
|
}
|
|
|
|
static void net_dgram_read_poll(NetDgramState *s, bool enable)
|
|
{
|
|
s->read_poll = enable;
|
|
net_dgram_update_fd_handler(s);
|
|
}
|
|
|
|
static void net_dgram_write_poll(NetDgramState *s, bool enable)
|
|
{
|
|
s->write_poll = enable;
|
|
net_dgram_update_fd_handler(s);
|
|
}
|
|
|
|
static void net_dgram_writable(void *opaque)
|
|
{
|
|
NetDgramState *s = opaque;
|
|
|
|
net_dgram_write_poll(s, false);
|
|
|
|
qemu_flush_queued_packets(&s->nc);
|
|
}
|
|
|
|
static ssize_t net_dgram_receive(NetClientState *nc,
|
|
const uint8_t *buf, size_t size)
|
|
{
|
|
NetDgramState *s = DO_UPCAST(NetDgramState, nc, nc);
|
|
ssize_t ret;
|
|
|
|
do {
|
|
if (s->dest_addr) {
|
|
ret = sendto(s->fd, buf, size, 0, s->dest_addr, s->dest_len);
|
|
} else {
|
|
ret = send(s->fd, buf, size, 0);
|
|
}
|
|
} while (ret == -1 && errno == EINTR);
|
|
|
|
if (ret == -1 && errno == EAGAIN) {
|
|
net_dgram_write_poll(s, true);
|
|
return 0;
|
|
}
|
|
return ret;
|
|
}
|
|
|
|
static void net_dgram_send_completed(NetClientState *nc, ssize_t len)
|
|
{
|
|
NetDgramState *s = DO_UPCAST(NetDgramState, nc, nc);
|
|
|
|
if (!s->read_poll) {
|
|
net_dgram_read_poll(s, true);
|
|
}
|
|
}
|
|
|
|
static void net_dgram_rs_finalize(SocketReadState *rs)
|
|
{
|
|
NetDgramState *s = container_of(rs, NetDgramState, rs);
|
|
|
|
if (qemu_send_packet_async(&s->nc, rs->buf,
|
|
rs->packet_len,
|
|
net_dgram_send_completed) == 0) {
|
|
net_dgram_read_poll(s, false);
|
|
}
|
|
}
|
|
|
|
static void net_dgram_send(void *opaque)
|
|
{
|
|
NetDgramState *s = opaque;
|
|
int size;
|
|
|
|
size = recv(s->fd, s->rs.buf, sizeof(s->rs.buf), 0);
|
|
if (size < 0) {
|
|
return;
|
|
}
|
|
if (size == 0) {
|
|
/* end of connection */
|
|
net_dgram_read_poll(s, false);
|
|
net_dgram_write_poll(s, false);
|
|
return;
|
|
}
|
|
if (qemu_send_packet_async(&s->nc, s->rs.buf, size,
|
|
net_dgram_send_completed) == 0) {
|
|
net_dgram_read_poll(s, false);
|
|
}
|
|
}
|
|
|
|
static int net_dgram_mcast_create(struct sockaddr_in *mcastaddr,
|
|
struct in_addr *localaddr,
|
|
Error **errp)
|
|
{
|
|
struct ip_mreq imr;
|
|
int fd;
|
|
int val, ret;
|
|
#ifdef __OpenBSD__
|
|
unsigned char loop;
|
|
#else
|
|
int loop;
|
|
#endif
|
|
|
|
if (!IN_MULTICAST(ntohl(mcastaddr->sin_addr.s_addr))) {
|
|
error_setg(errp, "specified mcastaddr %s (0x%08x) "
|
|
"does not contain a multicast address",
|
|
inet_ntoa(mcastaddr->sin_addr),
|
|
(int)ntohl(mcastaddr->sin_addr.s_addr));
|
|
return -1;
|
|
}
|
|
|
|
fd = qemu_socket(PF_INET, SOCK_DGRAM, 0);
|
|
if (fd < 0) {
|
|
error_setg_errno(errp, errno, "can't create datagram socket");
|
|
return -1;
|
|
}
|
|
|
|
/*
|
|
* Allow multiple sockets to bind the same multicast ip and port by setting
|
|
* SO_REUSEADDR. This is the only situation where SO_REUSEADDR should be set
|
|
* on windows. Use socket_set_fast_reuse otherwise as it sets SO_REUSEADDR
|
|
* only on posix systems.
|
|
*/
|
|
val = 1;
|
|
ret = setsockopt(fd, SOL_SOCKET, SO_REUSEADDR, &val, sizeof(val));
|
|
if (ret < 0) {
|
|
error_setg_errno(errp, errno, "can't set socket option SO_REUSEADDR");
|
|
goto fail;
|
|
}
|
|
|
|
ret = bind(fd, (struct sockaddr *)mcastaddr, sizeof(*mcastaddr));
|
|
if (ret < 0) {
|
|
error_setg_errno(errp, errno, "can't bind ip=%s to socket",
|
|
inet_ntoa(mcastaddr->sin_addr));
|
|
goto fail;
|
|
}
|
|
|
|
/* Add host to multicast group */
|
|
imr.imr_multiaddr = mcastaddr->sin_addr;
|
|
if (localaddr) {
|
|
imr.imr_interface = *localaddr;
|
|
} else {
|
|
imr.imr_interface.s_addr = htonl(INADDR_ANY);
|
|
}
|
|
|
|
ret = setsockopt(fd, IPPROTO_IP, IP_ADD_MEMBERSHIP,
|
|
&imr, sizeof(struct ip_mreq));
|
|
if (ret < 0) {
|
|
error_setg_errno(errp, errno,
|
|
"can't add socket to multicast group %s",
|
|
inet_ntoa(imr.imr_multiaddr));
|
|
goto fail;
|
|
}
|
|
|
|
/* Force mcast msgs to loopback (eg. several QEMUs in same host */
|
|
loop = 1;
|
|
ret = setsockopt(fd, IPPROTO_IP, IP_MULTICAST_LOOP,
|
|
&loop, sizeof(loop));
|
|
if (ret < 0) {
|
|
error_setg_errno(errp, errno,
|
|
"can't force multicast message to loopback");
|
|
goto fail;
|
|
}
|
|
|
|
/* If a bind address is given, only send packets from that address */
|
|
if (localaddr != NULL) {
|
|
ret = setsockopt(fd, IPPROTO_IP, IP_MULTICAST_IF,
|
|
localaddr, sizeof(*localaddr));
|
|
if (ret < 0) {
|
|
error_setg_errno(errp, errno,
|
|
"can't set the default network send interface");
|
|
goto fail;
|
|
}
|
|
}
|
|
|
|
qemu_socket_set_nonblock(fd);
|
|
return fd;
|
|
fail:
|
|
if (fd >= 0) {
|
|
closesocket(fd);
|
|
}
|
|
return -1;
|
|
}
|
|
|
|
static void net_dgram_cleanup(NetClientState *nc)
|
|
{
|
|
NetDgramState *s = DO_UPCAST(NetDgramState, nc, nc);
|
|
if (s->fd != -1) {
|
|
net_dgram_read_poll(s, false);
|
|
net_dgram_write_poll(s, false);
|
|
close(s->fd);
|
|
s->fd = -1;
|
|
}
|
|
g_free(s->dest_addr);
|
|
s->dest_addr = NULL;
|
|
s->dest_len = 0;
|
|
}
|
|
|
|
static NetClientInfo net_dgram_socket_info = {
|
|
.type = NET_CLIENT_DRIVER_DGRAM,
|
|
.size = sizeof(NetDgramState),
|
|
.receive = net_dgram_receive,
|
|
.cleanup = net_dgram_cleanup,
|
|
};
|
|
|
|
static NetDgramState *net_dgram_fd_init(NetClientState *peer,
|
|
const char *model,
|
|
const char *name,
|
|
int fd,
|
|
Error **errp)
|
|
{
|
|
NetClientState *nc;
|
|
NetDgramState *s;
|
|
|
|
nc = qemu_new_net_client(&net_dgram_socket_info, peer, model, name);
|
|
|
|
s = DO_UPCAST(NetDgramState, nc, nc);
|
|
|
|
s->fd = fd;
|
|
net_socket_rs_init(&s->rs, net_dgram_rs_finalize, false);
|
|
net_dgram_read_poll(s, true);
|
|
|
|
return s;
|
|
}
|
|
|
|
static int net_dgram_mcast_init(NetClientState *peer,
|
|
const char *model,
|
|
const char *name,
|
|
SocketAddress *remote,
|
|
SocketAddress *local,
|
|
Error **errp)
|
|
{
|
|
NetDgramState *s;
|
|
int fd, ret;
|
|
struct sockaddr_in *saddr;
|
|
|
|
if (remote->type != SOCKET_ADDRESS_TYPE_INET) {
|
|
error_setg(errp, "multicast only support inet type");
|
|
return -1;
|
|
}
|
|
|
|
saddr = g_new(struct sockaddr_in, 1);
|
|
if (convert_host_port(saddr, remote->u.inet.host, remote->u.inet.port,
|
|
errp) < 0) {
|
|
g_free(saddr);
|
|
return -1;
|
|
}
|
|
|
|
if (!local) {
|
|
fd = net_dgram_mcast_create(saddr, NULL, errp);
|
|
if (fd < 0) {
|
|
g_free(saddr);
|
|
return -1;
|
|
}
|
|
} else {
|
|
switch (local->type) {
|
|
case SOCKET_ADDRESS_TYPE_INET: {
|
|
struct in_addr localaddr;
|
|
|
|
if (inet_aton(local->u.inet.host, &localaddr) == 0) {
|
|
g_free(saddr);
|
|
error_setg(errp, "localaddr '%s' is not a valid IPv4 address",
|
|
local->u.inet.host);
|
|
return -1;
|
|
}
|
|
|
|
fd = net_dgram_mcast_create(saddr, &localaddr, errp);
|
|
if (fd < 0) {
|
|
g_free(saddr);
|
|
return -1;
|
|
}
|
|
break;
|
|
}
|
|
case SOCKET_ADDRESS_TYPE_FD: {
|
|
int newfd;
|
|
|
|
fd = monitor_fd_param(monitor_cur(), local->u.fd.str, errp);
|
|
if (fd == -1) {
|
|
g_free(saddr);
|
|
return -1;
|
|
}
|
|
ret = qemu_socket_try_set_nonblock(fd);
|
|
if (ret < 0) {
|
|
g_free(saddr);
|
|
error_setg_errno(errp, -ret, "%s: Can't use file descriptor %d",
|
|
name, fd);
|
|
return -1;
|
|
}
|
|
|
|
/*
|
|
* fd passed: multicast: "learn" dest_addr address from bound
|
|
* address and save it. Because this may be "shared" socket from a
|
|
* "master" process, datagrams would be recv() by ONLY ONE process:
|
|
* we must "clone" this dgram socket --jjo
|
|
*/
|
|
|
|
saddr = g_new(struct sockaddr_in, 1);
|
|
|
|
if (convert_host_port(saddr, local->u.inet.host, local->u.inet.port,
|
|
errp) < 0) {
|
|
g_free(saddr);
|
|
closesocket(fd);
|
|
return -1;
|
|
}
|
|
|
|
/* must be bound */
|
|
if (saddr->sin_addr.s_addr == 0) {
|
|
error_setg(errp, "can't setup multicast destination address");
|
|
g_free(saddr);
|
|
closesocket(fd);
|
|
return -1;
|
|
}
|
|
/* clone dgram socket */
|
|
newfd = net_dgram_mcast_create(saddr, NULL, errp);
|
|
if (newfd < 0) {
|
|
g_free(saddr);
|
|
closesocket(fd);
|
|
return -1;
|
|
}
|
|
/* clone newfd to fd, close newfd */
|
|
dup2(newfd, fd);
|
|
close(newfd);
|
|
break;
|
|
}
|
|
default:
|
|
g_free(saddr);
|
|
error_setg(errp, "only support inet or fd type for local");
|
|
return -1;
|
|
}
|
|
}
|
|
|
|
s = net_dgram_fd_init(peer, model, name, fd, errp);
|
|
if (!s) {
|
|
g_free(saddr);
|
|
return -1;
|
|
}
|
|
|
|
g_assert(s->dest_addr == NULL);
|
|
s->dest_addr = (struct sockaddr *)saddr;
|
|
s->dest_len = sizeof(*saddr);
|
|
|
|
if (!local) {
|
|
qemu_set_info_str(&s->nc, "mcast=%s:%d",
|
|
inet_ntoa(saddr->sin_addr),
|
|
ntohs(saddr->sin_port));
|
|
} else {
|
|
switch (local->type) {
|
|
case SOCKET_ADDRESS_TYPE_INET:
|
|
qemu_set_info_str(&s->nc, "mcast=%s:%d",
|
|
inet_ntoa(saddr->sin_addr),
|
|
ntohs(saddr->sin_port));
|
|
break;
|
|
case SOCKET_ADDRESS_TYPE_FD:
|
|
qemu_set_info_str(&s->nc, "fd=%d (cloned mcast=%s:%d)",
|
|
fd, inet_ntoa(saddr->sin_addr),
|
|
ntohs(saddr->sin_port));
|
|
break;
|
|
default:
|
|
g_assert_not_reached();
|
|
}
|
|
}
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
int net_init_dgram(const Netdev *netdev, const char *name,
|
|
NetClientState *peer, Error **errp)
|
|
{
|
|
NetDgramState *s;
|
|
int fd, ret;
|
|
SocketAddress *remote, *local;
|
|
struct sockaddr *dest_addr;
|
|
struct sockaddr_in laddr_in, raddr_in;
|
|
struct sockaddr_un laddr_un, raddr_un;
|
|
socklen_t dest_len;
|
|
|
|
assert(netdev->type == NET_CLIENT_DRIVER_DGRAM);
|
|
|
|
remote = netdev->u.dgram.remote;
|
|
local = netdev->u.dgram.local;
|
|
|
|
/* detect multicast address */
|
|
if (remote && remote->type == SOCKET_ADDRESS_TYPE_INET) {
|
|
struct sockaddr_in mcastaddr;
|
|
|
|
if (convert_host_port(&mcastaddr, remote->u.inet.host,
|
|
remote->u.inet.port, errp) < 0) {
|
|
return -1;
|
|
}
|
|
|
|
if (IN_MULTICAST(ntohl(mcastaddr.sin_addr.s_addr))) {
|
|
return net_dgram_mcast_init(peer, "dram", name, remote, local,
|
|
errp);
|
|
}
|
|
}
|
|
|
|
/* unicast address */
|
|
if (!local) {
|
|
error_setg(errp, "dgram requires local= parameter");
|
|
return -1;
|
|
}
|
|
|
|
if (remote) {
|
|
if (local->type == SOCKET_ADDRESS_TYPE_FD) {
|
|
error_setg(errp, "don't set remote with local.fd");
|
|
return -1;
|
|
}
|
|
if (remote->type != local->type) {
|
|
error_setg(errp, "remote and local types must be the same");
|
|
return -1;
|
|
}
|
|
} else {
|
|
if (local->type != SOCKET_ADDRESS_TYPE_FD) {
|
|
error_setg(errp,
|
|
"type=inet or type=unix requires remote parameter");
|
|
return -1;
|
|
}
|
|
}
|
|
|
|
switch (local->type) {
|
|
case SOCKET_ADDRESS_TYPE_INET:
|
|
if (convert_host_port(&laddr_in, local->u.inet.host, local->u.inet.port,
|
|
errp) < 0) {
|
|
return -1;
|
|
}
|
|
|
|
if (convert_host_port(&raddr_in, remote->u.inet.host,
|
|
remote->u.inet.port, errp) < 0) {
|
|
return -1;
|
|
}
|
|
|
|
fd = qemu_socket(PF_INET, SOCK_DGRAM, 0);
|
|
if (fd < 0) {
|
|
error_setg_errno(errp, errno, "can't create datagram socket");
|
|
return -1;
|
|
}
|
|
|
|
ret = socket_set_fast_reuse(fd);
|
|
if (ret < 0) {
|
|
error_setg_errno(errp, errno,
|
|
"can't set socket option SO_REUSEADDR");
|
|
closesocket(fd);
|
|
return -1;
|
|
}
|
|
ret = bind(fd, (struct sockaddr *)&laddr_in, sizeof(laddr_in));
|
|
if (ret < 0) {
|
|
error_setg_errno(errp, errno, "can't bind ip=%s to socket",
|
|
inet_ntoa(laddr_in.sin_addr));
|
|
closesocket(fd);
|
|
return -1;
|
|
}
|
|
qemu_socket_set_nonblock(fd);
|
|
|
|
dest_len = sizeof(raddr_in);
|
|
dest_addr = g_malloc(dest_len);
|
|
memcpy(dest_addr, &raddr_in, dest_len);
|
|
break;
|
|
case SOCKET_ADDRESS_TYPE_UNIX:
|
|
ret = unlink(local->u.q_unix.path);
|
|
if (ret < 0 && errno != ENOENT) {
|
|
error_setg_errno(errp, errno, "failed to unlink socket %s",
|
|
local->u.q_unix.path);
|
|
return -1;
|
|
}
|
|
|
|
laddr_un.sun_family = PF_UNIX;
|
|
ret = snprintf(laddr_un.sun_path, sizeof(laddr_un.sun_path), "%s",
|
|
local->u.q_unix.path);
|
|
if (ret < 0 || ret >= sizeof(laddr_un.sun_path)) {
|
|
error_setg(errp, "UNIX socket path '%s' is too long",
|
|
local->u.q_unix.path);
|
|
error_append_hint(errp, "Path must be less than %zu bytes\n",
|
|
sizeof(laddr_un.sun_path));
|
|
}
|
|
|
|
raddr_un.sun_family = PF_UNIX;
|
|
ret = snprintf(raddr_un.sun_path, sizeof(raddr_un.sun_path), "%s",
|
|
remote->u.q_unix.path);
|
|
if (ret < 0 || ret >= sizeof(raddr_un.sun_path)) {
|
|
error_setg(errp, "UNIX socket path '%s' is too long",
|
|
remote->u.q_unix.path);
|
|
error_append_hint(errp, "Path must be less than %zu bytes\n",
|
|
sizeof(raddr_un.sun_path));
|
|
}
|
|
|
|
fd = qemu_socket(PF_UNIX, SOCK_DGRAM, 0);
|
|
if (fd < 0) {
|
|
error_setg_errno(errp, errno, "can't create datagram socket");
|
|
return -1;
|
|
}
|
|
|
|
ret = bind(fd, (struct sockaddr *)&laddr_un, sizeof(laddr_un));
|
|
if (ret < 0) {
|
|
error_setg_errno(errp, errno, "can't bind unix=%s to socket",
|
|
laddr_un.sun_path);
|
|
closesocket(fd);
|
|
return -1;
|
|
}
|
|
qemu_socket_set_nonblock(fd);
|
|
|
|
dest_len = sizeof(raddr_un);
|
|
dest_addr = g_malloc(dest_len);
|
|
memcpy(dest_addr, &raddr_un, dest_len);
|
|
break;
|
|
case SOCKET_ADDRESS_TYPE_FD:
|
|
fd = monitor_fd_param(monitor_cur(), local->u.fd.str, errp);
|
|
if (fd == -1) {
|
|
return -1;
|
|
}
|
|
ret = qemu_socket_try_set_nonblock(fd);
|
|
if (ret < 0) {
|
|
error_setg_errno(errp, -ret, "%s: Can't use file descriptor %d",
|
|
name, fd);
|
|
return -1;
|
|
}
|
|
dest_addr = NULL;
|
|
dest_len = 0;
|
|
break;
|
|
default:
|
|
error_setg(errp, "only support inet or fd type for local");
|
|
return -1;
|
|
}
|
|
|
|
s = net_dgram_fd_init(peer, "dgram", name, fd, errp);
|
|
if (!s) {
|
|
return -1;
|
|
}
|
|
|
|
if (remote) {
|
|
g_assert(s->dest_addr == NULL);
|
|
s->dest_addr = dest_addr;
|
|
s->dest_len = dest_len;
|
|
}
|
|
|
|
switch (local->type) {
|
|
case SOCKET_ADDRESS_TYPE_INET:
|
|
qemu_set_info_str(&s->nc, "udp=%s:%d/%s:%d",
|
|
inet_ntoa(laddr_in.sin_addr),
|
|
ntohs(laddr_in.sin_port),
|
|
inet_ntoa(raddr_in.sin_addr),
|
|
ntohs(raddr_in.sin_port));
|
|
break;
|
|
case SOCKET_ADDRESS_TYPE_UNIX:
|
|
qemu_set_info_str(&s->nc, "udp=%s:%s",
|
|
laddr_un.sun_path, raddr_un.sun_path);
|
|
break;
|
|
case SOCKET_ADDRESS_TYPE_FD: {
|
|
SocketAddress *sa;
|
|
SocketAddressType sa_type;
|
|
|
|
sa = socket_local_address(fd, errp);
|
|
if (sa) {
|
|
sa_type = sa->type;
|
|
qapi_free_SocketAddress(sa);
|
|
|
|
qemu_set_info_str(&s->nc, "fd=%d %s", fd,
|
|
SocketAddressType_str(sa_type));
|
|
} else {
|
|
qemu_set_info_str(&s->nc, "fd=%d", fd);
|
|
}
|
|
break;
|
|
}
|
|
default:
|
|
g_assert_not_reached();
|
|
}
|
|
|
|
return 0;
|
|
}
|