2009-10-22 18:49:07 +02:00
|
|
|
/*
|
|
|
|
* QEMU System Emulator
|
|
|
|
*
|
|
|
|
* Copyright (c) 2003-2008 Fabrice Bellard
|
|
|
|
* Copyright (c) 2009 Red Hat, Inc.
|
|
|
|
*
|
|
|
|
* Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
|
|
* of this software and associated documentation files (the "Software"), to deal
|
|
|
|
* in the Software without restriction, including without limitation the rights
|
|
|
|
* to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
|
|
* copies of the Software, and to permit persons to whom the Software is
|
|
|
|
* furnished to do so, subject to the following conditions:
|
|
|
|
*
|
|
|
|
* The above copyright notice and this permission notice shall be included in
|
|
|
|
* all copies or substantial portions of the Software.
|
|
|
|
*
|
|
|
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
|
|
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
|
|
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
|
|
|
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
|
|
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
|
|
* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
|
|
|
* THE SOFTWARE.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include "net/tap.h"
|
|
|
|
|
|
|
|
#include "config-host.h"
|
|
|
|
|
|
|
|
#include <sys/ioctl.h>
|
|
|
|
#include <sys/stat.h>
|
|
|
|
#include <sys/wait.h>
|
2009-10-30 22:27:00 +01:00
|
|
|
#include <sys/socket.h>
|
2009-10-22 18:49:07 +02:00
|
|
|
#include <net/if.h>
|
|
|
|
|
|
|
|
#include "net.h"
|
|
|
|
#include "sysemu.h"
|
|
|
|
#include "qemu-char.h"
|
|
|
|
#include "qemu-common.h"
|
2010-02-18 16:24:31 +01:00
|
|
|
#include "qemu-error.h"
|
2009-10-22 18:49:07 +02:00
|
|
|
|
|
|
|
#include "net/tap-linux.h"
|
|
|
|
|
2010-03-17 12:08:24 +01:00
|
|
|
#include "hw/vhost_net.h"
|
|
|
|
|
2009-10-22 18:49:07 +02:00
|
|
|
/* Maximum GSO packet size (64k) plus plenty of room for
|
|
|
|
* the ethernet and virtio_net headers
|
|
|
|
*/
|
|
|
|
#define TAP_BUFSIZE (4096 + 65536)
|
|
|
|
|
|
|
|
typedef struct TAPState {
|
2009-11-25 19:49:04 +01:00
|
|
|
VLANClientState nc;
|
2009-10-22 18:49:07 +02:00
|
|
|
int fd;
|
|
|
|
char down_script[1024];
|
|
|
|
char down_script_arg[128];
|
|
|
|
uint8_t buf[TAP_BUFSIZE];
|
|
|
|
unsigned int read_poll : 1;
|
|
|
|
unsigned int write_poll : 1;
|
|
|
|
unsigned int using_vnet_hdr : 1;
|
|
|
|
unsigned int has_ufo: 1;
|
2010-03-17 12:08:24 +01:00
|
|
|
VHostNetState *vhost_net;
|
2010-07-13 16:55:31 +02:00
|
|
|
unsigned host_vnet_hdr_len;
|
2009-10-22 18:49:07 +02:00
|
|
|
} TAPState;
|
|
|
|
|
|
|
|
static int launch_script(const char *setup_script, const char *ifname, int fd);
|
|
|
|
|
|
|
|
static int tap_can_send(void *opaque);
|
|
|
|
static void tap_send(void *opaque);
|
|
|
|
static void tap_writable(void *opaque);
|
|
|
|
|
|
|
|
static void tap_update_fd_handler(TAPState *s)
|
|
|
|
{
|
|
|
|
qemu_set_fd_handler2(s->fd,
|
|
|
|
s->read_poll ? tap_can_send : NULL,
|
|
|
|
s->read_poll ? tap_send : NULL,
|
|
|
|
s->write_poll ? tap_writable : NULL,
|
|
|
|
s);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void tap_read_poll(TAPState *s, int enable)
|
|
|
|
{
|
|
|
|
s->read_poll = !!enable;
|
|
|
|
tap_update_fd_handler(s);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void tap_write_poll(TAPState *s, int enable)
|
|
|
|
{
|
|
|
|
s->write_poll = !!enable;
|
|
|
|
tap_update_fd_handler(s);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void tap_writable(void *opaque)
|
|
|
|
{
|
|
|
|
TAPState *s = opaque;
|
|
|
|
|
|
|
|
tap_write_poll(s, 0);
|
|
|
|
|
2009-11-25 19:49:04 +01:00
|
|
|
qemu_flush_queued_packets(&s->nc);
|
2009-10-22 18:49:07 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
static ssize_t tap_write_packet(TAPState *s, const struct iovec *iov, int iovcnt)
|
|
|
|
{
|
|
|
|
ssize_t len;
|
|
|
|
|
|
|
|
do {
|
|
|
|
len = writev(s->fd, iov, iovcnt);
|
|
|
|
} while (len == -1 && errno == EINTR);
|
|
|
|
|
|
|
|
if (len == -1 && errno == EAGAIN) {
|
|
|
|
tap_write_poll(s, 1);
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
return len;
|
|
|
|
}
|
|
|
|
|
2009-11-25 19:49:04 +01:00
|
|
|
static ssize_t tap_receive_iov(VLANClientState *nc, const struct iovec *iov,
|
2009-10-22 18:49:07 +02:00
|
|
|
int iovcnt)
|
|
|
|
{
|
2009-11-25 19:49:04 +01:00
|
|
|
TAPState *s = DO_UPCAST(TAPState, nc, nc);
|
2009-10-22 18:49:07 +02:00
|
|
|
const struct iovec *iovp = iov;
|
|
|
|
struct iovec iov_copy[iovcnt + 1];
|
2010-07-13 16:55:31 +02:00
|
|
|
struct virtio_net_hdr_mrg_rxbuf hdr = { };
|
2009-10-22 18:49:07 +02:00
|
|
|
|
2010-07-13 16:55:31 +02:00
|
|
|
if (s->host_vnet_hdr_len && !s->using_vnet_hdr) {
|
2009-10-22 18:49:07 +02:00
|
|
|
iov_copy[0].iov_base = &hdr;
|
2010-07-13 16:55:31 +02:00
|
|
|
iov_copy[0].iov_len = s->host_vnet_hdr_len;
|
2009-10-22 18:49:07 +02:00
|
|
|
memcpy(&iov_copy[1], iov, iovcnt * sizeof(*iov));
|
|
|
|
iovp = iov_copy;
|
|
|
|
iovcnt++;
|
|
|
|
}
|
|
|
|
|
|
|
|
return tap_write_packet(s, iovp, iovcnt);
|
|
|
|
}
|
|
|
|
|
2009-11-25 19:49:04 +01:00
|
|
|
static ssize_t tap_receive_raw(VLANClientState *nc, const uint8_t *buf, size_t size)
|
2009-10-22 18:49:07 +02:00
|
|
|
{
|
2009-11-25 19:49:04 +01:00
|
|
|
TAPState *s = DO_UPCAST(TAPState, nc, nc);
|
2009-10-22 18:49:07 +02:00
|
|
|
struct iovec iov[2];
|
|
|
|
int iovcnt = 0;
|
2010-07-13 16:55:31 +02:00
|
|
|
struct virtio_net_hdr_mrg_rxbuf hdr = { };
|
2009-10-22 18:49:07 +02:00
|
|
|
|
2010-07-13 16:55:31 +02:00
|
|
|
if (s->host_vnet_hdr_len) {
|
2009-10-22 18:49:07 +02:00
|
|
|
iov[iovcnt].iov_base = &hdr;
|
2010-07-13 16:55:31 +02:00
|
|
|
iov[iovcnt].iov_len = s->host_vnet_hdr_len;
|
2009-10-22 18:49:07 +02:00
|
|
|
iovcnt++;
|
|
|
|
}
|
|
|
|
|
|
|
|
iov[iovcnt].iov_base = (char *)buf;
|
|
|
|
iov[iovcnt].iov_len = size;
|
|
|
|
iovcnt++;
|
|
|
|
|
|
|
|
return tap_write_packet(s, iov, iovcnt);
|
|
|
|
}
|
|
|
|
|
2009-11-25 19:49:04 +01:00
|
|
|
static ssize_t tap_receive(VLANClientState *nc, const uint8_t *buf, size_t size)
|
2009-10-22 18:49:07 +02:00
|
|
|
{
|
2009-11-25 19:49:04 +01:00
|
|
|
TAPState *s = DO_UPCAST(TAPState, nc, nc);
|
2009-10-22 18:49:07 +02:00
|
|
|
struct iovec iov[1];
|
|
|
|
|
2010-07-13 16:55:31 +02:00
|
|
|
if (s->host_vnet_hdr_len && !s->using_vnet_hdr) {
|
2009-11-25 19:49:04 +01:00
|
|
|
return tap_receive_raw(nc, buf, size);
|
2009-10-22 18:49:07 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
iov[0].iov_base = (char *)buf;
|
|
|
|
iov[0].iov_len = size;
|
|
|
|
|
|
|
|
return tap_write_packet(s, iov, 1);
|
|
|
|
}
|
|
|
|
|
|
|
|
static int tap_can_send(void *opaque)
|
|
|
|
{
|
|
|
|
TAPState *s = opaque;
|
|
|
|
|
2009-11-25 19:49:04 +01:00
|
|
|
return qemu_can_send_packet(&s->nc);
|
2009-10-22 18:49:07 +02:00
|
|
|
}
|
|
|
|
|
2009-10-22 18:49:09 +02:00
|
|
|
#ifndef __sun__
|
|
|
|
ssize_t tap_read_packet(int tapfd, uint8_t *buf, int maxlen)
|
2009-10-22 18:49:07 +02:00
|
|
|
{
|
|
|
|
return read(tapfd, buf, maxlen);
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
2009-11-25 19:49:04 +01:00
|
|
|
static void tap_send_completed(VLANClientState *nc, ssize_t len)
|
2009-10-22 18:49:07 +02:00
|
|
|
{
|
2009-11-25 19:49:04 +01:00
|
|
|
TAPState *s = DO_UPCAST(TAPState, nc, nc);
|
2009-10-22 18:49:07 +02:00
|
|
|
tap_read_poll(s, 1);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void tap_send(void *opaque)
|
|
|
|
{
|
|
|
|
TAPState *s = opaque;
|
|
|
|
int size;
|
|
|
|
|
2009-10-27 19:16:39 +01:00
|
|
|
do {
|
|
|
|
uint8_t *buf = s->buf;
|
|
|
|
|
|
|
|
size = tap_read_packet(s->fd, s->buf, sizeof(s->buf));
|
|
|
|
if (size <= 0) {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
2010-07-13 16:55:31 +02:00
|
|
|
if (s->host_vnet_hdr_len && !s->using_vnet_hdr) {
|
|
|
|
buf += s->host_vnet_hdr_len;
|
|
|
|
size -= s->host_vnet_hdr_len;
|
2009-10-27 19:16:39 +01:00
|
|
|
}
|
|
|
|
|
2009-11-25 19:49:04 +01:00
|
|
|
size = qemu_send_packet_async(&s->nc, buf, size, tap_send_completed);
|
2009-10-27 19:16:39 +01:00
|
|
|
if (size == 0) {
|
|
|
|
tap_read_poll(s, 0);
|
|
|
|
}
|
2009-11-25 19:49:04 +01:00
|
|
|
} while (size > 0 && qemu_can_send_packet(&s->nc));
|
2009-10-22 18:49:07 +02:00
|
|
|
}
|
|
|
|
|
2009-11-25 19:49:04 +01:00
|
|
|
int tap_has_ufo(VLANClientState *nc)
|
2009-10-22 18:49:07 +02:00
|
|
|
{
|
2009-11-25 19:49:04 +01:00
|
|
|
TAPState *s = DO_UPCAST(TAPState, nc, nc);
|
2009-10-22 18:49:07 +02:00
|
|
|
|
2009-11-25 19:49:30 +01:00
|
|
|
assert(nc->info->type == NET_CLIENT_TYPE_TAP);
|
2009-10-22 18:49:07 +02:00
|
|
|
|
|
|
|
return s->has_ufo;
|
|
|
|
}
|
|
|
|
|
2009-11-25 19:49:04 +01:00
|
|
|
int tap_has_vnet_hdr(VLANClientState *nc)
|
2009-10-22 18:49:07 +02:00
|
|
|
{
|
2009-11-25 19:49:04 +01:00
|
|
|
TAPState *s = DO_UPCAST(TAPState, nc, nc);
|
2009-10-22 18:49:07 +02:00
|
|
|
|
2009-11-25 19:49:30 +01:00
|
|
|
assert(nc->info->type == NET_CLIENT_TYPE_TAP);
|
2009-10-22 18:49:07 +02:00
|
|
|
|
2010-07-13 16:55:31 +02:00
|
|
|
return !!s->host_vnet_hdr_len;
|
2009-10-22 18:49:07 +02:00
|
|
|
}
|
|
|
|
|
2010-07-16 10:16:06 +02:00
|
|
|
int tap_has_vnet_hdr_len(VLANClientState *nc, int len)
|
|
|
|
{
|
|
|
|
TAPState *s = DO_UPCAST(TAPState, nc, nc);
|
|
|
|
|
|
|
|
assert(nc->info->type == NET_CLIENT_TYPE_TAP);
|
|
|
|
|
|
|
|
return tap_probe_vnet_hdr_len(s->fd, len);
|
|
|
|
}
|
|
|
|
|
|
|
|
void tap_set_vnet_hdr_len(VLANClientState *nc, int len)
|
|
|
|
{
|
|
|
|
TAPState *s = DO_UPCAST(TAPState, nc, nc);
|
|
|
|
|
|
|
|
assert(nc->info->type == NET_CLIENT_TYPE_TAP);
|
|
|
|
assert(len == sizeof(struct virtio_net_hdr_mrg_rxbuf) ||
|
|
|
|
len == sizeof(struct virtio_net_hdr));
|
|
|
|
|
|
|
|
tap_fd_set_vnet_hdr_len(s->fd, len);
|
|
|
|
s->host_vnet_hdr_len = len;
|
|
|
|
}
|
|
|
|
|
2009-11-25 19:49:04 +01:00
|
|
|
void tap_using_vnet_hdr(VLANClientState *nc, int using_vnet_hdr)
|
2009-10-22 18:49:07 +02:00
|
|
|
{
|
2009-11-25 19:49:04 +01:00
|
|
|
TAPState *s = DO_UPCAST(TAPState, nc, nc);
|
2009-10-22 18:49:07 +02:00
|
|
|
|
|
|
|
using_vnet_hdr = using_vnet_hdr != 0;
|
|
|
|
|
2009-11-25 19:49:30 +01:00
|
|
|
assert(nc->info->type == NET_CLIENT_TYPE_TAP);
|
2010-07-13 16:55:31 +02:00
|
|
|
assert(!!s->host_vnet_hdr_len == using_vnet_hdr);
|
2009-10-22 18:49:07 +02:00
|
|
|
|
|
|
|
s->using_vnet_hdr = using_vnet_hdr;
|
|
|
|
}
|
|
|
|
|
2009-11-25 19:49:04 +01:00
|
|
|
void tap_set_offload(VLANClientState *nc, int csum, int tso4,
|
2009-10-22 18:49:07 +02:00
|
|
|
int tso6, int ecn, int ufo)
|
|
|
|
{
|
2009-11-25 19:49:04 +01:00
|
|
|
TAPState *s = DO_UPCAST(TAPState, nc, nc);
|
2010-10-31 18:06:47 +01:00
|
|
|
if (s->fd < 0) {
|
|
|
|
return;
|
|
|
|
}
|
2009-10-22 18:49:07 +02:00
|
|
|
|
2010-10-31 18:06:47 +01:00
|
|
|
tap_fd_set_offload(s->fd, csum, tso4, tso6, ecn, ufo);
|
2009-10-22 18:49:07 +02:00
|
|
|
}
|
|
|
|
|
2009-11-25 19:49:04 +01:00
|
|
|
static void tap_cleanup(VLANClientState *nc)
|
2009-10-22 18:49:07 +02:00
|
|
|
{
|
2009-11-25 19:49:04 +01:00
|
|
|
TAPState *s = DO_UPCAST(TAPState, nc, nc);
|
2009-10-22 18:49:07 +02:00
|
|
|
|
2010-03-17 12:08:24 +01:00
|
|
|
if (s->vhost_net) {
|
|
|
|
vhost_net_cleanup(s->vhost_net);
|
2010-10-27 20:03:43 +02:00
|
|
|
s->vhost_net = NULL;
|
2010-03-17 12:08:24 +01:00
|
|
|
}
|
|
|
|
|
2009-11-25 19:49:04 +01:00
|
|
|
qemu_purge_queued_packets(nc);
|
2009-10-22 18:49:07 +02:00
|
|
|
|
|
|
|
if (s->down_script[0])
|
|
|
|
launch_script(s->down_script, s->down_script_arg, s->fd);
|
|
|
|
|
|
|
|
tap_read_poll(s, 0);
|
|
|
|
tap_write_poll(s, 0);
|
|
|
|
close(s->fd);
|
2010-10-31 18:06:47 +01:00
|
|
|
s->fd = -1;
|
2009-10-22 18:49:07 +02:00
|
|
|
}
|
|
|
|
|
2009-12-24 13:46:29 +01:00
|
|
|
static void tap_poll(VLANClientState *nc, bool enable)
|
|
|
|
{
|
|
|
|
TAPState *s = DO_UPCAST(TAPState, nc, nc);
|
|
|
|
tap_read_poll(s, enable);
|
|
|
|
tap_write_poll(s, enable);
|
|
|
|
}
|
|
|
|
|
2010-03-17 12:07:50 +01:00
|
|
|
int tap_get_fd(VLANClientState *nc)
|
|
|
|
{
|
|
|
|
TAPState *s = DO_UPCAST(TAPState, nc, nc);
|
|
|
|
assert(nc->info->type == NET_CLIENT_TYPE_TAP);
|
|
|
|
return s->fd;
|
|
|
|
}
|
|
|
|
|
2009-10-22 18:49:07 +02:00
|
|
|
/* fd support */
|
|
|
|
|
2009-11-25 19:49:04 +01:00
|
|
|
static NetClientInfo net_tap_info = {
|
|
|
|
.type = NET_CLIENT_TYPE_TAP,
|
|
|
|
.size = sizeof(TAPState),
|
|
|
|
.receive = tap_receive,
|
|
|
|
.receive_raw = tap_receive_raw,
|
|
|
|
.receive_iov = tap_receive_iov,
|
2009-12-24 13:46:29 +01:00
|
|
|
.poll = tap_poll,
|
2009-11-25 19:49:04 +01:00
|
|
|
.cleanup = tap_cleanup,
|
|
|
|
};
|
|
|
|
|
2009-10-22 18:49:07 +02:00
|
|
|
static TAPState *net_tap_fd_init(VLANState *vlan,
|
|
|
|
const char *model,
|
|
|
|
const char *name,
|
|
|
|
int fd,
|
|
|
|
int vnet_hdr)
|
|
|
|
{
|
2009-11-25 19:49:04 +01:00
|
|
|
VLANClientState *nc;
|
2009-10-22 18:49:07 +02:00
|
|
|
TAPState *s;
|
|
|
|
|
2009-11-25 19:49:04 +01:00
|
|
|
nc = qemu_new_net_client(&net_tap_info, vlan, NULL, model, name);
|
|
|
|
|
|
|
|
s = DO_UPCAST(TAPState, nc, nc);
|
|
|
|
|
2009-10-22 18:49:07 +02:00
|
|
|
s->fd = fd;
|
2010-07-13 16:55:31 +02:00
|
|
|
s->host_vnet_hdr_len = vnet_hdr ? sizeof(struct virtio_net_hdr) : 0;
|
2009-10-22 18:49:07 +02:00
|
|
|
s->using_vnet_hdr = 0;
|
2009-10-22 18:49:16 +02:00
|
|
|
s->has_ufo = tap_probe_has_ufo(s->fd);
|
2009-11-25 19:49:04 +01:00
|
|
|
tap_set_offload(&s->nc, 0, 0, 0, 0, 0);
|
2009-10-22 18:49:07 +02:00
|
|
|
tap_read_poll(s, 1);
|
2010-03-17 12:08:24 +01:00
|
|
|
s->vhost_net = NULL;
|
2009-10-22 18:49:07 +02:00
|
|
|
return s;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int launch_script(const char *setup_script, const char *ifname, int fd)
|
|
|
|
{
|
|
|
|
int pid, status;
|
|
|
|
char *args[3];
|
|
|
|
char **parg;
|
|
|
|
|
|
|
|
/* try to launch network script */
|
|
|
|
pid = fork();
|
|
|
|
if (pid == 0) {
|
|
|
|
int open_max = sysconf(_SC_OPEN_MAX), i;
|
|
|
|
|
|
|
|
for (i = 0; i < open_max; i++) {
|
|
|
|
if (i != STDIN_FILENO &&
|
|
|
|
i != STDOUT_FILENO &&
|
|
|
|
i != STDERR_FILENO &&
|
|
|
|
i != fd) {
|
|
|
|
close(i);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
parg = args;
|
|
|
|
*parg++ = (char *)setup_script;
|
|
|
|
*parg++ = (char *)ifname;
|
2010-04-25 20:35:52 +02:00
|
|
|
*parg = NULL;
|
2009-10-22 18:49:07 +02:00
|
|
|
execv(setup_script, args);
|
|
|
|
_exit(1);
|
|
|
|
} else if (pid > 0) {
|
|
|
|
while (waitpid(pid, &status, 0) != pid) {
|
|
|
|
/* loop */
|
|
|
|
}
|
|
|
|
|
|
|
|
if (WIFEXITED(status) && WEXITSTATUS(status) == 0) {
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
fprintf(stderr, "%s: could not launch network script\n", setup_script);
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
Add support for net bridge
The most common use of -net tap is to connect a tap device to a bridge. This
requires the use of a script and running qemu as root in order to allocate a
tap device to pass to the script.
This model is great for portability and flexibility but it's incredibly
difficult to eliminate the need to run qemu as root. The only really viable
mechanism is to use tunctl to create a tap device, attach it to a bridge as
root, and then hand that tap device to qemu. The problem with this mechanism
is that it requires administrator intervention whenever a user wants to create
a guest.
By essentially writing a helper that implements the most common qemu-ifup
script that can be safely given cap_net_admin, we can dramatically simplify
things for non-privileged users. We still support existing -net tap options
as a mechanism for advanced users and backwards compatibility.
Currently, this is very Linux centric but there's really no reason why it
couldn't be extended for other Unixes.
A typical invocation would be similar to one of the following:
qemu linux.img -net bridge -net nic,model=virtio
qemu linux.img -net tap,helper="/usr/local/libexec/qemu-bridge-helper"
-net nic,model=virtio
qemu linux.img -netdev bridge,id=hn0
-device virtio-net-pci,netdev=hn0,id=nic1
qemu linux.img -netdev tap,helper="/usr/local/libexec/qemu-bridge-helper",id=hn0
-device virtio-net-pci,netdev=hn0,id=nic1
The default bridge that we attach to is br0. The thinking is that a distro
could preconfigure such an interface to allow out-of-the-box bridged networking.
Alternatively, if a user wants to use a different bridge, a typical invocation
would be simliar to one of the following:
qemu linux.img -net bridge,br=qemubr0 -net nic,model=virtio
qemu linux.img -net tap,helper="/usr/local/libexec/qemu-bridge-helper --br=qemubr0"
-net nic,model=virtio
qemu linux.img -netdev bridge,br=qemubr0,id=hn0
-device virtio-net-pci,netdev=hn0,id=nic1
qemu linux.img -netdev tap,helper="/usr/local/libexec/qemu-bridge-helper --br=qemubr0",id=hn0
-device virtio-net-pci,netdev=hn0,id=nic1
Signed-off-by: Anthony Liguori <aliguori@us.ibm.com>
Signed-off-by: Richa Marwaha <rmarwah@linux.vnet.ibm.com>
Signed-off-by: Corey Bryant <coreyb@linux.vnet.ibm.com>
Signed-off-by: Anthony Liguori <aliguori@us.ibm.com>
2012-01-26 15:42:27 +01:00
|
|
|
static int recv_fd(int c)
|
|
|
|
{
|
|
|
|
int fd;
|
|
|
|
uint8_t msgbuf[CMSG_SPACE(sizeof(fd))];
|
|
|
|
struct msghdr msg = {
|
|
|
|
.msg_control = msgbuf,
|
|
|
|
.msg_controllen = sizeof(msgbuf),
|
|
|
|
};
|
|
|
|
struct cmsghdr *cmsg;
|
|
|
|
struct iovec iov;
|
|
|
|
uint8_t req[1];
|
|
|
|
ssize_t len;
|
|
|
|
|
|
|
|
cmsg = CMSG_FIRSTHDR(&msg);
|
|
|
|
cmsg->cmsg_level = SOL_SOCKET;
|
|
|
|
cmsg->cmsg_type = SCM_RIGHTS;
|
|
|
|
cmsg->cmsg_len = CMSG_LEN(sizeof(fd));
|
|
|
|
msg.msg_controllen = cmsg->cmsg_len;
|
|
|
|
|
|
|
|
iov.iov_base = req;
|
|
|
|
iov.iov_len = sizeof(req);
|
|
|
|
|
|
|
|
msg.msg_iov = &iov;
|
|
|
|
msg.msg_iovlen = 1;
|
|
|
|
|
|
|
|
len = recvmsg(c, &msg, 0);
|
|
|
|
if (len > 0) {
|
|
|
|
memcpy(&fd, CMSG_DATA(cmsg), sizeof(fd));
|
|
|
|
return fd;
|
|
|
|
}
|
|
|
|
|
|
|
|
return len;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int net_bridge_run_helper(const char *helper, const char *bridge)
|
|
|
|
{
|
|
|
|
sigset_t oldmask, mask;
|
|
|
|
int pid, status;
|
|
|
|
char *args[5];
|
|
|
|
char **parg;
|
|
|
|
int sv[2];
|
|
|
|
|
|
|
|
sigemptyset(&mask);
|
|
|
|
sigaddset(&mask, SIGCHLD);
|
|
|
|
sigprocmask(SIG_BLOCK, &mask, &oldmask);
|
|
|
|
|
|
|
|
if (socketpair(PF_UNIX, SOCK_STREAM, 0, sv) == -1) {
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* try to launch bridge helper */
|
|
|
|
pid = fork();
|
|
|
|
if (pid == 0) {
|
|
|
|
int open_max = sysconf(_SC_OPEN_MAX), i;
|
|
|
|
char fd_buf[6+10];
|
|
|
|
char br_buf[6+IFNAMSIZ] = {0};
|
|
|
|
char helper_cmd[PATH_MAX + sizeof(fd_buf) + sizeof(br_buf) + 15];
|
|
|
|
|
|
|
|
for (i = 0; i < open_max; i++) {
|
|
|
|
if (i != STDIN_FILENO &&
|
|
|
|
i != STDOUT_FILENO &&
|
|
|
|
i != STDERR_FILENO &&
|
|
|
|
i != sv[1]) {
|
|
|
|
close(i);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
snprintf(fd_buf, sizeof(fd_buf), "%s%d", "--fd=", sv[1]);
|
|
|
|
|
|
|
|
if (strrchr(helper, ' ') || strrchr(helper, '\t')) {
|
|
|
|
/* assume helper is a command */
|
|
|
|
|
|
|
|
if (strstr(helper, "--br=") == NULL) {
|
|
|
|
snprintf(br_buf, sizeof(br_buf), "%s%s", "--br=", bridge);
|
|
|
|
}
|
|
|
|
|
|
|
|
snprintf(helper_cmd, sizeof(helper_cmd), "%s %s %s %s",
|
|
|
|
helper, "--use-vnet", fd_buf, br_buf);
|
|
|
|
|
|
|
|
parg = args;
|
|
|
|
*parg++ = (char *)"sh";
|
|
|
|
*parg++ = (char *)"-c";
|
|
|
|
*parg++ = helper_cmd;
|
|
|
|
*parg++ = NULL;
|
|
|
|
|
|
|
|
execv("/bin/sh", args);
|
|
|
|
} else {
|
|
|
|
/* assume helper is just the executable path name */
|
|
|
|
|
|
|
|
snprintf(br_buf, sizeof(br_buf), "%s%s", "--br=", bridge);
|
|
|
|
|
|
|
|
parg = args;
|
|
|
|
*parg++ = (char *)helper;
|
|
|
|
*parg++ = (char *)"--use-vnet";
|
|
|
|
*parg++ = fd_buf;
|
|
|
|
*parg++ = br_buf;
|
|
|
|
*parg++ = NULL;
|
|
|
|
|
|
|
|
execv(helper, args);
|
|
|
|
}
|
|
|
|
_exit(1);
|
|
|
|
|
|
|
|
} else if (pid > 0) {
|
|
|
|
int fd;
|
|
|
|
|
|
|
|
close(sv[1]);
|
|
|
|
|
|
|
|
do {
|
|
|
|
fd = recv_fd(sv[0]);
|
|
|
|
} while (fd == -1 && errno == EINTR);
|
|
|
|
|
|
|
|
close(sv[0]);
|
|
|
|
|
|
|
|
while (waitpid(pid, &status, 0) != pid) {
|
|
|
|
/* loop */
|
|
|
|
}
|
|
|
|
sigprocmask(SIG_SETMASK, &oldmask, NULL);
|
|
|
|
if (fd < 0) {
|
|
|
|
fprintf(stderr, "failed to recv file descriptor\n");
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (WIFEXITED(status) && WEXITSTATUS(status) == 0) {
|
|
|
|
return fd;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
fprintf(stderr, "failed to launch bridge helper\n");
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
int net_init_bridge(QemuOpts *opts, Monitor *mon, const char *name,
|
|
|
|
VLANState *vlan)
|
|
|
|
{
|
|
|
|
TAPState *s;
|
|
|
|
int fd, vnet_hdr;
|
|
|
|
|
|
|
|
if (!qemu_opt_get(opts, "br")) {
|
|
|
|
qemu_opt_set(opts, "br", DEFAULT_BRIDGE_INTERFACE);
|
|
|
|
}
|
|
|
|
if (!qemu_opt_get(opts, "helper")) {
|
|
|
|
qemu_opt_set(opts, "helper", DEFAULT_BRIDGE_HELPER);
|
|
|
|
}
|
|
|
|
|
|
|
|
fd = net_bridge_run_helper(qemu_opt_get(opts, "helper"),
|
|
|
|
qemu_opt_get(opts, "br"));
|
|
|
|
if (fd == -1) {
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
fcntl(fd, F_SETFL, O_NONBLOCK);
|
|
|
|
|
|
|
|
vnet_hdr = tap_probe_vnet_hdr(fd);
|
|
|
|
|
|
|
|
s = net_tap_fd_init(vlan, "bridge", name, fd, vnet_hdr);
|
|
|
|
if (!s) {
|
|
|
|
close(fd);
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
snprintf(s->nc.info_str, sizeof(s->nc.info_str), "helper=%s,br=%s",
|
|
|
|
qemu_opt_get(opts, "helper"), qemu_opt_get(opts, "br"));
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2009-10-22 18:49:07 +02:00
|
|
|
static int net_tap_init(QemuOpts *opts, int *vnet_hdr)
|
|
|
|
{
|
|
|
|
int fd, vnet_hdr_required;
|
|
|
|
char ifname[128] = {0,};
|
|
|
|
const char *setup_script;
|
|
|
|
|
|
|
|
if (qemu_opt_get(opts, "ifname")) {
|
|
|
|
pstrcpy(ifname, sizeof(ifname), qemu_opt_get(opts, "ifname"));
|
|
|
|
}
|
|
|
|
|
|
|
|
*vnet_hdr = qemu_opt_get_bool(opts, "vnet_hdr", 1);
|
|
|
|
if (qemu_opt_get(opts, "vnet_hdr")) {
|
|
|
|
vnet_hdr_required = *vnet_hdr;
|
|
|
|
} else {
|
|
|
|
vnet_hdr_required = 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
TFR(fd = tap_open(ifname, sizeof(ifname), vnet_hdr, vnet_hdr_required));
|
|
|
|
if (fd < 0) {
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
setup_script = qemu_opt_get(opts, "script");
|
|
|
|
if (setup_script &&
|
|
|
|
setup_script[0] != '\0' &&
|
|
|
|
strcmp(setup_script, "no") != 0 &&
|
|
|
|
launch_script(setup_script, ifname, fd)) {
|
|
|
|
close(fd);
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
qemu_opt_set(opts, "ifname", ifname);
|
|
|
|
|
|
|
|
return fd;
|
|
|
|
}
|
|
|
|
|
|
|
|
int net_init_tap(QemuOpts *opts, Monitor *mon, const char *name, VLANState *vlan)
|
|
|
|
{
|
|
|
|
TAPState *s;
|
2009-11-25 19:49:36 +01:00
|
|
|
int fd, vnet_hdr = 0;
|
Add support for net bridge
The most common use of -net tap is to connect a tap device to a bridge. This
requires the use of a script and running qemu as root in order to allocate a
tap device to pass to the script.
This model is great for portability and flexibility but it's incredibly
difficult to eliminate the need to run qemu as root. The only really viable
mechanism is to use tunctl to create a tap device, attach it to a bridge as
root, and then hand that tap device to qemu. The problem with this mechanism
is that it requires administrator intervention whenever a user wants to create
a guest.
By essentially writing a helper that implements the most common qemu-ifup
script that can be safely given cap_net_admin, we can dramatically simplify
things for non-privileged users. We still support existing -net tap options
as a mechanism for advanced users and backwards compatibility.
Currently, this is very Linux centric but there's really no reason why it
couldn't be extended for other Unixes.
A typical invocation would be similar to one of the following:
qemu linux.img -net bridge -net nic,model=virtio
qemu linux.img -net tap,helper="/usr/local/libexec/qemu-bridge-helper"
-net nic,model=virtio
qemu linux.img -netdev bridge,id=hn0
-device virtio-net-pci,netdev=hn0,id=nic1
qemu linux.img -netdev tap,helper="/usr/local/libexec/qemu-bridge-helper",id=hn0
-device virtio-net-pci,netdev=hn0,id=nic1
The default bridge that we attach to is br0. The thinking is that a distro
could preconfigure such an interface to allow out-of-the-box bridged networking.
Alternatively, if a user wants to use a different bridge, a typical invocation
would be simliar to one of the following:
qemu linux.img -net bridge,br=qemubr0 -net nic,model=virtio
qemu linux.img -net tap,helper="/usr/local/libexec/qemu-bridge-helper --br=qemubr0"
-net nic,model=virtio
qemu linux.img -netdev bridge,br=qemubr0,id=hn0
-device virtio-net-pci,netdev=hn0,id=nic1
qemu linux.img -netdev tap,helper="/usr/local/libexec/qemu-bridge-helper --br=qemubr0",id=hn0
-device virtio-net-pci,netdev=hn0,id=nic1
Signed-off-by: Anthony Liguori <aliguori@us.ibm.com>
Signed-off-by: Richa Marwaha <rmarwah@linux.vnet.ibm.com>
Signed-off-by: Corey Bryant <coreyb@linux.vnet.ibm.com>
Signed-off-by: Anthony Liguori <aliguori@us.ibm.com>
2012-01-26 15:42:27 +01:00
|
|
|
const char *model;
|
2009-10-22 18:49:07 +02:00
|
|
|
|
|
|
|
if (qemu_opt_get(opts, "fd")) {
|
|
|
|
if (qemu_opt_get(opts, "ifname") ||
|
|
|
|
qemu_opt_get(opts, "script") ||
|
|
|
|
qemu_opt_get(opts, "downscript") ||
|
Add support for net bridge
The most common use of -net tap is to connect a tap device to a bridge. This
requires the use of a script and running qemu as root in order to allocate a
tap device to pass to the script.
This model is great for portability and flexibility but it's incredibly
difficult to eliminate the need to run qemu as root. The only really viable
mechanism is to use tunctl to create a tap device, attach it to a bridge as
root, and then hand that tap device to qemu. The problem with this mechanism
is that it requires administrator intervention whenever a user wants to create
a guest.
By essentially writing a helper that implements the most common qemu-ifup
script that can be safely given cap_net_admin, we can dramatically simplify
things for non-privileged users. We still support existing -net tap options
as a mechanism for advanced users and backwards compatibility.
Currently, this is very Linux centric but there's really no reason why it
couldn't be extended for other Unixes.
A typical invocation would be similar to one of the following:
qemu linux.img -net bridge -net nic,model=virtio
qemu linux.img -net tap,helper="/usr/local/libexec/qemu-bridge-helper"
-net nic,model=virtio
qemu linux.img -netdev bridge,id=hn0
-device virtio-net-pci,netdev=hn0,id=nic1
qemu linux.img -netdev tap,helper="/usr/local/libexec/qemu-bridge-helper",id=hn0
-device virtio-net-pci,netdev=hn0,id=nic1
The default bridge that we attach to is br0. The thinking is that a distro
could preconfigure such an interface to allow out-of-the-box bridged networking.
Alternatively, if a user wants to use a different bridge, a typical invocation
would be simliar to one of the following:
qemu linux.img -net bridge,br=qemubr0 -net nic,model=virtio
qemu linux.img -net tap,helper="/usr/local/libexec/qemu-bridge-helper --br=qemubr0"
-net nic,model=virtio
qemu linux.img -netdev bridge,br=qemubr0,id=hn0
-device virtio-net-pci,netdev=hn0,id=nic1
qemu linux.img -netdev tap,helper="/usr/local/libexec/qemu-bridge-helper --br=qemubr0",id=hn0
-device virtio-net-pci,netdev=hn0,id=nic1
Signed-off-by: Anthony Liguori <aliguori@us.ibm.com>
Signed-off-by: Richa Marwaha <rmarwah@linux.vnet.ibm.com>
Signed-off-by: Corey Bryant <coreyb@linux.vnet.ibm.com>
Signed-off-by: Anthony Liguori <aliguori@us.ibm.com>
2012-01-26 15:42:27 +01:00
|
|
|
qemu_opt_get(opts, "vnet_hdr") ||
|
|
|
|
qemu_opt_get(opts, "helper")) {
|
|
|
|
error_report("ifname=, script=, downscript=, vnet_hdr=, "
|
|
|
|
"and helper= are invalid with fd=");
|
2009-10-22 18:49:07 +02:00
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
fd = net_handle_fd_param(mon, qemu_opt_get(opts, "fd"));
|
|
|
|
if (fd == -1) {
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
fcntl(fd, F_SETFL, O_NONBLOCK);
|
|
|
|
|
|
|
|
vnet_hdr = tap_probe_vnet_hdr(fd);
|
Add support for net bridge
The most common use of -net tap is to connect a tap device to a bridge. This
requires the use of a script and running qemu as root in order to allocate a
tap device to pass to the script.
This model is great for portability and flexibility but it's incredibly
difficult to eliminate the need to run qemu as root. The only really viable
mechanism is to use tunctl to create a tap device, attach it to a bridge as
root, and then hand that tap device to qemu. The problem with this mechanism
is that it requires administrator intervention whenever a user wants to create
a guest.
By essentially writing a helper that implements the most common qemu-ifup
script that can be safely given cap_net_admin, we can dramatically simplify
things for non-privileged users. We still support existing -net tap options
as a mechanism for advanced users and backwards compatibility.
Currently, this is very Linux centric but there's really no reason why it
couldn't be extended for other Unixes.
A typical invocation would be similar to one of the following:
qemu linux.img -net bridge -net nic,model=virtio
qemu linux.img -net tap,helper="/usr/local/libexec/qemu-bridge-helper"
-net nic,model=virtio
qemu linux.img -netdev bridge,id=hn0
-device virtio-net-pci,netdev=hn0,id=nic1
qemu linux.img -netdev tap,helper="/usr/local/libexec/qemu-bridge-helper",id=hn0
-device virtio-net-pci,netdev=hn0,id=nic1
The default bridge that we attach to is br0. The thinking is that a distro
could preconfigure such an interface to allow out-of-the-box bridged networking.
Alternatively, if a user wants to use a different bridge, a typical invocation
would be simliar to one of the following:
qemu linux.img -net bridge,br=qemubr0 -net nic,model=virtio
qemu linux.img -net tap,helper="/usr/local/libexec/qemu-bridge-helper --br=qemubr0"
-net nic,model=virtio
qemu linux.img -netdev bridge,br=qemubr0,id=hn0
-device virtio-net-pci,netdev=hn0,id=nic1
qemu linux.img -netdev tap,helper="/usr/local/libexec/qemu-bridge-helper --br=qemubr0",id=hn0
-device virtio-net-pci,netdev=hn0,id=nic1
Signed-off-by: Anthony Liguori <aliguori@us.ibm.com>
Signed-off-by: Richa Marwaha <rmarwah@linux.vnet.ibm.com>
Signed-off-by: Corey Bryant <coreyb@linux.vnet.ibm.com>
Signed-off-by: Anthony Liguori <aliguori@us.ibm.com>
2012-01-26 15:42:27 +01:00
|
|
|
|
|
|
|
model = "tap";
|
|
|
|
|
|
|
|
} else if (qemu_opt_get(opts, "helper")) {
|
|
|
|
if (qemu_opt_get(opts, "ifname") ||
|
|
|
|
qemu_opt_get(opts, "script") ||
|
|
|
|
qemu_opt_get(opts, "downscript") ||
|
|
|
|
qemu_opt_get(opts, "vnet_hdr")) {
|
|
|
|
error_report("ifname=, script=, downscript=, and vnet_hdr= "
|
|
|
|
"are invalid with helper=");
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
fd = net_bridge_run_helper(qemu_opt_get(opts, "helper"),
|
|
|
|
DEFAULT_BRIDGE_INTERFACE);
|
|
|
|
if (fd == -1) {
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
fcntl(fd, F_SETFL, O_NONBLOCK);
|
|
|
|
|
|
|
|
vnet_hdr = tap_probe_vnet_hdr(fd);
|
|
|
|
|
|
|
|
model = "bridge";
|
|
|
|
|
2009-10-22 18:49:07 +02:00
|
|
|
} else {
|
|
|
|
if (!qemu_opt_get(opts, "script")) {
|
|
|
|
qemu_opt_set(opts, "script", DEFAULT_NETWORK_SCRIPT);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!qemu_opt_get(opts, "downscript")) {
|
|
|
|
qemu_opt_set(opts, "downscript", DEFAULT_NETWORK_DOWN_SCRIPT);
|
|
|
|
}
|
|
|
|
|
|
|
|
fd = net_tap_init(opts, &vnet_hdr);
|
2009-11-20 23:23:03 +01:00
|
|
|
if (fd == -1) {
|
|
|
|
return -1;
|
|
|
|
}
|
Add support for net bridge
The most common use of -net tap is to connect a tap device to a bridge. This
requires the use of a script and running qemu as root in order to allocate a
tap device to pass to the script.
This model is great for portability and flexibility but it's incredibly
difficult to eliminate the need to run qemu as root. The only really viable
mechanism is to use tunctl to create a tap device, attach it to a bridge as
root, and then hand that tap device to qemu. The problem with this mechanism
is that it requires administrator intervention whenever a user wants to create
a guest.
By essentially writing a helper that implements the most common qemu-ifup
script that can be safely given cap_net_admin, we can dramatically simplify
things for non-privileged users. We still support existing -net tap options
as a mechanism for advanced users and backwards compatibility.
Currently, this is very Linux centric but there's really no reason why it
couldn't be extended for other Unixes.
A typical invocation would be similar to one of the following:
qemu linux.img -net bridge -net nic,model=virtio
qemu linux.img -net tap,helper="/usr/local/libexec/qemu-bridge-helper"
-net nic,model=virtio
qemu linux.img -netdev bridge,id=hn0
-device virtio-net-pci,netdev=hn0,id=nic1
qemu linux.img -netdev tap,helper="/usr/local/libexec/qemu-bridge-helper",id=hn0
-device virtio-net-pci,netdev=hn0,id=nic1
The default bridge that we attach to is br0. The thinking is that a distro
could preconfigure such an interface to allow out-of-the-box bridged networking.
Alternatively, if a user wants to use a different bridge, a typical invocation
would be simliar to one of the following:
qemu linux.img -net bridge,br=qemubr0 -net nic,model=virtio
qemu linux.img -net tap,helper="/usr/local/libexec/qemu-bridge-helper --br=qemubr0"
-net nic,model=virtio
qemu linux.img -netdev bridge,br=qemubr0,id=hn0
-device virtio-net-pci,netdev=hn0,id=nic1
qemu linux.img -netdev tap,helper="/usr/local/libexec/qemu-bridge-helper --br=qemubr0",id=hn0
-device virtio-net-pci,netdev=hn0,id=nic1
Signed-off-by: Anthony Liguori <aliguori@us.ibm.com>
Signed-off-by: Richa Marwaha <rmarwah@linux.vnet.ibm.com>
Signed-off-by: Corey Bryant <coreyb@linux.vnet.ibm.com>
Signed-off-by: Anthony Liguori <aliguori@us.ibm.com>
2012-01-26 15:42:27 +01:00
|
|
|
|
|
|
|
model = "tap";
|
2009-10-22 18:49:07 +02:00
|
|
|
}
|
|
|
|
|
Add support for net bridge
The most common use of -net tap is to connect a tap device to a bridge. This
requires the use of a script and running qemu as root in order to allocate a
tap device to pass to the script.
This model is great for portability and flexibility but it's incredibly
difficult to eliminate the need to run qemu as root. The only really viable
mechanism is to use tunctl to create a tap device, attach it to a bridge as
root, and then hand that tap device to qemu. The problem with this mechanism
is that it requires administrator intervention whenever a user wants to create
a guest.
By essentially writing a helper that implements the most common qemu-ifup
script that can be safely given cap_net_admin, we can dramatically simplify
things for non-privileged users. We still support existing -net tap options
as a mechanism for advanced users and backwards compatibility.
Currently, this is very Linux centric but there's really no reason why it
couldn't be extended for other Unixes.
A typical invocation would be similar to one of the following:
qemu linux.img -net bridge -net nic,model=virtio
qemu linux.img -net tap,helper="/usr/local/libexec/qemu-bridge-helper"
-net nic,model=virtio
qemu linux.img -netdev bridge,id=hn0
-device virtio-net-pci,netdev=hn0,id=nic1
qemu linux.img -netdev tap,helper="/usr/local/libexec/qemu-bridge-helper",id=hn0
-device virtio-net-pci,netdev=hn0,id=nic1
The default bridge that we attach to is br0. The thinking is that a distro
could preconfigure such an interface to allow out-of-the-box bridged networking.
Alternatively, if a user wants to use a different bridge, a typical invocation
would be simliar to one of the following:
qemu linux.img -net bridge,br=qemubr0 -net nic,model=virtio
qemu linux.img -net tap,helper="/usr/local/libexec/qemu-bridge-helper --br=qemubr0"
-net nic,model=virtio
qemu linux.img -netdev bridge,br=qemubr0,id=hn0
-device virtio-net-pci,netdev=hn0,id=nic1
qemu linux.img -netdev tap,helper="/usr/local/libexec/qemu-bridge-helper --br=qemubr0",id=hn0
-device virtio-net-pci,netdev=hn0,id=nic1
Signed-off-by: Anthony Liguori <aliguori@us.ibm.com>
Signed-off-by: Richa Marwaha <rmarwah@linux.vnet.ibm.com>
Signed-off-by: Corey Bryant <coreyb@linux.vnet.ibm.com>
Signed-off-by: Anthony Liguori <aliguori@us.ibm.com>
2012-01-26 15:42:27 +01:00
|
|
|
s = net_tap_fd_init(vlan, model, name, fd, vnet_hdr);
|
2009-10-22 18:49:07 +02:00
|
|
|
if (!s) {
|
|
|
|
close(fd);
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
2009-10-22 18:49:13 +02:00
|
|
|
if (tap_set_sndbuf(s->fd, opts) < 0) {
|
2009-10-22 18:49:07 +02:00
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (qemu_opt_get(opts, "fd")) {
|
2009-11-25 19:49:04 +01:00
|
|
|
snprintf(s->nc.info_str, sizeof(s->nc.info_str), "fd=%d", fd);
|
Add support for net bridge
The most common use of -net tap is to connect a tap device to a bridge. This
requires the use of a script and running qemu as root in order to allocate a
tap device to pass to the script.
This model is great for portability and flexibility but it's incredibly
difficult to eliminate the need to run qemu as root. The only really viable
mechanism is to use tunctl to create a tap device, attach it to a bridge as
root, and then hand that tap device to qemu. The problem with this mechanism
is that it requires administrator intervention whenever a user wants to create
a guest.
By essentially writing a helper that implements the most common qemu-ifup
script that can be safely given cap_net_admin, we can dramatically simplify
things for non-privileged users. We still support existing -net tap options
as a mechanism for advanced users and backwards compatibility.
Currently, this is very Linux centric but there's really no reason why it
couldn't be extended for other Unixes.
A typical invocation would be similar to one of the following:
qemu linux.img -net bridge -net nic,model=virtio
qemu linux.img -net tap,helper="/usr/local/libexec/qemu-bridge-helper"
-net nic,model=virtio
qemu linux.img -netdev bridge,id=hn0
-device virtio-net-pci,netdev=hn0,id=nic1
qemu linux.img -netdev tap,helper="/usr/local/libexec/qemu-bridge-helper",id=hn0
-device virtio-net-pci,netdev=hn0,id=nic1
The default bridge that we attach to is br0. The thinking is that a distro
could preconfigure such an interface to allow out-of-the-box bridged networking.
Alternatively, if a user wants to use a different bridge, a typical invocation
would be simliar to one of the following:
qemu linux.img -net bridge,br=qemubr0 -net nic,model=virtio
qemu linux.img -net tap,helper="/usr/local/libexec/qemu-bridge-helper --br=qemubr0"
-net nic,model=virtio
qemu linux.img -netdev bridge,br=qemubr0,id=hn0
-device virtio-net-pci,netdev=hn0,id=nic1
qemu linux.img -netdev tap,helper="/usr/local/libexec/qemu-bridge-helper --br=qemubr0",id=hn0
-device virtio-net-pci,netdev=hn0,id=nic1
Signed-off-by: Anthony Liguori <aliguori@us.ibm.com>
Signed-off-by: Richa Marwaha <rmarwah@linux.vnet.ibm.com>
Signed-off-by: Corey Bryant <coreyb@linux.vnet.ibm.com>
Signed-off-by: Anthony Liguori <aliguori@us.ibm.com>
2012-01-26 15:42:27 +01:00
|
|
|
} else if (qemu_opt_get(opts, "helper")) {
|
|
|
|
snprintf(s->nc.info_str, sizeof(s->nc.info_str),
|
|
|
|
"helper=%s", qemu_opt_get(opts, "helper"));
|
2009-10-22 18:49:07 +02:00
|
|
|
} else {
|
|
|
|
const char *ifname, *script, *downscript;
|
|
|
|
|
|
|
|
ifname = qemu_opt_get(opts, "ifname");
|
|
|
|
script = qemu_opt_get(opts, "script");
|
|
|
|
downscript = qemu_opt_get(opts, "downscript");
|
|
|
|
|
2009-11-25 19:49:04 +01:00
|
|
|
snprintf(s->nc.info_str, sizeof(s->nc.info_str),
|
2009-10-22 18:49:07 +02:00
|
|
|
"ifname=%s,script=%s,downscript=%s",
|
|
|
|
ifname, script, downscript);
|
|
|
|
|
|
|
|
if (strcmp(downscript, "no") != 0) {
|
|
|
|
snprintf(s->down_script, sizeof(s->down_script), "%s", downscript);
|
|
|
|
snprintf(s->down_script_arg, sizeof(s->down_script_arg), "%s", ifname);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2011-02-01 21:13:42 +01:00
|
|
|
if (qemu_opt_get_bool(opts, "vhost", !!qemu_opt_get(opts, "vhostfd") ||
|
|
|
|
qemu_opt_get_bool(opts, "vhostforce", false))) {
|
2010-03-17 12:08:24 +01:00
|
|
|
int vhostfd, r;
|
2011-02-01 21:13:42 +01:00
|
|
|
bool force = qemu_opt_get_bool(opts, "vhostforce", false);
|
2010-03-17 12:08:24 +01:00
|
|
|
if (qemu_opt_get(opts, "vhostfd")) {
|
|
|
|
r = net_handle_fd_param(mon, qemu_opt_get(opts, "vhostfd"));
|
|
|
|
if (r == -1) {
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
vhostfd = r;
|
|
|
|
} else {
|
|
|
|
vhostfd = -1;
|
|
|
|
}
|
2011-02-01 21:13:42 +01:00
|
|
|
s->vhost_net = vhost_net_init(&s->nc, vhostfd, force);
|
2010-03-17 12:08:24 +01:00
|
|
|
if (!s->vhost_net) {
|
|
|
|
error_report("vhost-net requested but could not be initialized");
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
} else if (qemu_opt_get(opts, "vhostfd")) {
|
|
|
|
error_report("vhostfd= is not valid without vhost");
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
2009-10-22 18:49:07 +02:00
|
|
|
return 0;
|
|
|
|
}
|
2010-03-17 12:08:38 +01:00
|
|
|
|
|
|
|
VHostNetState *tap_get_vhost_net(VLANClientState *nc)
|
|
|
|
{
|
|
|
|
TAPState *s = DO_UPCAST(TAPState, nc, nc);
|
|
|
|
assert(nc->info->type == NET_CLIENT_TYPE_TAP);
|
|
|
|
return s->vhost_net;
|
|
|
|
}
|