84f85eb95f
In net_cleanup() we only need to delete the netdevs, as those may have state which outlives Qemu when it exits, and thus may actually need to be cleaned up on exit. The nics, on the other hand, are owned by the device which created them. Most devices don't bother to clean up on exit because they don't have any state which will outlive Qemu... but XenBus devices do need to clean up their nodes in XenStore, and do have an exit handler to delete them. When the XenBus exit handler destroys the xen-net-device, it attempts to delete its nic after net_cleanup() had already done so. And crashes. Fix this by only deleting netdevs as we walk the list. As the comment notes, we can't use QTAILQ_FOREACH_SAFE() as each deletion may remove *multiple* entries, including the "safely" saved 'next' pointer. But we can store the *previous* entry, since nics are safe. Signed-off-by: David Woodhouse <dwmw@amazon.co.uk> Reviewed-by: Paul Durrant <paul@xen.org> Signed-off-by: Jason Wang <jasowang@redhat.com>
1947 lines
51 KiB
C
1947 lines
51 KiB
C
/*
|
|
* QEMU System Emulator
|
|
*
|
|
* Copyright (c) 2003-2008 Fabrice Bellard
|
|
*
|
|
* Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
* of this software and associated documentation files (the "Software"), to deal
|
|
* in the Software without restriction, including without limitation the rights
|
|
* to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
* copies of the Software, and to permit persons to whom the Software is
|
|
* furnished to do so, subject to the following conditions:
|
|
*
|
|
* The above copyright notice and this permission notice shall be included in
|
|
* all copies or substantial portions of the Software.
|
|
*
|
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
|
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
|
* THE SOFTWARE.
|
|
*/
|
|
|
|
#include "qemu/osdep.h"
|
|
|
|
#include "net/net.h"
|
|
#include "clients.h"
|
|
#include "hub.h"
|
|
#include "hw/qdev-properties.h"
|
|
#include "net/slirp.h"
|
|
#include "net/eth.h"
|
|
#include "util.h"
|
|
|
|
#include "monitor/monitor.h"
|
|
#include "qemu/help_option.h"
|
|
#include "qapi/qapi-commands-net.h"
|
|
#include "qapi/qapi-visit-net.h"
|
|
#include "qapi/qmp/qdict.h"
|
|
#include "qapi/qmp/qerror.h"
|
|
#include "qemu/error-report.h"
|
|
#include "qemu/sockets.h"
|
|
#include "qemu/cutils.h"
|
|
#include "qemu/config-file.h"
|
|
#include "qemu/ctype.h"
|
|
#include "qemu/id.h"
|
|
#include "qemu/iov.h"
|
|
#include "qemu/qemu-print.h"
|
|
#include "qemu/main-loop.h"
|
|
#include "qemu/option.h"
|
|
#include "qemu/keyval.h"
|
|
#include "qapi/error.h"
|
|
#include "qapi/opts-visitor.h"
|
|
#include "sysemu/runstate.h"
|
|
#include "net/colo-compare.h"
|
|
#include "net/filter.h"
|
|
#include "qapi/string-output-visitor.h"
|
|
#include "qapi/qobject-input-visitor.h"
|
|
|
|
/* Net bridge is currently not supported for W32. */
|
|
#if !defined(_WIN32)
|
|
# define CONFIG_NET_BRIDGE
|
|
#endif
|
|
|
|
static VMChangeStateEntry *net_change_state_entry;
|
|
NetClientStateList net_clients;
|
|
|
|
typedef struct NetdevQueueEntry {
|
|
Netdev *nd;
|
|
Location loc;
|
|
QSIMPLEQ_ENTRY(NetdevQueueEntry) entry;
|
|
} NetdevQueueEntry;
|
|
|
|
typedef QSIMPLEQ_HEAD(, NetdevQueueEntry) NetdevQueue;
|
|
|
|
static NetdevQueue nd_queue = QSIMPLEQ_HEAD_INITIALIZER(nd_queue);
|
|
|
|
/***********************************************************/
|
|
/* network device redirectors */
|
|
|
|
int convert_host_port(struct sockaddr_in *saddr, const char *host,
|
|
const char *port, Error **errp)
|
|
{
|
|
struct hostent *he;
|
|
const char *r;
|
|
long p;
|
|
|
|
memset(saddr, 0, sizeof(*saddr));
|
|
|
|
saddr->sin_family = AF_INET;
|
|
if (host[0] == '\0') {
|
|
saddr->sin_addr.s_addr = 0;
|
|
} else {
|
|
if (qemu_isdigit(host[0])) {
|
|
if (!inet_aton(host, &saddr->sin_addr)) {
|
|
error_setg(errp, "host address '%s' is not a valid "
|
|
"IPv4 address", host);
|
|
return -1;
|
|
}
|
|
} else {
|
|
he = gethostbyname(host);
|
|
if (he == NULL) {
|
|
error_setg(errp, "can't resolve host address '%s'", host);
|
|
return -1;
|
|
}
|
|
saddr->sin_addr = *(struct in_addr *)he->h_addr;
|
|
}
|
|
}
|
|
if (qemu_strtol(port, &r, 0, &p) != 0) {
|
|
error_setg(errp, "port number '%s' is invalid", port);
|
|
return -1;
|
|
}
|
|
saddr->sin_port = htons(p);
|
|
return 0;
|
|
}
|
|
|
|
int parse_host_port(struct sockaddr_in *saddr, const char *str,
|
|
Error **errp)
|
|
{
|
|
gchar **substrings;
|
|
int ret;
|
|
|
|
substrings = g_strsplit(str, ":", 2);
|
|
if (!substrings || !substrings[0] || !substrings[1]) {
|
|
error_setg(errp, "host address '%s' doesn't contain ':' "
|
|
"separating host from port", str);
|
|
ret = -1;
|
|
goto out;
|
|
}
|
|
|
|
ret = convert_host_port(saddr, substrings[0], substrings[1], errp);
|
|
|
|
out:
|
|
g_strfreev(substrings);
|
|
return ret;
|
|
}
|
|
|
|
char *qemu_mac_strdup_printf(const uint8_t *macaddr)
|
|
{
|
|
return g_strdup_printf("%.2x:%.2x:%.2x:%.2x:%.2x:%.2x",
|
|
macaddr[0], macaddr[1], macaddr[2],
|
|
macaddr[3], macaddr[4], macaddr[5]);
|
|
}
|
|
|
|
void qemu_set_info_str(NetClientState *nc, const char *fmt, ...)
|
|
{
|
|
va_list ap;
|
|
|
|
va_start(ap, fmt);
|
|
vsnprintf(nc->info_str, sizeof(nc->info_str), fmt, ap);
|
|
va_end(ap);
|
|
}
|
|
|
|
void qemu_format_nic_info_str(NetClientState *nc, uint8_t macaddr[6])
|
|
{
|
|
qemu_set_info_str(nc, "model=%s,macaddr=%02x:%02x:%02x:%02x:%02x:%02x",
|
|
nc->model, macaddr[0], macaddr[1], macaddr[2],
|
|
macaddr[3], macaddr[4], macaddr[5]);
|
|
}
|
|
|
|
static int mac_table[256] = {0};
|
|
|
|
static void qemu_macaddr_set_used(MACAddr *macaddr)
|
|
{
|
|
int index;
|
|
|
|
for (index = 0x56; index < 0xFF; index++) {
|
|
if (macaddr->a[5] == index) {
|
|
mac_table[index]++;
|
|
}
|
|
}
|
|
}
|
|
|
|
static void qemu_macaddr_set_free(MACAddr *macaddr)
|
|
{
|
|
int index;
|
|
static const MACAddr base = { .a = { 0x52, 0x54, 0x00, 0x12, 0x34, 0 } };
|
|
|
|
if (memcmp(macaddr->a, &base.a, (sizeof(base.a) - 1)) != 0) {
|
|
return;
|
|
}
|
|
for (index = 0x56; index < 0xFF; index++) {
|
|
if (macaddr->a[5] == index) {
|
|
mac_table[index]--;
|
|
}
|
|
}
|
|
}
|
|
|
|
static int qemu_macaddr_get_free(void)
|
|
{
|
|
int index;
|
|
|
|
for (index = 0x56; index < 0xFF; index++) {
|
|
if (mac_table[index] == 0) {
|
|
return index;
|
|
}
|
|
}
|
|
|
|
return -1;
|
|
}
|
|
|
|
void qemu_macaddr_default_if_unset(MACAddr *macaddr)
|
|
{
|
|
static const MACAddr zero = { .a = { 0,0,0,0,0,0 } };
|
|
static const MACAddr base = { .a = { 0x52, 0x54, 0x00, 0x12, 0x34, 0 } };
|
|
|
|
if (memcmp(macaddr, &zero, sizeof(zero)) != 0) {
|
|
if (memcmp(macaddr->a, &base.a, (sizeof(base.a) - 1)) != 0) {
|
|
return;
|
|
} else {
|
|
qemu_macaddr_set_used(macaddr);
|
|
return;
|
|
}
|
|
}
|
|
|
|
macaddr->a[0] = 0x52;
|
|
macaddr->a[1] = 0x54;
|
|
macaddr->a[2] = 0x00;
|
|
macaddr->a[3] = 0x12;
|
|
macaddr->a[4] = 0x34;
|
|
macaddr->a[5] = qemu_macaddr_get_free();
|
|
qemu_macaddr_set_used(macaddr);
|
|
}
|
|
|
|
/**
|
|
* Generate a name for net client
|
|
*
|
|
* Only net clients created with the legacy -net option and NICs need this.
|
|
*/
|
|
static char *assign_name(NetClientState *nc1, const char *model)
|
|
{
|
|
NetClientState *nc;
|
|
int id = 0;
|
|
|
|
QTAILQ_FOREACH(nc, &net_clients, next) {
|
|
if (nc == nc1) {
|
|
continue;
|
|
}
|
|
if (strcmp(nc->model, model) == 0) {
|
|
id++;
|
|
}
|
|
}
|
|
|
|
return g_strdup_printf("%s.%d", model, id);
|
|
}
|
|
|
|
static void qemu_net_client_destructor(NetClientState *nc)
|
|
{
|
|
g_free(nc);
|
|
}
|
|
static ssize_t qemu_deliver_packet_iov(NetClientState *sender,
|
|
unsigned flags,
|
|
const struct iovec *iov,
|
|
int iovcnt,
|
|
void *opaque);
|
|
|
|
static void qemu_net_client_setup(NetClientState *nc,
|
|
NetClientInfo *info,
|
|
NetClientState *peer,
|
|
const char *model,
|
|
const char *name,
|
|
NetClientDestructor *destructor,
|
|
bool is_datapath)
|
|
{
|
|
nc->info = info;
|
|
nc->model = g_strdup(model);
|
|
if (name) {
|
|
nc->name = g_strdup(name);
|
|
} else {
|
|
nc->name = assign_name(nc, model);
|
|
}
|
|
|
|
if (peer) {
|
|
assert(!peer->peer);
|
|
nc->peer = peer;
|
|
peer->peer = nc;
|
|
}
|
|
QTAILQ_INSERT_TAIL(&net_clients, nc, next);
|
|
|
|
nc->incoming_queue = qemu_new_net_queue(qemu_deliver_packet_iov, nc);
|
|
nc->destructor = destructor;
|
|
nc->is_datapath = is_datapath;
|
|
QTAILQ_INIT(&nc->filters);
|
|
}
|
|
|
|
NetClientState *qemu_new_net_client(NetClientInfo *info,
|
|
NetClientState *peer,
|
|
const char *model,
|
|
const char *name)
|
|
{
|
|
NetClientState *nc;
|
|
|
|
assert(info->size >= sizeof(NetClientState));
|
|
|
|
nc = g_malloc0(info->size);
|
|
qemu_net_client_setup(nc, info, peer, model, name,
|
|
qemu_net_client_destructor, true);
|
|
|
|
return nc;
|
|
}
|
|
|
|
NetClientState *qemu_new_net_control_client(NetClientInfo *info,
|
|
NetClientState *peer,
|
|
const char *model,
|
|
const char *name)
|
|
{
|
|
NetClientState *nc;
|
|
|
|
assert(info->size >= sizeof(NetClientState));
|
|
|
|
nc = g_malloc0(info->size);
|
|
qemu_net_client_setup(nc, info, peer, model, name,
|
|
qemu_net_client_destructor, false);
|
|
|
|
return nc;
|
|
}
|
|
|
|
NICState *qemu_new_nic(NetClientInfo *info,
|
|
NICConf *conf,
|
|
const char *model,
|
|
const char *name,
|
|
MemReentrancyGuard *reentrancy_guard,
|
|
void *opaque)
|
|
{
|
|
NetClientState **peers = conf->peers.ncs;
|
|
NICState *nic;
|
|
int i, queues = MAX(1, conf->peers.queues);
|
|
|
|
assert(info->type == NET_CLIENT_DRIVER_NIC);
|
|
assert(info->size >= sizeof(NICState));
|
|
|
|
nic = g_malloc0(info->size + sizeof(NetClientState) * queues);
|
|
nic->ncs = (void *)nic + info->size;
|
|
nic->conf = conf;
|
|
nic->reentrancy_guard = reentrancy_guard,
|
|
nic->opaque = opaque;
|
|
|
|
for (i = 0; i < queues; i++) {
|
|
qemu_net_client_setup(&nic->ncs[i], info, peers[i], model, name,
|
|
NULL, true);
|
|
nic->ncs[i].queue_index = i;
|
|
}
|
|
|
|
return nic;
|
|
}
|
|
|
|
NetClientState *qemu_get_subqueue(NICState *nic, int queue_index)
|
|
{
|
|
return nic->ncs + queue_index;
|
|
}
|
|
|
|
NetClientState *qemu_get_queue(NICState *nic)
|
|
{
|
|
return qemu_get_subqueue(nic, 0);
|
|
}
|
|
|
|
NICState *qemu_get_nic(NetClientState *nc)
|
|
{
|
|
NetClientState *nc0 = nc - nc->queue_index;
|
|
|
|
return (NICState *)((void *)nc0 - nc->info->size);
|
|
}
|
|
|
|
void *qemu_get_nic_opaque(NetClientState *nc)
|
|
{
|
|
NICState *nic = qemu_get_nic(nc);
|
|
|
|
return nic->opaque;
|
|
}
|
|
|
|
NetClientState *qemu_get_peer(NetClientState *nc, int queue_index)
|
|
{
|
|
assert(nc != NULL);
|
|
NetClientState *ncs = nc + queue_index;
|
|
return ncs->peer;
|
|
}
|
|
|
|
static void qemu_cleanup_net_client(NetClientState *nc)
|
|
{
|
|
QTAILQ_REMOVE(&net_clients, nc, next);
|
|
|
|
if (nc->info->cleanup) {
|
|
nc->info->cleanup(nc);
|
|
}
|
|
}
|
|
|
|
static void qemu_free_net_client(NetClientState *nc)
|
|
{
|
|
if (nc->incoming_queue) {
|
|
qemu_del_net_queue(nc->incoming_queue);
|
|
}
|
|
if (nc->peer) {
|
|
nc->peer->peer = NULL;
|
|
}
|
|
g_free(nc->name);
|
|
g_free(nc->model);
|
|
if (nc->destructor) {
|
|
nc->destructor(nc);
|
|
}
|
|
}
|
|
|
|
void qemu_del_net_client(NetClientState *nc)
|
|
{
|
|
NetClientState *ncs[MAX_QUEUE_NUM];
|
|
int queues, i;
|
|
NetFilterState *nf, *next;
|
|
|
|
assert(nc->info->type != NET_CLIENT_DRIVER_NIC);
|
|
|
|
/* If the NetClientState belongs to a multiqueue backend, we will change all
|
|
* other NetClientStates also.
|
|
*/
|
|
queues = qemu_find_net_clients_except(nc->name, ncs,
|
|
NET_CLIENT_DRIVER_NIC,
|
|
MAX_QUEUE_NUM);
|
|
assert(queues != 0);
|
|
|
|
QTAILQ_FOREACH_SAFE(nf, &nc->filters, next, next) {
|
|
object_unparent(OBJECT(nf));
|
|
}
|
|
|
|
/* If there is a peer NIC, delete and cleanup client, but do not free. */
|
|
if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_NIC) {
|
|
NICState *nic = qemu_get_nic(nc->peer);
|
|
if (nic->peer_deleted) {
|
|
return;
|
|
}
|
|
nic->peer_deleted = true;
|
|
|
|
for (i = 0; i < queues; i++) {
|
|
ncs[i]->peer->link_down = true;
|
|
}
|
|
|
|
if (nc->peer->info->link_status_changed) {
|
|
nc->peer->info->link_status_changed(nc->peer);
|
|
}
|
|
|
|
for (i = 0; i < queues; i++) {
|
|
qemu_cleanup_net_client(ncs[i]);
|
|
}
|
|
|
|
return;
|
|
}
|
|
|
|
for (i = 0; i < queues; i++) {
|
|
qemu_cleanup_net_client(ncs[i]);
|
|
qemu_free_net_client(ncs[i]);
|
|
}
|
|
}
|
|
|
|
void qemu_del_nic(NICState *nic)
|
|
{
|
|
int i, queues = MAX(nic->conf->peers.queues, 1);
|
|
|
|
qemu_macaddr_set_free(&nic->conf->macaddr);
|
|
|
|
for (i = 0; i < queues; i++) {
|
|
NetClientState *nc = qemu_get_subqueue(nic, i);
|
|
/* If this is a peer NIC and peer has already been deleted, free it now. */
|
|
if (nic->peer_deleted) {
|
|
qemu_free_net_client(nc->peer);
|
|
} else if (nc->peer) {
|
|
/* if there are RX packets pending, complete them */
|
|
qemu_purge_queued_packets(nc->peer);
|
|
}
|
|
}
|
|
|
|
for (i = queues - 1; i >= 0; i--) {
|
|
NetClientState *nc = qemu_get_subqueue(nic, i);
|
|
|
|
qemu_cleanup_net_client(nc);
|
|
qemu_free_net_client(nc);
|
|
}
|
|
|
|
g_free(nic);
|
|
}
|
|
|
|
void qemu_foreach_nic(qemu_nic_foreach func, void *opaque)
|
|
{
|
|
NetClientState *nc;
|
|
|
|
QTAILQ_FOREACH(nc, &net_clients, next) {
|
|
if (nc->info->type == NET_CLIENT_DRIVER_NIC) {
|
|
if (nc->queue_index == 0) {
|
|
func(qemu_get_nic(nc), opaque);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
bool qemu_has_ufo(NetClientState *nc)
|
|
{
|
|
if (!nc || !nc->info->has_ufo) {
|
|
return false;
|
|
}
|
|
|
|
return nc->info->has_ufo(nc);
|
|
}
|
|
|
|
bool qemu_has_uso(NetClientState *nc)
|
|
{
|
|
if (!nc || !nc->info->has_uso) {
|
|
return false;
|
|
}
|
|
|
|
return nc->info->has_uso(nc);
|
|
}
|
|
|
|
bool qemu_has_vnet_hdr(NetClientState *nc)
|
|
{
|
|
if (!nc || !nc->info->has_vnet_hdr) {
|
|
return false;
|
|
}
|
|
|
|
return nc->info->has_vnet_hdr(nc);
|
|
}
|
|
|
|
bool qemu_has_vnet_hdr_len(NetClientState *nc, int len)
|
|
{
|
|
if (!nc || !nc->info->has_vnet_hdr_len) {
|
|
return false;
|
|
}
|
|
|
|
return nc->info->has_vnet_hdr_len(nc, len);
|
|
}
|
|
|
|
bool qemu_get_using_vnet_hdr(NetClientState *nc)
|
|
{
|
|
if (!nc || !nc->info->get_using_vnet_hdr) {
|
|
return false;
|
|
}
|
|
|
|
return nc->info->get_using_vnet_hdr(nc);
|
|
}
|
|
|
|
void qemu_using_vnet_hdr(NetClientState *nc, bool enable)
|
|
{
|
|
if (!nc || !nc->info->using_vnet_hdr) {
|
|
return;
|
|
}
|
|
|
|
nc->info->using_vnet_hdr(nc, enable);
|
|
}
|
|
|
|
void qemu_set_offload(NetClientState *nc, int csum, int tso4, int tso6,
|
|
int ecn, int ufo, int uso4, int uso6)
|
|
{
|
|
if (!nc || !nc->info->set_offload) {
|
|
return;
|
|
}
|
|
|
|
nc->info->set_offload(nc, csum, tso4, tso6, ecn, ufo, uso4, uso6);
|
|
}
|
|
|
|
int qemu_get_vnet_hdr_len(NetClientState *nc)
|
|
{
|
|
if (!nc || !nc->info->get_vnet_hdr_len) {
|
|
return 0;
|
|
}
|
|
|
|
return nc->info->get_vnet_hdr_len(nc);
|
|
}
|
|
|
|
void qemu_set_vnet_hdr_len(NetClientState *nc, int len)
|
|
{
|
|
if (!nc || !nc->info->set_vnet_hdr_len) {
|
|
return;
|
|
}
|
|
|
|
nc->vnet_hdr_len = len;
|
|
nc->info->set_vnet_hdr_len(nc, len);
|
|
}
|
|
|
|
int qemu_set_vnet_le(NetClientState *nc, bool is_le)
|
|
{
|
|
#if HOST_BIG_ENDIAN
|
|
if (!nc || !nc->info->set_vnet_le) {
|
|
return -ENOSYS;
|
|
}
|
|
|
|
return nc->info->set_vnet_le(nc, is_le);
|
|
#else
|
|
return 0;
|
|
#endif
|
|
}
|
|
|
|
int qemu_set_vnet_be(NetClientState *nc, bool is_be)
|
|
{
|
|
#if HOST_BIG_ENDIAN
|
|
return 0;
|
|
#else
|
|
if (!nc || !nc->info->set_vnet_be) {
|
|
return -ENOSYS;
|
|
}
|
|
|
|
return nc->info->set_vnet_be(nc, is_be);
|
|
#endif
|
|
}
|
|
|
|
int qemu_can_receive_packet(NetClientState *nc)
|
|
{
|
|
if (nc->receive_disabled) {
|
|
return 0;
|
|
} else if (nc->info->can_receive &&
|
|
!nc->info->can_receive(nc)) {
|
|
return 0;
|
|
}
|
|
return 1;
|
|
}
|
|
|
|
int qemu_can_send_packet(NetClientState *sender)
|
|
{
|
|
int vm_running = runstate_is_running();
|
|
|
|
if (!vm_running) {
|
|
return 0;
|
|
}
|
|
|
|
if (!sender->peer) {
|
|
return 1;
|
|
}
|
|
|
|
return qemu_can_receive_packet(sender->peer);
|
|
}
|
|
|
|
static ssize_t filter_receive_iov(NetClientState *nc,
|
|
NetFilterDirection direction,
|
|
NetClientState *sender,
|
|
unsigned flags,
|
|
const struct iovec *iov,
|
|
int iovcnt,
|
|
NetPacketSent *sent_cb)
|
|
{
|
|
ssize_t ret = 0;
|
|
NetFilterState *nf = NULL;
|
|
|
|
if (direction == NET_FILTER_DIRECTION_TX) {
|
|
QTAILQ_FOREACH(nf, &nc->filters, next) {
|
|
ret = qemu_netfilter_receive(nf, direction, sender, flags, iov,
|
|
iovcnt, sent_cb);
|
|
if (ret) {
|
|
return ret;
|
|
}
|
|
}
|
|
} else {
|
|
QTAILQ_FOREACH_REVERSE(nf, &nc->filters, next) {
|
|
ret = qemu_netfilter_receive(nf, direction, sender, flags, iov,
|
|
iovcnt, sent_cb);
|
|
if (ret) {
|
|
return ret;
|
|
}
|
|
}
|
|
}
|
|
|
|
return ret;
|
|
}
|
|
|
|
static ssize_t filter_receive(NetClientState *nc,
|
|
NetFilterDirection direction,
|
|
NetClientState *sender,
|
|
unsigned flags,
|
|
const uint8_t *data,
|
|
size_t size,
|
|
NetPacketSent *sent_cb)
|
|
{
|
|
struct iovec iov = {
|
|
.iov_base = (void *)data,
|
|
.iov_len = size
|
|
};
|
|
|
|
return filter_receive_iov(nc, direction, sender, flags, &iov, 1, sent_cb);
|
|
}
|
|
|
|
void qemu_purge_queued_packets(NetClientState *nc)
|
|
{
|
|
if (!nc->peer) {
|
|
return;
|
|
}
|
|
|
|
qemu_net_queue_purge(nc->peer->incoming_queue, nc);
|
|
}
|
|
|
|
void qemu_flush_or_purge_queued_packets(NetClientState *nc, bool purge)
|
|
{
|
|
nc->receive_disabled = 0;
|
|
|
|
if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_HUBPORT) {
|
|
if (net_hub_flush(nc->peer)) {
|
|
qemu_notify_event();
|
|
}
|
|
}
|
|
if (qemu_net_queue_flush(nc->incoming_queue)) {
|
|
/* We emptied the queue successfully, signal to the IO thread to repoll
|
|
* the file descriptor (for tap, for example).
|
|
*/
|
|
qemu_notify_event();
|
|
} else if (purge) {
|
|
/* Unable to empty the queue, purge remaining packets */
|
|
qemu_net_queue_purge(nc->incoming_queue, nc->peer);
|
|
}
|
|
}
|
|
|
|
void qemu_flush_queued_packets(NetClientState *nc)
|
|
{
|
|
qemu_flush_or_purge_queued_packets(nc, false);
|
|
}
|
|
|
|
static ssize_t qemu_send_packet_async_with_flags(NetClientState *sender,
|
|
unsigned flags,
|
|
const uint8_t *buf, int size,
|
|
NetPacketSent *sent_cb)
|
|
{
|
|
NetQueue *queue;
|
|
int ret;
|
|
|
|
#ifdef DEBUG_NET
|
|
printf("qemu_send_packet_async:\n");
|
|
qemu_hexdump(stdout, "net", buf, size);
|
|
#endif
|
|
|
|
if (sender->link_down || !sender->peer) {
|
|
return size;
|
|
}
|
|
|
|
/* Let filters handle the packet first */
|
|
ret = filter_receive(sender, NET_FILTER_DIRECTION_TX,
|
|
sender, flags, buf, size, sent_cb);
|
|
if (ret) {
|
|
return ret;
|
|
}
|
|
|
|
ret = filter_receive(sender->peer, NET_FILTER_DIRECTION_RX,
|
|
sender, flags, buf, size, sent_cb);
|
|
if (ret) {
|
|
return ret;
|
|
}
|
|
|
|
queue = sender->peer->incoming_queue;
|
|
|
|
return qemu_net_queue_send(queue, sender, flags, buf, size, sent_cb);
|
|
}
|
|
|
|
ssize_t qemu_send_packet_async(NetClientState *sender,
|
|
const uint8_t *buf, int size,
|
|
NetPacketSent *sent_cb)
|
|
{
|
|
return qemu_send_packet_async_with_flags(sender, QEMU_NET_PACKET_FLAG_NONE,
|
|
buf, size, sent_cb);
|
|
}
|
|
|
|
ssize_t qemu_send_packet(NetClientState *nc, const uint8_t *buf, int size)
|
|
{
|
|
return qemu_send_packet_async(nc, buf, size, NULL);
|
|
}
|
|
|
|
ssize_t qemu_receive_packet(NetClientState *nc, const uint8_t *buf, int size)
|
|
{
|
|
if (!qemu_can_receive_packet(nc)) {
|
|
return 0;
|
|
}
|
|
|
|
return qemu_net_queue_receive(nc->incoming_queue, buf, size);
|
|
}
|
|
|
|
ssize_t qemu_receive_packet_iov(NetClientState *nc, const struct iovec *iov,
|
|
int iovcnt)
|
|
{
|
|
if (!qemu_can_receive_packet(nc)) {
|
|
return 0;
|
|
}
|
|
|
|
return qemu_net_queue_receive_iov(nc->incoming_queue, iov, iovcnt);
|
|
}
|
|
|
|
ssize_t qemu_send_packet_raw(NetClientState *nc, const uint8_t *buf, int size)
|
|
{
|
|
return qemu_send_packet_async_with_flags(nc, QEMU_NET_PACKET_FLAG_RAW,
|
|
buf, size, NULL);
|
|
}
|
|
|
|
static ssize_t nc_sendv_compat(NetClientState *nc, const struct iovec *iov,
|
|
int iovcnt, unsigned flags)
|
|
{
|
|
uint8_t *buf = NULL;
|
|
uint8_t *buffer;
|
|
size_t offset;
|
|
ssize_t ret;
|
|
|
|
if (iovcnt == 1) {
|
|
buffer = iov[0].iov_base;
|
|
offset = iov[0].iov_len;
|
|
} else {
|
|
offset = iov_size(iov, iovcnt);
|
|
if (offset > NET_BUFSIZE) {
|
|
return -1;
|
|
}
|
|
buf = g_malloc(offset);
|
|
buffer = buf;
|
|
offset = iov_to_buf(iov, iovcnt, 0, buf, offset);
|
|
}
|
|
|
|
if (flags & QEMU_NET_PACKET_FLAG_RAW && nc->info->receive_raw) {
|
|
ret = nc->info->receive_raw(nc, buffer, offset);
|
|
} else {
|
|
ret = nc->info->receive(nc, buffer, offset);
|
|
}
|
|
|
|
g_free(buf);
|
|
return ret;
|
|
}
|
|
|
|
static ssize_t qemu_deliver_packet_iov(NetClientState *sender,
|
|
unsigned flags,
|
|
const struct iovec *iov,
|
|
int iovcnt,
|
|
void *opaque)
|
|
{
|
|
MemReentrancyGuard *owned_reentrancy_guard;
|
|
NetClientState *nc = opaque;
|
|
int ret;
|
|
|
|
|
|
if (nc->link_down) {
|
|
return iov_size(iov, iovcnt);
|
|
}
|
|
|
|
if (nc->receive_disabled) {
|
|
return 0;
|
|
}
|
|
|
|
if (nc->info->type != NET_CLIENT_DRIVER_NIC ||
|
|
qemu_get_nic(nc)->reentrancy_guard->engaged_in_io) {
|
|
owned_reentrancy_guard = NULL;
|
|
} else {
|
|
owned_reentrancy_guard = qemu_get_nic(nc)->reentrancy_guard;
|
|
owned_reentrancy_guard->engaged_in_io = true;
|
|
}
|
|
|
|
if (nc->info->receive_iov && !(flags & QEMU_NET_PACKET_FLAG_RAW)) {
|
|
ret = nc->info->receive_iov(nc, iov, iovcnt);
|
|
} else {
|
|
ret = nc_sendv_compat(nc, iov, iovcnt, flags);
|
|
}
|
|
|
|
if (owned_reentrancy_guard) {
|
|
owned_reentrancy_guard->engaged_in_io = false;
|
|
}
|
|
|
|
if (ret == 0) {
|
|
nc->receive_disabled = 1;
|
|
}
|
|
|
|
return ret;
|
|
}
|
|
|
|
ssize_t qemu_sendv_packet_async(NetClientState *sender,
|
|
const struct iovec *iov, int iovcnt,
|
|
NetPacketSent *sent_cb)
|
|
{
|
|
NetQueue *queue;
|
|
size_t size = iov_size(iov, iovcnt);
|
|
int ret;
|
|
|
|
if (size > NET_BUFSIZE) {
|
|
return size;
|
|
}
|
|
|
|
if (sender->link_down || !sender->peer) {
|
|
return size;
|
|
}
|
|
|
|
/* Let filters handle the packet first */
|
|
ret = filter_receive_iov(sender, NET_FILTER_DIRECTION_TX, sender,
|
|
QEMU_NET_PACKET_FLAG_NONE, iov, iovcnt, sent_cb);
|
|
if (ret) {
|
|
return ret;
|
|
}
|
|
|
|
ret = filter_receive_iov(sender->peer, NET_FILTER_DIRECTION_RX, sender,
|
|
QEMU_NET_PACKET_FLAG_NONE, iov, iovcnt, sent_cb);
|
|
if (ret) {
|
|
return ret;
|
|
}
|
|
|
|
queue = sender->peer->incoming_queue;
|
|
|
|
return qemu_net_queue_send_iov(queue, sender,
|
|
QEMU_NET_PACKET_FLAG_NONE,
|
|
iov, iovcnt, sent_cb);
|
|
}
|
|
|
|
ssize_t
|
|
qemu_sendv_packet(NetClientState *nc, const struct iovec *iov, int iovcnt)
|
|
{
|
|
return qemu_sendv_packet_async(nc, iov, iovcnt, NULL);
|
|
}
|
|
|
|
NetClientState *qemu_find_netdev(const char *id)
|
|
{
|
|
NetClientState *nc;
|
|
|
|
QTAILQ_FOREACH(nc, &net_clients, next) {
|
|
if (nc->info->type == NET_CLIENT_DRIVER_NIC)
|
|
continue;
|
|
if (!strcmp(nc->name, id)) {
|
|
return nc;
|
|
}
|
|
}
|
|
|
|
return NULL;
|
|
}
|
|
|
|
int qemu_find_net_clients_except(const char *id, NetClientState **ncs,
|
|
NetClientDriver type, int max)
|
|
{
|
|
NetClientState *nc;
|
|
int ret = 0;
|
|
|
|
QTAILQ_FOREACH(nc, &net_clients, next) {
|
|
if (nc->info->type == type) {
|
|
continue;
|
|
}
|
|
if (!id || !strcmp(nc->name, id)) {
|
|
if (ret < max) {
|
|
ncs[ret] = nc;
|
|
}
|
|
ret++;
|
|
}
|
|
}
|
|
|
|
return ret;
|
|
}
|
|
|
|
static int nic_get_free_idx(void)
|
|
{
|
|
int index;
|
|
|
|
for (index = 0; index < MAX_NICS; index++)
|
|
if (!nd_table[index].used)
|
|
return index;
|
|
return -1;
|
|
}
|
|
|
|
GPtrArray *qemu_get_nic_models(const char *device_type)
|
|
{
|
|
GPtrArray *nic_models = g_ptr_array_new();
|
|
GSList *list = object_class_get_list_sorted(device_type, false);
|
|
|
|
while (list) {
|
|
DeviceClass *dc = OBJECT_CLASS_CHECK(DeviceClass, list->data,
|
|
TYPE_DEVICE);
|
|
GSList *next;
|
|
if (test_bit(DEVICE_CATEGORY_NETWORK, dc->categories) &&
|
|
dc->user_creatable) {
|
|
const char *name = object_class_get_name(list->data);
|
|
/*
|
|
* A network device might also be something else than a NIC, see
|
|
* e.g. the "rocker" device. Thus we have to look for the "netdev"
|
|
* property, too. Unfortunately, some devices like virtio-net only
|
|
* create this property during instance_init, so we have to create
|
|
* a temporary instance here to be able to check it.
|
|
*/
|
|
Object *obj = object_new_with_class(OBJECT_CLASS(dc));
|
|
if (object_property_find(obj, "netdev")) {
|
|
g_ptr_array_add(nic_models, (gpointer)name);
|
|
}
|
|
object_unref(obj);
|
|
}
|
|
next = list->next;
|
|
g_slist_free_1(list);
|
|
list = next;
|
|
}
|
|
g_ptr_array_add(nic_models, NULL);
|
|
|
|
return nic_models;
|
|
}
|
|
|
|
int qemu_show_nic_models(const char *arg, const char *const *models)
|
|
{
|
|
int i;
|
|
|
|
if (!arg || !is_help_option(arg)) {
|
|
return 0;
|
|
}
|
|
|
|
printf("Available NIC models:\n");
|
|
for (i = 0 ; models[i]; i++) {
|
|
printf("%s\n", models[i]);
|
|
}
|
|
return 1;
|
|
}
|
|
|
|
void qemu_check_nic_model(NICInfo *nd, const char *model)
|
|
{
|
|
const char *models[2];
|
|
|
|
models[0] = model;
|
|
models[1] = NULL;
|
|
|
|
if (qemu_show_nic_models(nd->model, models))
|
|
exit(0);
|
|
if (qemu_find_nic_model(nd, models, model) < 0)
|
|
exit(1);
|
|
}
|
|
|
|
int qemu_find_nic_model(NICInfo *nd, const char * const *models,
|
|
const char *default_model)
|
|
{
|
|
int i;
|
|
|
|
if (!nd->model)
|
|
nd->model = g_strdup(default_model);
|
|
|
|
for (i = 0 ; models[i]; i++) {
|
|
if (strcmp(nd->model, models[i]) == 0)
|
|
return i;
|
|
}
|
|
|
|
error_report("Unsupported NIC model: %s", nd->model);
|
|
return -1;
|
|
}
|
|
|
|
static int net_init_nic(const Netdev *netdev, const char *name,
|
|
NetClientState *peer, Error **errp)
|
|
{
|
|
int idx;
|
|
NICInfo *nd;
|
|
const NetLegacyNicOptions *nic;
|
|
|
|
assert(netdev->type == NET_CLIENT_DRIVER_NIC);
|
|
nic = &netdev->u.nic;
|
|
|
|
idx = nic_get_free_idx();
|
|
if (idx == -1 || nb_nics >= MAX_NICS) {
|
|
error_setg(errp, "too many NICs");
|
|
return -1;
|
|
}
|
|
|
|
nd = &nd_table[idx];
|
|
|
|
memset(nd, 0, sizeof(*nd));
|
|
|
|
if (nic->netdev) {
|
|
nd->netdev = qemu_find_netdev(nic->netdev);
|
|
if (!nd->netdev) {
|
|
error_setg(errp, "netdev '%s' not found", nic->netdev);
|
|
return -1;
|
|
}
|
|
} else {
|
|
assert(peer);
|
|
nd->netdev = peer;
|
|
}
|
|
nd->name = g_strdup(name);
|
|
if (nic->model) {
|
|
nd->model = g_strdup(nic->model);
|
|
}
|
|
if (nic->addr) {
|
|
nd->devaddr = g_strdup(nic->addr);
|
|
}
|
|
|
|
if (nic->macaddr &&
|
|
net_parse_macaddr(nd->macaddr.a, nic->macaddr) < 0) {
|
|
error_setg(errp, "invalid syntax for ethernet address");
|
|
return -1;
|
|
}
|
|
if (nic->macaddr &&
|
|
is_multicast_ether_addr(nd->macaddr.a)) {
|
|
error_setg(errp,
|
|
"NIC cannot have multicast MAC address (odd 1st byte)");
|
|
return -1;
|
|
}
|
|
qemu_macaddr_default_if_unset(&nd->macaddr);
|
|
|
|
if (nic->has_vectors) {
|
|
if (nic->vectors > 0x7ffffff) {
|
|
error_setg(errp, "invalid # of vectors: %"PRIu32, nic->vectors);
|
|
return -1;
|
|
}
|
|
nd->nvectors = nic->vectors;
|
|
} else {
|
|
nd->nvectors = DEV_NVECTORS_UNSPECIFIED;
|
|
}
|
|
|
|
nd->used = 1;
|
|
nb_nics++;
|
|
|
|
return idx;
|
|
}
|
|
|
|
|
|
static int (* const net_client_init_fun[NET_CLIENT_DRIVER__MAX])(
|
|
const Netdev *netdev,
|
|
const char *name,
|
|
NetClientState *peer, Error **errp) = {
|
|
[NET_CLIENT_DRIVER_NIC] = net_init_nic,
|
|
#ifdef CONFIG_SLIRP
|
|
[NET_CLIENT_DRIVER_USER] = net_init_slirp,
|
|
#endif
|
|
[NET_CLIENT_DRIVER_TAP] = net_init_tap,
|
|
[NET_CLIENT_DRIVER_SOCKET] = net_init_socket,
|
|
[NET_CLIENT_DRIVER_STREAM] = net_init_stream,
|
|
[NET_CLIENT_DRIVER_DGRAM] = net_init_dgram,
|
|
#ifdef CONFIG_VDE
|
|
[NET_CLIENT_DRIVER_VDE] = net_init_vde,
|
|
#endif
|
|
#ifdef CONFIG_NETMAP
|
|
[NET_CLIENT_DRIVER_NETMAP] = net_init_netmap,
|
|
#endif
|
|
#ifdef CONFIG_AF_XDP
|
|
[NET_CLIENT_DRIVER_AF_XDP] = net_init_af_xdp,
|
|
#endif
|
|
#ifdef CONFIG_NET_BRIDGE
|
|
[NET_CLIENT_DRIVER_BRIDGE] = net_init_bridge,
|
|
#endif
|
|
[NET_CLIENT_DRIVER_HUBPORT] = net_init_hubport,
|
|
#ifdef CONFIG_VHOST_NET_USER
|
|
[NET_CLIENT_DRIVER_VHOST_USER] = net_init_vhost_user,
|
|
#endif
|
|
#ifdef CONFIG_VHOST_NET_VDPA
|
|
[NET_CLIENT_DRIVER_VHOST_VDPA] = net_init_vhost_vdpa,
|
|
#endif
|
|
#ifdef CONFIG_L2TPV3
|
|
[NET_CLIENT_DRIVER_L2TPV3] = net_init_l2tpv3,
|
|
#endif
|
|
#ifdef CONFIG_VMNET
|
|
[NET_CLIENT_DRIVER_VMNET_HOST] = net_init_vmnet_host,
|
|
[NET_CLIENT_DRIVER_VMNET_SHARED] = net_init_vmnet_shared,
|
|
[NET_CLIENT_DRIVER_VMNET_BRIDGED] = net_init_vmnet_bridged,
|
|
#endif /* CONFIG_VMNET */
|
|
};
|
|
|
|
|
|
static int net_client_init1(const Netdev *netdev, bool is_netdev, Error **errp)
|
|
{
|
|
NetClientState *peer = NULL;
|
|
NetClientState *nc;
|
|
|
|
if (is_netdev) {
|
|
if (netdev->type == NET_CLIENT_DRIVER_NIC ||
|
|
!net_client_init_fun[netdev->type]) {
|
|
error_setg(errp, "network backend '%s' is not compiled into this binary",
|
|
NetClientDriver_str(netdev->type));
|
|
return -1;
|
|
}
|
|
} else {
|
|
if (netdev->type == NET_CLIENT_DRIVER_NONE) {
|
|
return 0; /* nothing to do */
|
|
}
|
|
if (netdev->type == NET_CLIENT_DRIVER_HUBPORT) {
|
|
error_setg(errp, "network backend '%s' is only supported with -netdev/-nic",
|
|
NetClientDriver_str(netdev->type));
|
|
return -1;
|
|
}
|
|
|
|
if (!net_client_init_fun[netdev->type]) {
|
|
error_setg(errp, "network backend '%s' is not compiled into this binary",
|
|
NetClientDriver_str(netdev->type));
|
|
return -1;
|
|
}
|
|
|
|
/* Do not add to a hub if it's a nic with a netdev= parameter. */
|
|
if (netdev->type != NET_CLIENT_DRIVER_NIC ||
|
|
!netdev->u.nic.netdev) {
|
|
peer = net_hub_add_port(0, NULL, NULL);
|
|
}
|
|
}
|
|
|
|
nc = qemu_find_netdev(netdev->id);
|
|
if (nc) {
|
|
error_setg(errp, "Duplicate ID '%s'", netdev->id);
|
|
return -1;
|
|
}
|
|
|
|
if (net_client_init_fun[netdev->type](netdev, netdev->id, peer, errp) < 0) {
|
|
/* FIXME drop when all init functions store an Error */
|
|
if (errp && !*errp) {
|
|
error_setg(errp, "Device '%s' could not be initialized",
|
|
NetClientDriver_str(netdev->type));
|
|
}
|
|
return -1;
|
|
}
|
|
|
|
if (is_netdev) {
|
|
nc = qemu_find_netdev(netdev->id);
|
|
assert(nc);
|
|
nc->is_netdev = true;
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
void show_netdevs(void)
|
|
{
|
|
int idx;
|
|
const char *available_netdevs[] = {
|
|
"socket",
|
|
"stream",
|
|
"dgram",
|
|
"hubport",
|
|
"tap",
|
|
#ifdef CONFIG_SLIRP
|
|
"user",
|
|
#endif
|
|
#ifdef CONFIG_L2TPV3
|
|
"l2tpv3",
|
|
#endif
|
|
#ifdef CONFIG_VDE
|
|
"vde",
|
|
#endif
|
|
#ifdef CONFIG_NET_BRIDGE
|
|
"bridge",
|
|
#endif
|
|
#ifdef CONFIG_NETMAP
|
|
"netmap",
|
|
#endif
|
|
#ifdef CONFIG_AF_XDP
|
|
"af-xdp",
|
|
#endif
|
|
#ifdef CONFIG_POSIX
|
|
"vhost-user",
|
|
#endif
|
|
#ifdef CONFIG_VHOST_VDPA
|
|
"vhost-vdpa",
|
|
#endif
|
|
#ifdef CONFIG_VMNET
|
|
"vmnet-host",
|
|
"vmnet-shared",
|
|
"vmnet-bridged",
|
|
#endif
|
|
};
|
|
|
|
qemu_printf("Available netdev backend types:\n");
|
|
for (idx = 0; idx < ARRAY_SIZE(available_netdevs); idx++) {
|
|
qemu_printf("%s\n", available_netdevs[idx]);
|
|
}
|
|
}
|
|
|
|
static int net_client_init(QemuOpts *opts, bool is_netdev, Error **errp)
|
|
{
|
|
gchar **substrings = NULL;
|
|
Netdev *object = NULL;
|
|
int ret = -1;
|
|
Visitor *v = opts_visitor_new(opts);
|
|
|
|
/* Parse convenience option format ipv6-net=fec0::0[/64] */
|
|
const char *ip6_net = qemu_opt_get(opts, "ipv6-net");
|
|
|
|
if (ip6_net) {
|
|
char *prefix_addr;
|
|
unsigned long prefix_len = 64; /* Default 64bit prefix length. */
|
|
|
|
substrings = g_strsplit(ip6_net, "/", 2);
|
|
if (!substrings || !substrings[0]) {
|
|
error_setg(errp, QERR_INVALID_PARAMETER_VALUE, "ipv6-net",
|
|
"a valid IPv6 prefix");
|
|
goto out;
|
|
}
|
|
|
|
prefix_addr = substrings[0];
|
|
|
|
/* Handle user-specified prefix length. */
|
|
if (substrings[1] &&
|
|
qemu_strtoul(substrings[1], NULL, 10, &prefix_len))
|
|
{
|
|
error_setg(errp,
|
|
"parameter 'ipv6-net' expects a number after '/'");
|
|
goto out;
|
|
}
|
|
|
|
qemu_opt_set(opts, "ipv6-prefix", prefix_addr, &error_abort);
|
|
qemu_opt_set_number(opts, "ipv6-prefixlen", prefix_len,
|
|
&error_abort);
|
|
qemu_opt_unset(opts, "ipv6-net");
|
|
}
|
|
|
|
/* Create an ID for -net if the user did not specify one */
|
|
if (!is_netdev && !qemu_opts_id(opts)) {
|
|
qemu_opts_set_id(opts, id_generate(ID_NET));
|
|
}
|
|
|
|
if (visit_type_Netdev(v, NULL, &object, errp)) {
|
|
ret = net_client_init1(object, is_netdev, errp);
|
|
}
|
|
|
|
qapi_free_Netdev(object);
|
|
|
|
out:
|
|
g_strfreev(substrings);
|
|
visit_free(v);
|
|
return ret;
|
|
}
|
|
|
|
void netdev_add(QemuOpts *opts, Error **errp)
|
|
{
|
|
net_client_init(opts, true, errp);
|
|
}
|
|
|
|
void qmp_netdev_add(Netdev *netdev, Error **errp)
|
|
{
|
|
if (!id_wellformed(netdev->id)) {
|
|
error_setg(errp, QERR_INVALID_PARAMETER_VALUE, "id", "an identifier");
|
|
return;
|
|
}
|
|
|
|
net_client_init1(netdev, true, errp);
|
|
}
|
|
|
|
void qmp_netdev_del(const char *id, Error **errp)
|
|
{
|
|
NetClientState *nc;
|
|
QemuOpts *opts;
|
|
|
|
nc = qemu_find_netdev(id);
|
|
if (!nc) {
|
|
error_set(errp, ERROR_CLASS_DEVICE_NOT_FOUND,
|
|
"Device '%s' not found", id);
|
|
return;
|
|
}
|
|
|
|
if (!nc->is_netdev) {
|
|
error_setg(errp, "Device '%s' is not a netdev", id);
|
|
return;
|
|
}
|
|
|
|
qemu_del_net_client(nc);
|
|
|
|
/*
|
|
* Wart: we need to delete the QemuOpts associated with netdevs
|
|
* created via CLI or HMP, to avoid bogus "Duplicate ID" errors in
|
|
* HMP netdev_add.
|
|
*/
|
|
opts = qemu_opts_find(qemu_find_opts("netdev"), id);
|
|
if (opts) {
|
|
qemu_opts_del(opts);
|
|
}
|
|
}
|
|
|
|
static void netfilter_print_info(Monitor *mon, NetFilterState *nf)
|
|
{
|
|
char *str;
|
|
ObjectProperty *prop;
|
|
ObjectPropertyIterator iter;
|
|
Visitor *v;
|
|
|
|
/* generate info str */
|
|
object_property_iter_init(&iter, OBJECT(nf));
|
|
while ((prop = object_property_iter_next(&iter))) {
|
|
if (!strcmp(prop->name, "type")) {
|
|
continue;
|
|
}
|
|
v = string_output_visitor_new(false, &str);
|
|
object_property_get(OBJECT(nf), prop->name, v, NULL);
|
|
visit_complete(v, &str);
|
|
visit_free(v);
|
|
monitor_printf(mon, ",%s=%s", prop->name, str);
|
|
g_free(str);
|
|
}
|
|
monitor_printf(mon, "\n");
|
|
}
|
|
|
|
void print_net_client(Monitor *mon, NetClientState *nc)
|
|
{
|
|
NetFilterState *nf;
|
|
|
|
monitor_printf(mon, "%s: index=%d,type=%s,%s\n", nc->name,
|
|
nc->queue_index,
|
|
NetClientDriver_str(nc->info->type),
|
|
nc->info_str);
|
|
if (!QTAILQ_EMPTY(&nc->filters)) {
|
|
monitor_printf(mon, "filters:\n");
|
|
}
|
|
QTAILQ_FOREACH(nf, &nc->filters, next) {
|
|
monitor_printf(mon, " - %s: type=%s",
|
|
object_get_canonical_path_component(OBJECT(nf)),
|
|
object_get_typename(OBJECT(nf)));
|
|
netfilter_print_info(mon, nf);
|
|
}
|
|
}
|
|
|
|
RxFilterInfoList *qmp_query_rx_filter(const char *name, Error **errp)
|
|
{
|
|
NetClientState *nc;
|
|
RxFilterInfoList *filter_list = NULL, **tail = &filter_list;
|
|
|
|
QTAILQ_FOREACH(nc, &net_clients, next) {
|
|
RxFilterInfo *info;
|
|
|
|
if (name && strcmp(nc->name, name) != 0) {
|
|
continue;
|
|
}
|
|
|
|
/* only query rx-filter information of NIC */
|
|
if (nc->info->type != NET_CLIENT_DRIVER_NIC) {
|
|
if (name) {
|
|
error_setg(errp, "net client(%s) isn't a NIC", name);
|
|
assert(!filter_list);
|
|
return NULL;
|
|
}
|
|
continue;
|
|
}
|
|
|
|
/* only query information on queue 0 since the info is per nic,
|
|
* not per queue
|
|
*/
|
|
if (nc->queue_index != 0)
|
|
continue;
|
|
|
|
if (nc->info->query_rx_filter) {
|
|
info = nc->info->query_rx_filter(nc);
|
|
QAPI_LIST_APPEND(tail, info);
|
|
} else if (name) {
|
|
error_setg(errp, "net client(%s) doesn't support"
|
|
" rx-filter querying", name);
|
|
assert(!filter_list);
|
|
return NULL;
|
|
}
|
|
|
|
if (name) {
|
|
break;
|
|
}
|
|
}
|
|
|
|
if (filter_list == NULL && name) {
|
|
error_setg(errp, "invalid net client name: %s", name);
|
|
}
|
|
|
|
return filter_list;
|
|
}
|
|
|
|
void colo_notify_filters_event(int event, Error **errp)
|
|
{
|
|
NetClientState *nc;
|
|
NetFilterState *nf;
|
|
NetFilterClass *nfc = NULL;
|
|
Error *local_err = NULL;
|
|
|
|
QTAILQ_FOREACH(nc, &net_clients, next) {
|
|
QTAILQ_FOREACH(nf, &nc->filters, next) {
|
|
nfc = NETFILTER_GET_CLASS(OBJECT(nf));
|
|
nfc->handle_event(nf, event, &local_err);
|
|
if (local_err) {
|
|
error_propagate(errp, local_err);
|
|
return;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
void qmp_set_link(const char *name, bool up, Error **errp)
|
|
{
|
|
NetClientState *ncs[MAX_QUEUE_NUM];
|
|
NetClientState *nc;
|
|
int queues, i;
|
|
|
|
queues = qemu_find_net_clients_except(name, ncs,
|
|
NET_CLIENT_DRIVER__MAX,
|
|
MAX_QUEUE_NUM);
|
|
|
|
if (queues == 0) {
|
|
error_set(errp, ERROR_CLASS_DEVICE_NOT_FOUND,
|
|
"Device '%s' not found", name);
|
|
return;
|
|
}
|
|
nc = ncs[0];
|
|
|
|
for (i = 0; i < queues; i++) {
|
|
ncs[i]->link_down = !up;
|
|
}
|
|
|
|
if (nc->info->link_status_changed) {
|
|
nc->info->link_status_changed(nc);
|
|
}
|
|
|
|
if (nc->peer) {
|
|
/* Change peer link only if the peer is NIC and then notify peer.
|
|
* If the peer is a HUBPORT or a backend, we do not change the
|
|
* link status.
|
|
*
|
|
* This behavior is compatible with qemu hubs where there could be
|
|
* multiple clients that can still communicate with each other in
|
|
* disconnected mode. For now maintain this compatibility.
|
|
*/
|
|
if (nc->peer->info->type == NET_CLIENT_DRIVER_NIC) {
|
|
for (i = 0; i < queues; i++) {
|
|
ncs[i]->peer->link_down = !up;
|
|
}
|
|
}
|
|
if (nc->peer->info->link_status_changed) {
|
|
nc->peer->info->link_status_changed(nc->peer);
|
|
}
|
|
}
|
|
}
|
|
|
|
static void net_vm_change_state_handler(void *opaque, bool running,
|
|
RunState state)
|
|
{
|
|
NetClientState *nc;
|
|
NetClientState *tmp;
|
|
|
|
QTAILQ_FOREACH_SAFE(nc, &net_clients, next, tmp) {
|
|
if (running) {
|
|
/* Flush queued packets and wake up backends. */
|
|
if (nc->peer && qemu_can_send_packet(nc)) {
|
|
qemu_flush_queued_packets(nc->peer);
|
|
}
|
|
} else {
|
|
/* Complete all queued packets, to guarantee we don't modify
|
|
* state later when VM is not running.
|
|
*/
|
|
qemu_flush_or_purge_queued_packets(nc, true);
|
|
}
|
|
}
|
|
}
|
|
|
|
void net_cleanup(void)
|
|
{
|
|
NetClientState *nc, **p = &QTAILQ_FIRST(&net_clients);
|
|
|
|
/*cleanup colo compare module for COLO*/
|
|
colo_compare_cleanup();
|
|
|
|
/*
|
|
* Walk the net_clients list and remove the netdevs but *not* any
|
|
* NET_CLIENT_DRIVER_NIC entries. The latter are owned by the device
|
|
* model which created them, and in some cases (e.g. xen-net-device)
|
|
* the device itself may do cleanup at exit and will be upset if we
|
|
* just delete its NIC from underneath it.
|
|
*
|
|
* Since qemu_del_net_client() may delete multiple entries, using
|
|
* QTAILQ_FOREACH_SAFE() is not safe here. The only safe pointer
|
|
* to keep as a bookmark is a NET_CLIENT_DRIVER_NIC entry, so keep
|
|
* 'p' pointing to either the head of the list, or the 'next' field
|
|
* of the latest NET_CLIENT_DRIVER_NIC, and operate on *p as we walk
|
|
* the list.
|
|
*
|
|
* The 'nc' variable isn't part of the list traversal; it's purely
|
|
* for convenience as too much '(*p)->' has a tendency to make the
|
|
* readers' eyes bleed.
|
|
*/
|
|
while (*p) {
|
|
nc = *p;
|
|
if (nc->info->type == NET_CLIENT_DRIVER_NIC) {
|
|
/* Skip NET_CLIENT_DRIVER_NIC entries */
|
|
p = &QTAILQ_NEXT(nc, next);
|
|
} else {
|
|
qemu_del_net_client(nc);
|
|
}
|
|
}
|
|
|
|
qemu_del_vm_change_state_handler(net_change_state_entry);
|
|
}
|
|
|
|
void net_check_clients(void)
|
|
{
|
|
NetClientState *nc;
|
|
int i;
|
|
|
|
net_hub_check_clients();
|
|
|
|
QTAILQ_FOREACH(nc, &net_clients, next) {
|
|
if (!nc->peer) {
|
|
warn_report("%s %s has no peer",
|
|
nc->info->type == NET_CLIENT_DRIVER_NIC
|
|
? "nic" : "netdev",
|
|
nc->name);
|
|
}
|
|
}
|
|
|
|
/* Check that all NICs requested via -net nic actually got created.
|
|
* NICs created via -device don't need to be checked here because
|
|
* they are always instantiated.
|
|
*/
|
|
for (i = 0; i < MAX_NICS; i++) {
|
|
NICInfo *nd = &nd_table[i];
|
|
if (nd->used && !nd->instantiated) {
|
|
warn_report("requested NIC (%s, model %s) "
|
|
"was not created (not supported by this machine?)",
|
|
nd->name ? nd->name : "anonymous",
|
|
nd->model ? nd->model : "unspecified");
|
|
}
|
|
}
|
|
}
|
|
|
|
static int net_init_client(void *dummy, QemuOpts *opts, Error **errp)
|
|
{
|
|
return net_client_init(opts, false, errp);
|
|
}
|
|
|
|
static int net_init_netdev(void *dummy, QemuOpts *opts, Error **errp)
|
|
{
|
|
const char *type = qemu_opt_get(opts, "type");
|
|
|
|
if (type && is_help_option(type)) {
|
|
show_netdevs();
|
|
exit(0);
|
|
}
|
|
return net_client_init(opts, true, errp);
|
|
}
|
|
|
|
/* For the convenience "--nic" parameter */
|
|
static int net_param_nic(void *dummy, QemuOpts *opts, Error **errp)
|
|
{
|
|
char *mac, *nd_id;
|
|
int idx, ret;
|
|
NICInfo *ni;
|
|
const char *type;
|
|
|
|
type = qemu_opt_get(opts, "type");
|
|
if (type) {
|
|
if (g_str_equal(type, "none")) {
|
|
return 0; /* Nothing to do, default_net is cleared in vl.c */
|
|
}
|
|
if (is_help_option(type)) {
|
|
GPtrArray *nic_models = qemu_get_nic_models(TYPE_DEVICE);
|
|
show_netdevs();
|
|
printf("\n");
|
|
qemu_show_nic_models(type, (const char **)nic_models->pdata);
|
|
g_ptr_array_free(nic_models, true);
|
|
exit(0);
|
|
}
|
|
}
|
|
|
|
idx = nic_get_free_idx();
|
|
if (idx == -1 || nb_nics >= MAX_NICS) {
|
|
error_setg(errp, "no more on-board/default NIC slots available");
|
|
return -1;
|
|
}
|
|
|
|
if (!type) {
|
|
qemu_opt_set(opts, "type", "user", &error_abort);
|
|
}
|
|
|
|
ni = &nd_table[idx];
|
|
memset(ni, 0, sizeof(*ni));
|
|
ni->model = qemu_opt_get_del(opts, "model");
|
|
|
|
/* Create an ID if the user did not specify one */
|
|
nd_id = g_strdup(qemu_opts_id(opts));
|
|
if (!nd_id) {
|
|
nd_id = id_generate(ID_NET);
|
|
qemu_opts_set_id(opts, nd_id);
|
|
}
|
|
|
|
/* Handle MAC address */
|
|
mac = qemu_opt_get_del(opts, "mac");
|
|
if (mac) {
|
|
ret = net_parse_macaddr(ni->macaddr.a, mac);
|
|
g_free(mac);
|
|
if (ret) {
|
|
error_setg(errp, "invalid syntax for ethernet address");
|
|
goto out;
|
|
}
|
|
if (is_multicast_ether_addr(ni->macaddr.a)) {
|
|
error_setg(errp, "NIC cannot have multicast MAC address");
|
|
ret = -1;
|
|
goto out;
|
|
}
|
|
}
|
|
qemu_macaddr_default_if_unset(&ni->macaddr);
|
|
|
|
ret = net_client_init(opts, true, errp);
|
|
if (ret == 0) {
|
|
ni->netdev = qemu_find_netdev(nd_id);
|
|
ni->used = true;
|
|
nb_nics++;
|
|
}
|
|
|
|
out:
|
|
g_free(nd_id);
|
|
return ret;
|
|
}
|
|
|
|
static void netdev_init_modern(void)
|
|
{
|
|
while (!QSIMPLEQ_EMPTY(&nd_queue)) {
|
|
NetdevQueueEntry *nd = QSIMPLEQ_FIRST(&nd_queue);
|
|
|
|
QSIMPLEQ_REMOVE_HEAD(&nd_queue, entry);
|
|
loc_push_restore(&nd->loc);
|
|
net_client_init1(nd->nd, true, &error_fatal);
|
|
loc_pop(&nd->loc);
|
|
qapi_free_Netdev(nd->nd);
|
|
g_free(nd);
|
|
}
|
|
}
|
|
|
|
void net_init_clients(void)
|
|
{
|
|
net_change_state_entry =
|
|
qemu_add_vm_change_state_handler(net_vm_change_state_handler, NULL);
|
|
|
|
QTAILQ_INIT(&net_clients);
|
|
|
|
netdev_init_modern();
|
|
|
|
qemu_opts_foreach(qemu_find_opts("netdev"), net_init_netdev, NULL,
|
|
&error_fatal);
|
|
|
|
qemu_opts_foreach(qemu_find_opts("nic"), net_param_nic, NULL,
|
|
&error_fatal);
|
|
|
|
qemu_opts_foreach(qemu_find_opts("net"), net_init_client, NULL,
|
|
&error_fatal);
|
|
}
|
|
|
|
/*
|
|
* Does this -netdev argument use modern rather than traditional syntax?
|
|
* Modern syntax is to be parsed with netdev_parse_modern().
|
|
* Traditional syntax is to be parsed with net_client_parse().
|
|
*/
|
|
bool netdev_is_modern(const char *optstr)
|
|
{
|
|
QemuOpts *opts;
|
|
bool is_modern;
|
|
const char *type;
|
|
static QemuOptsList dummy_opts = {
|
|
.name = "netdev",
|
|
.implied_opt_name = "type",
|
|
.head = QTAILQ_HEAD_INITIALIZER(dummy_opts.head),
|
|
.desc = { { } },
|
|
};
|
|
|
|
if (optstr[0] == '{') {
|
|
/* This is JSON, which means it's modern syntax */
|
|
return true;
|
|
}
|
|
|
|
opts = qemu_opts_create(&dummy_opts, NULL, false, &error_abort);
|
|
qemu_opts_do_parse(opts, optstr, dummy_opts.implied_opt_name,
|
|
&error_abort);
|
|
type = qemu_opt_get(opts, "type");
|
|
is_modern = !g_strcmp0(type, "stream") || !g_strcmp0(type, "dgram");
|
|
|
|
qemu_opts_reset(&dummy_opts);
|
|
|
|
return is_modern;
|
|
}
|
|
|
|
/*
|
|
* netdev_parse_modern() uses modern, more expressive syntax than
|
|
* net_client_parse(), but supports only the -netdev option.
|
|
* netdev_parse_modern() appends to @nd_queue, whereas net_client_parse()
|
|
* appends to @qemu_netdev_opts.
|
|
*/
|
|
void netdev_parse_modern(const char *optstr)
|
|
{
|
|
Visitor *v;
|
|
NetdevQueueEntry *nd;
|
|
|
|
v = qobject_input_visitor_new_str(optstr, "type", &error_fatal);
|
|
nd = g_new(NetdevQueueEntry, 1);
|
|
visit_type_Netdev(v, NULL, &nd->nd, &error_fatal);
|
|
visit_free(v);
|
|
loc_save(&nd->loc);
|
|
|
|
QSIMPLEQ_INSERT_TAIL(&nd_queue, nd, entry);
|
|
}
|
|
|
|
void net_client_parse(QemuOptsList *opts_list, const char *optstr)
|
|
{
|
|
if (!qemu_opts_parse_noisily(opts_list, optstr, true)) {
|
|
exit(1);
|
|
}
|
|
}
|
|
|
|
/* From FreeBSD */
|
|
/* XXX: optimize */
|
|
uint32_t net_crc32(const uint8_t *p, int len)
|
|
{
|
|
uint32_t crc;
|
|
int carry, i, j;
|
|
uint8_t b;
|
|
|
|
crc = 0xffffffff;
|
|
for (i = 0; i < len; i++) {
|
|
b = *p++;
|
|
for (j = 0; j < 8; j++) {
|
|
carry = ((crc & 0x80000000L) ? 1 : 0) ^ (b & 0x01);
|
|
crc <<= 1;
|
|
b >>= 1;
|
|
if (carry) {
|
|
crc = ((crc ^ POLYNOMIAL_BE) | carry);
|
|
}
|
|
}
|
|
}
|
|
|
|
return crc;
|
|
}
|
|
|
|
uint32_t net_crc32_le(const uint8_t *p, int len)
|
|
{
|
|
uint32_t crc;
|
|
int carry, i, j;
|
|
uint8_t b;
|
|
|
|
crc = 0xffffffff;
|
|
for (i = 0; i < len; i++) {
|
|
b = *p++;
|
|
for (j = 0; j < 8; j++) {
|
|
carry = (crc & 0x1) ^ (b & 0x01);
|
|
crc >>= 1;
|
|
b >>= 1;
|
|
if (carry) {
|
|
crc ^= POLYNOMIAL_LE;
|
|
}
|
|
}
|
|
}
|
|
|
|
return crc;
|
|
}
|
|
|
|
QemuOptsList qemu_netdev_opts = {
|
|
.name = "netdev",
|
|
.implied_opt_name = "type",
|
|
.head = QTAILQ_HEAD_INITIALIZER(qemu_netdev_opts.head),
|
|
.desc = {
|
|
/*
|
|
* no elements => accept any params
|
|
* validation will happen later
|
|
*/
|
|
{ /* end of list */ }
|
|
},
|
|
};
|
|
|
|
QemuOptsList qemu_nic_opts = {
|
|
.name = "nic",
|
|
.implied_opt_name = "type",
|
|
.head = QTAILQ_HEAD_INITIALIZER(qemu_nic_opts.head),
|
|
.desc = {
|
|
/*
|
|
* no elements => accept any params
|
|
* validation will happen later
|
|
*/
|
|
{ /* end of list */ }
|
|
},
|
|
};
|
|
|
|
QemuOptsList qemu_net_opts = {
|
|
.name = "net",
|
|
.implied_opt_name = "type",
|
|
.head = QTAILQ_HEAD_INITIALIZER(qemu_net_opts.head),
|
|
.desc = {
|
|
/*
|
|
* no elements => accept any params
|
|
* validation will happen later
|
|
*/
|
|
{ /* end of list */ }
|
|
},
|
|
};
|
|
|
|
void net_socket_rs_init(SocketReadState *rs,
|
|
SocketReadStateFinalize *finalize,
|
|
bool vnet_hdr)
|
|
{
|
|
rs->state = 0;
|
|
rs->vnet_hdr = vnet_hdr;
|
|
rs->index = 0;
|
|
rs->packet_len = 0;
|
|
rs->vnet_hdr_len = 0;
|
|
memset(rs->buf, 0, sizeof(rs->buf));
|
|
rs->finalize = finalize;
|
|
}
|
|
|
|
/*
|
|
* Returns
|
|
* 0: success
|
|
* -1: error occurs
|
|
*/
|
|
int net_fill_rstate(SocketReadState *rs, const uint8_t *buf, int size)
|
|
{
|
|
unsigned int l;
|
|
|
|
while (size > 0) {
|
|
/* Reassemble a packet from the network.
|
|
* 0 = getting length.
|
|
* 1 = getting vnet header length.
|
|
* 2 = getting data.
|
|
*/
|
|
switch (rs->state) {
|
|
case 0:
|
|
l = 4 - rs->index;
|
|
if (l > size) {
|
|
l = size;
|
|
}
|
|
memcpy(rs->buf + rs->index, buf, l);
|
|
buf += l;
|
|
size -= l;
|
|
rs->index += l;
|
|
if (rs->index == 4) {
|
|
/* got length */
|
|
rs->packet_len = ntohl(*(uint32_t *)rs->buf);
|
|
rs->index = 0;
|
|
if (rs->vnet_hdr) {
|
|
rs->state = 1;
|
|
} else {
|
|
rs->state = 2;
|
|
rs->vnet_hdr_len = 0;
|
|
}
|
|
}
|
|
break;
|
|
case 1:
|
|
l = 4 - rs->index;
|
|
if (l > size) {
|
|
l = size;
|
|
}
|
|
memcpy(rs->buf + rs->index, buf, l);
|
|
buf += l;
|
|
size -= l;
|
|
rs->index += l;
|
|
if (rs->index == 4) {
|
|
/* got vnet header length */
|
|
rs->vnet_hdr_len = ntohl(*(uint32_t *)rs->buf);
|
|
rs->index = 0;
|
|
rs->state = 2;
|
|
}
|
|
break;
|
|
case 2:
|
|
l = rs->packet_len - rs->index;
|
|
if (l > size) {
|
|
l = size;
|
|
}
|
|
if (rs->index + l <= sizeof(rs->buf)) {
|
|
memcpy(rs->buf + rs->index, buf, l);
|
|
} else {
|
|
fprintf(stderr, "serious error: oversized packet received,"
|
|
"connection terminated.\n");
|
|
rs->index = rs->state = 0;
|
|
return -1;
|
|
}
|
|
|
|
rs->index += l;
|
|
buf += l;
|
|
size -= l;
|
|
if (rs->index >= rs->packet_len) {
|
|
rs->index = 0;
|
|
rs->state = 0;
|
|
assert(rs->finalize);
|
|
rs->finalize(rs);
|
|
}
|
|
break;
|
|
}
|
|
}
|
|
|
|
assert(size == 0);
|
|
return 0;
|
|
}
|