b9ad513e18
While netmap implements virtio-net header, it does not implement
receive_raw(). Instead of implementing receive_raw for netmap, add
virtio-net headers in the common code and use receive_iov()/receive()
instead. This also fixes the buffer size for the virtio-net header.
Fixes: fbbdbddec0
("tap: allow extended virtio header with hash info")
Signed-off-by: Akihiko Odaki <akihiko.odaki@daynix.com>
Signed-off-by: Jason Wang <jasowang@redhat.com>
2097 lines
56 KiB
C
2097 lines
56 KiB
C
/*
|
|
* QEMU System Emulator
|
|
*
|
|
* Copyright (c) 2003-2008 Fabrice Bellard
|
|
*
|
|
* Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
* of this software and associated documentation files (the "Software"), to deal
|
|
* in the Software without restriction, including without limitation the rights
|
|
* to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
* copies of the Software, and to permit persons to whom the Software is
|
|
* furnished to do so, subject to the following conditions:
|
|
*
|
|
* The above copyright notice and this permission notice shall be included in
|
|
* all copies or substantial portions of the Software.
|
|
*
|
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
|
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
|
* THE SOFTWARE.
|
|
*/
|
|
|
|
#include "qemu/osdep.h"
|
|
|
|
#include "net/net.h"
|
|
#include "clients.h"
|
|
#include "hub.h"
|
|
#include "hw/qdev-properties.h"
|
|
#include "net/slirp.h"
|
|
#include "net/eth.h"
|
|
#include "util.h"
|
|
|
|
#include "monitor/monitor.h"
|
|
#include "qemu/help_option.h"
|
|
#include "qapi/qapi-commands-net.h"
|
|
#include "qapi/qapi-visit-net.h"
|
|
#include "qapi/qmp/qdict.h"
|
|
#include "qapi/qmp/qerror.h"
|
|
#include "qemu/error-report.h"
|
|
#include "qemu/sockets.h"
|
|
#include "qemu/cutils.h"
|
|
#include "qemu/config-file.h"
|
|
#include "qemu/ctype.h"
|
|
#include "qemu/id.h"
|
|
#include "qemu/iov.h"
|
|
#include "qemu/qemu-print.h"
|
|
#include "qemu/main-loop.h"
|
|
#include "qemu/option.h"
|
|
#include "qemu/keyval.h"
|
|
#include "qapi/error.h"
|
|
#include "qapi/opts-visitor.h"
|
|
#include "sysemu/runstate.h"
|
|
#include "net/colo-compare.h"
|
|
#include "net/filter.h"
|
|
#include "qapi/string-output-visitor.h"
|
|
#include "qapi/qobject-input-visitor.h"
|
|
#include "standard-headers/linux/virtio_net.h"
|
|
|
|
/* Net bridge is currently not supported for W32. */
|
|
#if !defined(_WIN32)
|
|
# define CONFIG_NET_BRIDGE
|
|
#endif
|
|
|
|
static VMChangeStateEntry *net_change_state_entry;
|
|
NetClientStateList net_clients;
|
|
|
|
typedef struct NetdevQueueEntry {
|
|
Netdev *nd;
|
|
Location loc;
|
|
QSIMPLEQ_ENTRY(NetdevQueueEntry) entry;
|
|
} NetdevQueueEntry;
|
|
|
|
typedef QSIMPLEQ_HEAD(, NetdevQueueEntry) NetdevQueue;
|
|
|
|
static NetdevQueue nd_queue = QSIMPLEQ_HEAD_INITIALIZER(nd_queue);
|
|
|
|
static GHashTable *nic_model_help;
|
|
|
|
static int nb_nics;
|
|
static NICInfo nd_table[MAX_NICS];
|
|
|
|
/***********************************************************/
|
|
/* network device redirectors */
|
|
|
|
int convert_host_port(struct sockaddr_in *saddr, const char *host,
|
|
const char *port, Error **errp)
|
|
{
|
|
struct hostent *he;
|
|
const char *r;
|
|
long p;
|
|
|
|
memset(saddr, 0, sizeof(*saddr));
|
|
|
|
saddr->sin_family = AF_INET;
|
|
if (host[0] == '\0') {
|
|
saddr->sin_addr.s_addr = 0;
|
|
} else {
|
|
if (qemu_isdigit(host[0])) {
|
|
if (!inet_aton(host, &saddr->sin_addr)) {
|
|
error_setg(errp, "host address '%s' is not a valid "
|
|
"IPv4 address", host);
|
|
return -1;
|
|
}
|
|
} else {
|
|
he = gethostbyname(host);
|
|
if (he == NULL) {
|
|
error_setg(errp, "can't resolve host address '%s'", host);
|
|
return -1;
|
|
}
|
|
saddr->sin_addr = *(struct in_addr *)he->h_addr;
|
|
}
|
|
}
|
|
if (qemu_strtol(port, &r, 0, &p) != 0) {
|
|
error_setg(errp, "port number '%s' is invalid", port);
|
|
return -1;
|
|
}
|
|
saddr->sin_port = htons(p);
|
|
return 0;
|
|
}
|
|
|
|
int parse_host_port(struct sockaddr_in *saddr, const char *str,
|
|
Error **errp)
|
|
{
|
|
gchar **substrings;
|
|
int ret;
|
|
|
|
substrings = g_strsplit(str, ":", 2);
|
|
if (!substrings || !substrings[0] || !substrings[1]) {
|
|
error_setg(errp, "host address '%s' doesn't contain ':' "
|
|
"separating host from port", str);
|
|
ret = -1;
|
|
goto out;
|
|
}
|
|
|
|
ret = convert_host_port(saddr, substrings[0], substrings[1], errp);
|
|
|
|
out:
|
|
g_strfreev(substrings);
|
|
return ret;
|
|
}
|
|
|
|
char *qemu_mac_strdup_printf(const uint8_t *macaddr)
|
|
{
|
|
return g_strdup_printf("%.2x:%.2x:%.2x:%.2x:%.2x:%.2x",
|
|
macaddr[0], macaddr[1], macaddr[2],
|
|
macaddr[3], macaddr[4], macaddr[5]);
|
|
}
|
|
|
|
void qemu_set_info_str(NetClientState *nc, const char *fmt, ...)
|
|
{
|
|
va_list ap;
|
|
|
|
va_start(ap, fmt);
|
|
vsnprintf(nc->info_str, sizeof(nc->info_str), fmt, ap);
|
|
va_end(ap);
|
|
}
|
|
|
|
void qemu_format_nic_info_str(NetClientState *nc, uint8_t macaddr[6])
|
|
{
|
|
qemu_set_info_str(nc, "model=%s,macaddr=%02x:%02x:%02x:%02x:%02x:%02x",
|
|
nc->model, macaddr[0], macaddr[1], macaddr[2],
|
|
macaddr[3], macaddr[4], macaddr[5]);
|
|
}
|
|
|
|
static int mac_table[256] = {0};
|
|
|
|
static void qemu_macaddr_set_used(MACAddr *macaddr)
|
|
{
|
|
int index;
|
|
|
|
for (index = 0x56; index < 0xFF; index++) {
|
|
if (macaddr->a[5] == index) {
|
|
mac_table[index]++;
|
|
}
|
|
}
|
|
}
|
|
|
|
static void qemu_macaddr_set_free(MACAddr *macaddr)
|
|
{
|
|
int index;
|
|
static const MACAddr base = { .a = { 0x52, 0x54, 0x00, 0x12, 0x34, 0 } };
|
|
|
|
if (memcmp(macaddr->a, &base.a, (sizeof(base.a) - 1)) != 0) {
|
|
return;
|
|
}
|
|
for (index = 0x56; index < 0xFF; index++) {
|
|
if (macaddr->a[5] == index) {
|
|
mac_table[index]--;
|
|
}
|
|
}
|
|
}
|
|
|
|
static int qemu_macaddr_get_free(void)
|
|
{
|
|
int index;
|
|
|
|
for (index = 0x56; index < 0xFF; index++) {
|
|
if (mac_table[index] == 0) {
|
|
return index;
|
|
}
|
|
}
|
|
|
|
return -1;
|
|
}
|
|
|
|
void qemu_macaddr_default_if_unset(MACAddr *macaddr)
|
|
{
|
|
static const MACAddr zero = { .a = { 0,0,0,0,0,0 } };
|
|
static const MACAddr base = { .a = { 0x52, 0x54, 0x00, 0x12, 0x34, 0 } };
|
|
|
|
if (memcmp(macaddr, &zero, sizeof(zero)) != 0) {
|
|
if (memcmp(macaddr->a, &base.a, (sizeof(base.a) - 1)) != 0) {
|
|
return;
|
|
} else {
|
|
qemu_macaddr_set_used(macaddr);
|
|
return;
|
|
}
|
|
}
|
|
|
|
macaddr->a[0] = 0x52;
|
|
macaddr->a[1] = 0x54;
|
|
macaddr->a[2] = 0x00;
|
|
macaddr->a[3] = 0x12;
|
|
macaddr->a[4] = 0x34;
|
|
macaddr->a[5] = qemu_macaddr_get_free();
|
|
qemu_macaddr_set_used(macaddr);
|
|
}
|
|
|
|
/**
|
|
* Generate a name for net client
|
|
*
|
|
* Only net clients created with the legacy -net option and NICs need this.
|
|
*/
|
|
static char *assign_name(NetClientState *nc1, const char *model)
|
|
{
|
|
NetClientState *nc;
|
|
int id = 0;
|
|
|
|
QTAILQ_FOREACH(nc, &net_clients, next) {
|
|
if (nc == nc1) {
|
|
continue;
|
|
}
|
|
if (strcmp(nc->model, model) == 0) {
|
|
id++;
|
|
}
|
|
}
|
|
|
|
return g_strdup_printf("%s.%d", model, id);
|
|
}
|
|
|
|
static void qemu_net_client_destructor(NetClientState *nc)
|
|
{
|
|
g_free(nc);
|
|
}
|
|
static ssize_t qemu_deliver_packet_iov(NetClientState *sender,
|
|
unsigned flags,
|
|
const struct iovec *iov,
|
|
int iovcnt,
|
|
void *opaque);
|
|
|
|
static void qemu_net_client_setup(NetClientState *nc,
|
|
NetClientInfo *info,
|
|
NetClientState *peer,
|
|
const char *model,
|
|
const char *name,
|
|
NetClientDestructor *destructor,
|
|
bool is_datapath)
|
|
{
|
|
nc->info = info;
|
|
nc->model = g_strdup(model);
|
|
if (name) {
|
|
nc->name = g_strdup(name);
|
|
} else {
|
|
nc->name = assign_name(nc, model);
|
|
}
|
|
|
|
if (peer) {
|
|
assert(!peer->peer);
|
|
nc->peer = peer;
|
|
peer->peer = nc;
|
|
}
|
|
QTAILQ_INSERT_TAIL(&net_clients, nc, next);
|
|
|
|
nc->incoming_queue = qemu_new_net_queue(qemu_deliver_packet_iov, nc);
|
|
nc->destructor = destructor;
|
|
nc->is_datapath = is_datapath;
|
|
QTAILQ_INIT(&nc->filters);
|
|
}
|
|
|
|
NetClientState *qemu_new_net_client(NetClientInfo *info,
|
|
NetClientState *peer,
|
|
const char *model,
|
|
const char *name)
|
|
{
|
|
NetClientState *nc;
|
|
|
|
assert(info->size >= sizeof(NetClientState));
|
|
|
|
nc = g_malloc0(info->size);
|
|
qemu_net_client_setup(nc, info, peer, model, name,
|
|
qemu_net_client_destructor, true);
|
|
|
|
return nc;
|
|
}
|
|
|
|
NetClientState *qemu_new_net_control_client(NetClientInfo *info,
|
|
NetClientState *peer,
|
|
const char *model,
|
|
const char *name)
|
|
{
|
|
NetClientState *nc;
|
|
|
|
assert(info->size >= sizeof(NetClientState));
|
|
|
|
nc = g_malloc0(info->size);
|
|
qemu_net_client_setup(nc, info, peer, model, name,
|
|
qemu_net_client_destructor, false);
|
|
|
|
return nc;
|
|
}
|
|
|
|
NICState *qemu_new_nic(NetClientInfo *info,
|
|
NICConf *conf,
|
|
const char *model,
|
|
const char *name,
|
|
MemReentrancyGuard *reentrancy_guard,
|
|
void *opaque)
|
|
{
|
|
NetClientState **peers = conf->peers.ncs;
|
|
NICState *nic;
|
|
int i, queues = MAX(1, conf->peers.queues);
|
|
|
|
assert(info->type == NET_CLIENT_DRIVER_NIC);
|
|
assert(info->size >= sizeof(NICState));
|
|
|
|
nic = g_malloc0(info->size + sizeof(NetClientState) * queues);
|
|
nic->ncs = (void *)nic + info->size;
|
|
nic->conf = conf;
|
|
nic->reentrancy_guard = reentrancy_guard,
|
|
nic->opaque = opaque;
|
|
|
|
for (i = 0; i < queues; i++) {
|
|
qemu_net_client_setup(&nic->ncs[i], info, peers[i], model, name,
|
|
NULL, true);
|
|
nic->ncs[i].queue_index = i;
|
|
}
|
|
|
|
return nic;
|
|
}
|
|
|
|
NetClientState *qemu_get_subqueue(NICState *nic, int queue_index)
|
|
{
|
|
return nic->ncs + queue_index;
|
|
}
|
|
|
|
NetClientState *qemu_get_queue(NICState *nic)
|
|
{
|
|
return qemu_get_subqueue(nic, 0);
|
|
}
|
|
|
|
NICState *qemu_get_nic(NetClientState *nc)
|
|
{
|
|
NetClientState *nc0 = nc - nc->queue_index;
|
|
|
|
return (NICState *)((void *)nc0 - nc->info->size);
|
|
}
|
|
|
|
void *qemu_get_nic_opaque(NetClientState *nc)
|
|
{
|
|
NICState *nic = qemu_get_nic(nc);
|
|
|
|
return nic->opaque;
|
|
}
|
|
|
|
NetClientState *qemu_get_peer(NetClientState *nc, int queue_index)
|
|
{
|
|
assert(nc != NULL);
|
|
NetClientState *ncs = nc + queue_index;
|
|
return ncs->peer;
|
|
}
|
|
|
|
static void qemu_cleanup_net_client(NetClientState *nc)
|
|
{
|
|
QTAILQ_REMOVE(&net_clients, nc, next);
|
|
|
|
if (nc->info->cleanup) {
|
|
nc->info->cleanup(nc);
|
|
}
|
|
}
|
|
|
|
static void qemu_free_net_client(NetClientState *nc)
|
|
{
|
|
if (nc->incoming_queue) {
|
|
qemu_del_net_queue(nc->incoming_queue);
|
|
}
|
|
if (nc->peer) {
|
|
nc->peer->peer = NULL;
|
|
}
|
|
g_free(nc->name);
|
|
g_free(nc->model);
|
|
if (nc->destructor) {
|
|
nc->destructor(nc);
|
|
}
|
|
}
|
|
|
|
void qemu_del_net_client(NetClientState *nc)
|
|
{
|
|
NetClientState *ncs[MAX_QUEUE_NUM];
|
|
int queues, i;
|
|
NetFilterState *nf, *next;
|
|
|
|
assert(nc->info->type != NET_CLIENT_DRIVER_NIC);
|
|
|
|
/* If the NetClientState belongs to a multiqueue backend, we will change all
|
|
* other NetClientStates also.
|
|
*/
|
|
queues = qemu_find_net_clients_except(nc->name, ncs,
|
|
NET_CLIENT_DRIVER_NIC,
|
|
MAX_QUEUE_NUM);
|
|
assert(queues != 0);
|
|
|
|
QTAILQ_FOREACH_SAFE(nf, &nc->filters, next, next) {
|
|
object_unparent(OBJECT(nf));
|
|
}
|
|
|
|
/* If there is a peer NIC, delete and cleanup client, but do not free. */
|
|
if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_NIC) {
|
|
NICState *nic = qemu_get_nic(nc->peer);
|
|
if (nic->peer_deleted) {
|
|
return;
|
|
}
|
|
nic->peer_deleted = true;
|
|
|
|
for (i = 0; i < queues; i++) {
|
|
ncs[i]->peer->link_down = true;
|
|
}
|
|
|
|
if (nc->peer->info->link_status_changed) {
|
|
nc->peer->info->link_status_changed(nc->peer);
|
|
}
|
|
|
|
for (i = 0; i < queues; i++) {
|
|
qemu_cleanup_net_client(ncs[i]);
|
|
}
|
|
|
|
return;
|
|
}
|
|
|
|
for (i = 0; i < queues; i++) {
|
|
qemu_cleanup_net_client(ncs[i]);
|
|
qemu_free_net_client(ncs[i]);
|
|
}
|
|
}
|
|
|
|
void qemu_del_nic(NICState *nic)
|
|
{
|
|
int i, queues = MAX(nic->conf->peers.queues, 1);
|
|
|
|
qemu_macaddr_set_free(&nic->conf->macaddr);
|
|
|
|
for (i = 0; i < queues; i++) {
|
|
NetClientState *nc = qemu_get_subqueue(nic, i);
|
|
/* If this is a peer NIC and peer has already been deleted, free it now. */
|
|
if (nic->peer_deleted) {
|
|
qemu_free_net_client(nc->peer);
|
|
} else if (nc->peer) {
|
|
/* if there are RX packets pending, complete them */
|
|
qemu_purge_queued_packets(nc->peer);
|
|
}
|
|
}
|
|
|
|
for (i = queues - 1; i >= 0; i--) {
|
|
NetClientState *nc = qemu_get_subqueue(nic, i);
|
|
|
|
qemu_cleanup_net_client(nc);
|
|
qemu_free_net_client(nc);
|
|
}
|
|
|
|
g_free(nic);
|
|
}
|
|
|
|
void qemu_foreach_nic(qemu_nic_foreach func, void *opaque)
|
|
{
|
|
NetClientState *nc;
|
|
|
|
QTAILQ_FOREACH(nc, &net_clients, next) {
|
|
if (nc->info->type == NET_CLIENT_DRIVER_NIC) {
|
|
if (nc->queue_index == 0) {
|
|
func(qemu_get_nic(nc), opaque);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
bool qemu_has_ufo(NetClientState *nc)
|
|
{
|
|
if (!nc || !nc->info->has_ufo) {
|
|
return false;
|
|
}
|
|
|
|
return nc->info->has_ufo(nc);
|
|
}
|
|
|
|
bool qemu_has_uso(NetClientState *nc)
|
|
{
|
|
if (!nc || !nc->info->has_uso) {
|
|
return false;
|
|
}
|
|
|
|
return nc->info->has_uso(nc);
|
|
}
|
|
|
|
bool qemu_has_vnet_hdr(NetClientState *nc)
|
|
{
|
|
if (!nc || !nc->info->has_vnet_hdr) {
|
|
return false;
|
|
}
|
|
|
|
return nc->info->has_vnet_hdr(nc);
|
|
}
|
|
|
|
bool qemu_has_vnet_hdr_len(NetClientState *nc, int len)
|
|
{
|
|
if (!nc || !nc->info->has_vnet_hdr_len) {
|
|
return false;
|
|
}
|
|
|
|
return nc->info->has_vnet_hdr_len(nc, len);
|
|
}
|
|
|
|
void qemu_set_offload(NetClientState *nc, int csum, int tso4, int tso6,
|
|
int ecn, int ufo, int uso4, int uso6)
|
|
{
|
|
if (!nc || !nc->info->set_offload) {
|
|
return;
|
|
}
|
|
|
|
nc->info->set_offload(nc, csum, tso4, tso6, ecn, ufo, uso4, uso6);
|
|
}
|
|
|
|
int qemu_get_vnet_hdr_len(NetClientState *nc)
|
|
{
|
|
return nc->vnet_hdr_len;
|
|
}
|
|
|
|
void qemu_set_vnet_hdr_len(NetClientState *nc, int len)
|
|
{
|
|
if (!nc || !nc->info->set_vnet_hdr_len) {
|
|
return;
|
|
}
|
|
|
|
assert(len == sizeof(struct virtio_net_hdr_mrg_rxbuf) ||
|
|
len == sizeof(struct virtio_net_hdr) ||
|
|
len == sizeof(struct virtio_net_hdr_v1_hash));
|
|
|
|
nc->vnet_hdr_len = len;
|
|
nc->info->set_vnet_hdr_len(nc, len);
|
|
}
|
|
|
|
int qemu_set_vnet_le(NetClientState *nc, bool is_le)
|
|
{
|
|
#if HOST_BIG_ENDIAN
|
|
if (!nc || !nc->info->set_vnet_le) {
|
|
return -ENOSYS;
|
|
}
|
|
|
|
return nc->info->set_vnet_le(nc, is_le);
|
|
#else
|
|
return 0;
|
|
#endif
|
|
}
|
|
|
|
int qemu_set_vnet_be(NetClientState *nc, bool is_be)
|
|
{
|
|
#if HOST_BIG_ENDIAN
|
|
return 0;
|
|
#else
|
|
if (!nc || !nc->info->set_vnet_be) {
|
|
return -ENOSYS;
|
|
}
|
|
|
|
return nc->info->set_vnet_be(nc, is_be);
|
|
#endif
|
|
}
|
|
|
|
int qemu_can_receive_packet(NetClientState *nc)
|
|
{
|
|
if (nc->receive_disabled) {
|
|
return 0;
|
|
} else if (nc->info->can_receive &&
|
|
!nc->info->can_receive(nc)) {
|
|
return 0;
|
|
}
|
|
return 1;
|
|
}
|
|
|
|
int qemu_can_send_packet(NetClientState *sender)
|
|
{
|
|
int vm_running = runstate_is_running();
|
|
|
|
if (!vm_running) {
|
|
return 0;
|
|
}
|
|
|
|
if (!sender->peer) {
|
|
return 1;
|
|
}
|
|
|
|
return qemu_can_receive_packet(sender->peer);
|
|
}
|
|
|
|
static ssize_t filter_receive_iov(NetClientState *nc,
|
|
NetFilterDirection direction,
|
|
NetClientState *sender,
|
|
unsigned flags,
|
|
const struct iovec *iov,
|
|
int iovcnt,
|
|
NetPacketSent *sent_cb)
|
|
{
|
|
ssize_t ret = 0;
|
|
NetFilterState *nf = NULL;
|
|
|
|
if (direction == NET_FILTER_DIRECTION_TX) {
|
|
QTAILQ_FOREACH(nf, &nc->filters, next) {
|
|
ret = qemu_netfilter_receive(nf, direction, sender, flags, iov,
|
|
iovcnt, sent_cb);
|
|
if (ret) {
|
|
return ret;
|
|
}
|
|
}
|
|
} else {
|
|
QTAILQ_FOREACH_REVERSE(nf, &nc->filters, next) {
|
|
ret = qemu_netfilter_receive(nf, direction, sender, flags, iov,
|
|
iovcnt, sent_cb);
|
|
if (ret) {
|
|
return ret;
|
|
}
|
|
}
|
|
}
|
|
|
|
return ret;
|
|
}
|
|
|
|
static ssize_t filter_receive(NetClientState *nc,
|
|
NetFilterDirection direction,
|
|
NetClientState *sender,
|
|
unsigned flags,
|
|
const uint8_t *data,
|
|
size_t size,
|
|
NetPacketSent *sent_cb)
|
|
{
|
|
struct iovec iov = {
|
|
.iov_base = (void *)data,
|
|
.iov_len = size
|
|
};
|
|
|
|
return filter_receive_iov(nc, direction, sender, flags, &iov, 1, sent_cb);
|
|
}
|
|
|
|
void qemu_purge_queued_packets(NetClientState *nc)
|
|
{
|
|
if (!nc->peer) {
|
|
return;
|
|
}
|
|
|
|
qemu_net_queue_purge(nc->peer->incoming_queue, nc);
|
|
}
|
|
|
|
void qemu_flush_or_purge_queued_packets(NetClientState *nc, bool purge)
|
|
{
|
|
nc->receive_disabled = 0;
|
|
|
|
if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_HUBPORT) {
|
|
if (net_hub_flush(nc->peer)) {
|
|
qemu_notify_event();
|
|
}
|
|
}
|
|
if (qemu_net_queue_flush(nc->incoming_queue)) {
|
|
/* We emptied the queue successfully, signal to the IO thread to repoll
|
|
* the file descriptor (for tap, for example).
|
|
*/
|
|
qemu_notify_event();
|
|
} else if (purge) {
|
|
/* Unable to empty the queue, purge remaining packets */
|
|
qemu_net_queue_purge(nc->incoming_queue, nc->peer);
|
|
}
|
|
}
|
|
|
|
void qemu_flush_queued_packets(NetClientState *nc)
|
|
{
|
|
qemu_flush_or_purge_queued_packets(nc, false);
|
|
}
|
|
|
|
static ssize_t qemu_send_packet_async_with_flags(NetClientState *sender,
|
|
unsigned flags,
|
|
const uint8_t *buf, int size,
|
|
NetPacketSent *sent_cb)
|
|
{
|
|
NetQueue *queue;
|
|
int ret;
|
|
|
|
#ifdef DEBUG_NET
|
|
printf("qemu_send_packet_async:\n");
|
|
qemu_hexdump(stdout, "net", buf, size);
|
|
#endif
|
|
|
|
if (sender->link_down || !sender->peer) {
|
|
return size;
|
|
}
|
|
|
|
/* Let filters handle the packet first */
|
|
ret = filter_receive(sender, NET_FILTER_DIRECTION_TX,
|
|
sender, flags, buf, size, sent_cb);
|
|
if (ret) {
|
|
return ret;
|
|
}
|
|
|
|
ret = filter_receive(sender->peer, NET_FILTER_DIRECTION_RX,
|
|
sender, flags, buf, size, sent_cb);
|
|
if (ret) {
|
|
return ret;
|
|
}
|
|
|
|
queue = sender->peer->incoming_queue;
|
|
|
|
return qemu_net_queue_send(queue, sender, flags, buf, size, sent_cb);
|
|
}
|
|
|
|
ssize_t qemu_send_packet_async(NetClientState *sender,
|
|
const uint8_t *buf, int size,
|
|
NetPacketSent *sent_cb)
|
|
{
|
|
return qemu_send_packet_async_with_flags(sender, QEMU_NET_PACKET_FLAG_NONE,
|
|
buf, size, sent_cb);
|
|
}
|
|
|
|
ssize_t qemu_send_packet(NetClientState *nc, const uint8_t *buf, int size)
|
|
{
|
|
return qemu_send_packet_async(nc, buf, size, NULL);
|
|
}
|
|
|
|
ssize_t qemu_receive_packet(NetClientState *nc, const uint8_t *buf, int size)
|
|
{
|
|
if (!qemu_can_receive_packet(nc)) {
|
|
return 0;
|
|
}
|
|
|
|
return qemu_net_queue_receive(nc->incoming_queue, buf, size);
|
|
}
|
|
|
|
ssize_t qemu_receive_packet_iov(NetClientState *nc, const struct iovec *iov,
|
|
int iovcnt)
|
|
{
|
|
if (!qemu_can_receive_packet(nc)) {
|
|
return 0;
|
|
}
|
|
|
|
return qemu_net_queue_receive_iov(nc->incoming_queue, iov, iovcnt);
|
|
}
|
|
|
|
ssize_t qemu_send_packet_raw(NetClientState *nc, const uint8_t *buf, int size)
|
|
{
|
|
return qemu_send_packet_async_with_flags(nc, QEMU_NET_PACKET_FLAG_RAW,
|
|
buf, size, NULL);
|
|
}
|
|
|
|
static ssize_t nc_sendv_compat(NetClientState *nc, const struct iovec *iov,
|
|
int iovcnt, unsigned flags)
|
|
{
|
|
uint8_t *buf = NULL;
|
|
uint8_t *buffer;
|
|
size_t offset;
|
|
ssize_t ret;
|
|
|
|
if (iovcnt == 1) {
|
|
buffer = iov[0].iov_base;
|
|
offset = iov[0].iov_len;
|
|
} else {
|
|
offset = iov_size(iov, iovcnt);
|
|
if (offset > NET_BUFSIZE) {
|
|
return -1;
|
|
}
|
|
buf = g_malloc(offset);
|
|
buffer = buf;
|
|
offset = iov_to_buf(iov, iovcnt, 0, buf, offset);
|
|
}
|
|
|
|
ret = nc->info->receive(nc, buffer, offset);
|
|
|
|
g_free(buf);
|
|
return ret;
|
|
}
|
|
|
|
static ssize_t qemu_deliver_packet_iov(NetClientState *sender,
|
|
unsigned flags,
|
|
const struct iovec *iov,
|
|
int iovcnt,
|
|
void *opaque)
|
|
{
|
|
MemReentrancyGuard *owned_reentrancy_guard;
|
|
NetClientState *nc = opaque;
|
|
int ret;
|
|
struct virtio_net_hdr_v1_hash vnet_hdr = { };
|
|
g_autofree struct iovec *iov_copy = NULL;
|
|
|
|
|
|
if (nc->link_down) {
|
|
return iov_size(iov, iovcnt);
|
|
}
|
|
|
|
if (nc->receive_disabled) {
|
|
return 0;
|
|
}
|
|
|
|
if (nc->info->type != NET_CLIENT_DRIVER_NIC ||
|
|
qemu_get_nic(nc)->reentrancy_guard->engaged_in_io) {
|
|
owned_reentrancy_guard = NULL;
|
|
} else {
|
|
owned_reentrancy_guard = qemu_get_nic(nc)->reentrancy_guard;
|
|
owned_reentrancy_guard->engaged_in_io = true;
|
|
}
|
|
|
|
if ((flags & QEMU_NET_PACKET_FLAG_RAW) && nc->vnet_hdr_len) {
|
|
iov_copy = g_new(struct iovec, iovcnt + 1);
|
|
iov_copy[0].iov_base = &vnet_hdr;
|
|
iov_copy[0].iov_len = nc->vnet_hdr_len;
|
|
memcpy(&iov_copy[1], iov, iovcnt * sizeof(*iov));
|
|
iov = iov_copy;
|
|
}
|
|
|
|
if (nc->info->receive_iov) {
|
|
ret = nc->info->receive_iov(nc, iov, iovcnt);
|
|
} else {
|
|
ret = nc_sendv_compat(nc, iov, iovcnt, flags);
|
|
}
|
|
|
|
if (owned_reentrancy_guard) {
|
|
owned_reentrancy_guard->engaged_in_io = false;
|
|
}
|
|
|
|
if (ret == 0) {
|
|
nc->receive_disabled = 1;
|
|
}
|
|
|
|
return ret;
|
|
}
|
|
|
|
ssize_t qemu_sendv_packet_async(NetClientState *sender,
|
|
const struct iovec *iov, int iovcnt,
|
|
NetPacketSent *sent_cb)
|
|
{
|
|
NetQueue *queue;
|
|
size_t size = iov_size(iov, iovcnt);
|
|
int ret;
|
|
|
|
if (size > NET_BUFSIZE) {
|
|
return size;
|
|
}
|
|
|
|
if (sender->link_down || !sender->peer) {
|
|
return size;
|
|
}
|
|
|
|
/* Let filters handle the packet first */
|
|
ret = filter_receive_iov(sender, NET_FILTER_DIRECTION_TX, sender,
|
|
QEMU_NET_PACKET_FLAG_NONE, iov, iovcnt, sent_cb);
|
|
if (ret) {
|
|
return ret;
|
|
}
|
|
|
|
ret = filter_receive_iov(sender->peer, NET_FILTER_DIRECTION_RX, sender,
|
|
QEMU_NET_PACKET_FLAG_NONE, iov, iovcnt, sent_cb);
|
|
if (ret) {
|
|
return ret;
|
|
}
|
|
|
|
queue = sender->peer->incoming_queue;
|
|
|
|
return qemu_net_queue_send_iov(queue, sender,
|
|
QEMU_NET_PACKET_FLAG_NONE,
|
|
iov, iovcnt, sent_cb);
|
|
}
|
|
|
|
ssize_t
|
|
qemu_sendv_packet(NetClientState *nc, const struct iovec *iov, int iovcnt)
|
|
{
|
|
return qemu_sendv_packet_async(nc, iov, iovcnt, NULL);
|
|
}
|
|
|
|
NetClientState *qemu_find_netdev(const char *id)
|
|
{
|
|
NetClientState *nc;
|
|
|
|
QTAILQ_FOREACH(nc, &net_clients, next) {
|
|
if (nc->info->type == NET_CLIENT_DRIVER_NIC)
|
|
continue;
|
|
if (!strcmp(nc->name, id)) {
|
|
return nc;
|
|
}
|
|
}
|
|
|
|
return NULL;
|
|
}
|
|
|
|
int qemu_find_net_clients_except(const char *id, NetClientState **ncs,
|
|
NetClientDriver type, int max)
|
|
{
|
|
NetClientState *nc;
|
|
int ret = 0;
|
|
|
|
QTAILQ_FOREACH(nc, &net_clients, next) {
|
|
if (nc->info->type == type) {
|
|
continue;
|
|
}
|
|
if (!id || !strcmp(nc->name, id)) {
|
|
if (ret < max) {
|
|
ncs[ret] = nc;
|
|
}
|
|
ret++;
|
|
}
|
|
}
|
|
|
|
return ret;
|
|
}
|
|
|
|
static int nic_get_free_idx(void)
|
|
{
|
|
int index;
|
|
|
|
for (index = 0; index < MAX_NICS; index++)
|
|
if (!nd_table[index].used)
|
|
return index;
|
|
return -1;
|
|
}
|
|
|
|
GPtrArray *qemu_get_nic_models(const char *device_type)
|
|
{
|
|
GPtrArray *nic_models = g_ptr_array_new();
|
|
GSList *list = object_class_get_list_sorted(device_type, false);
|
|
|
|
while (list) {
|
|
DeviceClass *dc = OBJECT_CLASS_CHECK(DeviceClass, list->data,
|
|
TYPE_DEVICE);
|
|
GSList *next;
|
|
if (test_bit(DEVICE_CATEGORY_NETWORK, dc->categories) &&
|
|
dc->user_creatable) {
|
|
const char *name = object_class_get_name(list->data);
|
|
/*
|
|
* A network device might also be something else than a NIC, see
|
|
* e.g. the "rocker" device. Thus we have to look for the "netdev"
|
|
* property, too. Unfortunately, some devices like virtio-net only
|
|
* create this property during instance_init, so we have to create
|
|
* a temporary instance here to be able to check it.
|
|
*/
|
|
Object *obj = object_new_with_class(OBJECT_CLASS(dc));
|
|
if (object_property_find(obj, "netdev")) {
|
|
g_ptr_array_add(nic_models, (gpointer)name);
|
|
}
|
|
object_unref(obj);
|
|
}
|
|
next = list->next;
|
|
g_slist_free_1(list);
|
|
list = next;
|
|
}
|
|
g_ptr_array_add(nic_models, NULL);
|
|
|
|
return nic_models;
|
|
}
|
|
|
|
static int net_init_nic(const Netdev *netdev, const char *name,
|
|
NetClientState *peer, Error **errp)
|
|
{
|
|
int idx;
|
|
NICInfo *nd;
|
|
const NetLegacyNicOptions *nic;
|
|
|
|
assert(netdev->type == NET_CLIENT_DRIVER_NIC);
|
|
nic = &netdev->u.nic;
|
|
|
|
idx = nic_get_free_idx();
|
|
if (idx == -1 || nb_nics >= MAX_NICS) {
|
|
error_setg(errp, "too many NICs");
|
|
return -1;
|
|
}
|
|
|
|
nd = &nd_table[idx];
|
|
|
|
memset(nd, 0, sizeof(*nd));
|
|
|
|
if (nic->netdev) {
|
|
nd->netdev = qemu_find_netdev(nic->netdev);
|
|
if (!nd->netdev) {
|
|
error_setg(errp, "netdev '%s' not found", nic->netdev);
|
|
return -1;
|
|
}
|
|
} else {
|
|
assert(peer);
|
|
nd->netdev = peer;
|
|
}
|
|
nd->name = g_strdup(name);
|
|
if (nic->model) {
|
|
nd->model = g_strdup(nic->model);
|
|
}
|
|
if (nic->addr) {
|
|
nd->devaddr = g_strdup(nic->addr);
|
|
}
|
|
|
|
if (nic->macaddr &&
|
|
net_parse_macaddr(nd->macaddr.a, nic->macaddr) < 0) {
|
|
error_setg(errp, "invalid syntax for ethernet address");
|
|
return -1;
|
|
}
|
|
if (nic->macaddr &&
|
|
is_multicast_ether_addr(nd->macaddr.a)) {
|
|
error_setg(errp,
|
|
"NIC cannot have multicast MAC address (odd 1st byte)");
|
|
return -1;
|
|
}
|
|
qemu_macaddr_default_if_unset(&nd->macaddr);
|
|
|
|
if (nic->has_vectors) {
|
|
if (nic->vectors > 0x7ffffff) {
|
|
error_setg(errp, "invalid # of vectors: %"PRIu32, nic->vectors);
|
|
return -1;
|
|
}
|
|
nd->nvectors = nic->vectors;
|
|
} else {
|
|
nd->nvectors = DEV_NVECTORS_UNSPECIFIED;
|
|
}
|
|
|
|
nd->used = 1;
|
|
nb_nics++;
|
|
|
|
return idx;
|
|
}
|
|
|
|
static gboolean add_nic_result(gpointer key, gpointer value, gpointer user_data)
|
|
{
|
|
GPtrArray *results = user_data;
|
|
GPtrArray *alias_list = value;
|
|
const char *model = key;
|
|
char *result;
|
|
|
|
if (!alias_list) {
|
|
result = g_strdup(model);
|
|
} else {
|
|
GString *result_str = g_string_new(model);
|
|
int i;
|
|
|
|
g_string_append(result_str, " (aka ");
|
|
for (i = 0; i < alias_list->len; i++) {
|
|
if (i) {
|
|
g_string_append(result_str, ", ");
|
|
}
|
|
g_string_append(result_str, alias_list->pdata[i]);
|
|
}
|
|
g_string_append(result_str, ")");
|
|
result = result_str->str;
|
|
g_string_free(result_str, false);
|
|
g_ptr_array_unref(alias_list);
|
|
}
|
|
g_ptr_array_add(results, result);
|
|
return true;
|
|
}
|
|
|
|
static int model_cmp(char **a, char **b)
|
|
{
|
|
return strcmp(*a, *b);
|
|
}
|
|
|
|
static void show_nic_models(void)
|
|
{
|
|
GPtrArray *results = g_ptr_array_new();
|
|
int i;
|
|
|
|
g_hash_table_foreach_remove(nic_model_help, add_nic_result, results);
|
|
g_ptr_array_sort(results, (GCompareFunc)model_cmp);
|
|
|
|
printf("Available NIC models for this configuration:\n");
|
|
for (i = 0 ; i < results->len; i++) {
|
|
printf("%s\n", (char *)results->pdata[i]);
|
|
}
|
|
g_hash_table_unref(nic_model_help);
|
|
nic_model_help = NULL;
|
|
}
|
|
|
|
static void add_nic_model_help(const char *model, const char *alias)
|
|
{
|
|
GPtrArray *alias_list = NULL;
|
|
|
|
if (g_hash_table_lookup_extended(nic_model_help, model, NULL,
|
|
(gpointer *)&alias_list)) {
|
|
/* Already exists, no alias to add: return */
|
|
if (!alias) {
|
|
return;
|
|
}
|
|
if (alias_list) {
|
|
/* Check if this alias is already in the list. Add if not. */
|
|
if (!g_ptr_array_find_with_equal_func(alias_list, alias,
|
|
g_str_equal, NULL)) {
|
|
g_ptr_array_add(alias_list, g_strdup(alias));
|
|
}
|
|
return;
|
|
}
|
|
}
|
|
/* Either this model wasn't in the list already, or a first alias added */
|
|
if (alias) {
|
|
alias_list = g_ptr_array_new();
|
|
g_ptr_array_set_free_func(alias_list, g_free);
|
|
g_ptr_array_add(alias_list, g_strdup(alias));
|
|
}
|
|
g_hash_table_replace(nic_model_help, g_strdup(model), alias_list);
|
|
}
|
|
|
|
NICInfo *qemu_find_nic_info(const char *typename, bool match_default,
|
|
const char *alias)
|
|
{
|
|
NICInfo *nd;
|
|
int i;
|
|
|
|
if (nic_model_help) {
|
|
add_nic_model_help(typename, alias);
|
|
}
|
|
|
|
for (i = 0; i < nb_nics; i++) {
|
|
nd = &nd_table[i];
|
|
|
|
if (!nd->used || nd->instantiated) {
|
|
continue;
|
|
}
|
|
|
|
if ((match_default && !nd->model) || !g_strcmp0(nd->model, typename)
|
|
|| (alias && !g_strcmp0(nd->model, alias))) {
|
|
return nd;
|
|
}
|
|
}
|
|
return NULL;
|
|
}
|
|
|
|
|
|
/* "I have created a device. Please configure it if you can" */
|
|
bool qemu_configure_nic_device(DeviceState *dev, bool match_default,
|
|
const char *alias)
|
|
{
|
|
NICInfo *nd = qemu_find_nic_info(object_get_typename(OBJECT(dev)),
|
|
match_default, alias);
|
|
|
|
if (nd) {
|
|
qdev_set_nic_properties(dev, nd);
|
|
return true;
|
|
}
|
|
return false;
|
|
}
|
|
|
|
/* "Please create a device, if you have a configuration for it" */
|
|
DeviceState *qemu_create_nic_device(const char *typename, bool match_default,
|
|
const char *alias)
|
|
{
|
|
NICInfo *nd = qemu_find_nic_info(typename, match_default, alias);
|
|
DeviceState *dev;
|
|
|
|
if (!nd) {
|
|
return NULL;
|
|
}
|
|
|
|
dev = qdev_new(typename);
|
|
qdev_set_nic_properties(dev, nd);
|
|
return dev;
|
|
}
|
|
|
|
void qemu_create_nic_bus_devices(BusState *bus, const char *parent_type,
|
|
const char *default_model,
|
|
const char *alias, const char *alias_target)
|
|
{
|
|
GPtrArray *nic_models = qemu_get_nic_models(parent_type);
|
|
const char *model;
|
|
DeviceState *dev;
|
|
NICInfo *nd;
|
|
int i;
|
|
|
|
if (nic_model_help) {
|
|
if (alias_target) {
|
|
add_nic_model_help(alias_target, alias);
|
|
}
|
|
for (i = 0; i < nic_models->len - 1; i++) {
|
|
add_nic_model_help(nic_models->pdata[i], NULL);
|
|
}
|
|
}
|
|
|
|
/* Drop the NULL terminator which would make g_str_equal() unhappy */
|
|
nic_models->len--;
|
|
|
|
for (i = 0; i < nb_nics; i++) {
|
|
nd = &nd_table[i];
|
|
|
|
if (!nd->used || nd->instantiated) {
|
|
continue;
|
|
}
|
|
|
|
model = nd->model ? nd->model : default_model;
|
|
if (!model) {
|
|
continue;
|
|
}
|
|
|
|
/* Each bus type is allowed *one* substitution */
|
|
if (g_str_equal(model, alias)) {
|
|
model = alias_target;
|
|
}
|
|
|
|
if (!g_ptr_array_find_with_equal_func(nic_models, model,
|
|
g_str_equal, NULL)) {
|
|
/* This NIC does not live on this bus. */
|
|
continue;
|
|
}
|
|
|
|
dev = qdev_new(model);
|
|
qdev_set_nic_properties(dev, nd);
|
|
qdev_realize_and_unref(dev, bus, &error_fatal);
|
|
}
|
|
|
|
g_ptr_array_free(nic_models, true);
|
|
}
|
|
|
|
static int (* const net_client_init_fun[NET_CLIENT_DRIVER__MAX])(
|
|
const Netdev *netdev,
|
|
const char *name,
|
|
NetClientState *peer, Error **errp) = {
|
|
[NET_CLIENT_DRIVER_NIC] = net_init_nic,
|
|
#ifdef CONFIG_SLIRP
|
|
[NET_CLIENT_DRIVER_USER] = net_init_slirp,
|
|
#endif
|
|
[NET_CLIENT_DRIVER_TAP] = net_init_tap,
|
|
[NET_CLIENT_DRIVER_SOCKET] = net_init_socket,
|
|
[NET_CLIENT_DRIVER_STREAM] = net_init_stream,
|
|
[NET_CLIENT_DRIVER_DGRAM] = net_init_dgram,
|
|
#ifdef CONFIG_VDE
|
|
[NET_CLIENT_DRIVER_VDE] = net_init_vde,
|
|
#endif
|
|
#ifdef CONFIG_NETMAP
|
|
[NET_CLIENT_DRIVER_NETMAP] = net_init_netmap,
|
|
#endif
|
|
#ifdef CONFIG_AF_XDP
|
|
[NET_CLIENT_DRIVER_AF_XDP] = net_init_af_xdp,
|
|
#endif
|
|
#ifdef CONFIG_NET_BRIDGE
|
|
[NET_CLIENT_DRIVER_BRIDGE] = net_init_bridge,
|
|
#endif
|
|
[NET_CLIENT_DRIVER_HUBPORT] = net_init_hubport,
|
|
#ifdef CONFIG_VHOST_NET_USER
|
|
[NET_CLIENT_DRIVER_VHOST_USER] = net_init_vhost_user,
|
|
#endif
|
|
#ifdef CONFIG_VHOST_NET_VDPA
|
|
[NET_CLIENT_DRIVER_VHOST_VDPA] = net_init_vhost_vdpa,
|
|
#endif
|
|
#ifdef CONFIG_L2TPV3
|
|
[NET_CLIENT_DRIVER_L2TPV3] = net_init_l2tpv3,
|
|
#endif
|
|
#ifdef CONFIG_VMNET
|
|
[NET_CLIENT_DRIVER_VMNET_HOST] = net_init_vmnet_host,
|
|
[NET_CLIENT_DRIVER_VMNET_SHARED] = net_init_vmnet_shared,
|
|
[NET_CLIENT_DRIVER_VMNET_BRIDGED] = net_init_vmnet_bridged,
|
|
#endif /* CONFIG_VMNET */
|
|
};
|
|
|
|
|
|
static int net_client_init1(const Netdev *netdev, bool is_netdev, Error **errp)
|
|
{
|
|
NetClientState *peer = NULL;
|
|
NetClientState *nc;
|
|
|
|
if (is_netdev) {
|
|
if (netdev->type == NET_CLIENT_DRIVER_NIC ||
|
|
!net_client_init_fun[netdev->type]) {
|
|
error_setg(errp, "network backend '%s' is not compiled into this binary",
|
|
NetClientDriver_str(netdev->type));
|
|
return -1;
|
|
}
|
|
} else {
|
|
if (netdev->type == NET_CLIENT_DRIVER_NONE) {
|
|
return 0; /* nothing to do */
|
|
}
|
|
if (netdev->type == NET_CLIENT_DRIVER_HUBPORT) {
|
|
error_setg(errp, "network backend '%s' is only supported with -netdev/-nic",
|
|
NetClientDriver_str(netdev->type));
|
|
return -1;
|
|
}
|
|
|
|
if (!net_client_init_fun[netdev->type]) {
|
|
error_setg(errp, "network backend '%s' is not compiled into this binary",
|
|
NetClientDriver_str(netdev->type));
|
|
return -1;
|
|
}
|
|
|
|
/* Do not add to a hub if it's a nic with a netdev= parameter. */
|
|
if (netdev->type != NET_CLIENT_DRIVER_NIC ||
|
|
!netdev->u.nic.netdev) {
|
|
peer = net_hub_add_port(0, NULL, NULL);
|
|
}
|
|
}
|
|
|
|
nc = qemu_find_netdev(netdev->id);
|
|
if (nc) {
|
|
error_setg(errp, "Duplicate ID '%s'", netdev->id);
|
|
return -1;
|
|
}
|
|
|
|
if (net_client_init_fun[netdev->type](netdev, netdev->id, peer, errp) < 0) {
|
|
/* FIXME drop when all init functions store an Error */
|
|
if (errp && !*errp) {
|
|
error_setg(errp, "Device '%s' could not be initialized",
|
|
NetClientDriver_str(netdev->type));
|
|
}
|
|
return -1;
|
|
}
|
|
|
|
if (is_netdev) {
|
|
nc = qemu_find_netdev(netdev->id);
|
|
assert(nc);
|
|
nc->is_netdev = true;
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
void show_netdevs(void)
|
|
{
|
|
int idx;
|
|
const char *available_netdevs[] = {
|
|
"socket",
|
|
"stream",
|
|
"dgram",
|
|
"hubport",
|
|
"tap",
|
|
#ifdef CONFIG_SLIRP
|
|
"user",
|
|
#endif
|
|
#ifdef CONFIG_L2TPV3
|
|
"l2tpv3",
|
|
#endif
|
|
#ifdef CONFIG_VDE
|
|
"vde",
|
|
#endif
|
|
#ifdef CONFIG_NET_BRIDGE
|
|
"bridge",
|
|
#endif
|
|
#ifdef CONFIG_NETMAP
|
|
"netmap",
|
|
#endif
|
|
#ifdef CONFIG_AF_XDP
|
|
"af-xdp",
|
|
#endif
|
|
#ifdef CONFIG_POSIX
|
|
"vhost-user",
|
|
#endif
|
|
#ifdef CONFIG_VHOST_VDPA
|
|
"vhost-vdpa",
|
|
#endif
|
|
#ifdef CONFIG_VMNET
|
|
"vmnet-host",
|
|
"vmnet-shared",
|
|
"vmnet-bridged",
|
|
#endif
|
|
};
|
|
|
|
qemu_printf("Available netdev backend types:\n");
|
|
for (idx = 0; idx < ARRAY_SIZE(available_netdevs); idx++) {
|
|
qemu_printf("%s\n", available_netdevs[idx]);
|
|
}
|
|
}
|
|
|
|
static int net_client_init(QemuOpts *opts, bool is_netdev, Error **errp)
|
|
{
|
|
gchar **substrings = NULL;
|
|
Netdev *object = NULL;
|
|
int ret = -1;
|
|
Visitor *v = opts_visitor_new(opts);
|
|
|
|
/* Parse convenience option format ipv6-net=fec0::0[/64] */
|
|
const char *ip6_net = qemu_opt_get(opts, "ipv6-net");
|
|
|
|
if (ip6_net) {
|
|
char *prefix_addr;
|
|
unsigned long prefix_len = 64; /* Default 64bit prefix length. */
|
|
|
|
substrings = g_strsplit(ip6_net, "/", 2);
|
|
if (!substrings || !substrings[0]) {
|
|
error_setg(errp, QERR_INVALID_PARAMETER_VALUE, "ipv6-net",
|
|
"a valid IPv6 prefix");
|
|
goto out;
|
|
}
|
|
|
|
prefix_addr = substrings[0];
|
|
|
|
/* Handle user-specified prefix length. */
|
|
if (substrings[1] &&
|
|
qemu_strtoul(substrings[1], NULL, 10, &prefix_len))
|
|
{
|
|
error_setg(errp,
|
|
"parameter 'ipv6-net' expects a number after '/'");
|
|
goto out;
|
|
}
|
|
|
|
qemu_opt_set(opts, "ipv6-prefix", prefix_addr, &error_abort);
|
|
qemu_opt_set_number(opts, "ipv6-prefixlen", prefix_len,
|
|
&error_abort);
|
|
qemu_opt_unset(opts, "ipv6-net");
|
|
}
|
|
|
|
/* Create an ID for -net if the user did not specify one */
|
|
if (!is_netdev && !qemu_opts_id(opts)) {
|
|
qemu_opts_set_id(opts, id_generate(ID_NET));
|
|
}
|
|
|
|
if (visit_type_Netdev(v, NULL, &object, errp)) {
|
|
ret = net_client_init1(object, is_netdev, errp);
|
|
}
|
|
|
|
qapi_free_Netdev(object);
|
|
|
|
out:
|
|
g_strfreev(substrings);
|
|
visit_free(v);
|
|
return ret;
|
|
}
|
|
|
|
void netdev_add(QemuOpts *opts, Error **errp)
|
|
{
|
|
net_client_init(opts, true, errp);
|
|
}
|
|
|
|
void qmp_netdev_add(Netdev *netdev, Error **errp)
|
|
{
|
|
if (!id_wellformed(netdev->id)) {
|
|
error_setg(errp, QERR_INVALID_PARAMETER_VALUE, "id", "an identifier");
|
|
return;
|
|
}
|
|
|
|
net_client_init1(netdev, true, errp);
|
|
}
|
|
|
|
void qmp_netdev_del(const char *id, Error **errp)
|
|
{
|
|
NetClientState *nc;
|
|
QemuOpts *opts;
|
|
|
|
nc = qemu_find_netdev(id);
|
|
if (!nc) {
|
|
error_set(errp, ERROR_CLASS_DEVICE_NOT_FOUND,
|
|
"Device '%s' not found", id);
|
|
return;
|
|
}
|
|
|
|
if (!nc->is_netdev) {
|
|
error_setg(errp, "Device '%s' is not a netdev", id);
|
|
return;
|
|
}
|
|
|
|
qemu_del_net_client(nc);
|
|
|
|
/*
|
|
* Wart: we need to delete the QemuOpts associated with netdevs
|
|
* created via CLI or HMP, to avoid bogus "Duplicate ID" errors in
|
|
* HMP netdev_add.
|
|
*/
|
|
opts = qemu_opts_find(qemu_find_opts("netdev"), id);
|
|
if (opts) {
|
|
qemu_opts_del(opts);
|
|
}
|
|
}
|
|
|
|
static void netfilter_print_info(Monitor *mon, NetFilterState *nf)
|
|
{
|
|
char *str;
|
|
ObjectProperty *prop;
|
|
ObjectPropertyIterator iter;
|
|
Visitor *v;
|
|
|
|
/* generate info str */
|
|
object_property_iter_init(&iter, OBJECT(nf));
|
|
while ((prop = object_property_iter_next(&iter))) {
|
|
if (!strcmp(prop->name, "type")) {
|
|
continue;
|
|
}
|
|
v = string_output_visitor_new(false, &str);
|
|
object_property_get(OBJECT(nf), prop->name, v, NULL);
|
|
visit_complete(v, &str);
|
|
visit_free(v);
|
|
monitor_printf(mon, ",%s=%s", prop->name, str);
|
|
g_free(str);
|
|
}
|
|
monitor_printf(mon, "\n");
|
|
}
|
|
|
|
void print_net_client(Monitor *mon, NetClientState *nc)
|
|
{
|
|
NetFilterState *nf;
|
|
|
|
monitor_printf(mon, "%s: index=%d,type=%s,%s\n", nc->name,
|
|
nc->queue_index,
|
|
NetClientDriver_str(nc->info->type),
|
|
nc->info_str);
|
|
if (!QTAILQ_EMPTY(&nc->filters)) {
|
|
monitor_printf(mon, "filters:\n");
|
|
}
|
|
QTAILQ_FOREACH(nf, &nc->filters, next) {
|
|
monitor_printf(mon, " - %s: type=%s",
|
|
object_get_canonical_path_component(OBJECT(nf)),
|
|
object_get_typename(OBJECT(nf)));
|
|
netfilter_print_info(mon, nf);
|
|
}
|
|
}
|
|
|
|
RxFilterInfoList *qmp_query_rx_filter(const char *name, Error **errp)
|
|
{
|
|
NetClientState *nc;
|
|
RxFilterInfoList *filter_list = NULL, **tail = &filter_list;
|
|
|
|
QTAILQ_FOREACH(nc, &net_clients, next) {
|
|
RxFilterInfo *info;
|
|
|
|
if (name && strcmp(nc->name, name) != 0) {
|
|
continue;
|
|
}
|
|
|
|
/* only query rx-filter information of NIC */
|
|
if (nc->info->type != NET_CLIENT_DRIVER_NIC) {
|
|
if (name) {
|
|
error_setg(errp, "net client(%s) isn't a NIC", name);
|
|
assert(!filter_list);
|
|
return NULL;
|
|
}
|
|
continue;
|
|
}
|
|
|
|
/* only query information on queue 0 since the info is per nic,
|
|
* not per queue
|
|
*/
|
|
if (nc->queue_index != 0)
|
|
continue;
|
|
|
|
if (nc->info->query_rx_filter) {
|
|
info = nc->info->query_rx_filter(nc);
|
|
QAPI_LIST_APPEND(tail, info);
|
|
} else if (name) {
|
|
error_setg(errp, "net client(%s) doesn't support"
|
|
" rx-filter querying", name);
|
|
assert(!filter_list);
|
|
return NULL;
|
|
}
|
|
|
|
if (name) {
|
|
break;
|
|
}
|
|
}
|
|
|
|
if (filter_list == NULL && name) {
|
|
error_setg(errp, "invalid net client name: %s", name);
|
|
}
|
|
|
|
return filter_list;
|
|
}
|
|
|
|
void colo_notify_filters_event(int event, Error **errp)
|
|
{
|
|
NetClientState *nc;
|
|
NetFilterState *nf;
|
|
NetFilterClass *nfc = NULL;
|
|
Error *local_err = NULL;
|
|
|
|
QTAILQ_FOREACH(nc, &net_clients, next) {
|
|
QTAILQ_FOREACH(nf, &nc->filters, next) {
|
|
nfc = NETFILTER_GET_CLASS(OBJECT(nf));
|
|
nfc->handle_event(nf, event, &local_err);
|
|
if (local_err) {
|
|
error_propagate(errp, local_err);
|
|
return;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
void qmp_set_link(const char *name, bool up, Error **errp)
|
|
{
|
|
NetClientState *ncs[MAX_QUEUE_NUM];
|
|
NetClientState *nc;
|
|
int queues, i;
|
|
|
|
queues = qemu_find_net_clients_except(name, ncs,
|
|
NET_CLIENT_DRIVER__MAX,
|
|
MAX_QUEUE_NUM);
|
|
|
|
if (queues == 0) {
|
|
error_set(errp, ERROR_CLASS_DEVICE_NOT_FOUND,
|
|
"Device '%s' not found", name);
|
|
return;
|
|
}
|
|
nc = ncs[0];
|
|
|
|
for (i = 0; i < queues; i++) {
|
|
ncs[i]->link_down = !up;
|
|
}
|
|
|
|
if (nc->info->link_status_changed) {
|
|
nc->info->link_status_changed(nc);
|
|
}
|
|
|
|
if (nc->peer) {
|
|
/* Change peer link only if the peer is NIC and then notify peer.
|
|
* If the peer is a HUBPORT or a backend, we do not change the
|
|
* link status.
|
|
*
|
|
* This behavior is compatible with qemu hubs where there could be
|
|
* multiple clients that can still communicate with each other in
|
|
* disconnected mode. For now maintain this compatibility.
|
|
*/
|
|
if (nc->peer->info->type == NET_CLIENT_DRIVER_NIC) {
|
|
for (i = 0; i < queues; i++) {
|
|
ncs[i]->peer->link_down = !up;
|
|
}
|
|
}
|
|
if (nc->peer->info->link_status_changed) {
|
|
nc->peer->info->link_status_changed(nc->peer);
|
|
}
|
|
}
|
|
}
|
|
|
|
static void net_vm_change_state_handler(void *opaque, bool running,
|
|
RunState state)
|
|
{
|
|
NetClientState *nc;
|
|
NetClientState *tmp;
|
|
|
|
QTAILQ_FOREACH_SAFE(nc, &net_clients, next, tmp) {
|
|
if (running) {
|
|
/* Flush queued packets and wake up backends. */
|
|
if (nc->peer && qemu_can_send_packet(nc)) {
|
|
qemu_flush_queued_packets(nc->peer);
|
|
}
|
|
} else {
|
|
/* Complete all queued packets, to guarantee we don't modify
|
|
* state later when VM is not running.
|
|
*/
|
|
qemu_flush_or_purge_queued_packets(nc, true);
|
|
}
|
|
}
|
|
}
|
|
|
|
void net_cleanup(void)
|
|
{
|
|
NetClientState *nc, **p = &QTAILQ_FIRST(&net_clients);
|
|
|
|
/*cleanup colo compare module for COLO*/
|
|
colo_compare_cleanup();
|
|
|
|
/*
|
|
* Walk the net_clients list and remove the netdevs but *not* any
|
|
* NET_CLIENT_DRIVER_NIC entries. The latter are owned by the device
|
|
* model which created them, and in some cases (e.g. xen-net-device)
|
|
* the device itself may do cleanup at exit and will be upset if we
|
|
* just delete its NIC from underneath it.
|
|
*
|
|
* Since qemu_del_net_client() may delete multiple entries, using
|
|
* QTAILQ_FOREACH_SAFE() is not safe here. The only safe pointer
|
|
* to keep as a bookmark is a NET_CLIENT_DRIVER_NIC entry, so keep
|
|
* 'p' pointing to either the head of the list, or the 'next' field
|
|
* of the latest NET_CLIENT_DRIVER_NIC, and operate on *p as we walk
|
|
* the list.
|
|
*
|
|
* The 'nc' variable isn't part of the list traversal; it's purely
|
|
* for convenience as too much '(*p)->' has a tendency to make the
|
|
* readers' eyes bleed.
|
|
*/
|
|
while (*p) {
|
|
nc = *p;
|
|
if (nc->info->type == NET_CLIENT_DRIVER_NIC) {
|
|
/* Skip NET_CLIENT_DRIVER_NIC entries */
|
|
p = &QTAILQ_NEXT(nc, next);
|
|
} else {
|
|
qemu_del_net_client(nc);
|
|
}
|
|
}
|
|
|
|
qemu_del_vm_change_state_handler(net_change_state_entry);
|
|
}
|
|
|
|
void net_check_clients(void)
|
|
{
|
|
NetClientState *nc;
|
|
int i;
|
|
|
|
if (nic_model_help) {
|
|
show_nic_models();
|
|
exit(0);
|
|
}
|
|
net_hub_check_clients();
|
|
|
|
QTAILQ_FOREACH(nc, &net_clients, next) {
|
|
if (!nc->peer) {
|
|
warn_report("%s %s has no peer",
|
|
nc->info->type == NET_CLIENT_DRIVER_NIC
|
|
? "nic" : "netdev",
|
|
nc->name);
|
|
}
|
|
}
|
|
|
|
/* Check that all NICs requested via -net nic actually got created.
|
|
* NICs created via -device don't need to be checked here because
|
|
* they are always instantiated.
|
|
*/
|
|
for (i = 0; i < MAX_NICS; i++) {
|
|
NICInfo *nd = &nd_table[i];
|
|
if (nd->used && !nd->instantiated) {
|
|
warn_report("requested NIC (%s, model %s) "
|
|
"was not created (not supported by this machine?)",
|
|
nd->name ? nd->name : "anonymous",
|
|
nd->model ? nd->model : "unspecified");
|
|
}
|
|
}
|
|
}
|
|
|
|
static int net_init_client(void *dummy, QemuOpts *opts, Error **errp)
|
|
{
|
|
return net_client_init(opts, false, errp);
|
|
}
|
|
|
|
static int net_init_netdev(void *dummy, QemuOpts *opts, Error **errp)
|
|
{
|
|
const char *type = qemu_opt_get(opts, "type");
|
|
|
|
if (type && is_help_option(type)) {
|
|
show_netdevs();
|
|
exit(0);
|
|
}
|
|
return net_client_init(opts, true, errp);
|
|
}
|
|
|
|
/* For the convenience "--nic" parameter */
|
|
static int net_param_nic(void *dummy, QemuOpts *opts, Error **errp)
|
|
{
|
|
char *mac, *nd_id;
|
|
int idx, ret;
|
|
NICInfo *ni;
|
|
const char *type;
|
|
|
|
type = qemu_opt_get(opts, "type");
|
|
if (type) {
|
|
if (g_str_equal(type, "none")) {
|
|
return 0; /* Nothing to do, default_net is cleared in vl.c */
|
|
}
|
|
if (is_help_option(type)) {
|
|
GPtrArray *nic_models = qemu_get_nic_models(TYPE_DEVICE);
|
|
int i;
|
|
show_netdevs();
|
|
printf("\n");
|
|
printf("Available NIC models "
|
|
"(use -nic model=help for a filtered list):\n");
|
|
for (i = 0 ; nic_models->pdata[i]; i++) {
|
|
printf("%s\n", (char *)nic_models->pdata[i]);
|
|
}
|
|
g_ptr_array_free(nic_models, true);
|
|
exit(0);
|
|
}
|
|
}
|
|
|
|
idx = nic_get_free_idx();
|
|
if (idx == -1 || nb_nics >= MAX_NICS) {
|
|
error_setg(errp, "no more on-board/default NIC slots available");
|
|
return -1;
|
|
}
|
|
|
|
if (!type) {
|
|
qemu_opt_set(opts, "type", "user", &error_abort);
|
|
}
|
|
|
|
ni = &nd_table[idx];
|
|
memset(ni, 0, sizeof(*ni));
|
|
ni->model = qemu_opt_get_del(opts, "model");
|
|
|
|
if (!nic_model_help && !g_strcmp0(ni->model, "help")) {
|
|
nic_model_help = g_hash_table_new_full(g_str_hash, g_str_equal,
|
|
g_free, NULL);
|
|
return 0;
|
|
}
|
|
|
|
/* Create an ID if the user did not specify one */
|
|
nd_id = g_strdup(qemu_opts_id(opts));
|
|
if (!nd_id) {
|
|
nd_id = id_generate(ID_NET);
|
|
qemu_opts_set_id(opts, nd_id);
|
|
}
|
|
|
|
/* Handle MAC address */
|
|
mac = qemu_opt_get_del(opts, "mac");
|
|
if (mac) {
|
|
ret = net_parse_macaddr(ni->macaddr.a, mac);
|
|
g_free(mac);
|
|
if (ret) {
|
|
error_setg(errp, "invalid syntax for ethernet address");
|
|
goto out;
|
|
}
|
|
if (is_multicast_ether_addr(ni->macaddr.a)) {
|
|
error_setg(errp, "NIC cannot have multicast MAC address");
|
|
ret = -1;
|
|
goto out;
|
|
}
|
|
}
|
|
qemu_macaddr_default_if_unset(&ni->macaddr);
|
|
|
|
ret = net_client_init(opts, true, errp);
|
|
if (ret == 0) {
|
|
ni->netdev = qemu_find_netdev(nd_id);
|
|
ni->used = true;
|
|
nb_nics++;
|
|
}
|
|
|
|
out:
|
|
g_free(nd_id);
|
|
return ret;
|
|
}
|
|
|
|
static void netdev_init_modern(void)
|
|
{
|
|
while (!QSIMPLEQ_EMPTY(&nd_queue)) {
|
|
NetdevQueueEntry *nd = QSIMPLEQ_FIRST(&nd_queue);
|
|
|
|
QSIMPLEQ_REMOVE_HEAD(&nd_queue, entry);
|
|
loc_push_restore(&nd->loc);
|
|
net_client_init1(nd->nd, true, &error_fatal);
|
|
loc_pop(&nd->loc);
|
|
qapi_free_Netdev(nd->nd);
|
|
g_free(nd);
|
|
}
|
|
}
|
|
|
|
void net_init_clients(void)
|
|
{
|
|
net_change_state_entry =
|
|
qemu_add_vm_change_state_handler(net_vm_change_state_handler, NULL);
|
|
|
|
QTAILQ_INIT(&net_clients);
|
|
|
|
netdev_init_modern();
|
|
|
|
qemu_opts_foreach(qemu_find_opts("netdev"), net_init_netdev, NULL,
|
|
&error_fatal);
|
|
|
|
qemu_opts_foreach(qemu_find_opts("nic"), net_param_nic, NULL,
|
|
&error_fatal);
|
|
|
|
qemu_opts_foreach(qemu_find_opts("net"), net_init_client, NULL,
|
|
&error_fatal);
|
|
}
|
|
|
|
/*
|
|
* Does this -netdev argument use modern rather than traditional syntax?
|
|
* Modern syntax is to be parsed with netdev_parse_modern().
|
|
* Traditional syntax is to be parsed with net_client_parse().
|
|
*/
|
|
bool netdev_is_modern(const char *optstr)
|
|
{
|
|
QemuOpts *opts;
|
|
bool is_modern;
|
|
const char *type;
|
|
static QemuOptsList dummy_opts = {
|
|
.name = "netdev",
|
|
.implied_opt_name = "type",
|
|
.head = QTAILQ_HEAD_INITIALIZER(dummy_opts.head),
|
|
.desc = { { } },
|
|
};
|
|
|
|
if (optstr[0] == '{') {
|
|
/* This is JSON, which means it's modern syntax */
|
|
return true;
|
|
}
|
|
|
|
opts = qemu_opts_create(&dummy_opts, NULL, false, &error_abort);
|
|
qemu_opts_do_parse(opts, optstr, dummy_opts.implied_opt_name,
|
|
&error_abort);
|
|
type = qemu_opt_get(opts, "type");
|
|
is_modern = !g_strcmp0(type, "stream") || !g_strcmp0(type, "dgram");
|
|
|
|
qemu_opts_reset(&dummy_opts);
|
|
|
|
return is_modern;
|
|
}
|
|
|
|
/*
|
|
* netdev_parse_modern() uses modern, more expressive syntax than
|
|
* net_client_parse(), but supports only the -netdev option.
|
|
* netdev_parse_modern() appends to @nd_queue, whereas net_client_parse()
|
|
* appends to @qemu_netdev_opts.
|
|
*/
|
|
void netdev_parse_modern(const char *optstr)
|
|
{
|
|
Visitor *v;
|
|
NetdevQueueEntry *nd;
|
|
|
|
v = qobject_input_visitor_new_str(optstr, "type", &error_fatal);
|
|
nd = g_new(NetdevQueueEntry, 1);
|
|
visit_type_Netdev(v, NULL, &nd->nd, &error_fatal);
|
|
visit_free(v);
|
|
loc_save(&nd->loc);
|
|
|
|
QSIMPLEQ_INSERT_TAIL(&nd_queue, nd, entry);
|
|
}
|
|
|
|
void net_client_parse(QemuOptsList *opts_list, const char *optstr)
|
|
{
|
|
if (!qemu_opts_parse_noisily(opts_list, optstr, true)) {
|
|
exit(1);
|
|
}
|
|
}
|
|
|
|
/* From FreeBSD */
|
|
/* XXX: optimize */
|
|
uint32_t net_crc32(const uint8_t *p, int len)
|
|
{
|
|
uint32_t crc;
|
|
int carry, i, j;
|
|
uint8_t b;
|
|
|
|
crc = 0xffffffff;
|
|
for (i = 0; i < len; i++) {
|
|
b = *p++;
|
|
for (j = 0; j < 8; j++) {
|
|
carry = ((crc & 0x80000000L) ? 1 : 0) ^ (b & 0x01);
|
|
crc <<= 1;
|
|
b >>= 1;
|
|
if (carry) {
|
|
crc = ((crc ^ POLYNOMIAL_BE) | carry);
|
|
}
|
|
}
|
|
}
|
|
|
|
return crc;
|
|
}
|
|
|
|
uint32_t net_crc32_le(const uint8_t *p, int len)
|
|
{
|
|
uint32_t crc;
|
|
int carry, i, j;
|
|
uint8_t b;
|
|
|
|
crc = 0xffffffff;
|
|
for (i = 0; i < len; i++) {
|
|
b = *p++;
|
|
for (j = 0; j < 8; j++) {
|
|
carry = (crc & 0x1) ^ (b & 0x01);
|
|
crc >>= 1;
|
|
b >>= 1;
|
|
if (carry) {
|
|
crc ^= POLYNOMIAL_LE;
|
|
}
|
|
}
|
|
}
|
|
|
|
return crc;
|
|
}
|
|
|
|
QemuOptsList qemu_netdev_opts = {
|
|
.name = "netdev",
|
|
.implied_opt_name = "type",
|
|
.head = QTAILQ_HEAD_INITIALIZER(qemu_netdev_opts.head),
|
|
.desc = {
|
|
/*
|
|
* no elements => accept any params
|
|
* validation will happen later
|
|
*/
|
|
{ /* end of list */ }
|
|
},
|
|
};
|
|
|
|
QemuOptsList qemu_nic_opts = {
|
|
.name = "nic",
|
|
.implied_opt_name = "type",
|
|
.head = QTAILQ_HEAD_INITIALIZER(qemu_nic_opts.head),
|
|
.desc = {
|
|
/*
|
|
* no elements => accept any params
|
|
* validation will happen later
|
|
*/
|
|
{ /* end of list */ }
|
|
},
|
|
};
|
|
|
|
QemuOptsList qemu_net_opts = {
|
|
.name = "net",
|
|
.implied_opt_name = "type",
|
|
.head = QTAILQ_HEAD_INITIALIZER(qemu_net_opts.head),
|
|
.desc = {
|
|
/*
|
|
* no elements => accept any params
|
|
* validation will happen later
|
|
*/
|
|
{ /* end of list */ }
|
|
},
|
|
};
|
|
|
|
void net_socket_rs_init(SocketReadState *rs,
|
|
SocketReadStateFinalize *finalize,
|
|
bool vnet_hdr)
|
|
{
|
|
rs->state = 0;
|
|
rs->vnet_hdr = vnet_hdr;
|
|
rs->index = 0;
|
|
rs->packet_len = 0;
|
|
rs->vnet_hdr_len = 0;
|
|
memset(rs->buf, 0, sizeof(rs->buf));
|
|
rs->finalize = finalize;
|
|
}
|
|
|
|
/*
|
|
* Returns
|
|
* 0: success
|
|
* -1: error occurs
|
|
*/
|
|
int net_fill_rstate(SocketReadState *rs, const uint8_t *buf, int size)
|
|
{
|
|
unsigned int l;
|
|
|
|
while (size > 0) {
|
|
/* Reassemble a packet from the network.
|
|
* 0 = getting length.
|
|
* 1 = getting vnet header length.
|
|
* 2 = getting data.
|
|
*/
|
|
switch (rs->state) {
|
|
case 0:
|
|
l = 4 - rs->index;
|
|
if (l > size) {
|
|
l = size;
|
|
}
|
|
memcpy(rs->buf + rs->index, buf, l);
|
|
buf += l;
|
|
size -= l;
|
|
rs->index += l;
|
|
if (rs->index == 4) {
|
|
/* got length */
|
|
rs->packet_len = ntohl(*(uint32_t *)rs->buf);
|
|
rs->index = 0;
|
|
if (rs->vnet_hdr) {
|
|
rs->state = 1;
|
|
} else {
|
|
rs->state = 2;
|
|
rs->vnet_hdr_len = 0;
|
|
}
|
|
}
|
|
break;
|
|
case 1:
|
|
l = 4 - rs->index;
|
|
if (l > size) {
|
|
l = size;
|
|
}
|
|
memcpy(rs->buf + rs->index, buf, l);
|
|
buf += l;
|
|
size -= l;
|
|
rs->index += l;
|
|
if (rs->index == 4) {
|
|
/* got vnet header length */
|
|
rs->vnet_hdr_len = ntohl(*(uint32_t *)rs->buf);
|
|
rs->index = 0;
|
|
rs->state = 2;
|
|
}
|
|
break;
|
|
case 2:
|
|
l = rs->packet_len - rs->index;
|
|
if (l > size) {
|
|
l = size;
|
|
}
|
|
if (rs->index + l <= sizeof(rs->buf)) {
|
|
memcpy(rs->buf + rs->index, buf, l);
|
|
} else {
|
|
fprintf(stderr, "serious error: oversized packet received,"
|
|
"connection terminated.\n");
|
|
rs->index = rs->state = 0;
|
|
return -1;
|
|
}
|
|
|
|
rs->index += l;
|
|
buf += l;
|
|
size -= l;
|
|
if (rs->index >= rs->packet_len) {
|
|
rs->index = 0;
|
|
rs->state = 0;
|
|
assert(rs->finalize);
|
|
rs->finalize(rs);
|
|
}
|
|
break;
|
|
}
|
|
}
|
|
|
|
assert(size == 0);
|
|
return 0;
|
|
}
|