NetBSD/sys/net/if_tokensubr.c
ozaki-r 9c4cd06355 Introduce softint-based if_input
This change intends to run the whole network stack in softint context
(or normal LWP), not hardware interrupt context. Note that the work is
still incomplete by this change; to that end, we also have to softint-ify
if_link_state_change (and bpf) which can still run in hardware interrupt.

This change softint-ifies at ifp->if_input that is called from
each device driver (and ieee80211_input) to ensure Layer 2 runs
in softint (e.g., ether_input and bridge_input). To this end,
we provide a framework (called percpuq) that utlizes softint(9)
and percpu ifqueues. With this patch, rxintr of most drivers just
queues received packets and schedules a softint, and the softint
dequeues packets and does rest packet processing.

To minimize changes to each driver, percpuq is allocated in struct
ifnet for now and that is initialized by default (in if_attach).
We probably have to move percpuq to softc of each driver, but it's
future work. At this point, only wm(4) has percpuq in its softc
as a reference implementation.

Additional information including performance numbers can be found
in the thread at tech-kern@ and tech-net@:
http://mail-index.netbsd.org/tech-kern/2016/01/14/msg019997.html

Acknowledgment: riastradh@ greatly helped this work.
Thank you very much!
2016-02-09 08:32:07 +00:00

521 lines
15 KiB
C

/* $NetBSD: if_tokensubr.c,v 1.73 2016/02/09 08:32:12 ozaki-r Exp $ */
/*
* Copyright (c) 1982, 1989, 1993
* The Regents of the University of California. All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
* 3. Neither the name of the University nor the names of its contributors
* may be used to endorse or promote products derived from this software
* without specific prior written permission.
*
* THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
* SUCH DAMAGE.
*
* from: NetBSD: if_fddisubr.c,v 1.2 1995/08/19 04:35:29 cgd Exp
*/
/*
* Copyright (c) 1997-1999 The NetBSD Foundation, Inc.
* All rights reserved.
*
* This code is derived from software contributed to The NetBSD Foundation
* by Onno van der Linden.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
*
* THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
* ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
* TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
* PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
* BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
* CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
* SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
* INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
* CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
* ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
* POSSIBILITY OF SUCH DAMAGE.
*/
/*
* Copyright (c) 1995
* Matt Thomas. All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
* 3. The names of its contributors may not be used to endorse or promote
* products derived from this software without specific prior written
* permission.
*
* THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
* SUCH DAMAGE.
*
* from: NetBSD: if_fddisubr.c,v 1.2 1995/08/19 04:35:29 cgd Exp
*/
#include <sys/cdefs.h>
__KERNEL_RCSID(0, "$NetBSD: if_tokensubr.c,v 1.73 2016/02/09 08:32:12 ozaki-r Exp $");
#ifdef _KERNEL_OPT
#include "opt_inet.h"
#include "opt_atalk.h"
#include "opt_gateway.h"
#endif
#include <sys/param.h>
#include <sys/systm.h>
#include <sys/kernel.h>
#include <sys/malloc.h>
#include <sys/mbuf.h>
#include <sys/protosw.h>
#include <sys/socket.h>
#include <sys/ioctl.h>
#include <sys/errno.h>
#include <sys/syslog.h>
#include <sys/cpu.h>
#include <net/if.h>
#include <net/if_dl.h>
#include <net/if_llatbl.h>
#include <net/if_llc.h>
#include <net/if_types.h>
#include <net/netisr.h>
#include <net/route.h>
#include <net/bpf.h>
#include <net/if_ether.h>
#include <net/if_token.h>
#ifdef INET
#include <netinet/in.h>
#include <netinet/in_var.h>
#include <netinet/if_inarp.h>
#endif
#include "carp.h"
#if NCARP > 0
#include <netinet/ip_carp.h>
#endif
#define senderr(e) { error = (e); goto bad;}
#define RCF_ALLROUTES (2 << 8) | TOKEN_RCF_FRAME2 | TOKEN_RCF_BROADCAST_ALL
#define RCF_SINGLEROUTE (2 << 8) | TOKEN_RCF_FRAME2 | TOKEN_RCF_BROADCAST_SINGLE
static int token_output(struct ifnet *, struct mbuf *,
const struct sockaddr *, struct rtentry *);
static void token_input(struct ifnet *, struct mbuf *);
/*
* Token Ring output routine.
* Encapsulate a packet of type family for the local net.
* Assumes that ifp is actually pointer to arphdr structure.
* XXX route info has to go into the same mbuf as the header
*/
static int
token_output(struct ifnet *ifp0, struct mbuf *m0, const struct sockaddr *dst,
struct rtentry *rt)
{
uint16_t etype;
int error = 0;
u_char edst[ISO88025_ADDR_LEN];
struct mbuf *m = m0;
struct mbuf *mcopy = NULL;
struct token_header *trh;
#ifdef INET
struct arphdr *ah = (struct arphdr *)ifp0;
#endif /* INET */
struct token_rif *rif = NULL;
struct token_rif bcastrif;
struct ifnet *ifp = ifp0;
size_t riflen = 0;
ALTQ_DECL(struct altq_pktattr pktattr;)
#if NCARP > 0
if (ifp->if_type == IFT_CARP) {
struct ifaddr *ifa;
/* loop back if this is going to the carp interface */
if (dst != NULL && ifp0->if_link_state == LINK_STATE_UP &&
(ifa = ifa_ifwithaddr(dst)) != NULL &&
ifa->ifa_ifp == ifp0)
return (looutput(ifp0, m, dst, rt));
ifp = ifp->if_carpdev;
ah = (struct arphdr *)ifp;
if ((ifp0->if_flags & (IFF_UP|IFF_RUNNING)) !=
(IFF_UP|IFF_RUNNING))
senderr(ENETDOWN);
}
#endif /* NCARP > 0 */
if ((ifp->if_flags & (IFF_UP|IFF_RUNNING)) != (IFF_UP|IFF_RUNNING))
senderr(ENETDOWN);
/*
* If the queueing discipline needs packet classification,
* do it before prepending link headers.
*/
IFQ_CLASSIFY(&ifp->if_snd, m, dst->sa_family, &pktattr);
switch (dst->sa_family) {
#ifdef INET
case AF_INET:
if (m->m_flags & M_BCAST) {
if (ifp->if_flags & IFF_LINK0) {
if (ifp->if_flags & IFF_LINK1)
bcastrif.tr_rcf = htons(RCF_ALLROUTES);
else
bcastrif.tr_rcf = htons(RCF_SINGLEROUTE);
rif = &bcastrif;
riflen = sizeof(rif->tr_rcf);
}
memcpy(edst, tokenbroadcastaddr, sizeof(edst));
}
/*
* XXX m->m_flags & M_MCAST IEEE802_MAP_IP_MULTICAST ??
*/
else {
struct llentry *la;
if (!arpresolve(ifp, rt, m, dst, edst))
return (0); /* if not yet resolved */
la = rt->rt_llinfo;
KASSERT(la != NULL);
TOKEN_RIF_LLE_ASSERT(la);
rif = TOKEN_RIF_LLE(la);
riflen = (ntohs(rif->tr_rcf) & TOKEN_RCF_LEN_MASK) >> 8;
}
/* If broadcasting on a simplex interface, loopback a copy. */
if ((m->m_flags & M_BCAST) && (ifp->if_flags & IFF_SIMPLEX))
mcopy = m_copy(m, 0, (int)M_COPYALL);
etype = htons(ETHERTYPE_IP);
break;
case AF_ARP:
/*
* XXX source routing, assume m->m_data contains the useful stuff
*/
ah = mtod(m, struct arphdr *);
ah->ar_hrd = htons(ARPHRD_IEEE802);
switch (ntohs(ah->ar_op)) {
case ARPOP_REVREQUEST:
case ARPOP_REVREPLY:
etype = htons(ETHERTYPE_REVARP);
break;
case ARPOP_REQUEST:
case ARPOP_REPLY:
default:
etype = htons(ETHERTYPE_ARP);
}
if (m->m_flags & M_BCAST) {
if (ifp->if_flags & IFF_LINK0) {
if (ifp->if_flags & IFF_LINK1)
bcastrif.tr_rcf = htons(RCF_ALLROUTES);
else
bcastrif.tr_rcf = htons(RCF_SINGLEROUTE);
rif = &bcastrif;
riflen = sizeof(rif->tr_rcf);
}
memcpy(edst, tokenbroadcastaddr, sizeof(edst));
}
else {
void *tha = ar_tha(ah);
if (tha == NULL)
return 0;
memcpy(edst, tha, sizeof(edst));
trh = (struct token_header *)M_TRHSTART(m);
trh->token_ac = TOKEN_AC;
trh->token_fc = TOKEN_FC;
if (trh->token_shost[0] & TOKEN_RI_PRESENT) {
struct token_rif *trrif;
trrif = TOKEN_RIF(trh);
riflen = (ntohs(trrif->tr_rcf) & TOKEN_RCF_LEN_MASK) >> 8;
}
memcpy((void *)trh->token_dhost, (void *)edst,
sizeof (edst));
memcpy((void *)trh->token_shost, CLLADDR(ifp->if_sadl),
sizeof(trh->token_shost));
if (riflen != 0)
trh->token_shost[0] |= TOKEN_RI_PRESENT;
/*
* compare (m->m_data - m->m_pktdat) with (sizeof(struct token_header) + riflen + ...
*/
m->m_len += (sizeof(*trh) + riflen + LLC_SNAPFRAMELEN);
m->m_data -= (sizeof(*trh) + riflen + LLC_SNAPFRAMELEN);
m->m_pkthdr.len += (sizeof(*trh) + riflen + LLC_SNAPFRAMELEN);
goto send;
}
break;
#endif
case AF_UNSPEC:
{
const struct ether_header *eh;
eh = (const struct ether_header *)dst->sa_data;
memcpy(edst, eh->ether_dhost, sizeof(edst));
if (*edst & 1)
m->m_flags |= (M_BCAST|M_MCAST);
etype = eh->ether_type;
if (m->m_flags & M_BCAST) {
if (ifp->if_flags & IFF_LINK0) {
if (ifp->if_flags & IFF_LINK1)
bcastrif.tr_rcf = htons(RCF_ALLROUTES);
else
bcastrif.tr_rcf = htons(RCF_SINGLEROUTE);
rif = &bcastrif;
riflen = sizeof(bcastrif.tr_rcf);
}
}
break;
}
default:
printf("%s: can't handle af%d\n", ifp->if_xname,
dst->sa_family);
senderr(EAFNOSUPPORT);
}
if (mcopy)
(void) looutput(ifp, mcopy, dst, rt);
if (etype != 0) {
struct llc *l;
M_PREPEND(m, LLC_SNAPFRAMELEN, M_DONTWAIT);
if (m == 0)
senderr(ENOBUFS);
l = mtod(m, struct llc *);
l->llc_control = LLC_UI;
l->llc_dsap = l->llc_ssap = LLC_SNAP_LSAP;
l->llc_snap.org_code[0] = l->llc_snap.org_code[1] =
l->llc_snap.org_code[2] = 0;
memcpy((void *) &l->llc_snap.ether_type, (void *) &etype,
sizeof(uint16_t));
}
/*
* Add local net header. If no space in first mbuf,
* allocate another.
*/
M_PREPEND(m, (riflen + sizeof (*trh)), M_DONTWAIT);
if (m == 0)
senderr(ENOBUFS);
trh = mtod(m, struct token_header *);
trh->token_ac = TOKEN_AC;
trh->token_fc = TOKEN_FC;
memcpy((void *)trh->token_dhost, (void *)edst, sizeof (edst));
memcpy((void *)trh->token_shost, CLLADDR(ifp->if_sadl),
sizeof(trh->token_shost));
if (riflen != 0) {
struct token_rif *trrif;
trh->token_shost[0] |= TOKEN_RI_PRESENT;
trrif = TOKEN_RIF(trh);
memcpy(trrif, rif, riflen);
}
#ifdef INET
send:
#endif
#if NCARP > 0
if (ifp0 != ifp && ifp0->if_type == IFT_CARP) {
memcpy((void *)trh->token_shost, CLLADDR(ifp0->if_sadl),
sizeof(trh->token_shost));
}
#endif /* NCARP > 0 */
return ifq_enqueue(ifp, m ALTQ_COMMA ALTQ_DECL(&pktattr));
bad:
if (m)
m_freem(m);
return (error);
}
/*
* Process a received token ring packet;
* the packet is in the mbuf chain m with
* the token ring header.
*/
static void
token_input(struct ifnet *ifp, struct mbuf *m)
{
pktqueue_t *pktq = NULL;
struct ifqueue *inq = NULL;
struct llc *l;
struct token_header *trh;
int s, lan_hdr_len;
int isr = 0;
if ((ifp->if_flags & IFF_UP) == 0) {
m_freem(m);
return;
}
trh = mtod(m, struct token_header *);
ifp->if_ibytes += m->m_pkthdr.len;
if (memcmp(tokenbroadcastaddr, trh->token_dhost,
sizeof(tokenbroadcastaddr)) == 0)
m->m_flags |= M_BCAST;
else if (trh->token_dhost[0] & 1)
m->m_flags |= M_MCAST;
if (m->m_flags & (M_BCAST|M_MCAST))
ifp->if_imcasts++;
/* Skip past the Token Ring header and RIF. */
lan_hdr_len = sizeof(struct token_header);
if (trh->token_shost[0] & TOKEN_RI_PRESENT) {
struct token_rif *trrif;
trrif = TOKEN_RIF(trh);
lan_hdr_len += (ntohs(trrif->tr_rcf) & TOKEN_RCF_LEN_MASK) >> 8;
}
l = (struct llc *)(mtod(m, uint8_t *) + lan_hdr_len);
switch (l->llc_dsap) {
#if defined(INET)
case LLC_SNAP_LSAP:
{
uint16_t etype;
if (l->llc_control != LLC_UI || l->llc_ssap != LLC_SNAP_LSAP)
goto dropanyway;
if (l->llc_snap.org_code[0] != 0 ||
l->llc_snap.org_code[1] != 0 ||
l->llc_snap.org_code[2] != 0)
goto dropanyway;
etype = ntohs(l->llc_snap.ether_type);
m_adj(m, lan_hdr_len + LLC_SNAPFRAMELEN);
#if NCARP > 0
if (ifp->if_carp && ifp->if_type != IFT_CARP &&
(carp_input(m, (uint8_t *)&trh->token_shost,
(uint8_t *)&trh->token_dhost, l->llc_snap.ether_type) == 0))
return;
#endif /* NCARP > 0 */
switch (etype) {
#ifdef INET
case ETHERTYPE_IP:
pktq = ip_pktq;
break;
case ETHERTYPE_ARP:
isr = NETISR_ARP;
inq = &arpintrq;
break;
#endif
default:
/*
printf("token_input: unknown protocol 0x%x\n", etype);
*/
ifp->if_noproto++;
goto dropanyway;
}
break;
}
#endif /* INET */
default:
/* printf("token_input: unknown dsap 0x%x\n", l->llc_dsap); */
ifp->if_noproto++;
#if defined(INET)
dropanyway:
#endif
m_freem(m);
return;
}
if (__predict_true(pktq)) {
if (__predict_false(!pktq_enqueue(pktq, m, 0))) {
m_freem(m);
}
return;
}
s = splnet();
if (IF_QFULL(inq)) {
IF_DROP(inq);
m_freem(m);
} else {
IF_ENQUEUE(inq, m);
schednetisr(isr);
}
splx(s);
}
/*
* Perform common duties while attaching to interface list
*/
void
token_ifattach(struct ifnet *ifp, void *lla)
{
ifp->if_type = IFT_ISO88025;
ifp->if_hdrlen = 14;
ifp->if_dlt = DLT_IEEE802;
ifp->if_mtu = ISO88025_MTU;
ifp->if_output = token_output;
ifp->_if_input = token_input;
ifp->if_broadcastaddr = tokenbroadcastaddr;
#ifdef IFF_NOTRAILERS
ifp->if_flags |= IFF_NOTRAILERS;
#endif
if_set_sadl(ifp, lla, ISO88025_ADDR_LEN, true);
bpf_attach(ifp, DLT_IEEE802, sizeof(struct token_header));
}
void
token_ifdetach(struct ifnet *ifp)
{
bpf_detach(ifp);
}