///////////////////////////////////////////////////////////////////////// // $Id: eth_tap.cc,v 1.36 2009-04-19 17:25:40 vruppert Exp $ ///////////////////////////////////////////////////////////////////////// // // Copyright (C) 2001 MandrakeSoft S.A. // // MandrakeSoft S.A. // 43, rue d'Aboukir // 75002 Paris - France // http://www.linux-mandrake.com/ // http://www.mandrakesoft.com/ // // This library is free software; you can redistribute it and/or // modify it under the terms of the GNU Lesser General Public // License as published by the Free Software Foundation; either // version 2 of the License, or (at your option) any later version. // // This library is distributed in the hope that it will be useful, // but WITHOUT ANY WARRANTY; without even the implied warranty of // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU // Lesser General Public License for more details. // // You should have received a copy of the GNU Lesser General Public // License along with this library; if not, write to the Free Software // Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA // ///////////////////////////////////////////////////////////////////////// // eth_tap.cc - TAP interface by Bryce Denney // // Here's how to get this working. On the host machine: // $ su root // # /sbin/insmod ethertap // Using /lib/modules/2.2.14-5.0/net/ethertap.o // # mknod /dev/tap0 c 36 16 # if not already there // # /sbin/ifconfig tap0 10.0.0.1 // # /sbin/route add -host 10.0.0.2 gw 10.0.0.1 // // Now you have a tap0 device which you can on the ifconfig output. The // tap0 interface has the IP address of 10.0.0.1. The bochs machine will have // the IP address 10.0.0.2. // // Compile a bochs version from March 8, 2002 or later with --enable-ne2000. // Add this ne2k line to your .bochsrc to activate the tap device. // ne2k: ioaddr=0x280, irq=9, mac=fe:fd:00:00:00:01, ethmod=tap, ethdev=tap0 // Don't change the mac or ethmod! // // Boot up DLX Linux in Bochs. Log in as root and then type the following // commands to set up networking: // # ifconfig eth0 10.0.0.2 // # route add -net 10.0.0.0 // # route add default gw 10.0.0.1 // Now you should be able to ping from guest OS to your host machine, if // you give its IP number. I'm still having trouble with pings from the // host machine to the guest, so something is still not right. Symptoms: I // ping from the host to the guest's IP address 10.0.0.2. With tcpdump I can // see the ping going to Bochs, and then the ping reply coming from Bochs. // But the ping program itself does not see the responses....well every // once in a while it does, like 1 in 60 pings. // // host$ ping 10.0.0.2 // PING 10.0.0.2 (10.0.0.2) from 10.0.0.1 : 56(84) bytes of data. // // Netstat output: // 20:29:59.018776 fe:fd:0:0:0:0 fe:fd:0:0:0:1 0800 98: 10.0.0.1 > 10.0.0.2: icmp: echo request // 4500 0054 2800 0000 4001 3ea7 0a00 0001 // 0a00 0002 0800 09d3 a53e 0400 9765 893c // 3949 0000 0809 0a0b 0c0d 0e0f 1011 1213 // 1415 1617 1819 // 20:29:59.023017 fe:fd:0:0:0:1 fe:fd:0:0:0:0 0800 98: 10.0.0.2 > 10.0.0.1: icmp: echo reply // 4500 0054 004a 0000 4001 665d 0a00 0002 // 0a00 0001 0000 11d3 a53e 0400 9765 893c // 3949 0000 0809 0a0b 0c0d 0e0f 1011 1213 // 1415 1617 1819 // // I suspect it may be related to the fact that ping 10.0.0.1 from the // host also doesn't work. Why wouldn't the host respond to its own IP // address on the tap0 device? // // Theoretically, if you set up packet forwarding (with masquerading) on the // host, you should be able to get Bochs talking to anyone on the internet. // // Pavel Dufek (PD), CZ, 2008 - quick & dirty hack for Solaris 10 sparc tap // ala Qemu. // Define BX_PLUGGABLE in files that can be compiled into plugins. For // platforms that require a special tag on exported symbols, BX_PLUGGABLE // is used to know when we are exporting symbols and when we are importing. #define BX_PLUGGABLE #define NO_DEVICE_INCLUDES #include "iodev.h" #if BX_NETWORKING && defined(HAVE_ETHERTAP) #include "eth.h" #define LOG_THIS netdev-> #include #include #include #ifndef __APPLE__ #include #endif #include #include #include #include #include #if defined(__linux__) #include #include #include #elif BX_HAVE_NET_IF_H #include #endif #include #include #include #if defined(__sun__) // Sun/Solaris specific defines/includes #define TUNNEWPPA (('T'<<16) | 0x0001) #include #endif #define BX_ETH_TAP_LOGGING 0 // // Define the class. This is private to this module // class bx_tap_pktmover_c : public eth_pktmover_c { public: bx_tap_pktmover_c(const char *netif, const char *macaddr, eth_rx_handler_t rxh, bx_devmodel_c *dev, const char *script); void sendpkt(void *buf, unsigned io_len); private: int fd; int rx_timer_index; static void rx_timer_handler(void *); void rx_timer (); Bit8u guest_macaddr[6]; #if BX_ETH_TAP_LOGGING FILE *txlog, *txlog_txt, *rxlog, *rxlog_txt; #endif }; // // Define the static class that registers the derived pktmover class, // and allocates one on request. // class bx_tap_locator_c : public eth_locator_c { public: bx_tap_locator_c(void) : eth_locator_c("tap") {} protected: eth_pktmover_c *allocate(const char *netif, const char *macaddr, eth_rx_handler_t rxh, bx_devmodel_c *dev, const char *script) { return (new bx_tap_pktmover_c(netif, macaddr, rxh, dev, script)); } } bx_tap_match; // // Define the methods for the bx_tap_pktmover derived class // // the constructor bx_tap_pktmover_c::bx_tap_pktmover_c(const char *netif, const char *macaddr, eth_rx_handler_t rxh, bx_devmodel_c *dev, const char *script) { int flags; char filename[BX_PATHNAME_LEN]; this->netdev = dev; if (strncmp (netif, "tap", 3) != 0) { BX_PANIC(("eth_tap: interface name (%s) must be tap0..tap15", netif)); } #if defined(__sun__) strcpy(filename,"/dev/tap"); /* PD - device on Solaris is always the same */ #else sprintf(filename, "/dev/%s", netif); #endif #if defined(__linux__) // check if the TAP devices is running, and turn on ARP. This is based // on code from the Mac-On-Linux project. http://http://www.maconlinux.org/ int sock = socket(AF_INET, SOCK_DGRAM, 0); if (sock < 0) { BX_PANIC(("socket creation: %s", strerror(errno))); return; } struct ifreq ifr; memset(&ifr, 0, sizeof(ifr)); strncpy(ifr.ifr_name, netif, sizeof(ifr.ifr_name)); if(ioctl(sock, SIOCGIFFLAGS, &ifr) < 0) { BX_PANIC(("SIOCGIFFLAGS on %s: %s", netif, strerror(errno))); close(sock); return; } if (!(ifr.ifr_flags & IFF_RUNNING)) { BX_PANIC(("%s device is not running", netif)); close(sock); return; } if ((ifr.ifr_flags & IFF_NOARP)){ BX_INFO(("turn on ARP for %s device", netif)); ifr.ifr_flags &= ~IFF_NOARP; if (ioctl(sock, SIOCSIFFLAGS, &ifr) < 0) { BX_PANIC(("SIOCSIFFLAGS: %s", strerror(errno))); close(sock); return; } } close(sock); #endif fd = open (filename, O_RDWR); if (fd < 0) { BX_PANIC(("open failed on TAP %s: %s", netif, strerror(errno))); return; } #if defined(__sun__) char *ptr; /* PD - ppa allocation ala qemu */ char my_dev[10]; /* enough ... */ int ppa=-1; struct strioctl strioc_ppa; my_dev[10-1]=0; strncpy(my_dev,netif,10); /* following ptr= does not work with const char* */ if( *my_dev ) { /* find the ppa number X from string tapX */ ptr = my_dev; while( *ptr && !isdigit((int)*ptr) ) ptr++; ppa = atoi(ptr); } /* Assign a new PPA and get its unit number. */ strioc_ppa.ic_cmd = TUNNEWPPA; strioc_ppa.ic_timout = 0; strioc_ppa.ic_len = sizeof(ppa); strioc_ppa.ic_dp = (char *)&ppa; if ((ppa = ioctl (fd, I_STR, &strioc_ppa)) < 0) BX_PANIC(("Can't assign new interface tap%d !",ppa)); #endif /* set O_ASYNC flag so that we can poll with read() */ if ((flags = fcntl(fd, F_GETFL)) < 0) { BX_PANIC(("getflags on tap device: %s", strerror(errno))); } flags |= O_NONBLOCK; if (fcntl(fd, F_SETFL, flags) < 0) { BX_PANIC(("set tap device flags: %s", strerror(errno))); } BX_INFO(("tap network drive: opened %s device", netif)); /* Execute the configuration script */ char intname[IFNAMSIZ]; strcpy(intname,netif); if((script != NULL) && (strcmp(script, "") != 0) && (strcmp(script, "none") != 0)) { if (execute_script(this->netdev, script, intname) < 0) BX_ERROR(("execute script '%s' on %s failed", script, intname)); } // Start the rx poll this->rx_timer_index = bx_pc_system.register_timer(this, this->rx_timer_handler, 1000, 1, 1, "eth_tap"); // continuous, active this->rxh = rxh; memcpy(&guest_macaddr[0], macaddr, 6); #if BX_ETH_TAP_LOGGING // eventually Bryce wants txlog to dump in pcap format so that // tcpdump -r FILE can read it and interpret packets. txlog = fopen("ne2k-tx.log", "wb"); if (!txlog) BX_PANIC(("open ne2k-tx.log failed")); txlog_txt = fopen("ne2k-txdump.txt", "wb"); if (!txlog_txt) BX_PANIC(("open ne2k-txdump.txt failed")); fprintf(txlog_txt, "tap packetmover readable log file\n"); fprintf(txlog_txt, "net IF = %s\n", netif); fprintf(txlog_txt, "MAC address = "); for (int i=0; i<6; i++) fprintf(txlog_txt, "%02x%s", 0xff & macaddr[i], i<5?":" : ""); fprintf(txlog_txt, "\n--\n"); fflush(txlog_txt); rxlog = fopen("ne2k-rx.log", "wb"); if (!rxlog) BX_PANIC(("open ne2k-rx.log failed")); rxlog_txt = fopen("ne2k-rxdump.txt", "wb"); if (!rxlog_txt) BX_PANIC(("open ne2k-rxdump.txt failed")); fprintf(rxlog_txt, "tap packetmover readable log file\n"); fprintf(rxlog_txt, "net IF = %s\n", netif); fprintf(rxlog_txt, "MAC address = "); for (int i=0; i<6; i++) fprintf(rxlog_txt, "%02x%s", 0xff & macaddr[i], i<5?":" : ""); fprintf(rxlog_txt, "\n--\n"); fflush(rxlog_txt); #endif } void bx_tap_pktmover_c::sendpkt(void *buf, unsigned io_len) { Bit8u txbuf[BX_PACKET_BUFSIZE]; txbuf[0] = 0; txbuf[1] = 0; unsigned int size; #if defined(__FreeBSD__) || defined(__FreeBSD_kernel__) || \ defined(__APPLE__) || defined(__OpenBSD__) || defined(__sun__) // Should be fixed for other *BSD memcpy(txbuf, buf, io_len); /* PD - for Sun variant the retry cycle from qemu - mainly to be sure packet is really out */ #if defined(__sun__) int ret; for(;;) { ret=write(fd, txbuf, io_len); if (ret < 0 && (errno == EINTR || errno == EAGAIN)) { } else { size=ret; break; } } #else /* not defined __sun__ */ size = write(fd, txbuf, io_len); #endif /* whole condition about defined __sun__ */ if (size != io_len) { #else /* not bsd/apple/sun style */ memcpy(txbuf+2, buf, io_len); size = write(fd, txbuf, io_len+2); if (size != io_len+2) { #endif BX_PANIC(("write on tap device: %s", strerror(errno))); } else { BX_DEBUG(("wrote %d bytes + ev. 2 byte pad on tap", io_len)); } #if BX_ETH_TAP_LOGGING BX_DEBUG(("sendpkt length %u", io_len)); // dump raw bytes to a file, eventually dump in pcap format so that // tcpdump -r FILE can interpret them for us. int n = fwrite(buf, io_len, 1, txlog); if (n != 1) BX_ERROR(("fwrite to txlog failed, io_len = %u", io_len)); // dump packet in hex into an ascii log file write_pktlog_txt(txlog_txt, (const Bit8u *)buf, io_len, 0); // flush log so that we see the packets as they arrive w/o buffering fflush(txlog); #endif } void bx_tap_pktmover_c::rx_timer_handler(void *this_ptr) { bx_tap_pktmover_c *class_ptr = (bx_tap_pktmover_c *) this_ptr; class_ptr->rx_timer(); } void bx_tap_pktmover_c::rx_timer() { int nbytes; Bit8u buf[BX_PACKET_BUFSIZE]; Bit8u *rxbuf; if (fd<0) return; #if defined(__sun__) struct strbuf sbuf; int f = 0; sbuf.maxlen = sizeof(buf); sbuf.buf = (char *)buf; nbytes = getmsg(fd, NULL, &sbuf, &f) >=0 ? sbuf.len : -1; #else nbytes = read (fd, buf, sizeof(buf)); #endif // hack: discard first two bytes #if defined(__FreeBSD__) || defined(__FreeBSD_kernel__) || defined(__APPLE__) || defined(__sun__) // Should be fixed for other *BSD rxbuf = buf; #else rxbuf = buf+2; nbytes-=2; #endif #if defined(__linux__) // hack: TAP device likes to create an ethernet header which has // the same source and destination address FE:FD:00:00:00:00. // Change the dest address to FE:FD:00:00:00:01. if (!memcmp(&rxbuf[0], &rxbuf[6], 6)) { rxbuf[5] = guest_macaddr[5]; } #endif if (nbytes>0) BX_DEBUG(("tap read returned %d bytes", nbytes)); if (nbytes<0) { if (errno != EAGAIN) BX_ERROR(("tap read error: %s", strerror(errno))); return; } #if BX_ETH_TAP_LOGGING if (nbytes > 0) { BX_DEBUG(("receive packet length %u", nbytes)); // dump raw bytes to a file, eventually dump in pcap format so that // tcpdump -r FILE can interpret them for us. int n = fwrite(rxbuf, nbytes, 1, rxlog); if (n != 1) BX_ERROR(("fwrite to rxlog failed, nbytes = %d", nbytes)); // dump packet in hex into an ascii log file write_pktlog_txt(rxlog_txt, rxbuf, nbytes, 1); // flush log so that we see the packets as they arrive w/o buffering fflush(rxlog); } #endif BX_DEBUG(("eth_tap: got packet: %d bytes, dst=%x:%x:%x:%x:%x:%x, src=%x:%x:%x:%x:%x:%x\n", nbytes, rxbuf[0], rxbuf[1], rxbuf[2], rxbuf[3], rxbuf[4], rxbuf[5], rxbuf[6], rxbuf[7], rxbuf[8], rxbuf[9], rxbuf[10], rxbuf[11])); if (nbytes < 60) { BX_INFO(("packet too short (%d), padding to 60", nbytes)); nbytes = 60; } (*rxh)(netdev, rxbuf, nbytes); } #endif /* if BX_NETWORKING && defined HAVE_ETHERTAP */