15281d757SMark McLoughlin /* 25281d757SMark McLoughlin * QEMU System Emulator 35281d757SMark McLoughlin * 45281d757SMark McLoughlin * Copyright (c) 2003-2008 Fabrice Bellard 55281d757SMark McLoughlin * Copyright (c) 2009 Red Hat, Inc. 65281d757SMark McLoughlin * 75281d757SMark McLoughlin * Permission is hereby granted, free of charge, to any person obtaining a copy 85281d757SMark McLoughlin * of this software and associated documentation files (the "Software"), to deal 95281d757SMark McLoughlin * in the Software without restriction, including without limitation the rights 105281d757SMark McLoughlin * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell 115281d757SMark McLoughlin * copies of the Software, and to permit persons to whom the Software is 125281d757SMark McLoughlin * furnished to do so, subject to the following conditions: 135281d757SMark McLoughlin * 145281d757SMark McLoughlin * The above copyright notice and this permission notice shall be included in 155281d757SMark McLoughlin * all copies or substantial portions of the Software. 165281d757SMark McLoughlin * 175281d757SMark McLoughlin * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 185281d757SMark McLoughlin * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 195281d757SMark McLoughlin * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 205281d757SMark McLoughlin * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 215281d757SMark McLoughlin * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 225281d757SMark McLoughlin * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN 235281d757SMark McLoughlin * THE SOFTWARE. 245281d757SMark McLoughlin */ 255281d757SMark McLoughlin 265281d757SMark McLoughlin #include "net/tap.h" 275281d757SMark McLoughlin 285281d757SMark McLoughlin #include "config-host.h" 295281d757SMark McLoughlin 305281d757SMark McLoughlin #include <signal.h> 315281d757SMark McLoughlin #include <sys/ioctl.h> 325281d757SMark McLoughlin #include <sys/stat.h> 335281d757SMark McLoughlin #include <sys/wait.h> 345281d757SMark McLoughlin #include <net/if.h> 355281d757SMark McLoughlin 365281d757SMark McLoughlin #include "net.h" 375281d757SMark McLoughlin #include "sysemu.h" 385281d757SMark McLoughlin #include "qemu-char.h" 395281d757SMark McLoughlin #include "qemu-common.h" 405281d757SMark McLoughlin 415281d757SMark McLoughlin #ifdef __linux__ 425281d757SMark McLoughlin #include "net/tap-linux.h" 435281d757SMark McLoughlin #endif 445281d757SMark McLoughlin 455281d757SMark McLoughlin #if !defined(_AIX) 465281d757SMark McLoughlin 475281d757SMark McLoughlin /* Maximum GSO packet size (64k) plus plenty of room for 485281d757SMark McLoughlin * the ethernet and virtio_net headers 495281d757SMark McLoughlin */ 505281d757SMark McLoughlin #define TAP_BUFSIZE (4096 + 65536) 515281d757SMark McLoughlin 525281d757SMark McLoughlin typedef struct TAPState { 535281d757SMark McLoughlin VLANClientState *vc; 545281d757SMark McLoughlin int fd; 555281d757SMark McLoughlin char down_script[1024]; 565281d757SMark McLoughlin char down_script_arg[128]; 575281d757SMark McLoughlin uint8_t buf[TAP_BUFSIZE]; 585281d757SMark McLoughlin unsigned int read_poll : 1; 595281d757SMark McLoughlin unsigned int write_poll : 1; 605281d757SMark McLoughlin unsigned int has_vnet_hdr : 1; 615281d757SMark McLoughlin unsigned int using_vnet_hdr : 1; 625281d757SMark McLoughlin unsigned int has_ufo: 1; 635281d757SMark McLoughlin } TAPState; 645281d757SMark McLoughlin 655281d757SMark McLoughlin static int launch_script(const char *setup_script, const char *ifname, int fd); 665281d757SMark McLoughlin 675281d757SMark McLoughlin static int tap_can_send(void *opaque); 685281d757SMark McLoughlin static void tap_send(void *opaque); 695281d757SMark McLoughlin static void tap_writable(void *opaque); 705281d757SMark McLoughlin 715281d757SMark McLoughlin static void tap_update_fd_handler(TAPState *s) 725281d757SMark McLoughlin { 735281d757SMark McLoughlin qemu_set_fd_handler2(s->fd, 745281d757SMark McLoughlin s->read_poll ? tap_can_send : NULL, 755281d757SMark McLoughlin s->read_poll ? tap_send : NULL, 765281d757SMark McLoughlin s->write_poll ? tap_writable : NULL, 775281d757SMark McLoughlin s); 785281d757SMark McLoughlin } 795281d757SMark McLoughlin 805281d757SMark McLoughlin static void tap_read_poll(TAPState *s, int enable) 815281d757SMark McLoughlin { 825281d757SMark McLoughlin s->read_poll = !!enable; 835281d757SMark McLoughlin tap_update_fd_handler(s); 845281d757SMark McLoughlin } 855281d757SMark McLoughlin 865281d757SMark McLoughlin static void tap_write_poll(TAPState *s, int enable) 875281d757SMark McLoughlin { 885281d757SMark McLoughlin s->write_poll = !!enable; 895281d757SMark McLoughlin tap_update_fd_handler(s); 905281d757SMark McLoughlin } 915281d757SMark McLoughlin 925281d757SMark McLoughlin static void tap_writable(void *opaque) 935281d757SMark McLoughlin { 945281d757SMark McLoughlin TAPState *s = opaque; 955281d757SMark McLoughlin 965281d757SMark McLoughlin tap_write_poll(s, 0); 975281d757SMark McLoughlin 985281d757SMark McLoughlin qemu_flush_queued_packets(s->vc); 995281d757SMark McLoughlin } 1005281d757SMark McLoughlin 1015281d757SMark McLoughlin static ssize_t tap_write_packet(TAPState *s, const struct iovec *iov, int iovcnt) 1025281d757SMark McLoughlin { 1035281d757SMark McLoughlin ssize_t len; 1045281d757SMark McLoughlin 1055281d757SMark McLoughlin do { 1065281d757SMark McLoughlin len = writev(s->fd, iov, iovcnt); 1075281d757SMark McLoughlin } while (len == -1 && errno == EINTR); 1085281d757SMark McLoughlin 1095281d757SMark McLoughlin if (len == -1 && errno == EAGAIN) { 1105281d757SMark McLoughlin tap_write_poll(s, 1); 1115281d757SMark McLoughlin return 0; 1125281d757SMark McLoughlin } 1135281d757SMark McLoughlin 1145281d757SMark McLoughlin return len; 1155281d757SMark McLoughlin } 1165281d757SMark McLoughlin 1175281d757SMark McLoughlin static ssize_t tap_receive_iov(VLANClientState *vc, const struct iovec *iov, 1185281d757SMark McLoughlin int iovcnt) 1195281d757SMark McLoughlin { 1205281d757SMark McLoughlin TAPState *s = vc->opaque; 1215281d757SMark McLoughlin const struct iovec *iovp = iov; 1225281d757SMark McLoughlin struct iovec iov_copy[iovcnt + 1]; 1235281d757SMark McLoughlin struct virtio_net_hdr hdr = { 0, }; 1245281d757SMark McLoughlin 1255281d757SMark McLoughlin if (s->has_vnet_hdr && !s->using_vnet_hdr) { 1265281d757SMark McLoughlin iov_copy[0].iov_base = &hdr; 1275281d757SMark McLoughlin iov_copy[0].iov_len = sizeof(hdr); 1285281d757SMark McLoughlin memcpy(&iov_copy[1], iov, iovcnt * sizeof(*iov)); 1295281d757SMark McLoughlin iovp = iov_copy; 1305281d757SMark McLoughlin iovcnt++; 1315281d757SMark McLoughlin } 1325281d757SMark McLoughlin 1335281d757SMark McLoughlin return tap_write_packet(s, iovp, iovcnt); 1345281d757SMark McLoughlin } 1355281d757SMark McLoughlin 1365281d757SMark McLoughlin static ssize_t tap_receive_raw(VLANClientState *vc, const uint8_t *buf, size_t size) 1375281d757SMark McLoughlin { 1385281d757SMark McLoughlin TAPState *s = vc->opaque; 1395281d757SMark McLoughlin struct iovec iov[2]; 1405281d757SMark McLoughlin int iovcnt = 0; 1415281d757SMark McLoughlin struct virtio_net_hdr hdr = { 0, }; 1425281d757SMark McLoughlin 1435281d757SMark McLoughlin if (s->has_vnet_hdr) { 1445281d757SMark McLoughlin iov[iovcnt].iov_base = &hdr; 1455281d757SMark McLoughlin iov[iovcnt].iov_len = sizeof(hdr); 1465281d757SMark McLoughlin iovcnt++; 1475281d757SMark McLoughlin } 1485281d757SMark McLoughlin 1495281d757SMark McLoughlin iov[iovcnt].iov_base = (char *)buf; 1505281d757SMark McLoughlin iov[iovcnt].iov_len = size; 1515281d757SMark McLoughlin iovcnt++; 1525281d757SMark McLoughlin 1535281d757SMark McLoughlin return tap_write_packet(s, iov, iovcnt); 1545281d757SMark McLoughlin } 1555281d757SMark McLoughlin 1565281d757SMark McLoughlin static ssize_t tap_receive(VLANClientState *vc, const uint8_t *buf, size_t size) 1575281d757SMark McLoughlin { 1585281d757SMark McLoughlin TAPState *s = vc->opaque; 1595281d757SMark McLoughlin struct iovec iov[1]; 1605281d757SMark McLoughlin 1615281d757SMark McLoughlin if (s->has_vnet_hdr && !s->using_vnet_hdr) { 1625281d757SMark McLoughlin return tap_receive_raw(vc, buf, size); 1635281d757SMark McLoughlin } 1645281d757SMark McLoughlin 1655281d757SMark McLoughlin iov[0].iov_base = (char *)buf; 1665281d757SMark McLoughlin iov[0].iov_len = size; 1675281d757SMark McLoughlin 1685281d757SMark McLoughlin return tap_write_packet(s, iov, 1); 1695281d757SMark McLoughlin } 1705281d757SMark McLoughlin 1715281d757SMark McLoughlin static int tap_can_send(void *opaque) 1725281d757SMark McLoughlin { 1735281d757SMark McLoughlin TAPState *s = opaque; 1745281d757SMark McLoughlin 1755281d757SMark McLoughlin return qemu_can_send_packet(s->vc); 1765281d757SMark McLoughlin } 1775281d757SMark McLoughlin 178*966ea5ecSMark McLoughlin #ifndef __sun__ 179*966ea5ecSMark McLoughlin ssize_t tap_read_packet(int tapfd, uint8_t *buf, int maxlen) 1805281d757SMark McLoughlin { 1815281d757SMark McLoughlin return read(tapfd, buf, maxlen); 1825281d757SMark McLoughlin } 1835281d757SMark McLoughlin #endif 1845281d757SMark McLoughlin 1855281d757SMark McLoughlin static void tap_send_completed(VLANClientState *vc, ssize_t len) 1865281d757SMark McLoughlin { 1875281d757SMark McLoughlin TAPState *s = vc->opaque; 1885281d757SMark McLoughlin tap_read_poll(s, 1); 1895281d757SMark McLoughlin } 1905281d757SMark McLoughlin 1915281d757SMark McLoughlin static void tap_send(void *opaque) 1925281d757SMark McLoughlin { 1935281d757SMark McLoughlin TAPState *s = opaque; 1945281d757SMark McLoughlin int size; 1955281d757SMark McLoughlin 1965281d757SMark McLoughlin do { 1975281d757SMark McLoughlin uint8_t *buf = s->buf; 1985281d757SMark McLoughlin 1995281d757SMark McLoughlin size = tap_read_packet(s->fd, s->buf, sizeof(s->buf)); 2005281d757SMark McLoughlin if (size <= 0) { 2015281d757SMark McLoughlin break; 2025281d757SMark McLoughlin } 2035281d757SMark McLoughlin 2045281d757SMark McLoughlin if (s->has_vnet_hdr && !s->using_vnet_hdr) { 2055281d757SMark McLoughlin buf += sizeof(struct virtio_net_hdr); 2065281d757SMark McLoughlin size -= sizeof(struct virtio_net_hdr); 2075281d757SMark McLoughlin } 2085281d757SMark McLoughlin 2095281d757SMark McLoughlin size = qemu_send_packet_async(s->vc, buf, size, tap_send_completed); 2105281d757SMark McLoughlin if (size == 0) { 2115281d757SMark McLoughlin tap_read_poll(s, 0); 2125281d757SMark McLoughlin } 2135281d757SMark McLoughlin } while (size > 0); 2145281d757SMark McLoughlin } 2155281d757SMark McLoughlin 2165281d757SMark McLoughlin /* sndbuf should be set to a value lower than the tx queue 2175281d757SMark McLoughlin * capacity of any destination network interface. 2185281d757SMark McLoughlin * Ethernet NICs generally have txqueuelen=1000, so 1Mb is 2195281d757SMark McLoughlin * a good default, given a 1500 byte MTU. 2205281d757SMark McLoughlin */ 2215281d757SMark McLoughlin #define TAP_DEFAULT_SNDBUF 1024*1024 2225281d757SMark McLoughlin 2235281d757SMark McLoughlin static int tap_set_sndbuf(TAPState *s, QemuOpts *opts) 2245281d757SMark McLoughlin { 2255281d757SMark McLoughlin int sndbuf; 2265281d757SMark McLoughlin 2275281d757SMark McLoughlin sndbuf = qemu_opt_get_size(opts, "sndbuf", TAP_DEFAULT_SNDBUF); 2285281d757SMark McLoughlin if (!sndbuf) { 2295281d757SMark McLoughlin sndbuf = INT_MAX; 2305281d757SMark McLoughlin } 2315281d757SMark McLoughlin 2325281d757SMark McLoughlin if (ioctl(s->fd, TUNSETSNDBUF, &sndbuf) == -1 && qemu_opt_get(opts, "sndbuf")) { 2335281d757SMark McLoughlin qemu_error("TUNSETSNDBUF ioctl failed: %s\n", strerror(errno)); 2345281d757SMark McLoughlin return -1; 2355281d757SMark McLoughlin } 2365281d757SMark McLoughlin return 0; 2375281d757SMark McLoughlin } 2385281d757SMark McLoughlin 2395281d757SMark McLoughlin int tap_has_ufo(VLANClientState *vc) 2405281d757SMark McLoughlin { 2415281d757SMark McLoughlin TAPState *s = vc->opaque; 2425281d757SMark McLoughlin 2435281d757SMark McLoughlin assert(vc->type == NET_CLIENT_TYPE_TAP); 2445281d757SMark McLoughlin 2455281d757SMark McLoughlin return s->has_ufo; 2465281d757SMark McLoughlin } 2475281d757SMark McLoughlin 2485281d757SMark McLoughlin int tap_has_vnet_hdr(VLANClientState *vc) 2495281d757SMark McLoughlin { 2505281d757SMark McLoughlin TAPState *s = vc->opaque; 2515281d757SMark McLoughlin 2525281d757SMark McLoughlin assert(vc->type == NET_CLIENT_TYPE_TAP); 2535281d757SMark McLoughlin 2545281d757SMark McLoughlin return s->has_vnet_hdr; 2555281d757SMark McLoughlin } 2565281d757SMark McLoughlin 2575281d757SMark McLoughlin void tap_using_vnet_hdr(VLANClientState *vc, int using_vnet_hdr) 2585281d757SMark McLoughlin { 2595281d757SMark McLoughlin TAPState *s = vc->opaque; 2605281d757SMark McLoughlin 2615281d757SMark McLoughlin using_vnet_hdr = using_vnet_hdr != 0; 2625281d757SMark McLoughlin 2635281d757SMark McLoughlin assert(vc->type == NET_CLIENT_TYPE_TAP); 2645281d757SMark McLoughlin assert(s->has_vnet_hdr == using_vnet_hdr); 2655281d757SMark McLoughlin 2665281d757SMark McLoughlin s->using_vnet_hdr = using_vnet_hdr; 2675281d757SMark McLoughlin } 2685281d757SMark McLoughlin 2695281d757SMark McLoughlin static int tap_probe_vnet_hdr(int fd) 2705281d757SMark McLoughlin { 2715281d757SMark McLoughlin struct ifreq ifr; 2725281d757SMark McLoughlin 2735281d757SMark McLoughlin if (ioctl(fd, TUNGETIFF, &ifr) != 0) { 2745281d757SMark McLoughlin qemu_error("TUNGETIFF ioctl() failed: %s\n", strerror(errno)); 2755281d757SMark McLoughlin return 0; 2765281d757SMark McLoughlin } 2775281d757SMark McLoughlin 2785281d757SMark McLoughlin return ifr.ifr_flags & IFF_VNET_HDR; 2795281d757SMark McLoughlin } 2805281d757SMark McLoughlin 2815281d757SMark McLoughlin void tap_set_offload(VLANClientState *vc, int csum, int tso4, 2825281d757SMark McLoughlin int tso6, int ecn, int ufo) 2835281d757SMark McLoughlin { 2845281d757SMark McLoughlin TAPState *s = vc->opaque; 2855281d757SMark McLoughlin unsigned int offload = 0; 2865281d757SMark McLoughlin 2875281d757SMark McLoughlin if (csum) { 2885281d757SMark McLoughlin offload |= TUN_F_CSUM; 2895281d757SMark McLoughlin if (tso4) 2905281d757SMark McLoughlin offload |= TUN_F_TSO4; 2915281d757SMark McLoughlin if (tso6) 2925281d757SMark McLoughlin offload |= TUN_F_TSO6; 2935281d757SMark McLoughlin if ((tso4 || tso6) && ecn) 2945281d757SMark McLoughlin offload |= TUN_F_TSO_ECN; 2955281d757SMark McLoughlin if (ufo) 2965281d757SMark McLoughlin offload |= TUN_F_UFO; 2975281d757SMark McLoughlin } 2985281d757SMark McLoughlin 2995281d757SMark McLoughlin if (ioctl(s->fd, TUNSETOFFLOAD, offload) != 0) { 3005281d757SMark McLoughlin offload &= ~TUN_F_UFO; 3015281d757SMark McLoughlin if (ioctl(s->fd, TUNSETOFFLOAD, offload) != 0) { 3025281d757SMark McLoughlin fprintf(stderr, "TUNSETOFFLOAD ioctl() failed: %s\n", 3035281d757SMark McLoughlin strerror(errno)); 3045281d757SMark McLoughlin } 3055281d757SMark McLoughlin } 3065281d757SMark McLoughlin } 3075281d757SMark McLoughlin 3085281d757SMark McLoughlin static void tap_cleanup(VLANClientState *vc) 3095281d757SMark McLoughlin { 3105281d757SMark McLoughlin TAPState *s = vc->opaque; 3115281d757SMark McLoughlin 3125281d757SMark McLoughlin qemu_purge_queued_packets(vc); 3135281d757SMark McLoughlin 3145281d757SMark McLoughlin if (s->down_script[0]) 3155281d757SMark McLoughlin launch_script(s->down_script, s->down_script_arg, s->fd); 3165281d757SMark McLoughlin 3175281d757SMark McLoughlin tap_read_poll(s, 0); 3185281d757SMark McLoughlin tap_write_poll(s, 0); 3195281d757SMark McLoughlin close(s->fd); 3205281d757SMark McLoughlin qemu_free(s); 3215281d757SMark McLoughlin } 3225281d757SMark McLoughlin 3235281d757SMark McLoughlin /* fd support */ 3245281d757SMark McLoughlin 3255281d757SMark McLoughlin static TAPState *net_tap_fd_init(VLANState *vlan, 3265281d757SMark McLoughlin const char *model, 3275281d757SMark McLoughlin const char *name, 3285281d757SMark McLoughlin int fd, 3295281d757SMark McLoughlin int vnet_hdr) 3305281d757SMark McLoughlin { 3315281d757SMark McLoughlin TAPState *s; 3325281d757SMark McLoughlin unsigned int offload; 3335281d757SMark McLoughlin 3345281d757SMark McLoughlin s = qemu_mallocz(sizeof(TAPState)); 3355281d757SMark McLoughlin s->fd = fd; 3365281d757SMark McLoughlin s->has_vnet_hdr = vnet_hdr != 0; 3375281d757SMark McLoughlin s->using_vnet_hdr = 0; 3385281d757SMark McLoughlin s->vc = qemu_new_vlan_client(NET_CLIENT_TYPE_TAP, 3395281d757SMark McLoughlin vlan, NULL, model, name, NULL, 3405281d757SMark McLoughlin tap_receive, tap_receive_raw, 3415281d757SMark McLoughlin tap_receive_iov, tap_cleanup, s); 3425281d757SMark McLoughlin s->has_ufo = 0; 3435281d757SMark McLoughlin /* Check if tap supports UFO */ 3445281d757SMark McLoughlin offload = TUN_F_CSUM | TUN_F_UFO; 3455281d757SMark McLoughlin if (ioctl(s->fd, TUNSETOFFLOAD, offload) == 0) 3465281d757SMark McLoughlin s->has_ufo = 1; 3475281d757SMark McLoughlin tap_set_offload(s->vc, 0, 0, 0, 0, 0); 3485281d757SMark McLoughlin tap_read_poll(s, 1); 3495281d757SMark McLoughlin return s; 3505281d757SMark McLoughlin } 3515281d757SMark McLoughlin 352*966ea5ecSMark McLoughlin #ifdef _AIX 353e7e92325SMark McLoughlin int tap_open(char *ifname, int ifname_size, int *vnet_hdr, int vnet_hdr_required) 3545281d757SMark McLoughlin { 3555281d757SMark McLoughlin fprintf (stderr, "no tap on AIX\n"); 3565281d757SMark McLoughlin return -1; 3575281d757SMark McLoughlin } 3585281d757SMark McLoughlin #else 359e7e92325SMark McLoughlin int tap_open(char *ifname, int ifname_size, int *vnet_hdr, int vnet_hdr_required) 3605281d757SMark McLoughlin { 3615281d757SMark McLoughlin struct ifreq ifr; 3625281d757SMark McLoughlin int fd, ret; 3635281d757SMark McLoughlin 3645281d757SMark McLoughlin TFR(fd = open("/dev/net/tun", O_RDWR)); 3655281d757SMark McLoughlin if (fd < 0) { 3665281d757SMark McLoughlin fprintf(stderr, "warning: could not open /dev/net/tun: no virtual network emulation\n"); 3675281d757SMark McLoughlin return -1; 3685281d757SMark McLoughlin } 3695281d757SMark McLoughlin memset(&ifr, 0, sizeof(ifr)); 3705281d757SMark McLoughlin ifr.ifr_flags = IFF_TAP | IFF_NO_PI; 3715281d757SMark McLoughlin 3725281d757SMark McLoughlin if (*vnet_hdr) { 3735281d757SMark McLoughlin unsigned int features; 3745281d757SMark McLoughlin 3755281d757SMark McLoughlin if (ioctl(fd, TUNGETFEATURES, &features) == 0 && 3765281d757SMark McLoughlin features & IFF_VNET_HDR) { 3775281d757SMark McLoughlin *vnet_hdr = 1; 3785281d757SMark McLoughlin ifr.ifr_flags |= IFF_VNET_HDR; 3795281d757SMark McLoughlin } 3805281d757SMark McLoughlin 3815281d757SMark McLoughlin if (vnet_hdr_required && !*vnet_hdr) { 3825281d757SMark McLoughlin qemu_error("vnet_hdr=1 requested, but no kernel " 3835281d757SMark McLoughlin "support for IFF_VNET_HDR available"); 3845281d757SMark McLoughlin close(fd); 3855281d757SMark McLoughlin return -1; 3865281d757SMark McLoughlin } 3875281d757SMark McLoughlin } 3885281d757SMark McLoughlin 3895281d757SMark McLoughlin if (ifname[0] != '\0') 3905281d757SMark McLoughlin pstrcpy(ifr.ifr_name, IFNAMSIZ, ifname); 3915281d757SMark McLoughlin else 3925281d757SMark McLoughlin pstrcpy(ifr.ifr_name, IFNAMSIZ, "tap%d"); 3935281d757SMark McLoughlin ret = ioctl(fd, TUNSETIFF, (void *) &ifr); 3945281d757SMark McLoughlin if (ret != 0) { 3955281d757SMark McLoughlin fprintf(stderr, "warning: could not configure /dev/net/tun: no virtual network emulation\n"); 3965281d757SMark McLoughlin close(fd); 3975281d757SMark McLoughlin return -1; 3985281d757SMark McLoughlin } 3995281d757SMark McLoughlin pstrcpy(ifname, ifname_size, ifr.ifr_name); 4005281d757SMark McLoughlin fcntl(fd, F_SETFL, O_NONBLOCK); 4015281d757SMark McLoughlin return fd; 4025281d757SMark McLoughlin } 4035281d757SMark McLoughlin #endif 4045281d757SMark McLoughlin 4055281d757SMark McLoughlin static int launch_script(const char *setup_script, const char *ifname, int fd) 4065281d757SMark McLoughlin { 4075281d757SMark McLoughlin sigset_t oldmask, mask; 4085281d757SMark McLoughlin int pid, status; 4095281d757SMark McLoughlin char *args[3]; 4105281d757SMark McLoughlin char **parg; 4115281d757SMark McLoughlin 4125281d757SMark McLoughlin sigemptyset(&mask); 4135281d757SMark McLoughlin sigaddset(&mask, SIGCHLD); 4145281d757SMark McLoughlin sigprocmask(SIG_BLOCK, &mask, &oldmask); 4155281d757SMark McLoughlin 4165281d757SMark McLoughlin /* try to launch network script */ 4175281d757SMark McLoughlin pid = fork(); 4185281d757SMark McLoughlin if (pid == 0) { 4195281d757SMark McLoughlin int open_max = sysconf(_SC_OPEN_MAX), i; 4205281d757SMark McLoughlin 4215281d757SMark McLoughlin for (i = 0; i < open_max; i++) { 4225281d757SMark McLoughlin if (i != STDIN_FILENO && 4235281d757SMark McLoughlin i != STDOUT_FILENO && 4245281d757SMark McLoughlin i != STDERR_FILENO && 4255281d757SMark McLoughlin i != fd) { 4265281d757SMark McLoughlin close(i); 4275281d757SMark McLoughlin } 4285281d757SMark McLoughlin } 4295281d757SMark McLoughlin parg = args; 4305281d757SMark McLoughlin *parg++ = (char *)setup_script; 4315281d757SMark McLoughlin *parg++ = (char *)ifname; 4325281d757SMark McLoughlin *parg++ = NULL; 4335281d757SMark McLoughlin execv(setup_script, args); 4345281d757SMark McLoughlin _exit(1); 4355281d757SMark McLoughlin } else if (pid > 0) { 4365281d757SMark McLoughlin while (waitpid(pid, &status, 0) != pid) { 4375281d757SMark McLoughlin /* loop */ 4385281d757SMark McLoughlin } 4395281d757SMark McLoughlin sigprocmask(SIG_SETMASK, &oldmask, NULL); 4405281d757SMark McLoughlin 4415281d757SMark McLoughlin if (WIFEXITED(status) && WEXITSTATUS(status) == 0) { 4425281d757SMark McLoughlin return 0; 4435281d757SMark McLoughlin } 4445281d757SMark McLoughlin } 4455281d757SMark McLoughlin fprintf(stderr, "%s: could not launch network script\n", setup_script); 4465281d757SMark McLoughlin return -1; 4475281d757SMark McLoughlin } 4485281d757SMark McLoughlin 4495281d757SMark McLoughlin static int net_tap_init(QemuOpts *opts, int *vnet_hdr) 4505281d757SMark McLoughlin { 4515281d757SMark McLoughlin int fd, vnet_hdr_required; 4525281d757SMark McLoughlin char ifname[128] = {0,}; 4535281d757SMark McLoughlin const char *setup_script; 4545281d757SMark McLoughlin 4555281d757SMark McLoughlin if (qemu_opt_get(opts, "ifname")) { 4565281d757SMark McLoughlin pstrcpy(ifname, sizeof(ifname), qemu_opt_get(opts, "ifname")); 4575281d757SMark McLoughlin } 4585281d757SMark McLoughlin 4595281d757SMark McLoughlin *vnet_hdr = qemu_opt_get_bool(opts, "vnet_hdr", 1); 4605281d757SMark McLoughlin if (qemu_opt_get(opts, "vnet_hdr")) { 4615281d757SMark McLoughlin vnet_hdr_required = *vnet_hdr; 4625281d757SMark McLoughlin } else { 4635281d757SMark McLoughlin vnet_hdr_required = 0; 4645281d757SMark McLoughlin } 4655281d757SMark McLoughlin 4665281d757SMark McLoughlin TFR(fd = tap_open(ifname, sizeof(ifname), vnet_hdr, vnet_hdr_required)); 4675281d757SMark McLoughlin if (fd < 0) { 4685281d757SMark McLoughlin return -1; 4695281d757SMark McLoughlin } 4705281d757SMark McLoughlin 4715281d757SMark McLoughlin setup_script = qemu_opt_get(opts, "script"); 4725281d757SMark McLoughlin if (setup_script && 4735281d757SMark McLoughlin setup_script[0] != '\0' && 4745281d757SMark McLoughlin strcmp(setup_script, "no") != 0 && 4755281d757SMark McLoughlin launch_script(setup_script, ifname, fd)) { 4765281d757SMark McLoughlin close(fd); 4775281d757SMark McLoughlin return -1; 4785281d757SMark McLoughlin } 4795281d757SMark McLoughlin 4805281d757SMark McLoughlin qemu_opt_set(opts, "ifname", ifname); 4815281d757SMark McLoughlin 4825281d757SMark McLoughlin return fd; 4835281d757SMark McLoughlin } 4845281d757SMark McLoughlin 4855281d757SMark McLoughlin int net_init_tap(QemuOpts *opts, Monitor *mon, const char *name, VLANState *vlan) 4865281d757SMark McLoughlin { 4875281d757SMark McLoughlin TAPState *s; 4885281d757SMark McLoughlin int fd, vnet_hdr; 4895281d757SMark McLoughlin 4905281d757SMark McLoughlin if (qemu_opt_get(opts, "fd")) { 4915281d757SMark McLoughlin if (qemu_opt_get(opts, "ifname") || 4925281d757SMark McLoughlin qemu_opt_get(opts, "script") || 4935281d757SMark McLoughlin qemu_opt_get(opts, "downscript") || 4945281d757SMark McLoughlin qemu_opt_get(opts, "vnet_hdr")) { 4955281d757SMark McLoughlin qemu_error("ifname=, script=, downscript= and vnet_hdr= is invalid with fd=\n"); 4965281d757SMark McLoughlin return -1; 4975281d757SMark McLoughlin } 4985281d757SMark McLoughlin 4995281d757SMark McLoughlin fd = net_handle_fd_param(mon, qemu_opt_get(opts, "fd")); 5005281d757SMark McLoughlin if (fd == -1) { 5015281d757SMark McLoughlin return -1; 5025281d757SMark McLoughlin } 5035281d757SMark McLoughlin 5045281d757SMark McLoughlin fcntl(fd, F_SETFL, O_NONBLOCK); 5055281d757SMark McLoughlin 5065281d757SMark McLoughlin vnet_hdr = tap_probe_vnet_hdr(fd); 5075281d757SMark McLoughlin } else { 5085281d757SMark McLoughlin if (!qemu_opt_get(opts, "script")) { 5095281d757SMark McLoughlin qemu_opt_set(opts, "script", DEFAULT_NETWORK_SCRIPT); 5105281d757SMark McLoughlin } 5115281d757SMark McLoughlin 5125281d757SMark McLoughlin if (!qemu_opt_get(opts, "downscript")) { 5135281d757SMark McLoughlin qemu_opt_set(opts, "downscript", DEFAULT_NETWORK_DOWN_SCRIPT); 5145281d757SMark McLoughlin } 5155281d757SMark McLoughlin 5165281d757SMark McLoughlin fd = net_tap_init(opts, &vnet_hdr); 5175281d757SMark McLoughlin } 5185281d757SMark McLoughlin 5195281d757SMark McLoughlin s = net_tap_fd_init(vlan, "tap", name, fd, vnet_hdr); 5205281d757SMark McLoughlin if (!s) { 5215281d757SMark McLoughlin close(fd); 5225281d757SMark McLoughlin return -1; 5235281d757SMark McLoughlin } 5245281d757SMark McLoughlin 5255281d757SMark McLoughlin if (tap_set_sndbuf(s, opts) < 0) { 5265281d757SMark McLoughlin return -1; 5275281d757SMark McLoughlin } 5285281d757SMark McLoughlin 5295281d757SMark McLoughlin if (qemu_opt_get(opts, "fd")) { 5305281d757SMark McLoughlin snprintf(s->vc->info_str, sizeof(s->vc->info_str), "fd=%d", fd); 5315281d757SMark McLoughlin } else { 5325281d757SMark McLoughlin const char *ifname, *script, *downscript; 5335281d757SMark McLoughlin 5345281d757SMark McLoughlin ifname = qemu_opt_get(opts, "ifname"); 5355281d757SMark McLoughlin script = qemu_opt_get(opts, "script"); 5365281d757SMark McLoughlin downscript = qemu_opt_get(opts, "downscript"); 5375281d757SMark McLoughlin 5385281d757SMark McLoughlin snprintf(s->vc->info_str, sizeof(s->vc->info_str), 5395281d757SMark McLoughlin "ifname=%s,script=%s,downscript=%s", 5405281d757SMark McLoughlin ifname, script, downscript); 5415281d757SMark McLoughlin 5425281d757SMark McLoughlin if (strcmp(downscript, "no") != 0) { 5435281d757SMark McLoughlin snprintf(s->down_script, sizeof(s->down_script), "%s", downscript); 5445281d757SMark McLoughlin snprintf(s->down_script_arg, sizeof(s->down_script_arg), "%s", ifname); 5455281d757SMark McLoughlin } 5465281d757SMark McLoughlin } 5475281d757SMark McLoughlin 5485281d757SMark McLoughlin if (vlan) { 5495281d757SMark McLoughlin vlan->nb_host_devs++; 5505281d757SMark McLoughlin } 5515281d757SMark McLoughlin 5525281d757SMark McLoughlin return 0; 5535281d757SMark McLoughlin } 5545281d757SMark McLoughlin 5555281d757SMark McLoughlin #endif /* !defined(_AIX) */ 556