xref: /qemu/net/tap.c (revision 966ea5ec4fb14d4b420715e7aadc5dfd3ea5add2)
15281d757SMark McLoughlin /*
25281d757SMark McLoughlin  * QEMU System Emulator
35281d757SMark McLoughlin  *
45281d757SMark McLoughlin  * Copyright (c) 2003-2008 Fabrice Bellard
55281d757SMark McLoughlin  * Copyright (c) 2009 Red Hat, Inc.
65281d757SMark McLoughlin  *
75281d757SMark McLoughlin  * Permission is hereby granted, free of charge, to any person obtaining a copy
85281d757SMark McLoughlin  * of this software and associated documentation files (the "Software"), to deal
95281d757SMark McLoughlin  * in the Software without restriction, including without limitation the rights
105281d757SMark McLoughlin  * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
115281d757SMark McLoughlin  * copies of the Software, and to permit persons to whom the Software is
125281d757SMark McLoughlin  * furnished to do so, subject to the following conditions:
135281d757SMark McLoughlin  *
145281d757SMark McLoughlin  * The above copyright notice and this permission notice shall be included in
155281d757SMark McLoughlin  * all copies or substantial portions of the Software.
165281d757SMark McLoughlin  *
175281d757SMark McLoughlin  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
185281d757SMark McLoughlin  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
195281d757SMark McLoughlin  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
205281d757SMark McLoughlin  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
215281d757SMark McLoughlin  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
225281d757SMark McLoughlin  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
235281d757SMark McLoughlin  * THE SOFTWARE.
245281d757SMark McLoughlin  */
255281d757SMark McLoughlin 
265281d757SMark McLoughlin #include "net/tap.h"
275281d757SMark McLoughlin 
285281d757SMark McLoughlin #include "config-host.h"
295281d757SMark McLoughlin 
305281d757SMark McLoughlin #include <signal.h>
315281d757SMark McLoughlin #include <sys/ioctl.h>
325281d757SMark McLoughlin #include <sys/stat.h>
335281d757SMark McLoughlin #include <sys/wait.h>
345281d757SMark McLoughlin #include <net/if.h>
355281d757SMark McLoughlin 
365281d757SMark McLoughlin #include "net.h"
375281d757SMark McLoughlin #include "sysemu.h"
385281d757SMark McLoughlin #include "qemu-char.h"
395281d757SMark McLoughlin #include "qemu-common.h"
405281d757SMark McLoughlin 
415281d757SMark McLoughlin #ifdef __linux__
425281d757SMark McLoughlin #include "net/tap-linux.h"
435281d757SMark McLoughlin #endif
445281d757SMark McLoughlin 
455281d757SMark McLoughlin #if !defined(_AIX)
465281d757SMark McLoughlin 
475281d757SMark McLoughlin /* Maximum GSO packet size (64k) plus plenty of room for
485281d757SMark McLoughlin  * the ethernet and virtio_net headers
495281d757SMark McLoughlin  */
505281d757SMark McLoughlin #define TAP_BUFSIZE (4096 + 65536)
515281d757SMark McLoughlin 
525281d757SMark McLoughlin typedef struct TAPState {
535281d757SMark McLoughlin     VLANClientState *vc;
545281d757SMark McLoughlin     int fd;
555281d757SMark McLoughlin     char down_script[1024];
565281d757SMark McLoughlin     char down_script_arg[128];
575281d757SMark McLoughlin     uint8_t buf[TAP_BUFSIZE];
585281d757SMark McLoughlin     unsigned int read_poll : 1;
595281d757SMark McLoughlin     unsigned int write_poll : 1;
605281d757SMark McLoughlin     unsigned int has_vnet_hdr : 1;
615281d757SMark McLoughlin     unsigned int using_vnet_hdr : 1;
625281d757SMark McLoughlin     unsigned int has_ufo: 1;
635281d757SMark McLoughlin } TAPState;
645281d757SMark McLoughlin 
655281d757SMark McLoughlin static int launch_script(const char *setup_script, const char *ifname, int fd);
665281d757SMark McLoughlin 
675281d757SMark McLoughlin static int tap_can_send(void *opaque);
685281d757SMark McLoughlin static void tap_send(void *opaque);
695281d757SMark McLoughlin static void tap_writable(void *opaque);
705281d757SMark McLoughlin 
715281d757SMark McLoughlin static void tap_update_fd_handler(TAPState *s)
725281d757SMark McLoughlin {
735281d757SMark McLoughlin     qemu_set_fd_handler2(s->fd,
745281d757SMark McLoughlin                          s->read_poll  ? tap_can_send : NULL,
755281d757SMark McLoughlin                          s->read_poll  ? tap_send     : NULL,
765281d757SMark McLoughlin                          s->write_poll ? tap_writable : NULL,
775281d757SMark McLoughlin                          s);
785281d757SMark McLoughlin }
795281d757SMark McLoughlin 
805281d757SMark McLoughlin static void tap_read_poll(TAPState *s, int enable)
815281d757SMark McLoughlin {
825281d757SMark McLoughlin     s->read_poll = !!enable;
835281d757SMark McLoughlin     tap_update_fd_handler(s);
845281d757SMark McLoughlin }
855281d757SMark McLoughlin 
865281d757SMark McLoughlin static void tap_write_poll(TAPState *s, int enable)
875281d757SMark McLoughlin {
885281d757SMark McLoughlin     s->write_poll = !!enable;
895281d757SMark McLoughlin     tap_update_fd_handler(s);
905281d757SMark McLoughlin }
915281d757SMark McLoughlin 
925281d757SMark McLoughlin static void tap_writable(void *opaque)
935281d757SMark McLoughlin {
945281d757SMark McLoughlin     TAPState *s = opaque;
955281d757SMark McLoughlin 
965281d757SMark McLoughlin     tap_write_poll(s, 0);
975281d757SMark McLoughlin 
985281d757SMark McLoughlin     qemu_flush_queued_packets(s->vc);
995281d757SMark McLoughlin }
1005281d757SMark McLoughlin 
1015281d757SMark McLoughlin static ssize_t tap_write_packet(TAPState *s, const struct iovec *iov, int iovcnt)
1025281d757SMark McLoughlin {
1035281d757SMark McLoughlin     ssize_t len;
1045281d757SMark McLoughlin 
1055281d757SMark McLoughlin     do {
1065281d757SMark McLoughlin         len = writev(s->fd, iov, iovcnt);
1075281d757SMark McLoughlin     } while (len == -1 && errno == EINTR);
1085281d757SMark McLoughlin 
1095281d757SMark McLoughlin     if (len == -1 && errno == EAGAIN) {
1105281d757SMark McLoughlin         tap_write_poll(s, 1);
1115281d757SMark McLoughlin         return 0;
1125281d757SMark McLoughlin     }
1135281d757SMark McLoughlin 
1145281d757SMark McLoughlin     return len;
1155281d757SMark McLoughlin }
1165281d757SMark McLoughlin 
1175281d757SMark McLoughlin static ssize_t tap_receive_iov(VLANClientState *vc, const struct iovec *iov,
1185281d757SMark McLoughlin                                int iovcnt)
1195281d757SMark McLoughlin {
1205281d757SMark McLoughlin     TAPState *s = vc->opaque;
1215281d757SMark McLoughlin     const struct iovec *iovp = iov;
1225281d757SMark McLoughlin     struct iovec iov_copy[iovcnt + 1];
1235281d757SMark McLoughlin     struct virtio_net_hdr hdr = { 0, };
1245281d757SMark McLoughlin 
1255281d757SMark McLoughlin     if (s->has_vnet_hdr && !s->using_vnet_hdr) {
1265281d757SMark McLoughlin         iov_copy[0].iov_base = &hdr;
1275281d757SMark McLoughlin         iov_copy[0].iov_len =  sizeof(hdr);
1285281d757SMark McLoughlin         memcpy(&iov_copy[1], iov, iovcnt * sizeof(*iov));
1295281d757SMark McLoughlin         iovp = iov_copy;
1305281d757SMark McLoughlin         iovcnt++;
1315281d757SMark McLoughlin     }
1325281d757SMark McLoughlin 
1335281d757SMark McLoughlin     return tap_write_packet(s, iovp, iovcnt);
1345281d757SMark McLoughlin }
1355281d757SMark McLoughlin 
1365281d757SMark McLoughlin static ssize_t tap_receive_raw(VLANClientState *vc, const uint8_t *buf, size_t size)
1375281d757SMark McLoughlin {
1385281d757SMark McLoughlin     TAPState *s = vc->opaque;
1395281d757SMark McLoughlin     struct iovec iov[2];
1405281d757SMark McLoughlin     int iovcnt = 0;
1415281d757SMark McLoughlin     struct virtio_net_hdr hdr = { 0, };
1425281d757SMark McLoughlin 
1435281d757SMark McLoughlin     if (s->has_vnet_hdr) {
1445281d757SMark McLoughlin         iov[iovcnt].iov_base = &hdr;
1455281d757SMark McLoughlin         iov[iovcnt].iov_len  = sizeof(hdr);
1465281d757SMark McLoughlin         iovcnt++;
1475281d757SMark McLoughlin     }
1485281d757SMark McLoughlin 
1495281d757SMark McLoughlin     iov[iovcnt].iov_base = (char *)buf;
1505281d757SMark McLoughlin     iov[iovcnt].iov_len  = size;
1515281d757SMark McLoughlin     iovcnt++;
1525281d757SMark McLoughlin 
1535281d757SMark McLoughlin     return tap_write_packet(s, iov, iovcnt);
1545281d757SMark McLoughlin }
1555281d757SMark McLoughlin 
1565281d757SMark McLoughlin static ssize_t tap_receive(VLANClientState *vc, const uint8_t *buf, size_t size)
1575281d757SMark McLoughlin {
1585281d757SMark McLoughlin     TAPState *s = vc->opaque;
1595281d757SMark McLoughlin     struct iovec iov[1];
1605281d757SMark McLoughlin 
1615281d757SMark McLoughlin     if (s->has_vnet_hdr && !s->using_vnet_hdr) {
1625281d757SMark McLoughlin         return tap_receive_raw(vc, buf, size);
1635281d757SMark McLoughlin     }
1645281d757SMark McLoughlin 
1655281d757SMark McLoughlin     iov[0].iov_base = (char *)buf;
1665281d757SMark McLoughlin     iov[0].iov_len  = size;
1675281d757SMark McLoughlin 
1685281d757SMark McLoughlin     return tap_write_packet(s, iov, 1);
1695281d757SMark McLoughlin }
1705281d757SMark McLoughlin 
1715281d757SMark McLoughlin static int tap_can_send(void *opaque)
1725281d757SMark McLoughlin {
1735281d757SMark McLoughlin     TAPState *s = opaque;
1745281d757SMark McLoughlin 
1755281d757SMark McLoughlin     return qemu_can_send_packet(s->vc);
1765281d757SMark McLoughlin }
1775281d757SMark McLoughlin 
178*966ea5ecSMark McLoughlin #ifndef __sun__
179*966ea5ecSMark McLoughlin ssize_t tap_read_packet(int tapfd, uint8_t *buf, int maxlen)
1805281d757SMark McLoughlin {
1815281d757SMark McLoughlin     return read(tapfd, buf, maxlen);
1825281d757SMark McLoughlin }
1835281d757SMark McLoughlin #endif
1845281d757SMark McLoughlin 
1855281d757SMark McLoughlin static void tap_send_completed(VLANClientState *vc, ssize_t len)
1865281d757SMark McLoughlin {
1875281d757SMark McLoughlin     TAPState *s = vc->opaque;
1885281d757SMark McLoughlin     tap_read_poll(s, 1);
1895281d757SMark McLoughlin }
1905281d757SMark McLoughlin 
1915281d757SMark McLoughlin static void tap_send(void *opaque)
1925281d757SMark McLoughlin {
1935281d757SMark McLoughlin     TAPState *s = opaque;
1945281d757SMark McLoughlin     int size;
1955281d757SMark McLoughlin 
1965281d757SMark McLoughlin     do {
1975281d757SMark McLoughlin         uint8_t *buf = s->buf;
1985281d757SMark McLoughlin 
1995281d757SMark McLoughlin         size = tap_read_packet(s->fd, s->buf, sizeof(s->buf));
2005281d757SMark McLoughlin         if (size <= 0) {
2015281d757SMark McLoughlin             break;
2025281d757SMark McLoughlin         }
2035281d757SMark McLoughlin 
2045281d757SMark McLoughlin         if (s->has_vnet_hdr && !s->using_vnet_hdr) {
2055281d757SMark McLoughlin             buf  += sizeof(struct virtio_net_hdr);
2065281d757SMark McLoughlin             size -= sizeof(struct virtio_net_hdr);
2075281d757SMark McLoughlin         }
2085281d757SMark McLoughlin 
2095281d757SMark McLoughlin         size = qemu_send_packet_async(s->vc, buf, size, tap_send_completed);
2105281d757SMark McLoughlin         if (size == 0) {
2115281d757SMark McLoughlin             tap_read_poll(s, 0);
2125281d757SMark McLoughlin         }
2135281d757SMark McLoughlin     } while (size > 0);
2145281d757SMark McLoughlin }
2155281d757SMark McLoughlin 
2165281d757SMark McLoughlin /* sndbuf should be set to a value lower than the tx queue
2175281d757SMark McLoughlin  * capacity of any destination network interface.
2185281d757SMark McLoughlin  * Ethernet NICs generally have txqueuelen=1000, so 1Mb is
2195281d757SMark McLoughlin  * a good default, given a 1500 byte MTU.
2205281d757SMark McLoughlin  */
2215281d757SMark McLoughlin #define TAP_DEFAULT_SNDBUF 1024*1024
2225281d757SMark McLoughlin 
2235281d757SMark McLoughlin static int tap_set_sndbuf(TAPState *s, QemuOpts *opts)
2245281d757SMark McLoughlin {
2255281d757SMark McLoughlin     int sndbuf;
2265281d757SMark McLoughlin 
2275281d757SMark McLoughlin     sndbuf = qemu_opt_get_size(opts, "sndbuf", TAP_DEFAULT_SNDBUF);
2285281d757SMark McLoughlin     if (!sndbuf) {
2295281d757SMark McLoughlin         sndbuf = INT_MAX;
2305281d757SMark McLoughlin     }
2315281d757SMark McLoughlin 
2325281d757SMark McLoughlin     if (ioctl(s->fd, TUNSETSNDBUF, &sndbuf) == -1 && qemu_opt_get(opts, "sndbuf")) {
2335281d757SMark McLoughlin         qemu_error("TUNSETSNDBUF ioctl failed: %s\n", strerror(errno));
2345281d757SMark McLoughlin         return -1;
2355281d757SMark McLoughlin     }
2365281d757SMark McLoughlin     return 0;
2375281d757SMark McLoughlin }
2385281d757SMark McLoughlin 
2395281d757SMark McLoughlin int tap_has_ufo(VLANClientState *vc)
2405281d757SMark McLoughlin {
2415281d757SMark McLoughlin     TAPState *s = vc->opaque;
2425281d757SMark McLoughlin 
2435281d757SMark McLoughlin     assert(vc->type == NET_CLIENT_TYPE_TAP);
2445281d757SMark McLoughlin 
2455281d757SMark McLoughlin     return s->has_ufo;
2465281d757SMark McLoughlin }
2475281d757SMark McLoughlin 
2485281d757SMark McLoughlin int tap_has_vnet_hdr(VLANClientState *vc)
2495281d757SMark McLoughlin {
2505281d757SMark McLoughlin     TAPState *s = vc->opaque;
2515281d757SMark McLoughlin 
2525281d757SMark McLoughlin     assert(vc->type == NET_CLIENT_TYPE_TAP);
2535281d757SMark McLoughlin 
2545281d757SMark McLoughlin     return s->has_vnet_hdr;
2555281d757SMark McLoughlin }
2565281d757SMark McLoughlin 
2575281d757SMark McLoughlin void tap_using_vnet_hdr(VLANClientState *vc, int using_vnet_hdr)
2585281d757SMark McLoughlin {
2595281d757SMark McLoughlin     TAPState *s = vc->opaque;
2605281d757SMark McLoughlin 
2615281d757SMark McLoughlin     using_vnet_hdr = using_vnet_hdr != 0;
2625281d757SMark McLoughlin 
2635281d757SMark McLoughlin     assert(vc->type == NET_CLIENT_TYPE_TAP);
2645281d757SMark McLoughlin     assert(s->has_vnet_hdr == using_vnet_hdr);
2655281d757SMark McLoughlin 
2665281d757SMark McLoughlin     s->using_vnet_hdr = using_vnet_hdr;
2675281d757SMark McLoughlin }
2685281d757SMark McLoughlin 
2695281d757SMark McLoughlin static int tap_probe_vnet_hdr(int fd)
2705281d757SMark McLoughlin {
2715281d757SMark McLoughlin     struct ifreq ifr;
2725281d757SMark McLoughlin 
2735281d757SMark McLoughlin     if (ioctl(fd, TUNGETIFF, &ifr) != 0) {
2745281d757SMark McLoughlin         qemu_error("TUNGETIFF ioctl() failed: %s\n", strerror(errno));
2755281d757SMark McLoughlin         return 0;
2765281d757SMark McLoughlin     }
2775281d757SMark McLoughlin 
2785281d757SMark McLoughlin     return ifr.ifr_flags & IFF_VNET_HDR;
2795281d757SMark McLoughlin }
2805281d757SMark McLoughlin 
2815281d757SMark McLoughlin void tap_set_offload(VLANClientState *vc, int csum, int tso4,
2825281d757SMark McLoughlin                      int tso6, int ecn, int ufo)
2835281d757SMark McLoughlin {
2845281d757SMark McLoughlin     TAPState *s = vc->opaque;
2855281d757SMark McLoughlin     unsigned int offload = 0;
2865281d757SMark McLoughlin 
2875281d757SMark McLoughlin     if (csum) {
2885281d757SMark McLoughlin         offload |= TUN_F_CSUM;
2895281d757SMark McLoughlin         if (tso4)
2905281d757SMark McLoughlin             offload |= TUN_F_TSO4;
2915281d757SMark McLoughlin         if (tso6)
2925281d757SMark McLoughlin             offload |= TUN_F_TSO6;
2935281d757SMark McLoughlin         if ((tso4 || tso6) && ecn)
2945281d757SMark McLoughlin             offload |= TUN_F_TSO_ECN;
2955281d757SMark McLoughlin         if (ufo)
2965281d757SMark McLoughlin             offload |= TUN_F_UFO;
2975281d757SMark McLoughlin     }
2985281d757SMark McLoughlin 
2995281d757SMark McLoughlin     if (ioctl(s->fd, TUNSETOFFLOAD, offload) != 0) {
3005281d757SMark McLoughlin         offload &= ~TUN_F_UFO;
3015281d757SMark McLoughlin         if (ioctl(s->fd, TUNSETOFFLOAD, offload) != 0) {
3025281d757SMark McLoughlin             fprintf(stderr, "TUNSETOFFLOAD ioctl() failed: %s\n",
3035281d757SMark McLoughlin                     strerror(errno));
3045281d757SMark McLoughlin         }
3055281d757SMark McLoughlin     }
3065281d757SMark McLoughlin }
3075281d757SMark McLoughlin 
3085281d757SMark McLoughlin static void tap_cleanup(VLANClientState *vc)
3095281d757SMark McLoughlin {
3105281d757SMark McLoughlin     TAPState *s = vc->opaque;
3115281d757SMark McLoughlin 
3125281d757SMark McLoughlin     qemu_purge_queued_packets(vc);
3135281d757SMark McLoughlin 
3145281d757SMark McLoughlin     if (s->down_script[0])
3155281d757SMark McLoughlin         launch_script(s->down_script, s->down_script_arg, s->fd);
3165281d757SMark McLoughlin 
3175281d757SMark McLoughlin     tap_read_poll(s, 0);
3185281d757SMark McLoughlin     tap_write_poll(s, 0);
3195281d757SMark McLoughlin     close(s->fd);
3205281d757SMark McLoughlin     qemu_free(s);
3215281d757SMark McLoughlin }
3225281d757SMark McLoughlin 
3235281d757SMark McLoughlin /* fd support */
3245281d757SMark McLoughlin 
3255281d757SMark McLoughlin static TAPState *net_tap_fd_init(VLANState *vlan,
3265281d757SMark McLoughlin                                  const char *model,
3275281d757SMark McLoughlin                                  const char *name,
3285281d757SMark McLoughlin                                  int fd,
3295281d757SMark McLoughlin                                  int vnet_hdr)
3305281d757SMark McLoughlin {
3315281d757SMark McLoughlin     TAPState *s;
3325281d757SMark McLoughlin     unsigned int offload;
3335281d757SMark McLoughlin 
3345281d757SMark McLoughlin     s = qemu_mallocz(sizeof(TAPState));
3355281d757SMark McLoughlin     s->fd = fd;
3365281d757SMark McLoughlin     s->has_vnet_hdr = vnet_hdr != 0;
3375281d757SMark McLoughlin     s->using_vnet_hdr = 0;
3385281d757SMark McLoughlin     s->vc = qemu_new_vlan_client(NET_CLIENT_TYPE_TAP,
3395281d757SMark McLoughlin                                  vlan, NULL, model, name, NULL,
3405281d757SMark McLoughlin                                  tap_receive, tap_receive_raw,
3415281d757SMark McLoughlin                                  tap_receive_iov, tap_cleanup, s);
3425281d757SMark McLoughlin     s->has_ufo = 0;
3435281d757SMark McLoughlin     /* Check if tap supports UFO */
3445281d757SMark McLoughlin     offload = TUN_F_CSUM | TUN_F_UFO;
3455281d757SMark McLoughlin     if (ioctl(s->fd, TUNSETOFFLOAD, offload) == 0)
3465281d757SMark McLoughlin        s->has_ufo = 1;
3475281d757SMark McLoughlin     tap_set_offload(s->vc, 0, 0, 0, 0, 0);
3485281d757SMark McLoughlin     tap_read_poll(s, 1);
3495281d757SMark McLoughlin     return s;
3505281d757SMark McLoughlin }
3515281d757SMark McLoughlin 
352*966ea5ecSMark McLoughlin #ifdef _AIX
353e7e92325SMark McLoughlin int tap_open(char *ifname, int ifname_size, int *vnet_hdr, int vnet_hdr_required)
3545281d757SMark McLoughlin {
3555281d757SMark McLoughlin     fprintf (stderr, "no tap on AIX\n");
3565281d757SMark McLoughlin     return -1;
3575281d757SMark McLoughlin }
3585281d757SMark McLoughlin #else
359e7e92325SMark McLoughlin int tap_open(char *ifname, int ifname_size, int *vnet_hdr, int vnet_hdr_required)
3605281d757SMark McLoughlin {
3615281d757SMark McLoughlin     struct ifreq ifr;
3625281d757SMark McLoughlin     int fd, ret;
3635281d757SMark McLoughlin 
3645281d757SMark McLoughlin     TFR(fd = open("/dev/net/tun", O_RDWR));
3655281d757SMark McLoughlin     if (fd < 0) {
3665281d757SMark McLoughlin         fprintf(stderr, "warning: could not open /dev/net/tun: no virtual network emulation\n");
3675281d757SMark McLoughlin         return -1;
3685281d757SMark McLoughlin     }
3695281d757SMark McLoughlin     memset(&ifr, 0, sizeof(ifr));
3705281d757SMark McLoughlin     ifr.ifr_flags = IFF_TAP | IFF_NO_PI;
3715281d757SMark McLoughlin 
3725281d757SMark McLoughlin     if (*vnet_hdr) {
3735281d757SMark McLoughlin         unsigned int features;
3745281d757SMark McLoughlin 
3755281d757SMark McLoughlin         if (ioctl(fd, TUNGETFEATURES, &features) == 0 &&
3765281d757SMark McLoughlin             features & IFF_VNET_HDR) {
3775281d757SMark McLoughlin             *vnet_hdr = 1;
3785281d757SMark McLoughlin             ifr.ifr_flags |= IFF_VNET_HDR;
3795281d757SMark McLoughlin         }
3805281d757SMark McLoughlin 
3815281d757SMark McLoughlin         if (vnet_hdr_required && !*vnet_hdr) {
3825281d757SMark McLoughlin             qemu_error("vnet_hdr=1 requested, but no kernel "
3835281d757SMark McLoughlin                        "support for IFF_VNET_HDR available");
3845281d757SMark McLoughlin             close(fd);
3855281d757SMark McLoughlin             return -1;
3865281d757SMark McLoughlin         }
3875281d757SMark McLoughlin     }
3885281d757SMark McLoughlin 
3895281d757SMark McLoughlin     if (ifname[0] != '\0')
3905281d757SMark McLoughlin         pstrcpy(ifr.ifr_name, IFNAMSIZ, ifname);
3915281d757SMark McLoughlin     else
3925281d757SMark McLoughlin         pstrcpy(ifr.ifr_name, IFNAMSIZ, "tap%d");
3935281d757SMark McLoughlin     ret = ioctl(fd, TUNSETIFF, (void *) &ifr);
3945281d757SMark McLoughlin     if (ret != 0) {
3955281d757SMark McLoughlin         fprintf(stderr, "warning: could not configure /dev/net/tun: no virtual network emulation\n");
3965281d757SMark McLoughlin         close(fd);
3975281d757SMark McLoughlin         return -1;
3985281d757SMark McLoughlin     }
3995281d757SMark McLoughlin     pstrcpy(ifname, ifname_size, ifr.ifr_name);
4005281d757SMark McLoughlin     fcntl(fd, F_SETFL, O_NONBLOCK);
4015281d757SMark McLoughlin     return fd;
4025281d757SMark McLoughlin }
4035281d757SMark McLoughlin #endif
4045281d757SMark McLoughlin 
4055281d757SMark McLoughlin static int launch_script(const char *setup_script, const char *ifname, int fd)
4065281d757SMark McLoughlin {
4075281d757SMark McLoughlin     sigset_t oldmask, mask;
4085281d757SMark McLoughlin     int pid, status;
4095281d757SMark McLoughlin     char *args[3];
4105281d757SMark McLoughlin     char **parg;
4115281d757SMark McLoughlin 
4125281d757SMark McLoughlin     sigemptyset(&mask);
4135281d757SMark McLoughlin     sigaddset(&mask, SIGCHLD);
4145281d757SMark McLoughlin     sigprocmask(SIG_BLOCK, &mask, &oldmask);
4155281d757SMark McLoughlin 
4165281d757SMark McLoughlin     /* try to launch network script */
4175281d757SMark McLoughlin     pid = fork();
4185281d757SMark McLoughlin     if (pid == 0) {
4195281d757SMark McLoughlin         int open_max = sysconf(_SC_OPEN_MAX), i;
4205281d757SMark McLoughlin 
4215281d757SMark McLoughlin         for (i = 0; i < open_max; i++) {
4225281d757SMark McLoughlin             if (i != STDIN_FILENO &&
4235281d757SMark McLoughlin                 i != STDOUT_FILENO &&
4245281d757SMark McLoughlin                 i != STDERR_FILENO &&
4255281d757SMark McLoughlin                 i != fd) {
4265281d757SMark McLoughlin                 close(i);
4275281d757SMark McLoughlin             }
4285281d757SMark McLoughlin         }
4295281d757SMark McLoughlin         parg = args;
4305281d757SMark McLoughlin         *parg++ = (char *)setup_script;
4315281d757SMark McLoughlin         *parg++ = (char *)ifname;
4325281d757SMark McLoughlin         *parg++ = NULL;
4335281d757SMark McLoughlin         execv(setup_script, args);
4345281d757SMark McLoughlin         _exit(1);
4355281d757SMark McLoughlin     } else if (pid > 0) {
4365281d757SMark McLoughlin         while (waitpid(pid, &status, 0) != pid) {
4375281d757SMark McLoughlin             /* loop */
4385281d757SMark McLoughlin         }
4395281d757SMark McLoughlin         sigprocmask(SIG_SETMASK, &oldmask, NULL);
4405281d757SMark McLoughlin 
4415281d757SMark McLoughlin         if (WIFEXITED(status) && WEXITSTATUS(status) == 0) {
4425281d757SMark McLoughlin             return 0;
4435281d757SMark McLoughlin         }
4445281d757SMark McLoughlin     }
4455281d757SMark McLoughlin     fprintf(stderr, "%s: could not launch network script\n", setup_script);
4465281d757SMark McLoughlin     return -1;
4475281d757SMark McLoughlin }
4485281d757SMark McLoughlin 
4495281d757SMark McLoughlin static int net_tap_init(QemuOpts *opts, int *vnet_hdr)
4505281d757SMark McLoughlin {
4515281d757SMark McLoughlin     int fd, vnet_hdr_required;
4525281d757SMark McLoughlin     char ifname[128] = {0,};
4535281d757SMark McLoughlin     const char *setup_script;
4545281d757SMark McLoughlin 
4555281d757SMark McLoughlin     if (qemu_opt_get(opts, "ifname")) {
4565281d757SMark McLoughlin         pstrcpy(ifname, sizeof(ifname), qemu_opt_get(opts, "ifname"));
4575281d757SMark McLoughlin     }
4585281d757SMark McLoughlin 
4595281d757SMark McLoughlin     *vnet_hdr = qemu_opt_get_bool(opts, "vnet_hdr", 1);
4605281d757SMark McLoughlin     if (qemu_opt_get(opts, "vnet_hdr")) {
4615281d757SMark McLoughlin         vnet_hdr_required = *vnet_hdr;
4625281d757SMark McLoughlin     } else {
4635281d757SMark McLoughlin         vnet_hdr_required = 0;
4645281d757SMark McLoughlin     }
4655281d757SMark McLoughlin 
4665281d757SMark McLoughlin     TFR(fd = tap_open(ifname, sizeof(ifname), vnet_hdr, vnet_hdr_required));
4675281d757SMark McLoughlin     if (fd < 0) {
4685281d757SMark McLoughlin         return -1;
4695281d757SMark McLoughlin     }
4705281d757SMark McLoughlin 
4715281d757SMark McLoughlin     setup_script = qemu_opt_get(opts, "script");
4725281d757SMark McLoughlin     if (setup_script &&
4735281d757SMark McLoughlin         setup_script[0] != '\0' &&
4745281d757SMark McLoughlin         strcmp(setup_script, "no") != 0 &&
4755281d757SMark McLoughlin         launch_script(setup_script, ifname, fd)) {
4765281d757SMark McLoughlin         close(fd);
4775281d757SMark McLoughlin         return -1;
4785281d757SMark McLoughlin     }
4795281d757SMark McLoughlin 
4805281d757SMark McLoughlin     qemu_opt_set(opts, "ifname", ifname);
4815281d757SMark McLoughlin 
4825281d757SMark McLoughlin     return fd;
4835281d757SMark McLoughlin }
4845281d757SMark McLoughlin 
4855281d757SMark McLoughlin int net_init_tap(QemuOpts *opts, Monitor *mon, const char *name, VLANState *vlan)
4865281d757SMark McLoughlin {
4875281d757SMark McLoughlin     TAPState *s;
4885281d757SMark McLoughlin     int fd, vnet_hdr;
4895281d757SMark McLoughlin 
4905281d757SMark McLoughlin     if (qemu_opt_get(opts, "fd")) {
4915281d757SMark McLoughlin         if (qemu_opt_get(opts, "ifname") ||
4925281d757SMark McLoughlin             qemu_opt_get(opts, "script") ||
4935281d757SMark McLoughlin             qemu_opt_get(opts, "downscript") ||
4945281d757SMark McLoughlin             qemu_opt_get(opts, "vnet_hdr")) {
4955281d757SMark McLoughlin             qemu_error("ifname=, script=, downscript= and vnet_hdr= is invalid with fd=\n");
4965281d757SMark McLoughlin             return -1;
4975281d757SMark McLoughlin         }
4985281d757SMark McLoughlin 
4995281d757SMark McLoughlin         fd = net_handle_fd_param(mon, qemu_opt_get(opts, "fd"));
5005281d757SMark McLoughlin         if (fd == -1) {
5015281d757SMark McLoughlin             return -1;
5025281d757SMark McLoughlin         }
5035281d757SMark McLoughlin 
5045281d757SMark McLoughlin         fcntl(fd, F_SETFL, O_NONBLOCK);
5055281d757SMark McLoughlin 
5065281d757SMark McLoughlin         vnet_hdr = tap_probe_vnet_hdr(fd);
5075281d757SMark McLoughlin     } else {
5085281d757SMark McLoughlin         if (!qemu_opt_get(opts, "script")) {
5095281d757SMark McLoughlin             qemu_opt_set(opts, "script", DEFAULT_NETWORK_SCRIPT);
5105281d757SMark McLoughlin         }
5115281d757SMark McLoughlin 
5125281d757SMark McLoughlin         if (!qemu_opt_get(opts, "downscript")) {
5135281d757SMark McLoughlin             qemu_opt_set(opts, "downscript", DEFAULT_NETWORK_DOWN_SCRIPT);
5145281d757SMark McLoughlin         }
5155281d757SMark McLoughlin 
5165281d757SMark McLoughlin         fd = net_tap_init(opts, &vnet_hdr);
5175281d757SMark McLoughlin     }
5185281d757SMark McLoughlin 
5195281d757SMark McLoughlin     s = net_tap_fd_init(vlan, "tap", name, fd, vnet_hdr);
5205281d757SMark McLoughlin     if (!s) {
5215281d757SMark McLoughlin         close(fd);
5225281d757SMark McLoughlin         return -1;
5235281d757SMark McLoughlin     }
5245281d757SMark McLoughlin 
5255281d757SMark McLoughlin     if (tap_set_sndbuf(s, opts) < 0) {
5265281d757SMark McLoughlin         return -1;
5275281d757SMark McLoughlin     }
5285281d757SMark McLoughlin 
5295281d757SMark McLoughlin     if (qemu_opt_get(opts, "fd")) {
5305281d757SMark McLoughlin         snprintf(s->vc->info_str, sizeof(s->vc->info_str), "fd=%d", fd);
5315281d757SMark McLoughlin     } else {
5325281d757SMark McLoughlin         const char *ifname, *script, *downscript;
5335281d757SMark McLoughlin 
5345281d757SMark McLoughlin         ifname     = qemu_opt_get(opts, "ifname");
5355281d757SMark McLoughlin         script     = qemu_opt_get(opts, "script");
5365281d757SMark McLoughlin         downscript = qemu_opt_get(opts, "downscript");
5375281d757SMark McLoughlin 
5385281d757SMark McLoughlin         snprintf(s->vc->info_str, sizeof(s->vc->info_str),
5395281d757SMark McLoughlin                  "ifname=%s,script=%s,downscript=%s",
5405281d757SMark McLoughlin                  ifname, script, downscript);
5415281d757SMark McLoughlin 
5425281d757SMark McLoughlin         if (strcmp(downscript, "no") != 0) {
5435281d757SMark McLoughlin             snprintf(s->down_script, sizeof(s->down_script), "%s", downscript);
5445281d757SMark McLoughlin             snprintf(s->down_script_arg, sizeof(s->down_script_arg), "%s", ifname);
5455281d757SMark McLoughlin         }
5465281d757SMark McLoughlin     }
5475281d757SMark McLoughlin 
5485281d757SMark McLoughlin     if (vlan) {
5495281d757SMark McLoughlin         vlan->nb_host_devs++;
5505281d757SMark McLoughlin     }
5515281d757SMark McLoughlin 
5525281d757SMark McLoughlin     return 0;
5535281d757SMark McLoughlin }
5545281d757SMark McLoughlin 
5555281d757SMark McLoughlin #endif /* !defined(_AIX) */
556