xref: /qemu/net/tap.c (revision 27a6375de3edece2e5d115847d54c01e52331f7e)
15281d757SMark McLoughlin /*
25281d757SMark McLoughlin  * QEMU System Emulator
35281d757SMark McLoughlin  *
45281d757SMark McLoughlin  * Copyright (c) 2003-2008 Fabrice Bellard
55281d757SMark McLoughlin  * Copyright (c) 2009 Red Hat, Inc.
65281d757SMark McLoughlin  *
75281d757SMark McLoughlin  * Permission is hereby granted, free of charge, to any person obtaining a copy
85281d757SMark McLoughlin  * of this software and associated documentation files (the "Software"), to deal
95281d757SMark McLoughlin  * in the Software without restriction, including without limitation the rights
105281d757SMark McLoughlin  * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
115281d757SMark McLoughlin  * copies of the Software, and to permit persons to whom the Software is
125281d757SMark McLoughlin  * furnished to do so, subject to the following conditions:
135281d757SMark McLoughlin  *
145281d757SMark McLoughlin  * The above copyright notice and this permission notice shall be included in
155281d757SMark McLoughlin  * all copies or substantial portions of the Software.
165281d757SMark McLoughlin  *
175281d757SMark McLoughlin  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
185281d757SMark McLoughlin  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
195281d757SMark McLoughlin  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
205281d757SMark McLoughlin  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
215281d757SMark McLoughlin  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
225281d757SMark McLoughlin  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
235281d757SMark McLoughlin  * THE SOFTWARE.
245281d757SMark McLoughlin  */
255281d757SMark McLoughlin 
265281d757SMark McLoughlin #include "net/tap.h"
275281d757SMark McLoughlin 
285281d757SMark McLoughlin #include "config-host.h"
295281d757SMark McLoughlin 
305281d757SMark McLoughlin #include <signal.h>
315281d757SMark McLoughlin #include <sys/ioctl.h>
325281d757SMark McLoughlin #include <sys/stat.h>
335281d757SMark McLoughlin #include <sys/wait.h>
3471f4effcSAlexander Graf #include <sys/socket.h>
355281d757SMark McLoughlin #include <net/if.h>
365281d757SMark McLoughlin 
375281d757SMark McLoughlin #include "net.h"
385281d757SMark McLoughlin #include "sysemu.h"
395281d757SMark McLoughlin #include "qemu-char.h"
405281d757SMark McLoughlin #include "qemu-common.h"
412f792016SMarkus Armbruster #include "qemu-error.h"
425281d757SMark McLoughlin 
435281d757SMark McLoughlin #include "net/tap-linux.h"
445281d757SMark McLoughlin 
4582b0d80eSMichael S. Tsirkin #include "hw/vhost_net.h"
4682b0d80eSMichael S. Tsirkin 
475281d757SMark McLoughlin /* Maximum GSO packet size (64k) plus plenty of room for
485281d757SMark McLoughlin  * the ethernet and virtio_net headers
495281d757SMark McLoughlin  */
505281d757SMark McLoughlin #define TAP_BUFSIZE (4096 + 65536)
515281d757SMark McLoughlin 
525281d757SMark McLoughlin typedef struct TAPState {
533e35ba93SMark McLoughlin     VLANClientState nc;
545281d757SMark McLoughlin     int fd;
555281d757SMark McLoughlin     char down_script[1024];
565281d757SMark McLoughlin     char down_script_arg[128];
575281d757SMark McLoughlin     uint8_t buf[TAP_BUFSIZE];
585281d757SMark McLoughlin     unsigned int read_poll : 1;
595281d757SMark McLoughlin     unsigned int write_poll : 1;
605281d757SMark McLoughlin     unsigned int using_vnet_hdr : 1;
615281d757SMark McLoughlin     unsigned int has_ufo: 1;
6282b0d80eSMichael S. Tsirkin     VHostNetState *vhost_net;
63ef4252b1SMichael S. Tsirkin     unsigned host_vnet_hdr_len;
645281d757SMark McLoughlin } TAPState;
655281d757SMark McLoughlin 
665281d757SMark McLoughlin static int launch_script(const char *setup_script, const char *ifname, int fd);
675281d757SMark McLoughlin 
685281d757SMark McLoughlin static int tap_can_send(void *opaque);
695281d757SMark McLoughlin static void tap_send(void *opaque);
705281d757SMark McLoughlin static void tap_writable(void *opaque);
715281d757SMark McLoughlin 
725281d757SMark McLoughlin static void tap_update_fd_handler(TAPState *s)
735281d757SMark McLoughlin {
745281d757SMark McLoughlin     qemu_set_fd_handler2(s->fd,
755281d757SMark McLoughlin                          s->read_poll  ? tap_can_send : NULL,
765281d757SMark McLoughlin                          s->read_poll  ? tap_send     : NULL,
775281d757SMark McLoughlin                          s->write_poll ? tap_writable : NULL,
785281d757SMark McLoughlin                          s);
795281d757SMark McLoughlin }
805281d757SMark McLoughlin 
815281d757SMark McLoughlin static void tap_read_poll(TAPState *s, int enable)
825281d757SMark McLoughlin {
835281d757SMark McLoughlin     s->read_poll = !!enable;
845281d757SMark McLoughlin     tap_update_fd_handler(s);
855281d757SMark McLoughlin }
865281d757SMark McLoughlin 
875281d757SMark McLoughlin static void tap_write_poll(TAPState *s, int enable)
885281d757SMark McLoughlin {
895281d757SMark McLoughlin     s->write_poll = !!enable;
905281d757SMark McLoughlin     tap_update_fd_handler(s);
915281d757SMark McLoughlin }
925281d757SMark McLoughlin 
935281d757SMark McLoughlin static void tap_writable(void *opaque)
945281d757SMark McLoughlin {
955281d757SMark McLoughlin     TAPState *s = opaque;
965281d757SMark McLoughlin 
975281d757SMark McLoughlin     tap_write_poll(s, 0);
985281d757SMark McLoughlin 
993e35ba93SMark McLoughlin     qemu_flush_queued_packets(&s->nc);
1005281d757SMark McLoughlin }
1015281d757SMark McLoughlin 
1025281d757SMark McLoughlin static ssize_t tap_write_packet(TAPState *s, const struct iovec *iov, int iovcnt)
1035281d757SMark McLoughlin {
1045281d757SMark McLoughlin     ssize_t len;
1055281d757SMark McLoughlin 
1065281d757SMark McLoughlin     do {
1075281d757SMark McLoughlin         len = writev(s->fd, iov, iovcnt);
1085281d757SMark McLoughlin     } while (len == -1 && errno == EINTR);
1095281d757SMark McLoughlin 
1105281d757SMark McLoughlin     if (len == -1 && errno == EAGAIN) {
1115281d757SMark McLoughlin         tap_write_poll(s, 1);
1125281d757SMark McLoughlin         return 0;
1135281d757SMark McLoughlin     }
1145281d757SMark McLoughlin 
1155281d757SMark McLoughlin     return len;
1165281d757SMark McLoughlin }
1175281d757SMark McLoughlin 
1183e35ba93SMark McLoughlin static ssize_t tap_receive_iov(VLANClientState *nc, const struct iovec *iov,
1195281d757SMark McLoughlin                                int iovcnt)
1205281d757SMark McLoughlin {
1213e35ba93SMark McLoughlin     TAPState *s = DO_UPCAST(TAPState, nc, nc);
1225281d757SMark McLoughlin     const struct iovec *iovp = iov;
1235281d757SMark McLoughlin     struct iovec iov_copy[iovcnt + 1];
124ef4252b1SMichael S. Tsirkin     struct virtio_net_hdr_mrg_rxbuf hdr = { };
1255281d757SMark McLoughlin 
126ef4252b1SMichael S. Tsirkin     if (s->host_vnet_hdr_len && !s->using_vnet_hdr) {
1275281d757SMark McLoughlin         iov_copy[0].iov_base = &hdr;
128ef4252b1SMichael S. Tsirkin         iov_copy[0].iov_len =  s->host_vnet_hdr_len;
1295281d757SMark McLoughlin         memcpy(&iov_copy[1], iov, iovcnt * sizeof(*iov));
1305281d757SMark McLoughlin         iovp = iov_copy;
1315281d757SMark McLoughlin         iovcnt++;
1325281d757SMark McLoughlin     }
1335281d757SMark McLoughlin 
1345281d757SMark McLoughlin     return tap_write_packet(s, iovp, iovcnt);
1355281d757SMark McLoughlin }
1365281d757SMark McLoughlin 
1373e35ba93SMark McLoughlin static ssize_t tap_receive_raw(VLANClientState *nc, const uint8_t *buf, size_t size)
1385281d757SMark McLoughlin {
1393e35ba93SMark McLoughlin     TAPState *s = DO_UPCAST(TAPState, nc, nc);
1405281d757SMark McLoughlin     struct iovec iov[2];
1415281d757SMark McLoughlin     int iovcnt = 0;
142ef4252b1SMichael S. Tsirkin     struct virtio_net_hdr_mrg_rxbuf hdr = { };
1435281d757SMark McLoughlin 
144ef4252b1SMichael S. Tsirkin     if (s->host_vnet_hdr_len) {
1455281d757SMark McLoughlin         iov[iovcnt].iov_base = &hdr;
146ef4252b1SMichael S. Tsirkin         iov[iovcnt].iov_len  = s->host_vnet_hdr_len;
1475281d757SMark McLoughlin         iovcnt++;
1485281d757SMark McLoughlin     }
1495281d757SMark McLoughlin 
1505281d757SMark McLoughlin     iov[iovcnt].iov_base = (char *)buf;
1515281d757SMark McLoughlin     iov[iovcnt].iov_len  = size;
1525281d757SMark McLoughlin     iovcnt++;
1535281d757SMark McLoughlin 
1545281d757SMark McLoughlin     return tap_write_packet(s, iov, iovcnt);
1555281d757SMark McLoughlin }
1565281d757SMark McLoughlin 
1573e35ba93SMark McLoughlin static ssize_t tap_receive(VLANClientState *nc, const uint8_t *buf, size_t size)
1585281d757SMark McLoughlin {
1593e35ba93SMark McLoughlin     TAPState *s = DO_UPCAST(TAPState, nc, nc);
1605281d757SMark McLoughlin     struct iovec iov[1];
1615281d757SMark McLoughlin 
162ef4252b1SMichael S. Tsirkin     if (s->host_vnet_hdr_len && !s->using_vnet_hdr) {
1633e35ba93SMark McLoughlin         return tap_receive_raw(nc, buf, size);
1645281d757SMark McLoughlin     }
1655281d757SMark McLoughlin 
1665281d757SMark McLoughlin     iov[0].iov_base = (char *)buf;
1675281d757SMark McLoughlin     iov[0].iov_len  = size;
1685281d757SMark McLoughlin 
1695281d757SMark McLoughlin     return tap_write_packet(s, iov, 1);
1705281d757SMark McLoughlin }
1715281d757SMark McLoughlin 
1725281d757SMark McLoughlin static int tap_can_send(void *opaque)
1735281d757SMark McLoughlin {
1745281d757SMark McLoughlin     TAPState *s = opaque;
1755281d757SMark McLoughlin 
1763e35ba93SMark McLoughlin     return qemu_can_send_packet(&s->nc);
1775281d757SMark McLoughlin }
1785281d757SMark McLoughlin 
179966ea5ecSMark McLoughlin #ifndef __sun__
180966ea5ecSMark McLoughlin ssize_t tap_read_packet(int tapfd, uint8_t *buf, int maxlen)
1815281d757SMark McLoughlin {
1825281d757SMark McLoughlin     return read(tapfd, buf, maxlen);
1835281d757SMark McLoughlin }
1845281d757SMark McLoughlin #endif
1855281d757SMark McLoughlin 
1863e35ba93SMark McLoughlin static void tap_send_completed(VLANClientState *nc, ssize_t len)
1875281d757SMark McLoughlin {
1883e35ba93SMark McLoughlin     TAPState *s = DO_UPCAST(TAPState, nc, nc);
1895281d757SMark McLoughlin     tap_read_poll(s, 1);
1905281d757SMark McLoughlin }
1915281d757SMark McLoughlin 
1925281d757SMark McLoughlin static void tap_send(void *opaque)
1935281d757SMark McLoughlin {
1945281d757SMark McLoughlin     TAPState *s = opaque;
195be1636b3SMark McLoughlin     int size;
1965281d757SMark McLoughlin 
1975819c918SMark McLoughlin     do {
1985819c918SMark McLoughlin         uint8_t *buf = s->buf;
1995819c918SMark McLoughlin 
2005281d757SMark McLoughlin         size = tap_read_packet(s->fd, s->buf, sizeof(s->buf));
2015281d757SMark McLoughlin         if (size <= 0) {
2025819c918SMark McLoughlin             break;
2035281d757SMark McLoughlin         }
2045281d757SMark McLoughlin 
205ef4252b1SMichael S. Tsirkin         if (s->host_vnet_hdr_len && !s->using_vnet_hdr) {
206ef4252b1SMichael S. Tsirkin             buf  += s->host_vnet_hdr_len;
207ef4252b1SMichael S. Tsirkin             size -= s->host_vnet_hdr_len;
2085281d757SMark McLoughlin         }
2095281d757SMark McLoughlin 
2103e35ba93SMark McLoughlin         size = qemu_send_packet_async(&s->nc, buf, size, tap_send_completed);
2115281d757SMark McLoughlin         if (size == 0) {
2125281d757SMark McLoughlin             tap_read_poll(s, 0);
2135281d757SMark McLoughlin         }
2143e35ba93SMark McLoughlin     } while (size > 0 && qemu_can_send_packet(&s->nc));
2155281d757SMark McLoughlin }
2165281d757SMark McLoughlin 
2173e35ba93SMark McLoughlin int tap_has_ufo(VLANClientState *nc)
2185281d757SMark McLoughlin {
2193e35ba93SMark McLoughlin     TAPState *s = DO_UPCAST(TAPState, nc, nc);
2205281d757SMark McLoughlin 
221665a3b07SMark McLoughlin     assert(nc->info->type == NET_CLIENT_TYPE_TAP);
2225281d757SMark McLoughlin 
2235281d757SMark McLoughlin     return s->has_ufo;
2245281d757SMark McLoughlin }
2255281d757SMark McLoughlin 
2263e35ba93SMark McLoughlin int tap_has_vnet_hdr(VLANClientState *nc)
2275281d757SMark McLoughlin {
2283e35ba93SMark McLoughlin     TAPState *s = DO_UPCAST(TAPState, nc, nc);
2295281d757SMark McLoughlin 
230665a3b07SMark McLoughlin     assert(nc->info->type == NET_CLIENT_TYPE_TAP);
2315281d757SMark McLoughlin 
232ef4252b1SMichael S. Tsirkin     return !!s->host_vnet_hdr_len;
2335281d757SMark McLoughlin }
2345281d757SMark McLoughlin 
235445d892fSMichael S. Tsirkin int tap_has_vnet_hdr_len(VLANClientState *nc, int len)
236445d892fSMichael S. Tsirkin {
237445d892fSMichael S. Tsirkin     TAPState *s = DO_UPCAST(TAPState, nc, nc);
238445d892fSMichael S. Tsirkin 
239445d892fSMichael S. Tsirkin     assert(nc->info->type == NET_CLIENT_TYPE_TAP);
240445d892fSMichael S. Tsirkin 
241445d892fSMichael S. Tsirkin     return tap_probe_vnet_hdr_len(s->fd, len);
242445d892fSMichael S. Tsirkin }
243445d892fSMichael S. Tsirkin 
244445d892fSMichael S. Tsirkin void tap_set_vnet_hdr_len(VLANClientState *nc, int len)
245445d892fSMichael S. Tsirkin {
246445d892fSMichael S. Tsirkin     TAPState *s = DO_UPCAST(TAPState, nc, nc);
247445d892fSMichael S. Tsirkin 
248445d892fSMichael S. Tsirkin     assert(nc->info->type == NET_CLIENT_TYPE_TAP);
249445d892fSMichael S. Tsirkin     assert(len == sizeof(struct virtio_net_hdr_mrg_rxbuf) ||
250445d892fSMichael S. Tsirkin            len == sizeof(struct virtio_net_hdr));
251445d892fSMichael S. Tsirkin 
252445d892fSMichael S. Tsirkin     tap_fd_set_vnet_hdr_len(s->fd, len);
253445d892fSMichael S. Tsirkin     s->host_vnet_hdr_len = len;
254445d892fSMichael S. Tsirkin }
255445d892fSMichael S. Tsirkin 
2563e35ba93SMark McLoughlin void tap_using_vnet_hdr(VLANClientState *nc, int using_vnet_hdr)
2575281d757SMark McLoughlin {
2583e35ba93SMark McLoughlin     TAPState *s = DO_UPCAST(TAPState, nc, nc);
2595281d757SMark McLoughlin 
2605281d757SMark McLoughlin     using_vnet_hdr = using_vnet_hdr != 0;
2615281d757SMark McLoughlin 
262665a3b07SMark McLoughlin     assert(nc->info->type == NET_CLIENT_TYPE_TAP);
263ef4252b1SMichael S. Tsirkin     assert(!!s->host_vnet_hdr_len == using_vnet_hdr);
2645281d757SMark McLoughlin 
2655281d757SMark McLoughlin     s->using_vnet_hdr = using_vnet_hdr;
2665281d757SMark McLoughlin }
2675281d757SMark McLoughlin 
2683e35ba93SMark McLoughlin void tap_set_offload(VLANClientState *nc, int csum, int tso4,
2695281d757SMark McLoughlin                      int tso6, int ecn, int ufo)
2705281d757SMark McLoughlin {
2713e35ba93SMark McLoughlin     TAPState *s = DO_UPCAST(TAPState, nc, nc);
272*27a6375dSMichael S. Tsirkin     if (s->fd < 0) {
273*27a6375dSMichael S. Tsirkin         return;
274*27a6375dSMichael S. Tsirkin     }
2755281d757SMark McLoughlin 
276*27a6375dSMichael S. Tsirkin     tap_fd_set_offload(s->fd, csum, tso4, tso6, ecn, ufo);
2775281d757SMark McLoughlin }
2785281d757SMark McLoughlin 
2793e35ba93SMark McLoughlin static void tap_cleanup(VLANClientState *nc)
2805281d757SMark McLoughlin {
2813e35ba93SMark McLoughlin     TAPState *s = DO_UPCAST(TAPState, nc, nc);
2825281d757SMark McLoughlin 
28382b0d80eSMichael S. Tsirkin     if (s->vhost_net) {
28482b0d80eSMichael S. Tsirkin         vhost_net_cleanup(s->vhost_net);
28543849424SMichael S. Tsirkin         s->vhost_net = NULL;
28682b0d80eSMichael S. Tsirkin     }
28782b0d80eSMichael S. Tsirkin 
2883e35ba93SMark McLoughlin     qemu_purge_queued_packets(nc);
2895281d757SMark McLoughlin 
2905281d757SMark McLoughlin     if (s->down_script[0])
2915281d757SMark McLoughlin         launch_script(s->down_script, s->down_script_arg, s->fd);
2925281d757SMark McLoughlin 
2935281d757SMark McLoughlin     tap_read_poll(s, 0);
2945281d757SMark McLoughlin     tap_write_poll(s, 0);
2955281d757SMark McLoughlin     close(s->fd);
296*27a6375dSMichael S. Tsirkin     s->fd = -1;
2975281d757SMark McLoughlin }
2985281d757SMark McLoughlin 
299ceb69615SMichael S. Tsirkin static void tap_poll(VLANClientState *nc, bool enable)
300ceb69615SMichael S. Tsirkin {
301ceb69615SMichael S. Tsirkin     TAPState *s = DO_UPCAST(TAPState, nc, nc);
302ceb69615SMichael S. Tsirkin     tap_read_poll(s, enable);
303ceb69615SMichael S. Tsirkin     tap_write_poll(s, enable);
304ceb69615SMichael S. Tsirkin }
305ceb69615SMichael S. Tsirkin 
30695d528a2SMichael S. Tsirkin int tap_get_fd(VLANClientState *nc)
30795d528a2SMichael S. Tsirkin {
30895d528a2SMichael S. Tsirkin     TAPState *s = DO_UPCAST(TAPState, nc, nc);
30995d528a2SMichael S. Tsirkin     assert(nc->info->type == NET_CLIENT_TYPE_TAP);
31095d528a2SMichael S. Tsirkin     return s->fd;
31195d528a2SMichael S. Tsirkin }
31295d528a2SMichael S. Tsirkin 
3135281d757SMark McLoughlin /* fd support */
3145281d757SMark McLoughlin 
3153e35ba93SMark McLoughlin static NetClientInfo net_tap_info = {
3163e35ba93SMark McLoughlin     .type = NET_CLIENT_TYPE_TAP,
3173e35ba93SMark McLoughlin     .size = sizeof(TAPState),
3183e35ba93SMark McLoughlin     .receive = tap_receive,
3193e35ba93SMark McLoughlin     .receive_raw = tap_receive_raw,
3203e35ba93SMark McLoughlin     .receive_iov = tap_receive_iov,
321ceb69615SMichael S. Tsirkin     .poll = tap_poll,
3223e35ba93SMark McLoughlin     .cleanup = tap_cleanup,
3233e35ba93SMark McLoughlin };
3243e35ba93SMark McLoughlin 
3255281d757SMark McLoughlin static TAPState *net_tap_fd_init(VLANState *vlan,
3265281d757SMark McLoughlin                                  const char *model,
3275281d757SMark McLoughlin                                  const char *name,
3285281d757SMark McLoughlin                                  int fd,
3295281d757SMark McLoughlin                                  int vnet_hdr)
3305281d757SMark McLoughlin {
3313e35ba93SMark McLoughlin     VLANClientState *nc;
3325281d757SMark McLoughlin     TAPState *s;
3335281d757SMark McLoughlin 
3343e35ba93SMark McLoughlin     nc = qemu_new_net_client(&net_tap_info, vlan, NULL, model, name);
3353e35ba93SMark McLoughlin 
3363e35ba93SMark McLoughlin     s = DO_UPCAST(TAPState, nc, nc);
3373e35ba93SMark McLoughlin 
3385281d757SMark McLoughlin     s->fd = fd;
339ef4252b1SMichael S. Tsirkin     s->host_vnet_hdr_len = vnet_hdr ? sizeof(struct virtio_net_hdr) : 0;
3405281d757SMark McLoughlin     s->using_vnet_hdr = 0;
3419c282718SMark McLoughlin     s->has_ufo = tap_probe_has_ufo(s->fd);
3423e35ba93SMark McLoughlin     tap_set_offload(&s->nc, 0, 0, 0, 0, 0);
3435281d757SMark McLoughlin     tap_read_poll(s, 1);
34482b0d80eSMichael S. Tsirkin     s->vhost_net = NULL;
3455281d757SMark McLoughlin     return s;
3465281d757SMark McLoughlin }
3475281d757SMark McLoughlin 
3485281d757SMark McLoughlin static int launch_script(const char *setup_script, const char *ifname, int fd)
3495281d757SMark McLoughlin {
3505281d757SMark McLoughlin     sigset_t oldmask, mask;
3515281d757SMark McLoughlin     int pid, status;
3525281d757SMark McLoughlin     char *args[3];
3535281d757SMark McLoughlin     char **parg;
3545281d757SMark McLoughlin 
3555281d757SMark McLoughlin     sigemptyset(&mask);
3565281d757SMark McLoughlin     sigaddset(&mask, SIGCHLD);
3575281d757SMark McLoughlin     sigprocmask(SIG_BLOCK, &mask, &oldmask);
3585281d757SMark McLoughlin 
3595281d757SMark McLoughlin     /* try to launch network script */
3605281d757SMark McLoughlin     pid = fork();
3615281d757SMark McLoughlin     if (pid == 0) {
3625281d757SMark McLoughlin         int open_max = sysconf(_SC_OPEN_MAX), i;
3635281d757SMark McLoughlin 
3645281d757SMark McLoughlin         for (i = 0; i < open_max; i++) {
3655281d757SMark McLoughlin             if (i != STDIN_FILENO &&
3665281d757SMark McLoughlin                 i != STDOUT_FILENO &&
3675281d757SMark McLoughlin                 i != STDERR_FILENO &&
3685281d757SMark McLoughlin                 i != fd) {
3695281d757SMark McLoughlin                 close(i);
3705281d757SMark McLoughlin             }
3715281d757SMark McLoughlin         }
3725281d757SMark McLoughlin         parg = args;
3735281d757SMark McLoughlin         *parg++ = (char *)setup_script;
3745281d757SMark McLoughlin         *parg++ = (char *)ifname;
3759678d950SBlue Swirl         *parg = NULL;
3765281d757SMark McLoughlin         execv(setup_script, args);
3775281d757SMark McLoughlin         _exit(1);
3785281d757SMark McLoughlin     } else if (pid > 0) {
3795281d757SMark McLoughlin         while (waitpid(pid, &status, 0) != pid) {
3805281d757SMark McLoughlin             /* loop */
3815281d757SMark McLoughlin         }
3825281d757SMark McLoughlin         sigprocmask(SIG_SETMASK, &oldmask, NULL);
3835281d757SMark McLoughlin 
3845281d757SMark McLoughlin         if (WIFEXITED(status) && WEXITSTATUS(status) == 0) {
3855281d757SMark McLoughlin             return 0;
3865281d757SMark McLoughlin         }
3875281d757SMark McLoughlin     }
3885281d757SMark McLoughlin     fprintf(stderr, "%s: could not launch network script\n", setup_script);
3895281d757SMark McLoughlin     return -1;
3905281d757SMark McLoughlin }
3915281d757SMark McLoughlin 
3925281d757SMark McLoughlin static int net_tap_init(QemuOpts *opts, int *vnet_hdr)
3935281d757SMark McLoughlin {
3945281d757SMark McLoughlin     int fd, vnet_hdr_required;
3955281d757SMark McLoughlin     char ifname[128] = {0,};
3965281d757SMark McLoughlin     const char *setup_script;
3975281d757SMark McLoughlin 
3985281d757SMark McLoughlin     if (qemu_opt_get(opts, "ifname")) {
3995281d757SMark McLoughlin         pstrcpy(ifname, sizeof(ifname), qemu_opt_get(opts, "ifname"));
4005281d757SMark McLoughlin     }
4015281d757SMark McLoughlin 
4025281d757SMark McLoughlin     *vnet_hdr = qemu_opt_get_bool(opts, "vnet_hdr", 1);
4035281d757SMark McLoughlin     if (qemu_opt_get(opts, "vnet_hdr")) {
4045281d757SMark McLoughlin         vnet_hdr_required = *vnet_hdr;
4055281d757SMark McLoughlin     } else {
4065281d757SMark McLoughlin         vnet_hdr_required = 0;
4075281d757SMark McLoughlin     }
4085281d757SMark McLoughlin 
4095281d757SMark McLoughlin     TFR(fd = tap_open(ifname, sizeof(ifname), vnet_hdr, vnet_hdr_required));
4105281d757SMark McLoughlin     if (fd < 0) {
4115281d757SMark McLoughlin         return -1;
4125281d757SMark McLoughlin     }
4135281d757SMark McLoughlin 
4145281d757SMark McLoughlin     setup_script = qemu_opt_get(opts, "script");
4155281d757SMark McLoughlin     if (setup_script &&
4165281d757SMark McLoughlin         setup_script[0] != '\0' &&
4175281d757SMark McLoughlin         strcmp(setup_script, "no") != 0 &&
4185281d757SMark McLoughlin         launch_script(setup_script, ifname, fd)) {
4195281d757SMark McLoughlin         close(fd);
4205281d757SMark McLoughlin         return -1;
4215281d757SMark McLoughlin     }
4225281d757SMark McLoughlin 
4235281d757SMark McLoughlin     qemu_opt_set(opts, "ifname", ifname);
4245281d757SMark McLoughlin 
4255281d757SMark McLoughlin     return fd;
4265281d757SMark McLoughlin }
4275281d757SMark McLoughlin 
4285281d757SMark McLoughlin int net_init_tap(QemuOpts *opts, Monitor *mon, const char *name, VLANState *vlan)
4295281d757SMark McLoughlin {
4305281d757SMark McLoughlin     TAPState *s;
431df6c2a0fSMark McLoughlin     int fd, vnet_hdr = 0;
4325281d757SMark McLoughlin 
4335281d757SMark McLoughlin     if (qemu_opt_get(opts, "fd")) {
4345281d757SMark McLoughlin         if (qemu_opt_get(opts, "ifname") ||
4355281d757SMark McLoughlin             qemu_opt_get(opts, "script") ||
4365281d757SMark McLoughlin             qemu_opt_get(opts, "downscript") ||
4375281d757SMark McLoughlin             qemu_opt_get(opts, "vnet_hdr")) {
4381ecda02bSMarkus Armbruster             error_report("ifname=, script=, downscript= and vnet_hdr= is invalid with fd=");
4395281d757SMark McLoughlin             return -1;
4405281d757SMark McLoughlin         }
4415281d757SMark McLoughlin 
4425281d757SMark McLoughlin         fd = net_handle_fd_param(mon, qemu_opt_get(opts, "fd"));
4435281d757SMark McLoughlin         if (fd == -1) {
4445281d757SMark McLoughlin             return -1;
4455281d757SMark McLoughlin         }
4465281d757SMark McLoughlin 
4475281d757SMark McLoughlin         fcntl(fd, F_SETFL, O_NONBLOCK);
4485281d757SMark McLoughlin 
4495281d757SMark McLoughlin         vnet_hdr = tap_probe_vnet_hdr(fd);
4505281d757SMark McLoughlin     } else {
4515281d757SMark McLoughlin         if (!qemu_opt_get(opts, "script")) {
4525281d757SMark McLoughlin             qemu_opt_set(opts, "script", DEFAULT_NETWORK_SCRIPT);
4535281d757SMark McLoughlin         }
4545281d757SMark McLoughlin 
4555281d757SMark McLoughlin         if (!qemu_opt_get(opts, "downscript")) {
4565281d757SMark McLoughlin             qemu_opt_set(opts, "downscript", DEFAULT_NETWORK_DOWN_SCRIPT);
4575281d757SMark McLoughlin         }
4585281d757SMark McLoughlin 
4595281d757SMark McLoughlin         fd = net_tap_init(opts, &vnet_hdr);
460929fe497SJuergen Lock         if (fd == -1) {
461929fe497SJuergen Lock             return -1;
462929fe497SJuergen Lock         }
4635281d757SMark McLoughlin     }
4645281d757SMark McLoughlin 
4655281d757SMark McLoughlin     s = net_tap_fd_init(vlan, "tap", name, fd, vnet_hdr);
4665281d757SMark McLoughlin     if (!s) {
4675281d757SMark McLoughlin         close(fd);
4685281d757SMark McLoughlin         return -1;
4695281d757SMark McLoughlin     }
4705281d757SMark McLoughlin 
47115ac913bSMark McLoughlin     if (tap_set_sndbuf(s->fd, opts) < 0) {
4725281d757SMark McLoughlin         return -1;
4735281d757SMark McLoughlin     }
4745281d757SMark McLoughlin 
4755281d757SMark McLoughlin     if (qemu_opt_get(opts, "fd")) {
4763e35ba93SMark McLoughlin         snprintf(s->nc.info_str, sizeof(s->nc.info_str), "fd=%d", fd);
4775281d757SMark McLoughlin     } else {
4785281d757SMark McLoughlin         const char *ifname, *script, *downscript;
4795281d757SMark McLoughlin 
4805281d757SMark McLoughlin         ifname     = qemu_opt_get(opts, "ifname");
4815281d757SMark McLoughlin         script     = qemu_opt_get(opts, "script");
4825281d757SMark McLoughlin         downscript = qemu_opt_get(opts, "downscript");
4835281d757SMark McLoughlin 
4843e35ba93SMark McLoughlin         snprintf(s->nc.info_str, sizeof(s->nc.info_str),
4855281d757SMark McLoughlin                  "ifname=%s,script=%s,downscript=%s",
4865281d757SMark McLoughlin                  ifname, script, downscript);
4875281d757SMark McLoughlin 
4885281d757SMark McLoughlin         if (strcmp(downscript, "no") != 0) {
4895281d757SMark McLoughlin             snprintf(s->down_script, sizeof(s->down_script), "%s", downscript);
4905281d757SMark McLoughlin             snprintf(s->down_script_arg, sizeof(s->down_script_arg), "%s", ifname);
4915281d757SMark McLoughlin         }
4925281d757SMark McLoughlin     }
4935281d757SMark McLoughlin 
49482b0d80eSMichael S. Tsirkin     if (qemu_opt_get_bool(opts, "vhost", !!qemu_opt_get(opts, "vhostfd"))) {
49582b0d80eSMichael S. Tsirkin         int vhostfd, r;
49682b0d80eSMichael S. Tsirkin         if (qemu_opt_get(opts, "vhostfd")) {
49782b0d80eSMichael S. Tsirkin             r = net_handle_fd_param(mon, qemu_opt_get(opts, "vhostfd"));
49882b0d80eSMichael S. Tsirkin             if (r == -1) {
49982b0d80eSMichael S. Tsirkin                 return -1;
50082b0d80eSMichael S. Tsirkin             }
50182b0d80eSMichael S. Tsirkin             vhostfd = r;
50282b0d80eSMichael S. Tsirkin         } else {
50382b0d80eSMichael S. Tsirkin             vhostfd = -1;
50482b0d80eSMichael S. Tsirkin         }
50582b0d80eSMichael S. Tsirkin         s->vhost_net = vhost_net_init(&s->nc, vhostfd);
50682b0d80eSMichael S. Tsirkin         if (!s->vhost_net) {
50782b0d80eSMichael S. Tsirkin             error_report("vhost-net requested but could not be initialized");
50882b0d80eSMichael S. Tsirkin             return -1;
50982b0d80eSMichael S. Tsirkin         }
51082b0d80eSMichael S. Tsirkin     } else if (qemu_opt_get(opts, "vhostfd")) {
51182b0d80eSMichael S. Tsirkin         error_report("vhostfd= is not valid without vhost");
51282b0d80eSMichael S. Tsirkin         return -1;
51382b0d80eSMichael S. Tsirkin     }
51482b0d80eSMichael S. Tsirkin 
5155281d757SMark McLoughlin     return 0;
5165281d757SMark McLoughlin }
517b202554cSMichael S. Tsirkin 
518b202554cSMichael S. Tsirkin VHostNetState *tap_get_vhost_net(VLANClientState *nc)
519b202554cSMichael S. Tsirkin {
520b202554cSMichael S. Tsirkin     TAPState *s = DO_UPCAST(TAPState, nc, nc);
521b202554cSMichael S. Tsirkin     assert(nc->info->type == NET_CLIENT_TYPE_TAP);
522b202554cSMichael S. Tsirkin     return s->vhost_net;
523b202554cSMichael S. Tsirkin }
524