131638bcaSCyrill Gorcunov #include "kvm/virtio-pci-dev.h" 2b5ee1ea7SAsias He #include "kvm/virtio-net.h" 34f56d42cSAsias He #include "kvm/virtio.h" 44f56d42cSAsias He #include "kvm/types.h" 54f56d42cSAsias He #include "kvm/mutex.h" 64f56d42cSAsias He #include "kvm/util.h" 74f56d42cSAsias He #include "kvm/kvm.h" 82449f6e3SSasha Levin #include "kvm/irq.h" 9b5ee1ea7SAsias He #include "kvm/uip.h" 10cb83de6fSSasha Levin #include "kvm/guest_compat.h" 114f56d42cSAsias He 129ed67cdcSSasha Levin #include <linux/vhost.h> 134f56d42cSAsias He #include <linux/virtio_net.h> 144f56d42cSAsias He #include <linux/if_tun.h> 1578a2a3e2SSasha Levin #include <linux/types.h> 16c229370aSIngo Molnar 17c229370aSIngo Molnar #include <arpa/inet.h> 184f56d42cSAsias He #include <net/if.h> 19c229370aSIngo Molnar 20c229370aSIngo Molnar #include <unistd.h> 214f56d42cSAsias He #include <fcntl.h> 22c229370aSIngo Molnar 23cb7202c1SSasha Levin #include <sys/socket.h> 24c229370aSIngo Molnar #include <sys/ioctl.h> 25c229370aSIngo Molnar #include <sys/types.h> 2673b7d038SAmos Kong #include <sys/wait.h> 279ed67cdcSSasha Levin #include <sys/eventfd.h> 284f56d42cSAsias He 294059ad8bSAsias He #define VIRTIO_NET_QUEUE_SIZE 256 304f56d42cSAsias He #define VIRTIO_NET_NUM_QUEUES 2 314f56d42cSAsias He #define VIRTIO_NET_RX_QUEUE 0 324f56d42cSAsias He #define VIRTIO_NET_TX_QUEUE 1 334f56d42cSAsias He 34b4fdde6dSAsias He struct net_dev; 35b4fdde6dSAsias He 36b4fdde6dSAsias He struct net_dev_operations { 37b4fdde6dSAsias He int (*rx)(struct iovec *iov, u16 in, struct net_dev *ndev); 38b4fdde6dSAsias He int (*tx)(struct iovec *iov, u16 in, struct net_dev *ndev); 39b4fdde6dSAsias He }; 40b4fdde6dSAsias He 418626798bSAsias He struct net_dev { 424f56d42cSAsias He pthread_mutex_t mutex; 4302eca50cSAsias He struct virtio_device vdev; 449a6d73f1SSasha Levin struct list_head list; 454f56d42cSAsias He 464f56d42cSAsias He struct virt_queue vqs[VIRTIO_NET_NUM_QUEUES]; 47c229370aSIngo Molnar struct virtio_net_config config; 4878a2a3e2SSasha Levin u32 features; 494f56d42cSAsias He 50c4aa7c02SPekka Enberg pthread_t io_rx_thread; 51c229370aSIngo Molnar pthread_mutex_t io_rx_lock; 52c4aa7c02SPekka Enberg pthread_cond_t io_rx_cond; 53c4aa7c02SPekka Enberg 54c4aa7c02SPekka Enberg pthread_t io_tx_thread; 55c229370aSIngo Molnar pthread_mutex_t io_tx_lock; 56c4aa7c02SPekka Enberg pthread_cond_t io_tx_cond; 57c4aa7c02SPekka Enberg 589ed67cdcSSasha Levin int vhost_fd; 594f56d42cSAsias He int tap_fd; 604f56d42cSAsias He char tap_name[IFNAMSIZ]; 61bb1a32f1SAsias He 62bb1a32f1SAsias He int mode; 63bb1a32f1SAsias He 64b5ee1ea7SAsias He struct uip_info info; 65b4fdde6dSAsias He struct net_dev_operations *ops; 669a6d73f1SSasha Levin struct kvm *kvm; 674f56d42cSAsias He }; 684f56d42cSAsias He 699a6d73f1SSasha Levin static LIST_HEAD(ndevs); 70312c62d1SSasha Levin static int compat_id = -1; 714f56d42cSAsias He 72c4aa7c02SPekka Enberg static void *virtio_net_rx_thread(void *p) 734f56d42cSAsias He { 744f56d42cSAsias He struct iovec iov[VIRTIO_NET_QUEUE_SIZE]; 754f56d42cSAsias He struct virt_queue *vq; 7643835ac9SSasha Levin struct kvm *kvm; 779a6d73f1SSasha Levin struct net_dev *ndev = p; 783fdf659dSSasha Levin u16 out, in; 793fdf659dSSasha Levin u16 head; 804f56d42cSAsias He int len; 814f56d42cSAsias He 829a6d73f1SSasha Levin kvm = ndev->kvm; 839a6d73f1SSasha Levin vq = &ndev->vqs[VIRTIO_NET_RX_QUEUE]; 84c4aa7c02SPekka Enberg 85c4aa7c02SPekka Enberg while (1) { 869a6d73f1SSasha Levin mutex_lock(&ndev->io_rx_lock); 87c4aa7c02SPekka Enberg if (!virt_queue__available(vq)) 889a6d73f1SSasha Levin pthread_cond_wait(&ndev->io_rx_cond, &ndev->io_rx_lock); 899a6d73f1SSasha Levin mutex_unlock(&ndev->io_rx_lock); 904f56d42cSAsias He 914f56d42cSAsias He while (virt_queue__available(vq)) { 9243835ac9SSasha Levin head = virt_queue__get_iov(vq, iov, &out, &in, kvm); 939a6d73f1SSasha Levin len = ndev->ops->rx(iov, in, ndev); 94246c8347SAsias He virt_queue__set_used_elem(vq, head, len); 957f5ffaf5SAsias He 96c4aa7c02SPekka Enberg /* We should interrupt guest right now, otherwise latency is huge. */ 9792c1f37bSSasha Levin if (virtio_queue__should_signal(&ndev->vqs[VIRTIO_NET_RX_QUEUE])) 9802eca50cSAsias He ndev->vdev.ops->signal_vq(kvm, &ndev->vdev, 9992c1f37bSSasha Levin VIRTIO_NET_RX_QUEUE); 1004f56d42cSAsias He } 101c4aa7c02SPekka Enberg } 102c4aa7c02SPekka Enberg 103c4aa7c02SPekka Enberg pthread_exit(NULL); 104c4aa7c02SPekka Enberg return NULL; 105c4aa7c02SPekka Enberg 106c4aa7c02SPekka Enberg } 107c4aa7c02SPekka Enberg 108c4aa7c02SPekka Enberg static void *virtio_net_tx_thread(void *p) 1094f56d42cSAsias He { 1104f56d42cSAsias He struct iovec iov[VIRTIO_NET_QUEUE_SIZE]; 1114f56d42cSAsias He struct virt_queue *vq; 11243835ac9SSasha Levin struct kvm *kvm; 1139a6d73f1SSasha Levin struct net_dev *ndev = p; 1143fdf659dSSasha Levin u16 out, in; 1153fdf659dSSasha Levin u16 head; 1164f56d42cSAsias He int len; 1174f56d42cSAsias He 1189a6d73f1SSasha Levin kvm = ndev->kvm; 1199a6d73f1SSasha Levin vq = &ndev->vqs[VIRTIO_NET_TX_QUEUE]; 120c4aa7c02SPekka Enberg 121c4aa7c02SPekka Enberg while (1) { 1229a6d73f1SSasha Levin mutex_lock(&ndev->io_tx_lock); 123c4aa7c02SPekka Enberg if (!virt_queue__available(vq)) 1249a6d73f1SSasha Levin pthread_cond_wait(&ndev->io_tx_cond, &ndev->io_tx_lock); 1259a6d73f1SSasha Levin mutex_unlock(&ndev->io_tx_lock); 1264f56d42cSAsias He 1274f56d42cSAsias He while (virt_queue__available(vq)) { 12843835ac9SSasha Levin head = virt_queue__get_iov(vq, iov, &out, &in, kvm); 1299a6d73f1SSasha Levin len = ndev->ops->tx(iov, out, ndev); 1304f56d42cSAsias He virt_queue__set_used_elem(vq, head, len); 1314f56d42cSAsias He } 1324f56d42cSAsias He 13392c1f37bSSasha Levin if (virtio_queue__should_signal(&ndev->vqs[VIRTIO_NET_TX_QUEUE])) 13402eca50cSAsias He ndev->vdev.ops->signal_vq(kvm, &ndev->vdev, VIRTIO_NET_TX_QUEUE); 1354f56d42cSAsias He } 1364f56d42cSAsias He 137c4aa7c02SPekka Enberg pthread_exit(NULL); 138407475bfSPekka Enberg 139c4aa7c02SPekka Enberg return NULL; 140c4aa7c02SPekka Enberg 141c4aa7c02SPekka Enberg } 142407475bfSPekka Enberg 1439a6d73f1SSasha Levin static void virtio_net_handle_callback(struct kvm *kvm, struct net_dev *ndev, int queue) 1444f56d42cSAsias He { 1459a6d73f1SSasha Levin switch (queue) { 146b5ee1ea7SAsias He case VIRTIO_NET_TX_QUEUE: 1479a6d73f1SSasha Levin mutex_lock(&ndev->io_tx_lock); 1489a6d73f1SSasha Levin pthread_cond_signal(&ndev->io_tx_cond); 1499a6d73f1SSasha Levin mutex_unlock(&ndev->io_tx_lock); 150407475bfSPekka Enberg break; 151b5ee1ea7SAsias He case VIRTIO_NET_RX_QUEUE: 1529a6d73f1SSasha Levin mutex_lock(&ndev->io_rx_lock); 1539a6d73f1SSasha Levin pthread_cond_signal(&ndev->io_rx_cond); 1549a6d73f1SSasha Levin mutex_unlock(&ndev->io_rx_lock); 155407475bfSPekka Enberg break; 156407475bfSPekka Enberg default: 1579a6d73f1SSasha Levin pr_warning("Unknown queue index %u", queue); 158c4aa7c02SPekka Enberg } 1594f56d42cSAsias He } 1604f56d42cSAsias He 1619a6d73f1SSasha Levin static bool virtio_net__tap_init(const struct virtio_net_params *params, 1629a6d73f1SSasha Levin struct net_dev *ndev) 1634f56d42cSAsias He { 164cb7202c1SSasha Levin int sock = socket(AF_INET, SOCK_STREAM, 0); 165f715177dSAsias He int pid, status, offload, hdr_len; 166cb7202c1SSasha Levin struct sockaddr_in sin = {0}; 167246c8347SAsias He struct ifreq ifr; 1684f56d42cSAsias He 169f19edd1eSSasha Levin /* Did the user already gave us the FD? */ 170f19edd1eSSasha Levin if (params->fd) { 171f19edd1eSSasha Levin ndev->tap_fd = params->fd; 172f19edd1eSSasha Levin return 1; 173f19edd1eSSasha Levin } 174f19edd1eSSasha Levin 1759a6d73f1SSasha Levin ndev->tap_fd = open("/dev/net/tun", O_RDWR); 1769a6d73f1SSasha Levin if (ndev->tap_fd < 0) { 1774542f276SCyrill Gorcunov pr_warning("Unable to open /dev/net/tun"); 1783b02f580SSasha Levin goto fail; 1793b02f580SSasha Levin } 1804f56d42cSAsias He 1814f56d42cSAsias He memset(&ifr, 0, sizeof(ifr)); 182246c8347SAsias He ifr.ifr_flags = IFF_TAP | IFF_NO_PI | IFF_VNET_HDR; 1839a6d73f1SSasha Levin if (ioctl(ndev->tap_fd, TUNSETIFF, &ifr) < 0) { 1844542f276SCyrill Gorcunov pr_warning("Config tap device error. Are you root?"); 1853b02f580SSasha Levin goto fail; 1863b02f580SSasha Levin } 1874f56d42cSAsias He 1889a6d73f1SSasha Levin strncpy(ndev->tap_name, ifr.ifr_name, sizeof(ndev->tap_name)); 1894f56d42cSAsias He 1909a6d73f1SSasha Levin if (ioctl(ndev->tap_fd, TUNSETNOCSUM, 1) < 0) { 1914542f276SCyrill Gorcunov pr_warning("Config tap device TUNSETNOCSUM error"); 192246c8347SAsias He goto fail; 193246c8347SAsias He } 194246c8347SAsias He 195246c8347SAsias He hdr_len = sizeof(struct virtio_net_hdr); 1969a6d73f1SSasha Levin if (ioctl(ndev->tap_fd, TUNSETVNETHDRSZ, &hdr_len) < 0) 1974542f276SCyrill Gorcunov pr_warning("Config tap device TUNSETVNETHDRSZ error"); 198246c8347SAsias He 199246c8347SAsias He offload = TUN_F_CSUM | TUN_F_TSO4 | TUN_F_TSO6 | TUN_F_UFO; 2009a6d73f1SSasha Levin if (ioctl(ndev->tap_fd, TUNSETOFFLOAD, offload) < 0) { 2014542f276SCyrill Gorcunov pr_warning("Config tap device TUNSETOFFLOAD error"); 202246c8347SAsias He goto fail; 203246c8347SAsias He } 2044f56d42cSAsias He 20573b7d038SAmos Kong if (strcmp(params->script, "none")) { 20673b7d038SAmos Kong pid = fork(); 20773b7d038SAmos Kong if (pid == 0) { 2089a6d73f1SSasha Levin execl(params->script, params->script, ndev->tap_name, NULL); 20973b7d038SAmos Kong _exit(1); 21073b7d038SAmos Kong } else { 21173b7d038SAmos Kong waitpid(pid, &status, 0); 21273b7d038SAmos Kong if (WIFEXITED(status) && WEXITSTATUS(status) != 0) { 2134542f276SCyrill Gorcunov pr_warning("Fail to setup tap by %s", params->script); 21473b7d038SAmos Kong goto fail; 21573b7d038SAmos Kong } 21673b7d038SAmos Kong } 21773b7d038SAmos Kong } else { 218cb7202c1SSasha Levin memset(&ifr, 0, sizeof(ifr)); 2199a6d73f1SSasha Levin strncpy(ifr.ifr_name, ndev->tap_name, sizeof(ndev->tap_name)); 220bdfcfca6SSasha Levin sin.sin_addr.s_addr = inet_addr(params->host_ip); 221cb7202c1SSasha Levin memcpy(&(ifr.ifr_addr), &sin, sizeof(ifr.ifr_addr)); 222cb7202c1SSasha Levin ifr.ifr_addr.sa_family = AF_INET; 2233b02f580SSasha Levin if (ioctl(sock, SIOCSIFADDR, &ifr) < 0) { 2244542f276SCyrill Gorcunov pr_warning("Could not set ip address on tap device"); 2253b02f580SSasha Levin goto fail; 2263b02f580SSasha Levin } 22773b7d038SAmos Kong } 228cb7202c1SSasha Levin 229cb7202c1SSasha Levin memset(&ifr, 0, sizeof(ifr)); 2309a6d73f1SSasha Levin strncpy(ifr.ifr_name, ndev->tap_name, sizeof(ndev->tap_name)); 231cb7202c1SSasha Levin ioctl(sock, SIOCGIFFLAGS, &ifr); 232cb7202c1SSasha Levin ifr.ifr_flags |= IFF_UP | IFF_RUNNING; 233cb7202c1SSasha Levin if (ioctl(sock, SIOCSIFFLAGS, &ifr) < 0) 2344542f276SCyrill Gorcunov pr_warning("Could not bring tap device up"); 235cb7202c1SSasha Levin 236cb7202c1SSasha Levin close(sock); 2373b02f580SSasha Levin 2383b02f580SSasha Levin return 1; 2393b02f580SSasha Levin 2403b02f580SSasha Levin fail: 2413b02f580SSasha Levin if (sock >= 0) 2423b02f580SSasha Levin close(sock); 2439a6d73f1SSasha Levin if (ndev->tap_fd >= 0) 2449a6d73f1SSasha Levin close(ndev->tap_fd); 2453b02f580SSasha Levin 2463b02f580SSasha Levin return 0; 2474f56d42cSAsias He } 2484f56d42cSAsias He 2499a6d73f1SSasha Levin static void virtio_net__io_thread_init(struct kvm *kvm, struct net_dev *ndev) 250c4aa7c02SPekka Enberg { 25106e5512fSAsias He pthread_mutex_init(&ndev->io_tx_lock, NULL); 2529a6d73f1SSasha Levin pthread_mutex_init(&ndev->io_rx_lock, NULL); 253c4aa7c02SPekka Enberg 2549a6d73f1SSasha Levin pthread_cond_init(&ndev->io_tx_cond, NULL); 25506e5512fSAsias He pthread_cond_init(&ndev->io_rx_cond, NULL); 256c4aa7c02SPekka Enberg 2579a6d73f1SSasha Levin pthread_create(&ndev->io_tx_thread, NULL, virtio_net_tx_thread, ndev); 25806e5512fSAsias He pthread_create(&ndev->io_rx_thread, NULL, virtio_net_rx_thread, ndev); 259c4aa7c02SPekka Enberg } 260c4aa7c02SPekka Enberg 261b4fdde6dSAsias He static inline int tap_ops_tx(struct iovec *iov, u16 out, struct net_dev *ndev) 262b4fdde6dSAsias He { 263b4fdde6dSAsias He return writev(ndev->tap_fd, iov, out); 264b4fdde6dSAsias He } 265b4fdde6dSAsias He 266b4fdde6dSAsias He static inline int tap_ops_rx(struct iovec *iov, u16 in, struct net_dev *ndev) 267b4fdde6dSAsias He { 268b4fdde6dSAsias He return readv(ndev->tap_fd, iov, in); 269b4fdde6dSAsias He } 270b4fdde6dSAsias He 271b4fdde6dSAsias He static inline int uip_ops_tx(struct iovec *iov, u16 out, struct net_dev *ndev) 272b4fdde6dSAsias He { 273b4fdde6dSAsias He return uip_tx(iov, out, &ndev->info); 274b4fdde6dSAsias He } 275b4fdde6dSAsias He 276b4fdde6dSAsias He static inline int uip_ops_rx(struct iovec *iov, u16 in, struct net_dev *ndev) 277b4fdde6dSAsias He { 278b4fdde6dSAsias He return uip_rx(iov, in, &ndev->info); 279b4fdde6dSAsias He } 280b4fdde6dSAsias He 281b4fdde6dSAsias He static struct net_dev_operations tap_ops = { 282b4fdde6dSAsias He .rx = tap_ops_rx, 283b4fdde6dSAsias He .tx = tap_ops_tx, 284b4fdde6dSAsias He }; 285b4fdde6dSAsias He 286b4fdde6dSAsias He static struct net_dev_operations uip_ops = { 287b4fdde6dSAsias He .rx = uip_ops_rx, 288b4fdde6dSAsias He .tx = uip_ops_tx, 289b4fdde6dSAsias He }; 290b4fdde6dSAsias He 291c5ae742bSSasha Levin static u8 *get_config(struct kvm *kvm, void *dev) 29278a2a3e2SSasha Levin { 29378a2a3e2SSasha Levin struct net_dev *ndev = dev; 29478a2a3e2SSasha Levin 295c5ae742bSSasha Levin return ((u8 *)(&ndev->config)); 29678a2a3e2SSasha Levin } 29778a2a3e2SSasha Levin 29878a2a3e2SSasha Levin static u32 get_host_features(struct kvm *kvm, void *dev) 29978a2a3e2SSasha Levin { 30078a2a3e2SSasha Levin return 1UL << VIRTIO_NET_F_MAC 30178a2a3e2SSasha Levin | 1UL << VIRTIO_NET_F_CSUM 30278a2a3e2SSasha Levin | 1UL << VIRTIO_NET_F_HOST_UFO 30378a2a3e2SSasha Levin | 1UL << VIRTIO_NET_F_HOST_TSO4 30478a2a3e2SSasha Levin | 1UL << VIRTIO_NET_F_HOST_TSO6 30578a2a3e2SSasha Levin | 1UL << VIRTIO_NET_F_GUEST_UFO 30678a2a3e2SSasha Levin | 1UL << VIRTIO_NET_F_GUEST_TSO4 30792c1f37bSSasha Levin | 1UL << VIRTIO_NET_F_GUEST_TSO6 308754c8ce3SSasha Levin | 1UL << VIRTIO_RING_F_EVENT_IDX 309754c8ce3SSasha Levin | 1UL << VIRTIO_RING_F_INDIRECT_DESC; 31078a2a3e2SSasha Levin } 31178a2a3e2SSasha Levin 31278a2a3e2SSasha Levin static void set_guest_features(struct kvm *kvm, void *dev, u32 features) 31378a2a3e2SSasha Levin { 31478a2a3e2SSasha Levin struct net_dev *ndev = dev; 31578a2a3e2SSasha Levin 31678a2a3e2SSasha Levin ndev->features = features; 31778a2a3e2SSasha Levin } 31878a2a3e2SSasha Levin 31978a2a3e2SSasha Levin static int init_vq(struct kvm *kvm, void *dev, u32 vq, u32 pfn) 32078a2a3e2SSasha Levin { 3219ed67cdcSSasha Levin struct vhost_vring_state state = { .index = vq }; 3229ed67cdcSSasha Levin struct vhost_vring_addr addr; 32378a2a3e2SSasha Levin struct net_dev *ndev = dev; 32478a2a3e2SSasha Levin struct virt_queue *queue; 32578a2a3e2SSasha Levin void *p; 3269ed67cdcSSasha Levin int r; 32778a2a3e2SSasha Levin 328312c62d1SSasha Levin compat__remove_message(compat_id); 32978a2a3e2SSasha Levin 33078a2a3e2SSasha Levin queue = &ndev->vqs[vq]; 33178a2a3e2SSasha Levin queue->pfn = pfn; 33278a2a3e2SSasha Levin p = guest_pfn_to_host(kvm, queue->pfn); 33378a2a3e2SSasha Levin 3340f4f51a8SAsias He /* FIXME: respect pci and mmio vring alignment */ 33578a2a3e2SSasha Levin vring_init(&queue->vring, VIRTIO_NET_QUEUE_SIZE, p, VIRTIO_PCI_VRING_ALIGN); 33678a2a3e2SSasha Levin 3379ed67cdcSSasha Levin if (ndev->vhost_fd == 0) 33878a2a3e2SSasha Levin return 0; 3399ed67cdcSSasha Levin 3409ed67cdcSSasha Levin state.num = queue->vring.num; 3419ed67cdcSSasha Levin r = ioctl(ndev->vhost_fd, VHOST_SET_VRING_NUM, &state); 3429ed67cdcSSasha Levin if (r < 0) 3439ed67cdcSSasha Levin die_perror("VHOST_SET_VRING_NUM failed"); 3449ed67cdcSSasha Levin state.num = 0; 3459ed67cdcSSasha Levin r = ioctl(ndev->vhost_fd, VHOST_SET_VRING_BASE, &state); 3469ed67cdcSSasha Levin if (r < 0) 3479ed67cdcSSasha Levin die_perror("VHOST_SET_VRING_BASE failed"); 3489ed67cdcSSasha Levin 3499ed67cdcSSasha Levin addr = (struct vhost_vring_addr) { 3509ed67cdcSSasha Levin .index = vq, 3519ed67cdcSSasha Levin .desc_user_addr = (u64)(unsigned long)queue->vring.desc, 3529ed67cdcSSasha Levin .avail_user_addr = (u64)(unsigned long)queue->vring.avail, 3539ed67cdcSSasha Levin .used_user_addr = (u64)(unsigned long)queue->vring.used, 3549ed67cdcSSasha Levin }; 3559ed67cdcSSasha Levin 3569ed67cdcSSasha Levin r = ioctl(ndev->vhost_fd, VHOST_SET_VRING_ADDR, &addr); 3579ed67cdcSSasha Levin if (r < 0) 3589ed67cdcSSasha Levin die_perror("VHOST_SET_VRING_ADDR failed"); 3599ed67cdcSSasha Levin 3609ed67cdcSSasha Levin return 0; 3619ed67cdcSSasha Levin } 3629ed67cdcSSasha Levin 3639ed67cdcSSasha Levin static void notify_vq_gsi(struct kvm *kvm, void *dev, u32 vq, u32 gsi) 3649ed67cdcSSasha Levin { 3659ed67cdcSSasha Levin struct net_dev *ndev = dev; 3669ed67cdcSSasha Levin struct kvm_irqfd irq; 3679ed67cdcSSasha Levin struct vhost_vring_file file; 3689ed67cdcSSasha Levin int r; 3699ed67cdcSSasha Levin 3709ed67cdcSSasha Levin if (ndev->vhost_fd == 0) 3719ed67cdcSSasha Levin return; 3729ed67cdcSSasha Levin 3739ed67cdcSSasha Levin irq = (struct kvm_irqfd) { 3749ed67cdcSSasha Levin .gsi = gsi, 3759ed67cdcSSasha Levin .fd = eventfd(0, 0), 3769ed67cdcSSasha Levin }; 3779ed67cdcSSasha Levin file = (struct vhost_vring_file) { 3789ed67cdcSSasha Levin .index = vq, 3799ed67cdcSSasha Levin .fd = irq.fd, 3809ed67cdcSSasha Levin }; 3819ed67cdcSSasha Levin 3829ed67cdcSSasha Levin r = ioctl(kvm->vm_fd, KVM_IRQFD, &irq); 3839ed67cdcSSasha Levin if (r < 0) 3849ed67cdcSSasha Levin die_perror("KVM_IRQFD failed"); 3859ed67cdcSSasha Levin 3869ed67cdcSSasha Levin r = ioctl(ndev->vhost_fd, VHOST_SET_VRING_CALL, &file); 3879ed67cdcSSasha Levin if (r < 0) 3889ed67cdcSSasha Levin die_perror("VHOST_SET_VRING_CALL failed"); 3899ed67cdcSSasha Levin file.fd = ndev->tap_fd; 3909ed67cdcSSasha Levin r = ioctl(ndev->vhost_fd, VHOST_NET_SET_BACKEND, &file); 3919ed67cdcSSasha Levin if (r != 0) 3929ed67cdcSSasha Levin die("VHOST_NET_SET_BACKEND failed %d", errno); 3939ed67cdcSSasha Levin 3949ed67cdcSSasha Levin } 3959ed67cdcSSasha Levin 3969ed67cdcSSasha Levin static void notify_vq_eventfd(struct kvm *kvm, void *dev, u32 vq, u32 efd) 3979ed67cdcSSasha Levin { 3989ed67cdcSSasha Levin struct net_dev *ndev = dev; 3999ed67cdcSSasha Levin struct vhost_vring_file file = { 4009ed67cdcSSasha Levin .index = vq, 4019ed67cdcSSasha Levin .fd = efd, 4029ed67cdcSSasha Levin }; 4039ed67cdcSSasha Levin int r; 4049ed67cdcSSasha Levin 4059ed67cdcSSasha Levin if (ndev->vhost_fd == 0) 4069ed67cdcSSasha Levin return; 4079ed67cdcSSasha Levin 4089ed67cdcSSasha Levin r = ioctl(ndev->vhost_fd, VHOST_SET_VRING_KICK, &file); 4099ed67cdcSSasha Levin if (r < 0) 4109ed67cdcSSasha Levin die_perror("VHOST_SET_VRING_KICK failed"); 41178a2a3e2SSasha Levin } 41278a2a3e2SSasha Levin 41378a2a3e2SSasha Levin static int notify_vq(struct kvm *kvm, void *dev, u32 vq) 41478a2a3e2SSasha Levin { 4159a6d73f1SSasha Levin struct net_dev *ndev = dev; 4169a6d73f1SSasha Levin 4179a6d73f1SSasha Levin virtio_net_handle_callback(kvm, ndev, vq); 41878a2a3e2SSasha Levin 41978a2a3e2SSasha Levin return 0; 42078a2a3e2SSasha Levin } 42178a2a3e2SSasha Levin 42278a2a3e2SSasha Levin static int get_pfn_vq(struct kvm *kvm, void *dev, u32 vq) 42378a2a3e2SSasha Levin { 42478a2a3e2SSasha Levin struct net_dev *ndev = dev; 42578a2a3e2SSasha Levin 42678a2a3e2SSasha Levin return ndev->vqs[vq].pfn; 42778a2a3e2SSasha Levin } 42878a2a3e2SSasha Levin 42978a2a3e2SSasha Levin static int get_size_vq(struct kvm *kvm, void *dev, u32 vq) 43078a2a3e2SSasha Levin { 4310f4f51a8SAsias He /* FIXME: dynamic */ 43278a2a3e2SSasha Levin return VIRTIO_NET_QUEUE_SIZE; 43378a2a3e2SSasha Levin } 43478a2a3e2SSasha Levin 4350f4f51a8SAsias He static int set_size_vq(struct kvm *kvm, void *dev, u32 vq, int size) 4360f4f51a8SAsias He { 4370f4f51a8SAsias He /* FIXME: dynamic */ 4380f4f51a8SAsias He return size; 4390f4f51a8SAsias He } 4400f4f51a8SAsias He 4411c47ce69SSasha Levin static struct virtio_ops net_dev_virtio_ops = (struct virtio_ops) { 4421c47ce69SSasha Levin .get_config = get_config, 4431c47ce69SSasha Levin .get_host_features = get_host_features, 4441c47ce69SSasha Levin .set_guest_features = set_guest_features, 4451c47ce69SSasha Levin .init_vq = init_vq, 4461c47ce69SSasha Levin .get_pfn_vq = get_pfn_vq, 4471c47ce69SSasha Levin .get_size_vq = get_size_vq, 4480f4f51a8SAsias He .set_size_vq = set_size_vq, 4490f4f51a8SAsias He .notify_vq = notify_vq, 4509ed67cdcSSasha Levin .notify_vq_gsi = notify_vq_gsi, 4519ed67cdcSSasha Levin .notify_vq_eventfd = notify_vq_eventfd, 4521c47ce69SSasha Levin }; 4531c47ce69SSasha Levin 4549ed67cdcSSasha Levin static void virtio_net__vhost_init(struct kvm *kvm, struct net_dev *ndev) 4559ed67cdcSSasha Levin { 45692c1f37bSSasha Levin u64 features = 1UL << VIRTIO_RING_F_EVENT_IDX; 4579ed67cdcSSasha Levin struct vhost_memory *mem; 4589ed67cdcSSasha Levin int r; 4599ed67cdcSSasha Levin 4609ed67cdcSSasha Levin ndev->vhost_fd = open("/dev/vhost-net", O_RDWR); 4619ed67cdcSSasha Levin if (ndev->vhost_fd < 0) 4629ed67cdcSSasha Levin die_perror("Failed openning vhost-net device"); 4639ed67cdcSSasha Levin 4648b795457SAsias He mem = calloc(1, sizeof(*mem) + sizeof(struct vhost_memory_region)); 4659ed67cdcSSasha Levin if (mem == NULL) 4669ed67cdcSSasha Levin die("Failed allocating memory for vhost memory map"); 4679ed67cdcSSasha Levin 4689ed67cdcSSasha Levin mem->nregions = 1; 4699ed67cdcSSasha Levin mem->regions[0] = (struct vhost_memory_region) { 4709ed67cdcSSasha Levin .guest_phys_addr = 0, 4719ed67cdcSSasha Levin .memory_size = kvm->ram_size, 472b4108023SAsias He .userspace_addr = (unsigned long)kvm->ram_start, 4739ed67cdcSSasha Levin }; 4749ed67cdcSSasha Levin 4759ed67cdcSSasha Levin r = ioctl(ndev->vhost_fd, VHOST_SET_OWNER); 4769ed67cdcSSasha Levin if (r != 0) 4779ed67cdcSSasha Levin die_perror("VHOST_SET_OWNER failed"); 4789ed67cdcSSasha Levin 4799ed67cdcSSasha Levin r = ioctl(ndev->vhost_fd, VHOST_SET_FEATURES, &features); 4809ed67cdcSSasha Levin if (r != 0) 4819ed67cdcSSasha Levin die_perror("VHOST_SET_FEATURES failed"); 4829ed67cdcSSasha Levin r = ioctl(ndev->vhost_fd, VHOST_SET_MEM_TABLE, mem); 4839ed67cdcSSasha Levin if (r != 0) 4849ed67cdcSSasha Levin die_perror("VHOST_SET_MEM_TABLE failed"); 485627d6874SAsias He 486627d6874SAsias He ndev->vdev.use_vhost = true; 487627d6874SAsias He 4889ed67cdcSSasha Levin free(mem); 4899ed67cdcSSasha Levin } 4909ed67cdcSSasha Levin 4915f225124SSasha Levin static inline void str_to_mac(const char *str, char *mac) 4925f225124SSasha Levin { 4935f225124SSasha Levin sscanf(str, "%hhx:%hhx:%hhx:%hhx:%hhx:%hhx", 4945f225124SSasha Levin mac, mac+1, mac+2, mac+3, mac+4, mac+5); 4955f225124SSasha Levin } 496*4346fd8fSSasha Levin static int set_net_param(struct kvm *kvm, struct virtio_net_params *p, 497*4346fd8fSSasha Levin const char *param, const char *val) 4985f225124SSasha Levin { 4995f225124SSasha Levin if (strcmp(param, "guest_mac") == 0) { 5005f225124SSasha Levin str_to_mac(val, p->guest_mac); 5015f225124SSasha Levin } else if (strcmp(param, "mode") == 0) { 5025f225124SSasha Levin if (!strncmp(val, "user", 4)) { 5035f225124SSasha Levin int i; 5045f225124SSasha Levin 5055f225124SSasha Levin for (i = 0; i < kvm->cfg.num_net_devices; i++) 5065f225124SSasha Levin if (kvm->cfg.net_params[i].mode == NET_MODE_USER) 5075f225124SSasha Levin die("Only one usermode network device allowed at a time"); 5085f225124SSasha Levin p->mode = NET_MODE_USER; 5095f225124SSasha Levin } else if (!strncmp(val, "tap", 3)) { 5105f225124SSasha Levin p->mode = NET_MODE_TAP; 5115f225124SSasha Levin } else if (!strncmp(val, "none", 4)) { 5125f225124SSasha Levin kvm->cfg.no_net = 1; 5135f225124SSasha Levin return -1; 5145f225124SSasha Levin } else 5155f225124SSasha Levin die("Unknown network mode %s, please use user, tap or none", kvm->cfg.network); 5165f225124SSasha Levin } else if (strcmp(param, "script") == 0) { 5175f225124SSasha Levin p->script = strdup(val); 5185f225124SSasha Levin } else if (strcmp(param, "guest_ip") == 0) { 5195f225124SSasha Levin p->guest_ip = strdup(val); 5205f225124SSasha Levin } else if (strcmp(param, "host_ip") == 0) { 5215f225124SSasha Levin p->host_ip = strdup(val); 5225f225124SSasha Levin } else if (strcmp(param, "trans") == 0) { 5235f225124SSasha Levin p->trans = strdup(val); 5245f225124SSasha Levin } else if (strcmp(param, "vhost") == 0) { 5255f225124SSasha Levin p->vhost = atoi(val); 5265f225124SSasha Levin } else if (strcmp(param, "fd") == 0) { 5275f225124SSasha Levin p->fd = atoi(val); 5285f225124SSasha Levin } else 5295f225124SSasha Levin die("Unknown network parameter %s", param); 5305f225124SSasha Levin 5315f225124SSasha Levin return 0; 5325f225124SSasha Levin } 5335f225124SSasha Levin 5345f225124SSasha Levin int netdev_parser(const struct option *opt, const char *arg, int unset) 5355f225124SSasha Levin { 5365f225124SSasha Levin struct virtio_net_params p; 5375f225124SSasha Levin char *buf = NULL, *cmd = NULL, *cur = NULL; 5385f225124SSasha Levin bool on_cmd = true; 5395f225124SSasha Levin struct kvm *kvm = opt->ptr; 5405f225124SSasha Levin 5415f225124SSasha Levin if (arg) { 5425f225124SSasha Levin buf = strdup(arg); 5435f225124SSasha Levin if (buf == NULL) 5445f225124SSasha Levin die("Failed allocating new net buffer"); 5455f225124SSasha Levin cur = strtok(buf, ",="); 5465f225124SSasha Levin } 5475f225124SSasha Levin 5485f225124SSasha Levin p = (struct virtio_net_params) { 5495f225124SSasha Levin .guest_ip = DEFAULT_GUEST_ADDR, 5505f225124SSasha Levin .host_ip = DEFAULT_HOST_ADDR, 5515f225124SSasha Levin .script = DEFAULT_SCRIPT, 5525f225124SSasha Levin .mode = NET_MODE_TAP, 5535f225124SSasha Levin }; 5545f225124SSasha Levin 5555f225124SSasha Levin str_to_mac(DEFAULT_GUEST_MAC, p.guest_mac); 5565f225124SSasha Levin p.guest_mac[5] += kvm->cfg.num_net_devices; 5575f225124SSasha Levin 5585f225124SSasha Levin while (cur) { 5595f225124SSasha Levin if (on_cmd) { 5605f225124SSasha Levin cmd = cur; 5615f225124SSasha Levin } else { 562*4346fd8fSSasha Levin if (set_net_param(kvm, &p, cmd, cur) < 0) 5635f225124SSasha Levin goto done; 5645f225124SSasha Levin } 5655f225124SSasha Levin on_cmd = !on_cmd; 5665f225124SSasha Levin 5675f225124SSasha Levin cur = strtok(NULL, ",="); 5685f225124SSasha Levin }; 5695f225124SSasha Levin 5705f225124SSasha Levin kvm->cfg.num_net_devices++; 5715f225124SSasha Levin 5725f225124SSasha Levin kvm->cfg.net_params = realloc(kvm->cfg.net_params, kvm->cfg.num_net_devices * sizeof(*kvm->cfg.net_params)); 5735f225124SSasha Levin if (kvm->cfg.net_params == NULL) 5745f225124SSasha Levin die("Failed adding new network device"); 5755f225124SSasha Levin 5765f225124SSasha Levin kvm->cfg.net_params[kvm->cfg.num_net_devices - 1] = p; 5775f225124SSasha Levin 5785f225124SSasha Levin done: 5795f225124SSasha Levin free(buf); 5805f225124SSasha Levin return 0; 5815f225124SSasha Levin } 5825f225124SSasha Levin 5835f225124SSasha Levin static int virtio_net__init_one(struct virtio_net_params *params) 5844f56d42cSAsias He { 585b5ee1ea7SAsias He int i; 5869a6d73f1SSasha Levin struct net_dev *ndev; 5879a6d73f1SSasha Levin 5889a6d73f1SSasha Levin ndev = calloc(1, sizeof(struct net_dev)); 5899a6d73f1SSasha Levin if (ndev == NULL) 5905f225124SSasha Levin return -ENOMEM; 5919a6d73f1SSasha Levin 5929a6d73f1SSasha Levin list_add_tail(&ndev->list, &ndevs); 5939a6d73f1SSasha Levin 5949a6d73f1SSasha Levin ndev->kvm = params->kvm; 5959a6d73f1SSasha Levin 5969a6d73f1SSasha Levin mutex_init(&ndev->mutex); 5979a6d73f1SSasha Levin ndev->config.status = VIRTIO_NET_S_LINK_UP; 5982449f6e3SSasha Levin 5990c54698eSAsias He for (i = 0 ; i < 6 ; i++) { 6009a6d73f1SSasha Levin ndev->config.mac[i] = params->guest_mac[i]; 6019a6d73f1SSasha Levin ndev->info.guest_mac.addr[i] = params->guest_mac[i]; 6029a6d73f1SSasha Levin ndev->info.host_mac.addr[i] = params->host_mac[i]; 6030c54698eSAsias He } 604f715177dSAsias He 6059a6d73f1SSasha Levin ndev->mode = params->mode; 6069a6d73f1SSasha Levin if (ndev->mode == NET_MODE_TAP) { 6079a6d73f1SSasha Levin if (!virtio_net__tap_init(params, ndev)) 608db051127SMichael Ellerman die_perror("You have requested a TAP device, but creation of one has failed because"); 6099a6d73f1SSasha Levin ndev->ops = &tap_ops; 610b4fdde6dSAsias He } else { 6119a6d73f1SSasha Levin ndev->info.host_ip = ntohl(inet_addr(params->host_ip)); 6129a6d73f1SSasha Levin ndev->info.guest_ip = ntohl(inet_addr(params->guest_ip)); 6139a6d73f1SSasha Levin ndev->info.guest_netmask = ntohl(inet_addr("255.255.255.0")); 6149a6d73f1SSasha Levin ndev->info.buf_nr = 20, 6159a6d73f1SSasha Levin uip_init(&ndev->info); 6169a6d73f1SSasha Levin ndev->ops = &uip_ops; 617b4fdde6dSAsias He } 618b5ee1ea7SAsias He 61969205aa1SAsias He if (params->trans && strcmp(params->trans, "mmio") == 0) 620*4346fd8fSSasha Levin virtio_init(params->kvm, ndev, &ndev->vdev, &net_dev_virtio_ops, 62169205aa1SAsias He VIRTIO_MMIO, PCI_DEVICE_ID_VIRTIO_NET, VIRTIO_ID_NET, PCI_CLASS_NET); 62269205aa1SAsias He else 623*4346fd8fSSasha Levin virtio_init(params->kvm, ndev, &ndev->vdev, &net_dev_virtio_ops, 62402eca50cSAsias He VIRTIO_PCI, PCI_DEVICE_ID_VIRTIO_NET, VIRTIO_ID_NET, PCI_CLASS_NET); 62527ab67f5SSasha Levin 6269ed67cdcSSasha Levin if (params->vhost) 6279ed67cdcSSasha Levin virtio_net__vhost_init(params->kvm, ndev); 6289ed67cdcSSasha Levin else 6299a6d73f1SSasha Levin virtio_net__io_thread_init(params->kvm, ndev); 630cb83de6fSSasha Levin 631d278197dSAsias He if (compat_id == -1) 63252f34d2cSAsias He compat_id = virtio_compat_add_message("virtio-net", "CONFIG_VIRTIO_NET"); 6335f225124SSasha Levin 6345f225124SSasha Levin return 0; 6355f225124SSasha Levin } 6365f225124SSasha Levin 6375f225124SSasha Levin int virtio_net__init(struct kvm *kvm) 6385f225124SSasha Levin { 6395f225124SSasha Levin int i; 6405f225124SSasha Levin 6415f225124SSasha Levin for (i = 0; i < kvm->cfg.num_net_devices; i++) { 6425f225124SSasha Levin kvm->cfg.net_params[i].kvm = kvm; 6435f225124SSasha Levin virtio_net__init_one(&kvm->cfg.net_params[i]); 6445f225124SSasha Levin } 6455f225124SSasha Levin 6465f225124SSasha Levin if (kvm->cfg.num_net_devices == 0 && kvm->cfg.no_net == 0) { 6475f225124SSasha Levin struct virtio_net_params net_params; 6485f225124SSasha Levin 6495f225124SSasha Levin net_params = (struct virtio_net_params) { 6505f225124SSasha Levin .guest_ip = kvm->cfg.guest_ip, 6515f225124SSasha Levin .host_ip = kvm->cfg.host_ip, 6525f225124SSasha Levin .kvm = kvm, 6535f225124SSasha Levin .script = kvm->cfg.script, 6545f225124SSasha Levin .mode = NET_MODE_USER, 6555f225124SSasha Levin }; 6565f225124SSasha Levin str_to_mac(kvm->cfg.guest_mac, net_params.guest_mac); 6575f225124SSasha Levin str_to_mac(kvm->cfg.host_mac, net_params.host_mac); 6585f225124SSasha Levin 6595f225124SSasha Levin virtio_net__init_one(&net_params); 6605f225124SSasha Levin } 6615f225124SSasha Levin 6625f225124SSasha Levin return 0; 6635f225124SSasha Levin } 66449a8afd1SSasha Levin virtio_dev_init(virtio_net__init); 6655f225124SSasha Levin 6665f225124SSasha Levin int virtio_net__exit(struct kvm *kvm) 6675f225124SSasha Levin { 6685f225124SSasha Levin return 0; 6694f56d42cSAsias He } 67049a8afd1SSasha Levin virtio_dev_exit(virtio_net__exit); 671