131638bcaSCyrill Gorcunov #include "kvm/virtio-pci-dev.h" 2b5ee1ea7SAsias He #include "kvm/virtio-net.h" 34f56d42cSAsias He #include "kvm/virtio.h" 44f56d42cSAsias He #include "kvm/mutex.h" 54f56d42cSAsias He #include "kvm/util.h" 64f56d42cSAsias He #include "kvm/kvm.h" 72449f6e3SSasha Levin #include "kvm/irq.h" 8b5ee1ea7SAsias He #include "kvm/uip.h" 9cb83de6fSSasha Levin #include "kvm/guest_compat.h" 107668c3a6SSasha Levin #include "kvm/iovec.h" 114f56d42cSAsias He 129ed67cdcSSasha Levin #include <linux/vhost.h> 134f56d42cSAsias He #include <linux/virtio_net.h> 144f56d42cSAsias He #include <linux/if_tun.h> 1578a2a3e2SSasha Levin #include <linux/types.h> 16c229370aSIngo Molnar 17c229370aSIngo Molnar #include <arpa/inet.h> 184f56d42cSAsias He #include <net/if.h> 19c229370aSIngo Molnar 20c229370aSIngo Molnar #include <unistd.h> 214f56d42cSAsias He #include <fcntl.h> 22c229370aSIngo Molnar 23cb7202c1SSasha Levin #include <sys/socket.h> 24c229370aSIngo Molnar #include <sys/ioctl.h> 25c229370aSIngo Molnar #include <sys/types.h> 2673b7d038SAmos Kong #include <sys/wait.h> 279ed67cdcSSasha Levin #include <sys/eventfd.h> 284f56d42cSAsias He 294059ad8bSAsias He #define VIRTIO_NET_QUEUE_SIZE 256 306585ffb7SSasha Levin #define VIRTIO_NET_NUM_QUEUES 8 314f56d42cSAsias He 32b4fdde6dSAsias He struct net_dev; 33b4fdde6dSAsias He 34b4fdde6dSAsias He struct net_dev_operations { 35b4fdde6dSAsias He int (*rx)(struct iovec *iov, u16 in, struct net_dev *ndev); 36b4fdde6dSAsias He int (*tx)(struct iovec *iov, u16 in, struct net_dev *ndev); 37b4fdde6dSAsias He }; 38b4fdde6dSAsias He 398626798bSAsias He struct net_dev { 40d3476f7dSSasha Levin struct mutex mutex; 4102eca50cSAsias He struct virtio_device vdev; 429a6d73f1SSasha Levin struct list_head list; 434f56d42cSAsias He 446585ffb7SSasha Levin struct virt_queue vqs[VIRTIO_NET_NUM_QUEUES * 2 + 1]; 45c229370aSIngo Molnar struct virtio_net_config config; 4679052597SSasha Levin u32 features, rx_vqs, tx_vqs, queue_pairs; 474f56d42cSAsias He 486585ffb7SSasha Levin pthread_t io_thread[VIRTIO_NET_NUM_QUEUES * 2 + 1]; 496585ffb7SSasha Levin struct mutex io_lock[VIRTIO_NET_NUM_QUEUES * 2 + 1]; 506585ffb7SSasha Levin pthread_cond_t io_cond[VIRTIO_NET_NUM_QUEUES * 2 + 1]; 51c4aa7c02SPekka Enberg 529ed67cdcSSasha Levin int vhost_fd; 534f56d42cSAsias He int tap_fd; 544f56d42cSAsias He char tap_name[IFNAMSIZ]; 5559ee54ebSWei Chen bool tap_ufo; 56bb1a32f1SAsias He 57bb1a32f1SAsias He int mode; 58bb1a32f1SAsias He 59b5ee1ea7SAsias He struct uip_info info; 60b4fdde6dSAsias He struct net_dev_operations *ops; 619a6d73f1SSasha Levin struct kvm *kvm; 628c0ae74dSSasha Levin 638c0ae74dSSasha Levin struct virtio_net_params *params; 644f56d42cSAsias He }; 654f56d42cSAsias He 669a6d73f1SSasha Levin static LIST_HEAD(ndevs); 67312c62d1SSasha Levin static int compat_id = -1; 684f56d42cSAsias He 697668c3a6SSasha Levin #define MAX_PACKET_SIZE 65550 707668c3a6SSasha Levin 717668c3a6SSasha Levin static bool has_virtio_feature(struct net_dev *ndev, u32 feature) 727668c3a6SSasha Levin { 737668c3a6SSasha Levin return ndev->features & (1 << feature); 747668c3a6SSasha Levin } 757668c3a6SSasha Levin 768ed60bbeSMarc Zyngier static void virtio_net_fix_tx_hdr(struct virtio_net_hdr *hdr, struct net_dev *ndev) 778ed60bbeSMarc Zyngier { 788ed60bbeSMarc Zyngier hdr->hdr_len = virtio_guest_to_host_u16(&ndev->vdev, hdr->hdr_len); 798ed60bbeSMarc Zyngier hdr->gso_size = virtio_guest_to_host_u16(&ndev->vdev, hdr->gso_size); 808ed60bbeSMarc Zyngier hdr->csum_start = virtio_guest_to_host_u16(&ndev->vdev, hdr->csum_start); 818ed60bbeSMarc Zyngier hdr->csum_offset = virtio_guest_to_host_u16(&ndev->vdev, hdr->csum_offset); 828ed60bbeSMarc Zyngier } 838ed60bbeSMarc Zyngier 843fea89a9SWill Deacon static void virtio_net_fix_rx_hdr(struct virtio_net_hdr *hdr, struct net_dev *ndev) 858ed60bbeSMarc Zyngier { 863fea89a9SWill Deacon hdr->hdr_len = virtio_host_to_guest_u16(&ndev->vdev, hdr->hdr_len); 873fea89a9SWill Deacon hdr->gso_size = virtio_host_to_guest_u16(&ndev->vdev, hdr->gso_size); 883fea89a9SWill Deacon hdr->csum_start = virtio_host_to_guest_u16(&ndev->vdev, hdr->csum_start); 893fea89a9SWill Deacon hdr->csum_offset = virtio_host_to_guest_u16(&ndev->vdev, hdr->csum_offset); 908ed60bbeSMarc Zyngier } 918ed60bbeSMarc Zyngier 92c4aa7c02SPekka Enberg static void *virtio_net_rx_thread(void *p) 934f56d42cSAsias He { 944f56d42cSAsias He struct iovec iov[VIRTIO_NET_QUEUE_SIZE]; 954f56d42cSAsias He struct virt_queue *vq; 9643835ac9SSasha Levin struct kvm *kvm; 979a6d73f1SSasha Levin struct net_dev *ndev = p; 983fdf659dSSasha Levin u16 out, in; 993fdf659dSSasha Levin u16 head; 1006d6cc14bSWill Deacon int len, copied; 1016585ffb7SSasha Levin u32 id; 1026585ffb7SSasha Levin 1036585ffb7SSasha Levin mutex_lock(&ndev->mutex); 1046585ffb7SSasha Levin id = ndev->rx_vqs++ * 2; 1056585ffb7SSasha Levin mutex_unlock(&ndev->mutex); 1064f56d42cSAsias He 107a4d8c55eSSasha Levin kvm__set_thread_name("virtio-net-rx"); 108a4d8c55eSSasha Levin 1099a6d73f1SSasha Levin kvm = ndev->kvm; 1106585ffb7SSasha Levin vq = &ndev->vqs[id]; 111c4aa7c02SPekka Enberg 112c4aa7c02SPekka Enberg while (1) { 1136585ffb7SSasha Levin mutex_lock(&ndev->io_lock[id]); 114c4aa7c02SPekka Enberg if (!virt_queue__available(vq)) 1156585ffb7SSasha Levin pthread_cond_wait(&ndev->io_cond[id], &ndev->io_lock[id].mutex); 1166585ffb7SSasha Levin mutex_unlock(&ndev->io_lock[id]); 1174f56d42cSAsias He 1184f56d42cSAsias He while (virt_queue__available(vq)) { 1197668c3a6SSasha Levin unsigned char buffer[MAX_PACKET_SIZE + sizeof(struct virtio_net_hdr_mrg_rxbuf)]; 1207668c3a6SSasha Levin struct iovec dummy_iov = { 1217668c3a6SSasha Levin .iov_base = buffer, 1227668c3a6SSasha Levin .iov_len = sizeof(buffer), 1237668c3a6SSasha Levin }; 1247668c3a6SSasha Levin struct virtio_net_hdr_mrg_rxbuf *hdr; 1253fea89a9SWill Deacon u16 num_buffers; 1267f5ffaf5SAsias He 1277668c3a6SSasha Levin len = ndev->ops->rx(&dummy_iov, 1, ndev); 1286d6cc14bSWill Deacon if (len < 0) { 1296d6cc14bSWill Deacon pr_warning("%s: rx on vq %u failed (%d), exiting thread\n", 1306d6cc14bSWill Deacon __func__, id, len); 1316d6cc14bSWill Deacon goto out_err; 1326d6cc14bSWill Deacon } 1336d6cc14bSWill Deacon 1343fea89a9SWill Deacon copied = num_buffers = 0; 1357668c3a6SSasha Levin head = virt_queue__get_iov(vq, iov, &out, &in, kvm); 1368ed60bbeSMarc Zyngier hdr = iov[0].iov_base; 1377668c3a6SSasha Levin while (copied < len) { 1386d6cc14bSWill Deacon size_t iovsize = min_t(size_t, len - copied, iov_size(iov, in)); 1397668c3a6SSasha Levin 140e2493047SAsias He memcpy_toiovec(iov, buffer + copied, iovsize); 1417668c3a6SSasha Levin copied += iovsize; 1423fea89a9SWill Deacon virt_queue__set_used_elem_no_update(vq, head, iovsize, num_buffers++); 1437668c3a6SSasha Levin if (copied == len) 1447668c3a6SSasha Levin break; 1457668c3a6SSasha Levin while (!virt_queue__available(vq)) 1467668c3a6SSasha Levin sleep(0); 1477668c3a6SSasha Levin head = virt_queue__get_iov(vq, iov, &out, &in, kvm); 1487668c3a6SSasha Levin } 1493fea89a9SWill Deacon 1503fea89a9SWill Deacon virtio_net_fix_rx_hdr(&hdr->hdr, ndev); 1513fea89a9SWill Deacon if (has_virtio_feature(ndev, VIRTIO_NET_F_MRG_RXBUF)) 1523fea89a9SWill Deacon hdr->num_buffers = virtio_host_to_guest_u16(vq, num_buffers); 1533fea89a9SWill Deacon 1543fea89a9SWill Deacon virt_queue__used_idx_advance(vq, num_buffers); 1553fea89a9SWill Deacon 156c4aa7c02SPekka Enberg /* We should interrupt guest right now, otherwise latency is huge. */ 1576585ffb7SSasha Levin if (virtio_queue__should_signal(vq)) 1586585ffb7SSasha Levin ndev->vdev.ops->signal_vq(kvm, &ndev->vdev, id); 1594f56d42cSAsias He } 160c4aa7c02SPekka Enberg } 161c4aa7c02SPekka Enberg 1626d6cc14bSWill Deacon out_err: 163c4aa7c02SPekka Enberg pthread_exit(NULL); 164c4aa7c02SPekka Enberg return NULL; 165c4aa7c02SPekka Enberg 166c4aa7c02SPekka Enberg } 167c4aa7c02SPekka Enberg 168c4aa7c02SPekka Enberg static void *virtio_net_tx_thread(void *p) 1694f56d42cSAsias He { 1704f56d42cSAsias He struct iovec iov[VIRTIO_NET_QUEUE_SIZE]; 1714f56d42cSAsias He struct virt_queue *vq; 17243835ac9SSasha Levin struct kvm *kvm; 1739a6d73f1SSasha Levin struct net_dev *ndev = p; 1743fdf659dSSasha Levin u16 out, in; 1753fdf659dSSasha Levin u16 head; 1764f56d42cSAsias He int len; 1776585ffb7SSasha Levin u32 id; 1786585ffb7SSasha Levin 1796585ffb7SSasha Levin mutex_lock(&ndev->mutex); 1806585ffb7SSasha Levin id = ndev->tx_vqs++ * 2 + 1; 1816585ffb7SSasha Levin mutex_unlock(&ndev->mutex); 1824f56d42cSAsias He 183a4d8c55eSSasha Levin kvm__set_thread_name("virtio-net-tx"); 184a4d8c55eSSasha Levin 1859a6d73f1SSasha Levin kvm = ndev->kvm; 1866585ffb7SSasha Levin vq = &ndev->vqs[id]; 187c4aa7c02SPekka Enberg 188c4aa7c02SPekka Enberg while (1) { 1896585ffb7SSasha Levin mutex_lock(&ndev->io_lock[id]); 190c4aa7c02SPekka Enberg if (!virt_queue__available(vq)) 1916585ffb7SSasha Levin pthread_cond_wait(&ndev->io_cond[id], &ndev->io_lock[id].mutex); 1926585ffb7SSasha Levin mutex_unlock(&ndev->io_lock[id]); 1934f56d42cSAsias He 1944f56d42cSAsias He while (virt_queue__available(vq)) { 1958ed60bbeSMarc Zyngier struct virtio_net_hdr *hdr; 19643835ac9SSasha Levin head = virt_queue__get_iov(vq, iov, &out, &in, kvm); 1978ed60bbeSMarc Zyngier hdr = iov[0].iov_base; 1988ed60bbeSMarc Zyngier virtio_net_fix_tx_hdr(hdr, ndev); 1999a6d73f1SSasha Levin len = ndev->ops->tx(iov, out, ndev); 2006d6cc14bSWill Deacon if (len < 0) { 2016d6cc14bSWill Deacon pr_warning("%s: tx on vq %u failed (%d)\n", 2028ed60bbeSMarc Zyngier __func__, id, errno); 2036d6cc14bSWill Deacon goto out_err; 2046d6cc14bSWill Deacon } 2056d6cc14bSWill Deacon 2064f56d42cSAsias He virt_queue__set_used_elem(vq, head, len); 2074f56d42cSAsias He } 2084f56d42cSAsias He 2096585ffb7SSasha Levin if (virtio_queue__should_signal(vq)) 2106585ffb7SSasha Levin ndev->vdev.ops->signal_vq(kvm, &ndev->vdev, id); 2114f56d42cSAsias He } 2124f56d42cSAsias He 2136d6cc14bSWill Deacon out_err: 214c4aa7c02SPekka Enberg pthread_exit(NULL); 215c4aa7c02SPekka Enberg return NULL; 216c4aa7c02SPekka Enberg } 217407475bfSPekka Enberg 2186585ffb7SSasha Levin static virtio_net_ctrl_ack virtio_net_handle_mq(struct kvm* kvm, struct net_dev *ndev, struct virtio_net_ctrl_hdr *ctrl) 2196585ffb7SSasha Levin { 2206585ffb7SSasha Levin /* Not much to do here */ 2216585ffb7SSasha Levin return VIRTIO_NET_OK; 2226585ffb7SSasha Levin } 2236585ffb7SSasha Levin 2246585ffb7SSasha Levin static void *virtio_net_ctrl_thread(void *p) 225abd4a801SSasha Levin { 226abd4a801SSasha Levin struct iovec iov[VIRTIO_NET_QUEUE_SIZE]; 227abd4a801SSasha Levin u16 out, in, head; 2286585ffb7SSasha Levin struct net_dev *ndev = p; 2296585ffb7SSasha Levin struct kvm *kvm = ndev->kvm; 23079052597SSasha Levin u32 id = ndev->queue_pairs * 2; 2316585ffb7SSasha Levin struct virt_queue *vq = &ndev->vqs[id]; 232abd4a801SSasha Levin struct virtio_net_ctrl_hdr *ctrl; 233abd4a801SSasha Levin virtio_net_ctrl_ack *ack; 234abd4a801SSasha Levin 235edb4a8a0SSuzuki K. Poulose kvm__set_thread_name("virtio-net-ctrl"); 236edb4a8a0SSuzuki K. Poulose 2376585ffb7SSasha Levin while (1) { 2386585ffb7SSasha Levin mutex_lock(&ndev->io_lock[id]); 2396585ffb7SSasha Levin if (!virt_queue__available(vq)) 2406585ffb7SSasha Levin pthread_cond_wait(&ndev->io_cond[id], &ndev->io_lock[id].mutex); 2416585ffb7SSasha Levin mutex_unlock(&ndev->io_lock[id]); 2426585ffb7SSasha Levin 2436585ffb7SSasha Levin while (virt_queue__available(vq)) { 2446585ffb7SSasha Levin head = virt_queue__get_iov(&ndev->vqs[id], iov, &out, &in, kvm); 245abd4a801SSasha Levin ctrl = iov[0].iov_base; 246abd4a801SSasha Levin ack = iov[out].iov_base; 247abd4a801SSasha Levin 248abd4a801SSasha Levin switch (ctrl->class) { 2496585ffb7SSasha Levin case VIRTIO_NET_CTRL_MQ: 2506585ffb7SSasha Levin *ack = virtio_net_handle_mq(kvm, ndev, ctrl); 2516585ffb7SSasha Levin break; 252abd4a801SSasha Levin default: 253abd4a801SSasha Levin *ack = VIRTIO_NET_ERR; 254abd4a801SSasha Levin break; 255abd4a801SSasha Levin } 2566585ffb7SSasha Levin virt_queue__set_used_elem(&ndev->vqs[id], head, iov[out].iov_len); 2576585ffb7SSasha Levin } 258abd4a801SSasha Levin 2596585ffb7SSasha Levin if (virtio_queue__should_signal(&ndev->vqs[id])) 2606585ffb7SSasha Levin ndev->vdev.ops->signal_vq(kvm, &ndev->vdev, id); 2616585ffb7SSasha Levin } 262abd4a801SSasha Levin 2636585ffb7SSasha Levin pthread_exit(NULL); 264abd4a801SSasha Levin 2656585ffb7SSasha Levin return NULL; 266abd4a801SSasha Levin } 267abd4a801SSasha Levin 2689a6d73f1SSasha Levin static void virtio_net_handle_callback(struct kvm *kvm, struct net_dev *ndev, int queue) 2694f56d42cSAsias He { 27079052597SSasha Levin if ((u32)queue >= (ndev->queue_pairs * 2 + 1)) { 2719a6d73f1SSasha Levin pr_warning("Unknown queue index %u", queue); 2726585ffb7SSasha Levin return; 273c4aa7c02SPekka Enberg } 2746585ffb7SSasha Levin 2756585ffb7SSasha Levin mutex_lock(&ndev->io_lock[queue]); 2766585ffb7SSasha Levin pthread_cond_signal(&ndev->io_cond[queue]); 2776585ffb7SSasha Levin mutex_unlock(&ndev->io_lock[queue]); 2784f56d42cSAsias He } 2794f56d42cSAsias He 280d2a7ddffSMarc Zyngier static int virtio_net_request_tap(struct net_dev *ndev, struct ifreq *ifr, 281d2a7ddffSMarc Zyngier const char *tapname) 282d2a7ddffSMarc Zyngier { 283d2a7ddffSMarc Zyngier int ret; 284d2a7ddffSMarc Zyngier 285d2a7ddffSMarc Zyngier memset(ifr, 0, sizeof(*ifr)); 286d2a7ddffSMarc Zyngier ifr->ifr_flags = IFF_TAP | IFF_NO_PI | IFF_VNET_HDR; 287d2a7ddffSMarc Zyngier if (tapname) 288d2a7ddffSMarc Zyngier strncpy(ifr->ifr_name, tapname, sizeof(ifr->ifr_name)); 289d2a7ddffSMarc Zyngier 290f83dc816SAndreas Herrmann ret = ioctl(ndev->tap_fd, TUNSETIFF, ifr); 291d2a7ddffSMarc Zyngier 292d2a7ddffSMarc Zyngier if (ret >= 0) 293d2a7ddffSMarc Zyngier strncpy(ndev->tap_name, ifr->ifr_name, sizeof(ndev->tap_name)); 294d2a7ddffSMarc Zyngier return ret; 295d2a7ddffSMarc Zyngier } 296d2a7ddffSMarc Zyngier 297eef27ae3SFan Du static int virtio_net_exec_script(const char* script, const char *tap_name) 298eef27ae3SFan Du { 299eef27ae3SFan Du pid_t pid; 300eef27ae3SFan Du int status; 301eef27ae3SFan Du 302eef27ae3SFan Du pid = fork(); 303eef27ae3SFan Du if (pid == 0) { 304eef27ae3SFan Du execl(script, script, tap_name, NULL); 305eef27ae3SFan Du _exit(1); 306eef27ae3SFan Du } else { 307eef27ae3SFan Du waitpid(pid, &status, 0); 308eef27ae3SFan Du if (WIFEXITED(status) && WEXITSTATUS(status) != 0) { 309eef27ae3SFan Du pr_warning("Fail to setup tap by %s", script); 310eef27ae3SFan Du return -1; 311eef27ae3SFan Du } 312eef27ae3SFan Du } 313eef27ae3SFan Du return 0; 314eef27ae3SFan Du } 315eef27ae3SFan Du 3168c0ae74dSSasha Levin static bool virtio_net__tap_init(struct net_dev *ndev) 3174f56d42cSAsias He { 318cb7202c1SSasha Levin int sock = socket(AF_INET, SOCK_STREAM, 0); 31959ee54ebSWei Chen int hdr_len; 320cb7202c1SSasha Levin struct sockaddr_in sin = {0}; 321246c8347SAsias He struct ifreq ifr; 3228c0ae74dSSasha Levin const struct virtio_net_params *params = ndev->params; 3231dfc7c24SMarc Zyngier bool skipconf = !!params->tapif; 3244f56d42cSAsias He 3257668c3a6SSasha Levin hdr_len = has_virtio_feature(ndev, VIRTIO_NET_F_MRG_RXBUF) ? 32648c6b47aSSasha Levin sizeof(struct virtio_net_hdr_mrg_rxbuf) : 32748c6b47aSSasha Levin sizeof(struct virtio_net_hdr); 3289a6d73f1SSasha Levin if (ioctl(ndev->tap_fd, TUNSETVNETHDRSZ, &hdr_len) < 0) 3294542f276SCyrill Gorcunov pr_warning("Config tap device TUNSETVNETHDRSZ error"); 330246c8347SAsias He 33173b7d038SAmos Kong if (strcmp(params->script, "none")) { 332eef27ae3SFan Du if (virtio_net_exec_script(params->script, ndev->tap_name) < 0) 33373b7d038SAmos Kong goto fail; 3341dfc7c24SMarc Zyngier } else if (!skipconf) { 335cb7202c1SSasha Levin memset(&ifr, 0, sizeof(ifr)); 3369a6d73f1SSasha Levin strncpy(ifr.ifr_name, ndev->tap_name, sizeof(ndev->tap_name)); 337bdfcfca6SSasha Levin sin.sin_addr.s_addr = inet_addr(params->host_ip); 338cb7202c1SSasha Levin memcpy(&(ifr.ifr_addr), &sin, sizeof(ifr.ifr_addr)); 339cb7202c1SSasha Levin ifr.ifr_addr.sa_family = AF_INET; 3403b02f580SSasha Levin if (ioctl(sock, SIOCSIFADDR, &ifr) < 0) { 3414542f276SCyrill Gorcunov pr_warning("Could not set ip address on tap device"); 3423b02f580SSasha Levin goto fail; 3433b02f580SSasha Levin } 34473b7d038SAmos Kong } 345cb7202c1SSasha Levin 3461dfc7c24SMarc Zyngier if (!skipconf) { 347cb7202c1SSasha Levin memset(&ifr, 0, sizeof(ifr)); 3489a6d73f1SSasha Levin strncpy(ifr.ifr_name, ndev->tap_name, sizeof(ndev->tap_name)); 349cb7202c1SSasha Levin ioctl(sock, SIOCGIFFLAGS, &ifr); 350cb7202c1SSasha Levin ifr.ifr_flags |= IFF_UP | IFF_RUNNING; 351cb7202c1SSasha Levin if (ioctl(sock, SIOCSIFFLAGS, &ifr) < 0) 3524542f276SCyrill Gorcunov pr_warning("Could not bring tap device up"); 3531dfc7c24SMarc Zyngier } 354cb7202c1SSasha Levin 355cb7202c1SSasha Levin close(sock); 3563b02f580SSasha Levin 3573b02f580SSasha Levin return 1; 3583b02f580SSasha Levin 3593b02f580SSasha Levin fail: 3603b02f580SSasha Levin if (sock >= 0) 3613b02f580SSasha Levin close(sock); 3629a6d73f1SSasha Levin if (ndev->tap_fd >= 0) 3639a6d73f1SSasha Levin close(ndev->tap_fd); 3643b02f580SSasha Levin 3653b02f580SSasha Levin return 0; 3664f56d42cSAsias He } 3674f56d42cSAsias He 36859ee54ebSWei Chen static bool virtio_net__tap_create(struct net_dev *ndev) 36959ee54ebSWei Chen { 37059ee54ebSWei Chen int offload; 37159ee54ebSWei Chen struct ifreq ifr; 37259ee54ebSWei Chen const struct virtio_net_params *params = ndev->params; 37359ee54ebSWei Chen bool macvtap = (!!params->tapif) && (params->tapif[0] == '/'); 37459ee54ebSWei Chen 37559ee54ebSWei Chen /* Did the user already gave us the FD? */ 37659ee54ebSWei Chen if (params->fd) 37759ee54ebSWei Chen ndev->tap_fd = params->fd; 37859ee54ebSWei Chen else { 37959ee54ebSWei Chen const char *tap_file = "/dev/net/tun"; 38059ee54ebSWei Chen 38159ee54ebSWei Chen /* Did the user ask us to use macvtap? */ 38259ee54ebSWei Chen if (macvtap) 38359ee54ebSWei Chen tap_file = params->tapif; 38459ee54ebSWei Chen 38559ee54ebSWei Chen ndev->tap_fd = open(tap_file, O_RDWR); 38659ee54ebSWei Chen if (ndev->tap_fd < 0) { 38759ee54ebSWei Chen pr_warning("Unable to open %s", tap_file); 38859ee54ebSWei Chen return 0; 38959ee54ebSWei Chen } 39059ee54ebSWei Chen } 39159ee54ebSWei Chen 39259ee54ebSWei Chen if (!macvtap && 39359ee54ebSWei Chen virtio_net_request_tap(ndev, &ifr, params->tapif) < 0) { 39459ee54ebSWei Chen pr_warning("Config tap device error. Are you root?"); 39559ee54ebSWei Chen goto fail; 39659ee54ebSWei Chen } 39759ee54ebSWei Chen 39859ee54ebSWei Chen /* 39959ee54ebSWei Chen * The UFO support had been removed from kernel in commit: 40059ee54ebSWei Chen * ID: fb652fdfe83710da0ca13448a41b7ed027d0a984 40159ee54ebSWei Chen * https://www.spinics.net/lists/netdev/msg443562.html 40259ee54ebSWei Chen * In oder to support the older kernels without this commit, 40359ee54ebSWei Chen * we set the TUN_F_UFO to offload by default to test the status of 40459ee54ebSWei Chen * UFO kernel support. 40559ee54ebSWei Chen */ 40659ee54ebSWei Chen ndev->tap_ufo = true; 40759ee54ebSWei Chen offload = TUN_F_CSUM | TUN_F_TSO4 | TUN_F_TSO6 | TUN_F_UFO; 40859ee54ebSWei Chen if (ioctl(ndev->tap_fd, TUNSETOFFLOAD, offload) < 0) { 40959ee54ebSWei Chen /* 41059ee54ebSWei Chen * Is this failure caused by kernel remove the UFO support? 41159ee54ebSWei Chen * Try TUNSETOFFLOAD without TUN_F_UFO. 41259ee54ebSWei Chen */ 41359ee54ebSWei Chen offload &= ~TUN_F_UFO; 41459ee54ebSWei Chen if (ioctl(ndev->tap_fd, TUNSETOFFLOAD, offload) < 0) { 41559ee54ebSWei Chen pr_warning("Config tap device TUNSETOFFLOAD error"); 41659ee54ebSWei Chen goto fail; 41759ee54ebSWei Chen } 41859ee54ebSWei Chen ndev->tap_ufo = false; 41959ee54ebSWei Chen } 42059ee54ebSWei Chen 42159ee54ebSWei Chen return 1; 42259ee54ebSWei Chen 42359ee54ebSWei Chen fail: 42459ee54ebSWei Chen if ((ndev->tap_fd >= 0) || (!params->fd) ) 42559ee54ebSWei Chen close(ndev->tap_fd); 42659ee54ebSWei Chen 42759ee54ebSWei Chen return 0; 42859ee54ebSWei Chen } 42959ee54ebSWei Chen 430b4fdde6dSAsias He static inline int tap_ops_tx(struct iovec *iov, u16 out, struct net_dev *ndev) 431b4fdde6dSAsias He { 432b4fdde6dSAsias He return writev(ndev->tap_fd, iov, out); 433b4fdde6dSAsias He } 434b4fdde6dSAsias He 435b4fdde6dSAsias He static inline int tap_ops_rx(struct iovec *iov, u16 in, struct net_dev *ndev) 436b4fdde6dSAsias He { 437b4fdde6dSAsias He return readv(ndev->tap_fd, iov, in); 438b4fdde6dSAsias He } 439b4fdde6dSAsias He 440b4fdde6dSAsias He static inline int uip_ops_tx(struct iovec *iov, u16 out, struct net_dev *ndev) 441b4fdde6dSAsias He { 442b4fdde6dSAsias He return uip_tx(iov, out, &ndev->info); 443b4fdde6dSAsias He } 444b4fdde6dSAsias He 445b4fdde6dSAsias He static inline int uip_ops_rx(struct iovec *iov, u16 in, struct net_dev *ndev) 446b4fdde6dSAsias He { 447b4fdde6dSAsias He return uip_rx(iov, in, &ndev->info); 448b4fdde6dSAsias He } 449b4fdde6dSAsias He 450b4fdde6dSAsias He static struct net_dev_operations tap_ops = { 451b4fdde6dSAsias He .rx = tap_ops_rx, 452b4fdde6dSAsias He .tx = tap_ops_tx, 453b4fdde6dSAsias He }; 454b4fdde6dSAsias He 455b4fdde6dSAsias He static struct net_dev_operations uip_ops = { 456b4fdde6dSAsias He .rx = uip_ops_rx, 457b4fdde6dSAsias He .tx = uip_ops_tx, 458b4fdde6dSAsias He }; 459b4fdde6dSAsias He 460c5ae742bSSasha Levin static u8 *get_config(struct kvm *kvm, void *dev) 46178a2a3e2SSasha Levin { 46278a2a3e2SSasha Levin struct net_dev *ndev = dev; 46378a2a3e2SSasha Levin 464c5ae742bSSasha Levin return ((u8 *)(&ndev->config)); 46578a2a3e2SSasha Levin } 46678a2a3e2SSasha Levin 46778a2a3e2SSasha Levin static u32 get_host_features(struct kvm *kvm, void *dev) 46878a2a3e2SSasha Levin { 46959ee54ebSWei Chen u32 features; 47079052597SSasha Levin struct net_dev *ndev = dev; 47179052597SSasha Levin 47259ee54ebSWei Chen features = 1UL << VIRTIO_NET_F_MAC 47378a2a3e2SSasha Levin | 1UL << VIRTIO_NET_F_CSUM 47478a2a3e2SSasha Levin | 1UL << VIRTIO_NET_F_HOST_TSO4 47578a2a3e2SSasha Levin | 1UL << VIRTIO_NET_F_HOST_TSO6 47678a2a3e2SSasha Levin | 1UL << VIRTIO_NET_F_GUEST_TSO4 47792c1f37bSSasha Levin | 1UL << VIRTIO_NET_F_GUEST_TSO6 478754c8ce3SSasha Levin | 1UL << VIRTIO_RING_F_EVENT_IDX 479abd4a801SSasha Levin | 1UL << VIRTIO_RING_F_INDIRECT_DESC 4806585ffb7SSasha Levin | 1UL << VIRTIO_NET_F_CTRL_VQ 4817668c3a6SSasha Levin | 1UL << VIRTIO_NET_F_MRG_RXBUF 48279052597SSasha Levin | 1UL << (ndev->queue_pairs > 1 ? VIRTIO_NET_F_MQ : 0); 48359ee54ebSWei Chen 48459ee54ebSWei Chen /* 48559ee54ebSWei Chen * The UFO feature for host and guest only can be enabled when the 48659ee54ebSWei Chen * kernel has TAP UFO support. 48759ee54ebSWei Chen */ 48859ee54ebSWei Chen if (ndev->tap_ufo) 48959ee54ebSWei Chen features |= (1UL << VIRTIO_NET_F_HOST_UFO 49059ee54ebSWei Chen | 1UL << VIRTIO_NET_F_GUEST_UFO); 49159ee54ebSWei Chen 49259ee54ebSWei Chen return features; 49378a2a3e2SSasha Levin } 49478a2a3e2SSasha Levin 49515636d5eSYing-Shiuan Pan static int virtio_net__vhost_set_features(struct net_dev *ndev) 49615636d5eSYing-Shiuan Pan { 49715636d5eSYing-Shiuan Pan u64 features = 1UL << VIRTIO_RING_F_EVENT_IDX; 49815636d5eSYing-Shiuan Pan u64 vhost_features; 49915636d5eSYing-Shiuan Pan 50015636d5eSYing-Shiuan Pan if (ioctl(ndev->vhost_fd, VHOST_GET_FEATURES, &vhost_features) != 0) 50115636d5eSYing-Shiuan Pan die_perror("VHOST_GET_FEATURES failed"); 50215636d5eSYing-Shiuan Pan 50315636d5eSYing-Shiuan Pan /* make sure both side support mergable rx buffers */ 50415636d5eSYing-Shiuan Pan if (vhost_features & 1UL << VIRTIO_NET_F_MRG_RXBUF && 50515636d5eSYing-Shiuan Pan has_virtio_feature(ndev, VIRTIO_NET_F_MRG_RXBUF)) 50615636d5eSYing-Shiuan Pan features |= 1UL << VIRTIO_NET_F_MRG_RXBUF; 50715636d5eSYing-Shiuan Pan 50815636d5eSYing-Shiuan Pan return ioctl(ndev->vhost_fd, VHOST_SET_FEATURES, &features); 50915636d5eSYing-Shiuan Pan } 51015636d5eSYing-Shiuan Pan 51178a2a3e2SSasha Levin static void set_guest_features(struct kvm *kvm, void *dev, u32 features) 51278a2a3e2SSasha Levin { 51378a2a3e2SSasha Levin struct net_dev *ndev = dev; 5148ed60bbeSMarc Zyngier struct virtio_net_config *conf = &ndev->config; 51578a2a3e2SSasha Levin 51678a2a3e2SSasha Levin ndev->features = features; 5178aa155c4SYing-Shiuan Pan 5188ed60bbeSMarc Zyngier conf->status = virtio_host_to_guest_u16(&ndev->vdev, conf->status); 5198ed60bbeSMarc Zyngier conf->max_virtqueue_pairs = virtio_host_to_guest_u16(&ndev->vdev, 5208ed60bbeSMarc Zyngier conf->max_virtqueue_pairs); 5218ed60bbeSMarc Zyngier 5228aa155c4SYing-Shiuan Pan if (ndev->mode == NET_MODE_TAP) { 5238aa155c4SYing-Shiuan Pan if (!virtio_net__tap_init(ndev)) 52459ee54ebSWei Chen die_perror("TAP device initialized failed because"); 52559ee54ebSWei Chen 52615636d5eSYing-Shiuan Pan if (ndev->vhost_fd && 52715636d5eSYing-Shiuan Pan virtio_net__vhost_set_features(ndev) != 0) 52815636d5eSYing-Shiuan Pan die_perror("VHOST_SET_FEATURES failed"); 5298aa155c4SYing-Shiuan Pan } else { 5308aa155c4SYing-Shiuan Pan ndev->info.vnet_hdr_len = has_virtio_feature(ndev, VIRTIO_NET_F_MRG_RXBUF) ? 5318aa155c4SYing-Shiuan Pan sizeof(struct virtio_net_hdr_mrg_rxbuf) : 5328aa155c4SYing-Shiuan Pan sizeof(struct virtio_net_hdr); 5338aa155c4SYing-Shiuan Pan uip_init(&ndev->info); 5348aa155c4SYing-Shiuan Pan } 53578a2a3e2SSasha Levin } 53678a2a3e2SSasha Levin 5379e56ec14SSasha Levin static bool is_ctrl_vq(struct net_dev *ndev, u32 vq) 5389e56ec14SSasha Levin { 5399e56ec14SSasha Levin return vq == (u32)(ndev->queue_pairs * 2); 5409e56ec14SSasha Levin } 5419e56ec14SSasha Levin 542c59ba304SWill Deacon static int init_vq(struct kvm *kvm, void *dev, u32 vq, u32 page_size, u32 align, 543c59ba304SWill Deacon u32 pfn) 54478a2a3e2SSasha Levin { 5459ed67cdcSSasha Levin struct vhost_vring_state state = { .index = vq }; 5469ed67cdcSSasha Levin struct vhost_vring_addr addr; 54778a2a3e2SSasha Levin struct net_dev *ndev = dev; 54878a2a3e2SSasha Levin struct virt_queue *queue; 54978a2a3e2SSasha Levin void *p; 5509ed67cdcSSasha Levin int r; 55178a2a3e2SSasha Levin 552312c62d1SSasha Levin compat__remove_message(compat_id); 55378a2a3e2SSasha Levin 55478a2a3e2SSasha Levin queue = &ndev->vqs[vq]; 55578a2a3e2SSasha Levin queue->pfn = pfn; 556e7e2950aSSasha Levin p = virtio_get_vq(kvm, queue->pfn, page_size); 55778a2a3e2SSasha Levin 558c59ba304SWill Deacon vring_init(&queue->vring, VIRTIO_NET_QUEUE_SIZE, p, align); 5598ed60bbeSMarc Zyngier virtio_init_device_vq(&ndev->vdev, queue); 56078a2a3e2SSasha Levin 5616585ffb7SSasha Levin mutex_init(&ndev->io_lock[vq]); 5626585ffb7SSasha Levin pthread_cond_init(&ndev->io_cond[vq], NULL); 5639e56ec14SSasha Levin if (is_ctrl_vq(ndev, vq)) { 5646585ffb7SSasha Levin pthread_create(&ndev->io_thread[vq], NULL, virtio_net_ctrl_thread, ndev); 5659e56ec14SSasha Levin 5669e56ec14SSasha Levin return 0; 5679e56ec14SSasha Levin } else if (ndev->vhost_fd == 0 ) { 5689e56ec14SSasha Levin if (vq & 1) 5696585ffb7SSasha Levin pthread_create(&ndev->io_thread[vq], NULL, virtio_net_tx_thread, ndev); 5706585ffb7SSasha Levin else 5716585ffb7SSasha Levin pthread_create(&ndev->io_thread[vq], NULL, virtio_net_rx_thread, ndev); 5726585ffb7SSasha Levin 57378a2a3e2SSasha Levin return 0; 5746585ffb7SSasha Levin } 5759ed67cdcSSasha Levin 5768ed60bbeSMarc Zyngier if (queue->endian != VIRTIO_ENDIAN_HOST) 577b960f243SAndre Przywara die_perror("VHOST requires the same endianness in guest and host"); 5788ed60bbeSMarc Zyngier 5799ed67cdcSSasha Levin state.num = queue->vring.num; 5809ed67cdcSSasha Levin r = ioctl(ndev->vhost_fd, VHOST_SET_VRING_NUM, &state); 5819ed67cdcSSasha Levin if (r < 0) 5829ed67cdcSSasha Levin die_perror("VHOST_SET_VRING_NUM failed"); 5839ed67cdcSSasha Levin state.num = 0; 5849ed67cdcSSasha Levin r = ioctl(ndev->vhost_fd, VHOST_SET_VRING_BASE, &state); 5859ed67cdcSSasha Levin if (r < 0) 5869ed67cdcSSasha Levin die_perror("VHOST_SET_VRING_BASE failed"); 5879ed67cdcSSasha Levin 5889ed67cdcSSasha Levin addr = (struct vhost_vring_addr) { 5899ed67cdcSSasha Levin .index = vq, 5909ed67cdcSSasha Levin .desc_user_addr = (u64)(unsigned long)queue->vring.desc, 5919ed67cdcSSasha Levin .avail_user_addr = (u64)(unsigned long)queue->vring.avail, 5929ed67cdcSSasha Levin .used_user_addr = (u64)(unsigned long)queue->vring.used, 5939ed67cdcSSasha Levin }; 5949ed67cdcSSasha Levin 5959ed67cdcSSasha Levin r = ioctl(ndev->vhost_fd, VHOST_SET_VRING_ADDR, &addr); 5969ed67cdcSSasha Levin if (r < 0) 5979ed67cdcSSasha Levin die_perror("VHOST_SET_VRING_ADDR failed"); 5989ed67cdcSSasha Levin 5999ed67cdcSSasha Levin return 0; 6009ed67cdcSSasha Levin } 6019ed67cdcSSasha Levin 6029ed67cdcSSasha Levin static void notify_vq_gsi(struct kvm *kvm, void *dev, u32 vq, u32 gsi) 6039ed67cdcSSasha Levin { 6049ed67cdcSSasha Levin struct net_dev *ndev = dev; 6059ed67cdcSSasha Levin struct vhost_vring_file file; 6069ed67cdcSSasha Levin int r; 6079ed67cdcSSasha Levin 6089ed67cdcSSasha Levin if (ndev->vhost_fd == 0) 6099ed67cdcSSasha Levin return; 6109ed67cdcSSasha Levin 6119ed67cdcSSasha Levin file = (struct vhost_vring_file) { 6129ed67cdcSSasha Levin .index = vq, 613*e59679d2SJean-Philippe Brucker .fd = eventfd(0, 0), 6149ed67cdcSSasha Levin }; 6159ed67cdcSSasha Levin 616*e59679d2SJean-Philippe Brucker r = irq__add_irqfd(kvm, gsi, file.fd, -1); 6179ed67cdcSSasha Levin if (r < 0) 6189ed67cdcSSasha Levin die_perror("KVM_IRQFD failed"); 6199ed67cdcSSasha Levin 6209ed67cdcSSasha Levin r = ioctl(ndev->vhost_fd, VHOST_SET_VRING_CALL, &file); 6219ed67cdcSSasha Levin if (r < 0) 6229ed67cdcSSasha Levin die_perror("VHOST_SET_VRING_CALL failed"); 6239ed67cdcSSasha Levin file.fd = ndev->tap_fd; 6249ed67cdcSSasha Levin r = ioctl(ndev->vhost_fd, VHOST_NET_SET_BACKEND, &file); 6259ed67cdcSSasha Levin if (r != 0) 6269ed67cdcSSasha Levin die("VHOST_NET_SET_BACKEND failed %d", errno); 6279ed67cdcSSasha Levin 6289ed67cdcSSasha Levin } 6299ed67cdcSSasha Levin 6309ed67cdcSSasha Levin static void notify_vq_eventfd(struct kvm *kvm, void *dev, u32 vq, u32 efd) 6319ed67cdcSSasha Levin { 6329ed67cdcSSasha Levin struct net_dev *ndev = dev; 6339ed67cdcSSasha Levin struct vhost_vring_file file = { 6349ed67cdcSSasha Levin .index = vq, 6359ed67cdcSSasha Levin .fd = efd, 6369ed67cdcSSasha Levin }; 6379ed67cdcSSasha Levin int r; 6389ed67cdcSSasha Levin 6399e56ec14SSasha Levin if (ndev->vhost_fd == 0 || is_ctrl_vq(ndev, vq)) 6409ed67cdcSSasha Levin return; 6419ed67cdcSSasha Levin 6429ed67cdcSSasha Levin r = ioctl(ndev->vhost_fd, VHOST_SET_VRING_KICK, &file); 6439ed67cdcSSasha Levin if (r < 0) 6449ed67cdcSSasha Levin die_perror("VHOST_SET_VRING_KICK failed"); 64578a2a3e2SSasha Levin } 64678a2a3e2SSasha Levin 64778a2a3e2SSasha Levin static int notify_vq(struct kvm *kvm, void *dev, u32 vq) 64878a2a3e2SSasha Levin { 6499a6d73f1SSasha Levin struct net_dev *ndev = dev; 6509a6d73f1SSasha Levin 6519a6d73f1SSasha Levin virtio_net_handle_callback(kvm, ndev, vq); 65278a2a3e2SSasha Levin 65378a2a3e2SSasha Levin return 0; 65478a2a3e2SSasha Levin } 65578a2a3e2SSasha Levin 65678a2a3e2SSasha Levin static int get_pfn_vq(struct kvm *kvm, void *dev, u32 vq) 65778a2a3e2SSasha Levin { 65878a2a3e2SSasha Levin struct net_dev *ndev = dev; 65978a2a3e2SSasha Levin 66078a2a3e2SSasha Levin return ndev->vqs[vq].pfn; 66178a2a3e2SSasha Levin } 66278a2a3e2SSasha Levin 66378a2a3e2SSasha Levin static int get_size_vq(struct kvm *kvm, void *dev, u32 vq) 66478a2a3e2SSasha Levin { 6650f4f51a8SAsias He /* FIXME: dynamic */ 66678a2a3e2SSasha Levin return VIRTIO_NET_QUEUE_SIZE; 66778a2a3e2SSasha Levin } 66878a2a3e2SSasha Levin 6690f4f51a8SAsias He static int set_size_vq(struct kvm *kvm, void *dev, u32 vq, int size) 6700f4f51a8SAsias He { 6710f4f51a8SAsias He /* FIXME: dynamic */ 6720f4f51a8SAsias He return size; 6730f4f51a8SAsias He } 6740f4f51a8SAsias He 67515542babSAndre Przywara static struct virtio_ops net_dev_virtio_ops = { 6761c47ce69SSasha Levin .get_config = get_config, 6771c47ce69SSasha Levin .get_host_features = get_host_features, 6781c47ce69SSasha Levin .set_guest_features = set_guest_features, 6791c47ce69SSasha Levin .init_vq = init_vq, 6801c47ce69SSasha Levin .get_pfn_vq = get_pfn_vq, 6811c47ce69SSasha Levin .get_size_vq = get_size_vq, 6820f4f51a8SAsias He .set_size_vq = set_size_vq, 6830f4f51a8SAsias He .notify_vq = notify_vq, 6849ed67cdcSSasha Levin .notify_vq_gsi = notify_vq_gsi, 6859ed67cdcSSasha Levin .notify_vq_eventfd = notify_vq_eventfd, 6861c47ce69SSasha Levin }; 6871c47ce69SSasha Levin 6889ed67cdcSSasha Levin static void virtio_net__vhost_init(struct kvm *kvm, struct net_dev *ndev) 6899ed67cdcSSasha Levin { 6907f9733c2SAndreas Herrmann struct kvm_mem_bank *bank; 6919ed67cdcSSasha Levin struct vhost_memory *mem; 6927f9733c2SAndreas Herrmann int r, i; 6939ed67cdcSSasha Levin 6949ed67cdcSSasha Levin ndev->vhost_fd = open("/dev/vhost-net", O_RDWR); 6959ed67cdcSSasha Levin if (ndev->vhost_fd < 0) 6969ed67cdcSSasha Levin die_perror("Failed openning vhost-net device"); 6979ed67cdcSSasha Levin 6987f9733c2SAndreas Herrmann mem = calloc(1, sizeof(*mem) + kvm->mem_slots * sizeof(struct vhost_memory_region)); 6999ed67cdcSSasha Levin if (mem == NULL) 7009ed67cdcSSasha Levin die("Failed allocating memory for vhost memory map"); 7019ed67cdcSSasha Levin 7027f9733c2SAndreas Herrmann i = 0; 7037f9733c2SAndreas Herrmann list_for_each_entry(bank, &kvm->mem_banks, list) { 7047f9733c2SAndreas Herrmann mem->regions[i] = (struct vhost_memory_region) { 7057f9733c2SAndreas Herrmann .guest_phys_addr = bank->guest_phys_addr, 7067f9733c2SAndreas Herrmann .memory_size = bank->size, 7077f9733c2SAndreas Herrmann .userspace_addr = (unsigned long)bank->host_addr, 7089ed67cdcSSasha Levin }; 7097f9733c2SAndreas Herrmann i++; 7107f9733c2SAndreas Herrmann } 7117f9733c2SAndreas Herrmann mem->nregions = i; 7129ed67cdcSSasha Levin 7139ed67cdcSSasha Levin r = ioctl(ndev->vhost_fd, VHOST_SET_OWNER); 7149ed67cdcSSasha Levin if (r != 0) 7159ed67cdcSSasha Levin die_perror("VHOST_SET_OWNER failed"); 7169ed67cdcSSasha Levin 7179ed67cdcSSasha Levin r = ioctl(ndev->vhost_fd, VHOST_SET_MEM_TABLE, mem); 7189ed67cdcSSasha Levin if (r != 0) 7199ed67cdcSSasha Levin die_perror("VHOST_SET_MEM_TABLE failed"); 720627d6874SAsias He 721627d6874SAsias He ndev->vdev.use_vhost = true; 722627d6874SAsias He 7239ed67cdcSSasha Levin free(mem); 7249ed67cdcSSasha Levin } 7259ed67cdcSSasha Levin 7265f225124SSasha Levin static inline void str_to_mac(const char *str, char *mac) 7275f225124SSasha Levin { 7285f225124SSasha Levin sscanf(str, "%hhx:%hhx:%hhx:%hhx:%hhx:%hhx", 7295f225124SSasha Levin mac, mac+1, mac+2, mac+3, mac+4, mac+5); 7305f225124SSasha Levin } 7314346fd8fSSasha Levin static int set_net_param(struct kvm *kvm, struct virtio_net_params *p, 7324346fd8fSSasha Levin const char *param, const char *val) 7335f225124SSasha Levin { 7345f225124SSasha Levin if (strcmp(param, "guest_mac") == 0) { 7355f225124SSasha Levin str_to_mac(val, p->guest_mac); 7365f225124SSasha Levin } else if (strcmp(param, "mode") == 0) { 7375f225124SSasha Levin if (!strncmp(val, "user", 4)) { 7385f225124SSasha Levin int i; 7395f225124SSasha Levin 7405f225124SSasha Levin for (i = 0; i < kvm->cfg.num_net_devices; i++) 7415f225124SSasha Levin if (kvm->cfg.net_params[i].mode == NET_MODE_USER) 7425f225124SSasha Levin die("Only one usermode network device allowed at a time"); 7435f225124SSasha Levin p->mode = NET_MODE_USER; 7445f225124SSasha Levin } else if (!strncmp(val, "tap", 3)) { 7455f225124SSasha Levin p->mode = NET_MODE_TAP; 7465f225124SSasha Levin } else if (!strncmp(val, "none", 4)) { 7475f225124SSasha Levin kvm->cfg.no_net = 1; 7485f225124SSasha Levin return -1; 7495f225124SSasha Levin } else 7505f225124SSasha Levin die("Unknown network mode %s, please use user, tap or none", kvm->cfg.network); 7515f225124SSasha Levin } else if (strcmp(param, "script") == 0) { 7525f225124SSasha Levin p->script = strdup(val); 753eef27ae3SFan Du } else if (strcmp(param, "downscript") == 0) { 754eef27ae3SFan Du p->downscript = strdup(val); 7555f225124SSasha Levin } else if (strcmp(param, "guest_ip") == 0) { 7565f225124SSasha Levin p->guest_ip = strdup(val); 7575f225124SSasha Levin } else if (strcmp(param, "host_ip") == 0) { 7585f225124SSasha Levin p->host_ip = strdup(val); 7595f225124SSasha Levin } else if (strcmp(param, "trans") == 0) { 7605f225124SSasha Levin p->trans = strdup(val); 7611dfc7c24SMarc Zyngier } else if (strcmp(param, "tapif") == 0) { 7621dfc7c24SMarc Zyngier p->tapif = strdup(val); 7635f225124SSasha Levin } else if (strcmp(param, "vhost") == 0) { 7645f225124SSasha Levin p->vhost = atoi(val); 7655f225124SSasha Levin } else if (strcmp(param, "fd") == 0) { 7665f225124SSasha Levin p->fd = atoi(val); 76779052597SSasha Levin } else if (strcmp(param, "mq") == 0) { 76879052597SSasha Levin p->mq = atoi(val); 7695f225124SSasha Levin } else 7705f225124SSasha Levin die("Unknown network parameter %s", param); 7715f225124SSasha Levin 7725f225124SSasha Levin return 0; 7735f225124SSasha Levin } 7745f225124SSasha Levin 7755f225124SSasha Levin int netdev_parser(const struct option *opt, const char *arg, int unset) 7765f225124SSasha Levin { 7775f225124SSasha Levin struct virtio_net_params p; 7785f225124SSasha Levin char *buf = NULL, *cmd = NULL, *cur = NULL; 7795f225124SSasha Levin bool on_cmd = true; 7805f225124SSasha Levin struct kvm *kvm = opt->ptr; 7815f225124SSasha Levin 7825f225124SSasha Levin if (arg) { 7835f225124SSasha Levin buf = strdup(arg); 7845f225124SSasha Levin if (buf == NULL) 7855f225124SSasha Levin die("Failed allocating new net buffer"); 7865f225124SSasha Levin cur = strtok(buf, ",="); 7875f225124SSasha Levin } 7885f225124SSasha Levin 7895f225124SSasha Levin p = (struct virtio_net_params) { 7905f225124SSasha Levin .guest_ip = DEFAULT_GUEST_ADDR, 7915f225124SSasha Levin .host_ip = DEFAULT_HOST_ADDR, 7925f225124SSasha Levin .script = DEFAULT_SCRIPT, 793eef27ae3SFan Du .downscript = DEFAULT_SCRIPT, 7945f225124SSasha Levin .mode = NET_MODE_TAP, 7955f225124SSasha Levin }; 7965f225124SSasha Levin 7975f225124SSasha Levin str_to_mac(DEFAULT_GUEST_MAC, p.guest_mac); 7985f225124SSasha Levin p.guest_mac[5] += kvm->cfg.num_net_devices; 7995f225124SSasha Levin 8005f225124SSasha Levin while (cur) { 8015f225124SSasha Levin if (on_cmd) { 8025f225124SSasha Levin cmd = cur; 8035f225124SSasha Levin } else { 8044346fd8fSSasha Levin if (set_net_param(kvm, &p, cmd, cur) < 0) 8055f225124SSasha Levin goto done; 8065f225124SSasha Levin } 8075f225124SSasha Levin on_cmd = !on_cmd; 8085f225124SSasha Levin 8095f225124SSasha Levin cur = strtok(NULL, ",="); 8105f225124SSasha Levin }; 8115f225124SSasha Levin 8125f225124SSasha Levin kvm->cfg.num_net_devices++; 8135f225124SSasha Levin 8145f225124SSasha Levin kvm->cfg.net_params = realloc(kvm->cfg.net_params, kvm->cfg.num_net_devices * sizeof(*kvm->cfg.net_params)); 8155f225124SSasha Levin if (kvm->cfg.net_params == NULL) 8165f225124SSasha Levin die("Failed adding new network device"); 8175f225124SSasha Levin 8185f225124SSasha Levin kvm->cfg.net_params[kvm->cfg.num_net_devices - 1] = p; 8195f225124SSasha Levin 8205f225124SSasha Levin done: 8215f225124SSasha Levin free(buf); 8225f225124SSasha Levin return 0; 8235f225124SSasha Levin } 8245f225124SSasha Levin 8255f225124SSasha Levin static int virtio_net__init_one(struct virtio_net_params *params) 8264f56d42cSAsias He { 82776a4aac6SWill Deacon int i, err; 8289a6d73f1SSasha Levin struct net_dev *ndev; 82976a4aac6SWill Deacon struct virtio_ops *ops; 830dc7a55d6SSuzuki K. Poulose enum virtio_trans trans = VIRTIO_DEFAULT_TRANS(params->kvm); 8319a6d73f1SSasha Levin 8329a6d73f1SSasha Levin ndev = calloc(1, sizeof(struct net_dev)); 8339a6d73f1SSasha Levin if (ndev == NULL) 8345f225124SSasha Levin return -ENOMEM; 8359a6d73f1SSasha Levin 83676a4aac6SWill Deacon ops = malloc(sizeof(*ops)); 83776a4aac6SWill Deacon if (ops == NULL) { 83876a4aac6SWill Deacon err = -ENOMEM; 83976a4aac6SWill Deacon goto err_free_ndev; 84076a4aac6SWill Deacon } 84176a4aac6SWill Deacon 8429a6d73f1SSasha Levin list_add_tail(&ndev->list, &ndevs); 8439a6d73f1SSasha Levin 8449a6d73f1SSasha Levin ndev->kvm = params->kvm; 8458c0ae74dSSasha Levin ndev->params = params; 8469a6d73f1SSasha Levin 8479a6d73f1SSasha Levin mutex_init(&ndev->mutex); 84879052597SSasha Levin ndev->queue_pairs = max(1, min(VIRTIO_NET_NUM_QUEUES, params->mq)); 8499a6d73f1SSasha Levin ndev->config.status = VIRTIO_NET_S_LINK_UP; 85079052597SSasha Levin if (ndev->queue_pairs > 1) 85179052597SSasha Levin ndev->config.max_virtqueue_pairs = ndev->queue_pairs; 85279052597SSasha Levin 8530c54698eSAsias He for (i = 0 ; i < 6 ; i++) { 8549a6d73f1SSasha Levin ndev->config.mac[i] = params->guest_mac[i]; 8559a6d73f1SSasha Levin ndev->info.guest_mac.addr[i] = params->guest_mac[i]; 8569a6d73f1SSasha Levin ndev->info.host_mac.addr[i] = params->host_mac[i]; 8570c54698eSAsias He } 858f715177dSAsias He 8599a6d73f1SSasha Levin ndev->mode = params->mode; 8609a6d73f1SSasha Levin if (ndev->mode == NET_MODE_TAP) { 8619a6d73f1SSasha Levin ndev->ops = &tap_ops; 86259ee54ebSWei Chen if (!virtio_net__tap_create(ndev)) 86359ee54ebSWei Chen die_perror("You have requested a TAP device, but creation of one has failed because"); 864b4fdde6dSAsias He } else { 8659a6d73f1SSasha Levin ndev->info.host_ip = ntohl(inet_addr(params->host_ip)); 8669a6d73f1SSasha Levin ndev->info.guest_ip = ntohl(inet_addr(params->guest_ip)); 8679a6d73f1SSasha Levin ndev->info.guest_netmask = ntohl(inet_addr("255.255.255.0")); 8689a6d73f1SSasha Levin ndev->info.buf_nr = 20, 8699a6d73f1SSasha Levin ndev->ops = &uip_ops; 8705f3aaf22SMarc Zyngier uip_static_init(&ndev->info); 871b4fdde6dSAsias He } 872b5ee1ea7SAsias He 87376a4aac6SWill Deacon *ops = net_dev_virtio_ops; 874dc7a55d6SSuzuki K. Poulose 875dc7a55d6SSuzuki K. Poulose if (params->trans) { 876dc7a55d6SSuzuki K. Poulose if (strcmp(params->trans, "mmio") == 0) 877dc7a55d6SSuzuki K. Poulose trans = VIRTIO_MMIO; 878dc7a55d6SSuzuki K. Poulose else if (strcmp(params->trans, "pci") == 0) 879dc7a55d6SSuzuki K. Poulose trans = VIRTIO_PCI; 88069205aa1SAsias He else 881dc7a55d6SSuzuki K. Poulose pr_warning("virtio-net: Unknown transport method : %s, " 882dc7a55d6SSuzuki K. Poulose "falling back to %s.", params->trans, 883dc7a55d6SSuzuki K. Poulose virtio_trans_name(trans)); 884dc7a55d6SSuzuki K. Poulose } 885dc7a55d6SSuzuki K. Poulose 886dc7a55d6SSuzuki K. Poulose virtio_init(params->kvm, ndev, &ndev->vdev, ops, trans, 88776a4aac6SWill Deacon PCI_DEVICE_ID_VIRTIO_NET, VIRTIO_ID_NET, PCI_CLASS_NET); 88827ab67f5SSasha Levin 8899ed67cdcSSasha Levin if (params->vhost) 8909ed67cdcSSasha Levin virtio_net__vhost_init(params->kvm, ndev); 891cb83de6fSSasha Levin 892d278197dSAsias He if (compat_id == -1) 89352f34d2cSAsias He compat_id = virtio_compat_add_message("virtio-net", "CONFIG_VIRTIO_NET"); 8945f225124SSasha Levin 8955f225124SSasha Levin return 0; 89676a4aac6SWill Deacon 89776a4aac6SWill Deacon err_free_ndev: 89876a4aac6SWill Deacon free(ndev); 89976a4aac6SWill Deacon return err; 9005f225124SSasha Levin } 9015f225124SSasha Levin 9025f225124SSasha Levin int virtio_net__init(struct kvm *kvm) 9035f225124SSasha Levin { 9045f225124SSasha Levin int i; 9055f225124SSasha Levin 9065f225124SSasha Levin for (i = 0; i < kvm->cfg.num_net_devices; i++) { 9075f225124SSasha Levin kvm->cfg.net_params[i].kvm = kvm; 9085f225124SSasha Levin virtio_net__init_one(&kvm->cfg.net_params[i]); 9095f225124SSasha Levin } 9105f225124SSasha Levin 9115f225124SSasha Levin if (kvm->cfg.num_net_devices == 0 && kvm->cfg.no_net == 0) { 9128c0ae74dSSasha Levin static struct virtio_net_params net_params; 9135f225124SSasha Levin 9145f225124SSasha Levin net_params = (struct virtio_net_params) { 9155f225124SSasha Levin .guest_ip = kvm->cfg.guest_ip, 9165f225124SSasha Levin .host_ip = kvm->cfg.host_ip, 9175f225124SSasha Levin .kvm = kvm, 9185f225124SSasha Levin .script = kvm->cfg.script, 9195f225124SSasha Levin .mode = NET_MODE_USER, 9205f225124SSasha Levin }; 9215f225124SSasha Levin str_to_mac(kvm->cfg.guest_mac, net_params.guest_mac); 9225f225124SSasha Levin str_to_mac(kvm->cfg.host_mac, net_params.host_mac); 9235f225124SSasha Levin 9245f225124SSasha Levin virtio_net__init_one(&net_params); 9255f225124SSasha Levin } 9265f225124SSasha Levin 9275f225124SSasha Levin return 0; 9285f225124SSasha Levin } 92949a8afd1SSasha Levin virtio_dev_init(virtio_net__init); 9305f225124SSasha Levin 9315f225124SSasha Levin int virtio_net__exit(struct kvm *kvm) 9325f225124SSasha Levin { 933eef27ae3SFan Du struct virtio_net_params *params; 934eef27ae3SFan Du struct net_dev *ndev; 935eef27ae3SFan Du struct list_head *ptr; 936eef27ae3SFan Du 937eef27ae3SFan Du list_for_each(ptr, &ndevs) { 938eef27ae3SFan Du ndev = list_entry(ptr, struct net_dev, list); 939eef27ae3SFan Du params = ndev->params; 940eef27ae3SFan Du /* Cleanup any tap device which attached to bridge */ 941eef27ae3SFan Du if (ndev->mode == NET_MODE_TAP && 942eef27ae3SFan Du strcmp(params->downscript, "none")) 943eef27ae3SFan Du virtio_net_exec_script(params->downscript, ndev->tap_name); 944eef27ae3SFan Du } 9455f225124SSasha Levin return 0; 9464f56d42cSAsias He } 94749a8afd1SSasha Levin virtio_dev_exit(virtio_net__exit); 948