131638bcaSCyrill Gorcunov #include "kvm/virtio-pci-dev.h" 2b5ee1ea7SAsias He #include "kvm/virtio-net.h" 34f56d42cSAsias He #include "kvm/virtio.h" 44f56d42cSAsias He #include "kvm/mutex.h" 54f56d42cSAsias He #include "kvm/util.h" 64f56d42cSAsias He #include "kvm/kvm.h" 72449f6e3SSasha Levin #include "kvm/irq.h" 8b5ee1ea7SAsias He #include "kvm/uip.h" 9cb83de6fSSasha Levin #include "kvm/guest_compat.h" 107668c3a6SSasha Levin #include "kvm/iovec.h" 1105755b29SAndre Przywara #include "kvm/strbuf.h" 124f56d42cSAsias He 139ed67cdcSSasha Levin #include <linux/vhost.h> 144f56d42cSAsias He #include <linux/virtio_net.h> 154f56d42cSAsias He #include <linux/if_tun.h> 1678a2a3e2SSasha Levin #include <linux/types.h> 17c229370aSIngo Molnar 18c229370aSIngo Molnar #include <arpa/inet.h> 194f56d42cSAsias He #include <net/if.h> 20c229370aSIngo Molnar 21c229370aSIngo Molnar #include <unistd.h> 224f56d42cSAsias He #include <fcntl.h> 23c229370aSIngo Molnar 24cb7202c1SSasha Levin #include <sys/socket.h> 25c229370aSIngo Molnar #include <sys/ioctl.h> 26c229370aSIngo Molnar #include <sys/types.h> 2773b7d038SAmos Kong #include <sys/wait.h> 289ed67cdcSSasha Levin #include <sys/eventfd.h> 294f56d42cSAsias He 304059ad8bSAsias He #define VIRTIO_NET_QUEUE_SIZE 256 316585ffb7SSasha Levin #define VIRTIO_NET_NUM_QUEUES 8 324f56d42cSAsias He 33b4fdde6dSAsias He struct net_dev; 34b4fdde6dSAsias He 35b4fdde6dSAsias He struct net_dev_operations { 36b4fdde6dSAsias He int (*rx)(struct iovec *iov, u16 in, struct net_dev *ndev); 37b4fdde6dSAsias He int (*tx)(struct iovec *iov, u16 in, struct net_dev *ndev); 38b4fdde6dSAsias He }; 39b4fdde6dSAsias He 40ad96e867SJean-Philippe Brucker struct net_dev_queue { 41ad96e867SJean-Philippe Brucker int id; 42ad96e867SJean-Philippe Brucker struct net_dev *ndev; 43ad96e867SJean-Philippe Brucker struct virt_queue vq; 44ad96e867SJean-Philippe Brucker pthread_t thread; 45ad96e867SJean-Philippe Brucker struct mutex lock; 46ad96e867SJean-Philippe Brucker pthread_cond_t cond; 4749bada43SJean-Philippe Brucker int gsi; 4849bada43SJean-Philippe Brucker int irqfd; 49ad96e867SJean-Philippe Brucker }; 50ad96e867SJean-Philippe Brucker 518626798bSAsias He struct net_dev { 52d3476f7dSSasha Levin struct mutex mutex; 5302eca50cSAsias He struct virtio_device vdev; 549a6d73f1SSasha Levin struct list_head list; 554f56d42cSAsias He 56ad96e867SJean-Philippe Brucker struct net_dev_queue queues[VIRTIO_NET_NUM_QUEUES * 2 + 1]; 57c229370aSIngo Molnar struct virtio_net_config config; 58ad96e867SJean-Philippe Brucker u32 features, queue_pairs; 59c4aa7c02SPekka Enberg 609ed67cdcSSasha Levin int vhost_fd; 614f56d42cSAsias He int tap_fd; 624f56d42cSAsias He char tap_name[IFNAMSIZ]; 6359ee54ebSWei Chen bool tap_ufo; 64bb1a32f1SAsias He 65bb1a32f1SAsias He int mode; 66bb1a32f1SAsias He 67b5ee1ea7SAsias He struct uip_info info; 68b4fdde6dSAsias He struct net_dev_operations *ops; 699a6d73f1SSasha Levin struct kvm *kvm; 708c0ae74dSSasha Levin 718c0ae74dSSasha Levin struct virtio_net_params *params; 724f56d42cSAsias He }; 734f56d42cSAsias He 749a6d73f1SSasha Levin static LIST_HEAD(ndevs); 75312c62d1SSasha Levin static int compat_id = -1; 764f56d42cSAsias He 777668c3a6SSasha Levin #define MAX_PACKET_SIZE 65550 787668c3a6SSasha Levin 797668c3a6SSasha Levin static bool has_virtio_feature(struct net_dev *ndev, u32 feature) 807668c3a6SSasha Levin { 817668c3a6SSasha Levin return ndev->features & (1 << feature); 827668c3a6SSasha Levin } 837668c3a6SSasha Levin 848ed60bbeSMarc Zyngier static void virtio_net_fix_tx_hdr(struct virtio_net_hdr *hdr, struct net_dev *ndev) 858ed60bbeSMarc Zyngier { 868ed60bbeSMarc Zyngier hdr->hdr_len = virtio_guest_to_host_u16(&ndev->vdev, hdr->hdr_len); 878ed60bbeSMarc Zyngier hdr->gso_size = virtio_guest_to_host_u16(&ndev->vdev, hdr->gso_size); 888ed60bbeSMarc Zyngier hdr->csum_start = virtio_guest_to_host_u16(&ndev->vdev, hdr->csum_start); 898ed60bbeSMarc Zyngier hdr->csum_offset = virtio_guest_to_host_u16(&ndev->vdev, hdr->csum_offset); 908ed60bbeSMarc Zyngier } 918ed60bbeSMarc Zyngier 923fea89a9SWill Deacon static void virtio_net_fix_rx_hdr(struct virtio_net_hdr *hdr, struct net_dev *ndev) 938ed60bbeSMarc Zyngier { 943fea89a9SWill Deacon hdr->hdr_len = virtio_host_to_guest_u16(&ndev->vdev, hdr->hdr_len); 953fea89a9SWill Deacon hdr->gso_size = virtio_host_to_guest_u16(&ndev->vdev, hdr->gso_size); 963fea89a9SWill Deacon hdr->csum_start = virtio_host_to_guest_u16(&ndev->vdev, hdr->csum_start); 973fea89a9SWill Deacon hdr->csum_offset = virtio_host_to_guest_u16(&ndev->vdev, hdr->csum_offset); 988ed60bbeSMarc Zyngier } 998ed60bbeSMarc Zyngier 100c4aa7c02SPekka Enberg static void *virtio_net_rx_thread(void *p) 1014f56d42cSAsias He { 1024f56d42cSAsias He struct iovec iov[VIRTIO_NET_QUEUE_SIZE]; 103ad96e867SJean-Philippe Brucker struct net_dev_queue *queue = p; 104ad96e867SJean-Philippe Brucker struct virt_queue *vq = &queue->vq; 105ad96e867SJean-Philippe Brucker struct net_dev *ndev = queue->ndev; 10643835ac9SSasha Levin struct kvm *kvm; 1073fdf659dSSasha Levin u16 out, in; 1083fdf659dSSasha Levin u16 head; 1096d6cc14bSWill Deacon int len, copied; 1104f56d42cSAsias He 111a4d8c55eSSasha Levin kvm__set_thread_name("virtio-net-rx"); 112a4d8c55eSSasha Levin 1139a6d73f1SSasha Levin kvm = ndev->kvm; 114c4aa7c02SPekka Enberg while (1) { 115ad96e867SJean-Philippe Brucker mutex_lock(&queue->lock); 116c4aa7c02SPekka Enberg if (!virt_queue__available(vq)) 117ad96e867SJean-Philippe Brucker pthread_cond_wait(&queue->cond, &queue->lock.mutex); 118ad96e867SJean-Philippe Brucker mutex_unlock(&queue->lock); 1194f56d42cSAsias He 1204f56d42cSAsias He while (virt_queue__available(vq)) { 1217668c3a6SSasha Levin unsigned char buffer[MAX_PACKET_SIZE + sizeof(struct virtio_net_hdr_mrg_rxbuf)]; 1227668c3a6SSasha Levin struct iovec dummy_iov = { 1237668c3a6SSasha Levin .iov_base = buffer, 1247668c3a6SSasha Levin .iov_len = sizeof(buffer), 1257668c3a6SSasha Levin }; 1267668c3a6SSasha Levin struct virtio_net_hdr_mrg_rxbuf *hdr; 1273fea89a9SWill Deacon u16 num_buffers; 1287f5ffaf5SAsias He 1297668c3a6SSasha Levin len = ndev->ops->rx(&dummy_iov, 1, ndev); 1306d6cc14bSWill Deacon if (len < 0) { 1316d6cc14bSWill Deacon pr_warning("%s: rx on vq %u failed (%d), exiting thread\n", 132ad96e867SJean-Philippe Brucker __func__, queue->id, len); 1336d6cc14bSWill Deacon goto out_err; 1346d6cc14bSWill Deacon } 1356d6cc14bSWill Deacon 1363fea89a9SWill Deacon copied = num_buffers = 0; 1377668c3a6SSasha Levin head = virt_queue__get_iov(vq, iov, &out, &in, kvm); 1388ed60bbeSMarc Zyngier hdr = iov[0].iov_base; 1397668c3a6SSasha Levin while (copied < len) { 1406d6cc14bSWill Deacon size_t iovsize = min_t(size_t, len - copied, iov_size(iov, in)); 1417668c3a6SSasha Levin 142e2493047SAsias He memcpy_toiovec(iov, buffer + copied, iovsize); 1437668c3a6SSasha Levin copied += iovsize; 1443fea89a9SWill Deacon virt_queue__set_used_elem_no_update(vq, head, iovsize, num_buffers++); 1457668c3a6SSasha Levin if (copied == len) 1467668c3a6SSasha Levin break; 1477668c3a6SSasha Levin while (!virt_queue__available(vq)) 1487668c3a6SSasha Levin sleep(0); 1497668c3a6SSasha Levin head = virt_queue__get_iov(vq, iov, &out, &in, kvm); 1507668c3a6SSasha Levin } 1513fea89a9SWill Deacon 1523fea89a9SWill Deacon virtio_net_fix_rx_hdr(&hdr->hdr, ndev); 1533fea89a9SWill Deacon if (has_virtio_feature(ndev, VIRTIO_NET_F_MRG_RXBUF)) 1543fea89a9SWill Deacon hdr->num_buffers = virtio_host_to_guest_u16(vq, num_buffers); 1553fea89a9SWill Deacon 1563fea89a9SWill Deacon virt_queue__used_idx_advance(vq, num_buffers); 1573fea89a9SWill Deacon 158c4aa7c02SPekka Enberg /* We should interrupt guest right now, otherwise latency is huge. */ 1596585ffb7SSasha Levin if (virtio_queue__should_signal(vq)) 160ad96e867SJean-Philippe Brucker ndev->vdev.ops->signal_vq(kvm, &ndev->vdev, queue->id); 1614f56d42cSAsias He } 162c4aa7c02SPekka Enberg } 163c4aa7c02SPekka Enberg 1646d6cc14bSWill Deacon out_err: 165c4aa7c02SPekka Enberg pthread_exit(NULL); 166c4aa7c02SPekka Enberg return NULL; 167c4aa7c02SPekka Enberg 168c4aa7c02SPekka Enberg } 169c4aa7c02SPekka Enberg 170c4aa7c02SPekka Enberg static void *virtio_net_tx_thread(void *p) 1714f56d42cSAsias He { 1724f56d42cSAsias He struct iovec iov[VIRTIO_NET_QUEUE_SIZE]; 173ad96e867SJean-Philippe Brucker struct net_dev_queue *queue = p; 174ad96e867SJean-Philippe Brucker struct virt_queue *vq = &queue->vq; 175ad96e867SJean-Philippe Brucker struct net_dev *ndev = queue->ndev; 17643835ac9SSasha Levin struct kvm *kvm; 1773fdf659dSSasha Levin u16 out, in; 1783fdf659dSSasha Levin u16 head; 1794f56d42cSAsias He int len; 1804f56d42cSAsias He 181a4d8c55eSSasha Levin kvm__set_thread_name("virtio-net-tx"); 182a4d8c55eSSasha Levin 1839a6d73f1SSasha Levin kvm = ndev->kvm; 184c4aa7c02SPekka Enberg 185c4aa7c02SPekka Enberg while (1) { 186ad96e867SJean-Philippe Brucker mutex_lock(&queue->lock); 187c4aa7c02SPekka Enberg if (!virt_queue__available(vq)) 188ad96e867SJean-Philippe Brucker pthread_cond_wait(&queue->cond, &queue->lock.mutex); 189ad96e867SJean-Philippe Brucker mutex_unlock(&queue->lock); 1904f56d42cSAsias He 1914f56d42cSAsias He while (virt_queue__available(vq)) { 1928ed60bbeSMarc Zyngier struct virtio_net_hdr *hdr; 19343835ac9SSasha Levin head = virt_queue__get_iov(vq, iov, &out, &in, kvm); 1948ed60bbeSMarc Zyngier hdr = iov[0].iov_base; 1958ed60bbeSMarc Zyngier virtio_net_fix_tx_hdr(hdr, ndev); 1969a6d73f1SSasha Levin len = ndev->ops->tx(iov, out, ndev); 1976d6cc14bSWill Deacon if (len < 0) { 1986d6cc14bSWill Deacon pr_warning("%s: tx on vq %u failed (%d)\n", 199ad96e867SJean-Philippe Brucker __func__, queue->id, errno); 2006d6cc14bSWill Deacon goto out_err; 2016d6cc14bSWill Deacon } 2026d6cc14bSWill Deacon 2034f56d42cSAsias He virt_queue__set_used_elem(vq, head, len); 2044f56d42cSAsias He } 2054f56d42cSAsias He 2066585ffb7SSasha Levin if (virtio_queue__should_signal(vq)) 207ad96e867SJean-Philippe Brucker ndev->vdev.ops->signal_vq(kvm, &ndev->vdev, queue->id); 2084f56d42cSAsias He } 2094f56d42cSAsias He 2106d6cc14bSWill Deacon out_err: 211c4aa7c02SPekka Enberg pthread_exit(NULL); 212c4aa7c02SPekka Enberg return NULL; 213c4aa7c02SPekka Enberg } 214407475bfSPekka Enberg 2156585ffb7SSasha Levin static virtio_net_ctrl_ack virtio_net_handle_mq(struct kvm* kvm, struct net_dev *ndev, struct virtio_net_ctrl_hdr *ctrl) 2166585ffb7SSasha Levin { 2176585ffb7SSasha Levin /* Not much to do here */ 2186585ffb7SSasha Levin return VIRTIO_NET_OK; 2196585ffb7SSasha Levin } 2206585ffb7SSasha Levin 2216585ffb7SSasha Levin static void *virtio_net_ctrl_thread(void *p) 222abd4a801SSasha Levin { 223abd4a801SSasha Levin struct iovec iov[VIRTIO_NET_QUEUE_SIZE]; 224ad96e867SJean-Philippe Brucker struct net_dev_queue *queue = p; 225ad96e867SJean-Philippe Brucker struct virt_queue *vq = &queue->vq; 226ad96e867SJean-Philippe Brucker struct net_dev *ndev = queue->ndev; 227abd4a801SSasha Levin u16 out, in, head; 2286585ffb7SSasha Levin struct kvm *kvm = ndev->kvm; 229abd4a801SSasha Levin struct virtio_net_ctrl_hdr *ctrl; 230abd4a801SSasha Levin virtio_net_ctrl_ack *ack; 231abd4a801SSasha Levin 232edb4a8a0SSuzuki K. Poulose kvm__set_thread_name("virtio-net-ctrl"); 233edb4a8a0SSuzuki K. Poulose 2346585ffb7SSasha Levin while (1) { 235ad96e867SJean-Philippe Brucker mutex_lock(&queue->lock); 2366585ffb7SSasha Levin if (!virt_queue__available(vq)) 237ad96e867SJean-Philippe Brucker pthread_cond_wait(&queue->cond, &queue->lock.mutex); 238ad96e867SJean-Philippe Brucker mutex_unlock(&queue->lock); 2396585ffb7SSasha Levin 2406585ffb7SSasha Levin while (virt_queue__available(vq)) { 241ad96e867SJean-Philippe Brucker head = virt_queue__get_iov(vq, iov, &out, &in, kvm); 242abd4a801SSasha Levin ctrl = iov[0].iov_base; 243abd4a801SSasha Levin ack = iov[out].iov_base; 244abd4a801SSasha Levin 245abd4a801SSasha Levin switch (ctrl->class) { 2466585ffb7SSasha Levin case VIRTIO_NET_CTRL_MQ: 2476585ffb7SSasha Levin *ack = virtio_net_handle_mq(kvm, ndev, ctrl); 2486585ffb7SSasha Levin break; 249abd4a801SSasha Levin default: 250abd4a801SSasha Levin *ack = VIRTIO_NET_ERR; 251abd4a801SSasha Levin break; 252abd4a801SSasha Levin } 253ad96e867SJean-Philippe Brucker virt_queue__set_used_elem(vq, head, iov[out].iov_len); 2546585ffb7SSasha Levin } 255abd4a801SSasha Levin 256ad96e867SJean-Philippe Brucker if (virtio_queue__should_signal(vq)) 257ad96e867SJean-Philippe Brucker ndev->vdev.ops->signal_vq(kvm, &ndev->vdev, queue->id); 2586585ffb7SSasha Levin } 259abd4a801SSasha Levin 2606585ffb7SSasha Levin pthread_exit(NULL); 261abd4a801SSasha Levin 2626585ffb7SSasha Levin return NULL; 263abd4a801SSasha Levin } 264abd4a801SSasha Levin 2659a6d73f1SSasha Levin static void virtio_net_handle_callback(struct kvm *kvm, struct net_dev *ndev, int queue) 2664f56d42cSAsias He { 267ad96e867SJean-Philippe Brucker struct net_dev_queue *net_queue = &ndev->queues[queue]; 268ad96e867SJean-Philippe Brucker 26979052597SSasha Levin if ((u32)queue >= (ndev->queue_pairs * 2 + 1)) { 2709a6d73f1SSasha Levin pr_warning("Unknown queue index %u", queue); 2716585ffb7SSasha Levin return; 272c4aa7c02SPekka Enberg } 2736585ffb7SSasha Levin 274ad96e867SJean-Philippe Brucker mutex_lock(&net_queue->lock); 275ad96e867SJean-Philippe Brucker pthread_cond_signal(&net_queue->cond); 276ad96e867SJean-Philippe Brucker mutex_unlock(&net_queue->lock); 2774f56d42cSAsias He } 2784f56d42cSAsias He 279d2a7ddffSMarc Zyngier static int virtio_net_request_tap(struct net_dev *ndev, struct ifreq *ifr, 280d2a7ddffSMarc Zyngier const char *tapname) 281d2a7ddffSMarc Zyngier { 282d2a7ddffSMarc Zyngier int ret; 283d2a7ddffSMarc Zyngier 284d2a7ddffSMarc Zyngier memset(ifr, 0, sizeof(*ifr)); 285d2a7ddffSMarc Zyngier ifr->ifr_flags = IFF_TAP | IFF_NO_PI | IFF_VNET_HDR; 286d2a7ddffSMarc Zyngier if (tapname) 28705755b29SAndre Przywara strlcpy(ifr->ifr_name, tapname, sizeof(ifr->ifr_name)); 288d2a7ddffSMarc Zyngier 289f83dc816SAndreas Herrmann ret = ioctl(ndev->tap_fd, TUNSETIFF, ifr); 290d2a7ddffSMarc Zyngier 291d2a7ddffSMarc Zyngier if (ret >= 0) 29205755b29SAndre Przywara strlcpy(ndev->tap_name, ifr->ifr_name, sizeof(ndev->tap_name)); 293d2a7ddffSMarc Zyngier return ret; 294d2a7ddffSMarc Zyngier } 295d2a7ddffSMarc Zyngier 296eef27ae3SFan Du static int virtio_net_exec_script(const char* script, const char *tap_name) 297eef27ae3SFan Du { 298eef27ae3SFan Du pid_t pid; 299eef27ae3SFan Du int status; 300eef27ae3SFan Du 301eef27ae3SFan Du pid = fork(); 302eef27ae3SFan Du if (pid == 0) { 303eef27ae3SFan Du execl(script, script, tap_name, NULL); 304eef27ae3SFan Du _exit(1); 305eef27ae3SFan Du } else { 306eef27ae3SFan Du waitpid(pid, &status, 0); 307eef27ae3SFan Du if (WIFEXITED(status) && WEXITSTATUS(status) != 0) { 308eef27ae3SFan Du pr_warning("Fail to setup tap by %s", script); 309eef27ae3SFan Du return -1; 310eef27ae3SFan Du } 311eef27ae3SFan Du } 312eef27ae3SFan Du return 0; 313eef27ae3SFan Du } 314eef27ae3SFan Du 3158c0ae74dSSasha Levin static bool virtio_net__tap_init(struct net_dev *ndev) 3164f56d42cSAsias He { 317cb7202c1SSasha Levin int sock = socket(AF_INET, SOCK_STREAM, 0); 31859ee54ebSWei Chen int hdr_len; 319cb7202c1SSasha Levin struct sockaddr_in sin = {0}; 320246c8347SAsias He struct ifreq ifr; 3218c0ae74dSSasha Levin const struct virtio_net_params *params = ndev->params; 3221dfc7c24SMarc Zyngier bool skipconf = !!params->tapif; 3234f56d42cSAsias He 3247668c3a6SSasha Levin hdr_len = has_virtio_feature(ndev, VIRTIO_NET_F_MRG_RXBUF) ? 32548c6b47aSSasha Levin sizeof(struct virtio_net_hdr_mrg_rxbuf) : 32648c6b47aSSasha Levin sizeof(struct virtio_net_hdr); 3279a6d73f1SSasha Levin if (ioctl(ndev->tap_fd, TUNSETVNETHDRSZ, &hdr_len) < 0) 3284542f276SCyrill Gorcunov pr_warning("Config tap device TUNSETVNETHDRSZ error"); 329246c8347SAsias He 33073b7d038SAmos Kong if (strcmp(params->script, "none")) { 331eef27ae3SFan Du if (virtio_net_exec_script(params->script, ndev->tap_name) < 0) 33273b7d038SAmos Kong goto fail; 3331dfc7c24SMarc Zyngier } else if (!skipconf) { 334cb7202c1SSasha Levin memset(&ifr, 0, sizeof(ifr)); 33516509081SAnisse Astier strncpy(ifr.ifr_name, ndev->tap_name, sizeof(ifr.ifr_name)); 336bdfcfca6SSasha Levin sin.sin_addr.s_addr = inet_addr(params->host_ip); 337cb7202c1SSasha Levin memcpy(&(ifr.ifr_addr), &sin, sizeof(ifr.ifr_addr)); 338cb7202c1SSasha Levin ifr.ifr_addr.sa_family = AF_INET; 3393b02f580SSasha Levin if (ioctl(sock, SIOCSIFADDR, &ifr) < 0) { 3404542f276SCyrill Gorcunov pr_warning("Could not set ip address on tap device"); 3413b02f580SSasha Levin goto fail; 3423b02f580SSasha Levin } 34373b7d038SAmos Kong } 344cb7202c1SSasha Levin 3451dfc7c24SMarc Zyngier if (!skipconf) { 346cb7202c1SSasha Levin memset(&ifr, 0, sizeof(ifr)); 34716509081SAnisse Astier strncpy(ifr.ifr_name, ndev->tap_name, sizeof(ifr.ifr_name)); 348cb7202c1SSasha Levin ioctl(sock, SIOCGIFFLAGS, &ifr); 349cb7202c1SSasha Levin ifr.ifr_flags |= IFF_UP | IFF_RUNNING; 350cb7202c1SSasha Levin if (ioctl(sock, SIOCSIFFLAGS, &ifr) < 0) 3514542f276SCyrill Gorcunov pr_warning("Could not bring tap device up"); 3521dfc7c24SMarc Zyngier } 353cb7202c1SSasha Levin 354cb7202c1SSasha Levin close(sock); 3553b02f580SSasha Levin 3563b02f580SSasha Levin return 1; 3573b02f580SSasha Levin 3583b02f580SSasha Levin fail: 3593b02f580SSasha Levin if (sock >= 0) 3603b02f580SSasha Levin close(sock); 3619a6d73f1SSasha Levin if (ndev->tap_fd >= 0) 3629a6d73f1SSasha Levin close(ndev->tap_fd); 3633b02f580SSasha Levin 3643b02f580SSasha Levin return 0; 3654f56d42cSAsias He } 3664f56d42cSAsias He 36749bada43SJean-Philippe Brucker static void virtio_net__tap_exit(struct net_dev *ndev) 36849bada43SJean-Philippe Brucker { 36949bada43SJean-Philippe Brucker int sock; 37049bada43SJean-Philippe Brucker struct ifreq ifr; 37149bada43SJean-Philippe Brucker 37249bada43SJean-Philippe Brucker if (ndev->params->tapif) 37349bada43SJean-Philippe Brucker return; 37449bada43SJean-Philippe Brucker 37549bada43SJean-Philippe Brucker sock = socket(AF_INET, SOCK_STREAM, 0); 37616509081SAnisse Astier strncpy(ifr.ifr_name, ndev->tap_name, sizeof(ifr.ifr_name)); 37749bada43SJean-Philippe Brucker ioctl(sock, SIOCGIFFLAGS, &ifr); 37849bada43SJean-Philippe Brucker ifr.ifr_flags &= ~(IFF_UP | IFF_RUNNING); 37949bada43SJean-Philippe Brucker if (ioctl(sock, SIOCGIFFLAGS, &ifr) < 0) 38049bada43SJean-Philippe Brucker pr_warning("Count not bring tap device down"); 38149bada43SJean-Philippe Brucker close(sock); 38249bada43SJean-Philippe Brucker } 38349bada43SJean-Philippe Brucker 38459ee54ebSWei Chen static bool virtio_net__tap_create(struct net_dev *ndev) 38559ee54ebSWei Chen { 38659ee54ebSWei Chen int offload; 38759ee54ebSWei Chen struct ifreq ifr; 38859ee54ebSWei Chen const struct virtio_net_params *params = ndev->params; 38959ee54ebSWei Chen bool macvtap = (!!params->tapif) && (params->tapif[0] == '/'); 39059ee54ebSWei Chen 39159ee54ebSWei Chen /* Did the user already gave us the FD? */ 39259ee54ebSWei Chen if (params->fd) 39359ee54ebSWei Chen ndev->tap_fd = params->fd; 39459ee54ebSWei Chen else { 39559ee54ebSWei Chen const char *tap_file = "/dev/net/tun"; 39659ee54ebSWei Chen 39759ee54ebSWei Chen /* Did the user ask us to use macvtap? */ 39859ee54ebSWei Chen if (macvtap) 39959ee54ebSWei Chen tap_file = params->tapif; 40059ee54ebSWei Chen 40159ee54ebSWei Chen ndev->tap_fd = open(tap_file, O_RDWR); 40259ee54ebSWei Chen if (ndev->tap_fd < 0) { 40359ee54ebSWei Chen pr_warning("Unable to open %s", tap_file); 40459ee54ebSWei Chen return 0; 40559ee54ebSWei Chen } 40659ee54ebSWei Chen } 40759ee54ebSWei Chen 40859ee54ebSWei Chen if (!macvtap && 40959ee54ebSWei Chen virtio_net_request_tap(ndev, &ifr, params->tapif) < 0) { 41059ee54ebSWei Chen pr_warning("Config tap device error. Are you root?"); 41159ee54ebSWei Chen goto fail; 41259ee54ebSWei Chen } 41359ee54ebSWei Chen 41459ee54ebSWei Chen /* 41559ee54ebSWei Chen * The UFO support had been removed from kernel in commit: 41659ee54ebSWei Chen * ID: fb652fdfe83710da0ca13448a41b7ed027d0a984 41759ee54ebSWei Chen * https://www.spinics.net/lists/netdev/msg443562.html 41859ee54ebSWei Chen * In oder to support the older kernels without this commit, 41959ee54ebSWei Chen * we set the TUN_F_UFO to offload by default to test the status of 42059ee54ebSWei Chen * UFO kernel support. 42159ee54ebSWei Chen */ 42259ee54ebSWei Chen ndev->tap_ufo = true; 42359ee54ebSWei Chen offload = TUN_F_CSUM | TUN_F_TSO4 | TUN_F_TSO6 | TUN_F_UFO; 42459ee54ebSWei Chen if (ioctl(ndev->tap_fd, TUNSETOFFLOAD, offload) < 0) { 42559ee54ebSWei Chen /* 42659ee54ebSWei Chen * Is this failure caused by kernel remove the UFO support? 42759ee54ebSWei Chen * Try TUNSETOFFLOAD without TUN_F_UFO. 42859ee54ebSWei Chen */ 42959ee54ebSWei Chen offload &= ~TUN_F_UFO; 43059ee54ebSWei Chen if (ioctl(ndev->tap_fd, TUNSETOFFLOAD, offload) < 0) { 43159ee54ebSWei Chen pr_warning("Config tap device TUNSETOFFLOAD error"); 43259ee54ebSWei Chen goto fail; 43359ee54ebSWei Chen } 43459ee54ebSWei Chen ndev->tap_ufo = false; 43559ee54ebSWei Chen } 43659ee54ebSWei Chen 43759ee54ebSWei Chen return 1; 43859ee54ebSWei Chen 43959ee54ebSWei Chen fail: 44059ee54ebSWei Chen if ((ndev->tap_fd >= 0) || (!params->fd) ) 44159ee54ebSWei Chen close(ndev->tap_fd); 44259ee54ebSWei Chen 44359ee54ebSWei Chen return 0; 44459ee54ebSWei Chen } 44559ee54ebSWei Chen 446b4fdde6dSAsias He static inline int tap_ops_tx(struct iovec *iov, u16 out, struct net_dev *ndev) 447b4fdde6dSAsias He { 448b4fdde6dSAsias He return writev(ndev->tap_fd, iov, out); 449b4fdde6dSAsias He } 450b4fdde6dSAsias He 451b4fdde6dSAsias He static inline int tap_ops_rx(struct iovec *iov, u16 in, struct net_dev *ndev) 452b4fdde6dSAsias He { 453b4fdde6dSAsias He return readv(ndev->tap_fd, iov, in); 454b4fdde6dSAsias He } 455b4fdde6dSAsias He 456b4fdde6dSAsias He static inline int uip_ops_tx(struct iovec *iov, u16 out, struct net_dev *ndev) 457b4fdde6dSAsias He { 458b4fdde6dSAsias He return uip_tx(iov, out, &ndev->info); 459b4fdde6dSAsias He } 460b4fdde6dSAsias He 461b4fdde6dSAsias He static inline int uip_ops_rx(struct iovec *iov, u16 in, struct net_dev *ndev) 462b4fdde6dSAsias He { 463b4fdde6dSAsias He return uip_rx(iov, in, &ndev->info); 464b4fdde6dSAsias He } 465b4fdde6dSAsias He 466b4fdde6dSAsias He static struct net_dev_operations tap_ops = { 467b4fdde6dSAsias He .rx = tap_ops_rx, 468b4fdde6dSAsias He .tx = tap_ops_tx, 469b4fdde6dSAsias He }; 470b4fdde6dSAsias He 471b4fdde6dSAsias He static struct net_dev_operations uip_ops = { 472b4fdde6dSAsias He .rx = uip_ops_rx, 473b4fdde6dSAsias He .tx = uip_ops_tx, 474b4fdde6dSAsias He }; 475b4fdde6dSAsias He 476c5ae742bSSasha Levin static u8 *get_config(struct kvm *kvm, void *dev) 47778a2a3e2SSasha Levin { 47878a2a3e2SSasha Levin struct net_dev *ndev = dev; 47978a2a3e2SSasha Levin 480c5ae742bSSasha Levin return ((u8 *)(&ndev->config)); 48178a2a3e2SSasha Levin } 48278a2a3e2SSasha Levin 483e4730284SMartin Radev static size_t get_config_size(struct kvm *kvm, void *dev) 484e4730284SMartin Radev { 485e4730284SMartin Radev struct net_dev *ndev = dev; 486e4730284SMartin Radev 487e4730284SMartin Radev return sizeof(ndev->config); 488e4730284SMartin Radev } 489e4730284SMartin Radev 49078a2a3e2SSasha Levin static u32 get_host_features(struct kvm *kvm, void *dev) 49178a2a3e2SSasha Levin { 49259ee54ebSWei Chen u32 features; 49379052597SSasha Levin struct net_dev *ndev = dev; 49479052597SSasha Levin 49559ee54ebSWei Chen features = 1UL << VIRTIO_NET_F_MAC 49678a2a3e2SSasha Levin | 1UL << VIRTIO_NET_F_CSUM 49778a2a3e2SSasha Levin | 1UL << VIRTIO_NET_F_HOST_TSO4 49878a2a3e2SSasha Levin | 1UL << VIRTIO_NET_F_HOST_TSO6 49978a2a3e2SSasha Levin | 1UL << VIRTIO_NET_F_GUEST_TSO4 50092c1f37bSSasha Levin | 1UL << VIRTIO_NET_F_GUEST_TSO6 501754c8ce3SSasha Levin | 1UL << VIRTIO_RING_F_EVENT_IDX 502abd4a801SSasha Levin | 1UL << VIRTIO_RING_F_INDIRECT_DESC 5036585ffb7SSasha Levin | 1UL << VIRTIO_NET_F_CTRL_VQ 5047668c3a6SSasha Levin | 1UL << VIRTIO_NET_F_MRG_RXBUF 50579052597SSasha Levin | 1UL << (ndev->queue_pairs > 1 ? VIRTIO_NET_F_MQ : 0); 50659ee54ebSWei Chen 50759ee54ebSWei Chen /* 50859ee54ebSWei Chen * The UFO feature for host and guest only can be enabled when the 50959ee54ebSWei Chen * kernel has TAP UFO support. 51059ee54ebSWei Chen */ 51159ee54ebSWei Chen if (ndev->tap_ufo) 51259ee54ebSWei Chen features |= (1UL << VIRTIO_NET_F_HOST_UFO 51359ee54ebSWei Chen | 1UL << VIRTIO_NET_F_GUEST_UFO); 51459ee54ebSWei Chen 51559ee54ebSWei Chen return features; 51678a2a3e2SSasha Levin } 51778a2a3e2SSasha Levin 51815636d5eSYing-Shiuan Pan static int virtio_net__vhost_set_features(struct net_dev *ndev) 51915636d5eSYing-Shiuan Pan { 52015636d5eSYing-Shiuan Pan u64 features = 1UL << VIRTIO_RING_F_EVENT_IDX; 52115636d5eSYing-Shiuan Pan u64 vhost_features; 52215636d5eSYing-Shiuan Pan 52315636d5eSYing-Shiuan Pan if (ioctl(ndev->vhost_fd, VHOST_GET_FEATURES, &vhost_features) != 0) 52415636d5eSYing-Shiuan Pan die_perror("VHOST_GET_FEATURES failed"); 52515636d5eSYing-Shiuan Pan 52615636d5eSYing-Shiuan Pan /* make sure both side support mergable rx buffers */ 52715636d5eSYing-Shiuan Pan if (vhost_features & 1UL << VIRTIO_NET_F_MRG_RXBUF && 52815636d5eSYing-Shiuan Pan has_virtio_feature(ndev, VIRTIO_NET_F_MRG_RXBUF)) 52915636d5eSYing-Shiuan Pan features |= 1UL << VIRTIO_NET_F_MRG_RXBUF; 53015636d5eSYing-Shiuan Pan 53115636d5eSYing-Shiuan Pan return ioctl(ndev->vhost_fd, VHOST_SET_FEATURES, &features); 53215636d5eSYing-Shiuan Pan } 53315636d5eSYing-Shiuan Pan 53478a2a3e2SSasha Levin static void set_guest_features(struct kvm *kvm, void *dev, u32 features) 53578a2a3e2SSasha Levin { 53678a2a3e2SSasha Levin struct net_dev *ndev = dev; 53778a2a3e2SSasha Levin 53878a2a3e2SSasha Levin ndev->features = features; 53995242e44SJean-Philippe Brucker } 5408ed60bbeSMarc Zyngier 54195242e44SJean-Philippe Brucker static void virtio_net_start(struct net_dev *ndev) 54295242e44SJean-Philippe Brucker { 5438aa155c4SYing-Shiuan Pan if (ndev->mode == NET_MODE_TAP) { 5448aa155c4SYing-Shiuan Pan if (!virtio_net__tap_init(ndev)) 54559ee54ebSWei Chen die_perror("TAP device initialized failed because"); 54659ee54ebSWei Chen 54715636d5eSYing-Shiuan Pan if (ndev->vhost_fd && 54815636d5eSYing-Shiuan Pan virtio_net__vhost_set_features(ndev) != 0) 54915636d5eSYing-Shiuan Pan die_perror("VHOST_SET_FEATURES failed"); 5508aa155c4SYing-Shiuan Pan } else { 5518aa155c4SYing-Shiuan Pan ndev->info.vnet_hdr_len = has_virtio_feature(ndev, VIRTIO_NET_F_MRG_RXBUF) ? 5528aa155c4SYing-Shiuan Pan sizeof(struct virtio_net_hdr_mrg_rxbuf) : 5538aa155c4SYing-Shiuan Pan sizeof(struct virtio_net_hdr); 5548aa155c4SYing-Shiuan Pan uip_init(&ndev->info); 5558aa155c4SYing-Shiuan Pan } 55678a2a3e2SSasha Levin } 55778a2a3e2SSasha Levin 55849bada43SJean-Philippe Brucker static void virtio_net_stop(struct net_dev *ndev) 55949bada43SJean-Philippe Brucker { 56049bada43SJean-Philippe Brucker /* Undo whatever start() did */ 56149bada43SJean-Philippe Brucker if (ndev->mode == NET_MODE_TAP) 56249bada43SJean-Philippe Brucker virtio_net__tap_exit(ndev); 56349bada43SJean-Philippe Brucker else 56449bada43SJean-Philippe Brucker uip_exit(&ndev->info); 56549bada43SJean-Philippe Brucker } 56649bada43SJean-Philippe Brucker 567*867b15ccSJean-Philippe Brucker static void virtio_net_update_endian(struct net_dev *ndev) 568*867b15ccSJean-Philippe Brucker { 569*867b15ccSJean-Philippe Brucker struct virtio_net_config *conf = &ndev->config; 570*867b15ccSJean-Philippe Brucker 571*867b15ccSJean-Philippe Brucker conf->status = virtio_host_to_guest_u16(&ndev->vdev, 572*867b15ccSJean-Philippe Brucker VIRTIO_NET_S_LINK_UP); 573*867b15ccSJean-Philippe Brucker conf->max_virtqueue_pairs = virtio_host_to_guest_u16(&ndev->vdev, 574*867b15ccSJean-Philippe Brucker ndev->queue_pairs); 575*867b15ccSJean-Philippe Brucker } 576*867b15ccSJean-Philippe Brucker 57795242e44SJean-Philippe Brucker static void notify_status(struct kvm *kvm, void *dev, u32 status) 57895242e44SJean-Philippe Brucker { 579*867b15ccSJean-Philippe Brucker struct net_dev *ndev = dev; 580*867b15ccSJean-Philippe Brucker 581*867b15ccSJean-Philippe Brucker if (status & VIRTIO__STATUS_CONFIG) 582*867b15ccSJean-Philippe Brucker virtio_net_update_endian(ndev); 583*867b15ccSJean-Philippe Brucker 58495242e44SJean-Philippe Brucker if (status & VIRTIO__STATUS_START) 58595242e44SJean-Philippe Brucker virtio_net_start(dev); 58649bada43SJean-Philippe Brucker else if (status & VIRTIO__STATUS_STOP) 58749bada43SJean-Philippe Brucker virtio_net_stop(dev); 58895242e44SJean-Philippe Brucker } 58995242e44SJean-Philippe Brucker 5909e56ec14SSasha Levin static bool is_ctrl_vq(struct net_dev *ndev, u32 vq) 5919e56ec14SSasha Levin { 5929e56ec14SSasha Levin return vq == (u32)(ndev->queue_pairs * 2); 5939e56ec14SSasha Levin } 5949e56ec14SSasha Levin 595609ee906SJean-Philippe Brucker static int init_vq(struct kvm *kvm, void *dev, u32 vq) 59678a2a3e2SSasha Levin { 5979ed67cdcSSasha Levin struct vhost_vring_state state = { .index = vq }; 598ad96e867SJean-Philippe Brucker struct net_dev_queue *net_queue; 5999ed67cdcSSasha Levin struct vhost_vring_addr addr; 60078a2a3e2SSasha Levin struct net_dev *ndev = dev; 60178a2a3e2SSasha Levin struct virt_queue *queue; 6029ed67cdcSSasha Levin int r; 60378a2a3e2SSasha Levin 604312c62d1SSasha Levin compat__remove_message(compat_id); 60578a2a3e2SSasha Levin 606ad96e867SJean-Philippe Brucker net_queue = &ndev->queues[vq]; 607ad96e867SJean-Philippe Brucker net_queue->id = vq; 608ad96e867SJean-Philippe Brucker net_queue->ndev = ndev; 609ad96e867SJean-Philippe Brucker queue = &net_queue->vq; 610609ee906SJean-Philippe Brucker virtio_init_device_vq(kvm, &ndev->vdev, queue, VIRTIO_NET_QUEUE_SIZE); 61178a2a3e2SSasha Levin 612ad96e867SJean-Philippe Brucker mutex_init(&net_queue->lock); 613ad96e867SJean-Philippe Brucker pthread_cond_init(&net_queue->cond, NULL); 6149e56ec14SSasha Levin if (is_ctrl_vq(ndev, vq)) { 615ad96e867SJean-Philippe Brucker pthread_create(&net_queue->thread, NULL, virtio_net_ctrl_thread, 616ad96e867SJean-Philippe Brucker net_queue); 6179e56ec14SSasha Levin 6189e56ec14SSasha Levin return 0; 6199e56ec14SSasha Levin } else if (ndev->vhost_fd == 0 ) { 6209e56ec14SSasha Levin if (vq & 1) 621ad96e867SJean-Philippe Brucker pthread_create(&net_queue->thread, NULL, 622ad96e867SJean-Philippe Brucker virtio_net_tx_thread, net_queue); 6236585ffb7SSasha Levin else 624ad96e867SJean-Philippe Brucker pthread_create(&net_queue->thread, NULL, 625ad96e867SJean-Philippe Brucker virtio_net_rx_thread, net_queue); 6266585ffb7SSasha Levin 62778a2a3e2SSasha Levin return 0; 6286585ffb7SSasha Levin } 6299ed67cdcSSasha Levin 6308ed60bbeSMarc Zyngier if (queue->endian != VIRTIO_ENDIAN_HOST) 631b960f243SAndre Przywara die_perror("VHOST requires the same endianness in guest and host"); 6328ed60bbeSMarc Zyngier 6339ed67cdcSSasha Levin state.num = queue->vring.num; 6349ed67cdcSSasha Levin r = ioctl(ndev->vhost_fd, VHOST_SET_VRING_NUM, &state); 6359ed67cdcSSasha Levin if (r < 0) 6369ed67cdcSSasha Levin die_perror("VHOST_SET_VRING_NUM failed"); 6379ed67cdcSSasha Levin state.num = 0; 6389ed67cdcSSasha Levin r = ioctl(ndev->vhost_fd, VHOST_SET_VRING_BASE, &state); 6399ed67cdcSSasha Levin if (r < 0) 6409ed67cdcSSasha Levin die_perror("VHOST_SET_VRING_BASE failed"); 6419ed67cdcSSasha Levin 6429ed67cdcSSasha Levin addr = (struct vhost_vring_addr) { 6439ed67cdcSSasha Levin .index = vq, 6449ed67cdcSSasha Levin .desc_user_addr = (u64)(unsigned long)queue->vring.desc, 6459ed67cdcSSasha Levin .avail_user_addr = (u64)(unsigned long)queue->vring.avail, 6469ed67cdcSSasha Levin .used_user_addr = (u64)(unsigned long)queue->vring.used, 6479ed67cdcSSasha Levin }; 6489ed67cdcSSasha Levin 6499ed67cdcSSasha Levin r = ioctl(ndev->vhost_fd, VHOST_SET_VRING_ADDR, &addr); 6509ed67cdcSSasha Levin if (r < 0) 6519ed67cdcSSasha Levin die_perror("VHOST_SET_VRING_ADDR failed"); 6529ed67cdcSSasha Levin 6539ed67cdcSSasha Levin return 0; 6549ed67cdcSSasha Levin } 6559ed67cdcSSasha Levin 65649bada43SJean-Philippe Brucker static void exit_vq(struct kvm *kvm, void *dev, u32 vq) 65749bada43SJean-Philippe Brucker { 65849bada43SJean-Philippe Brucker struct net_dev *ndev = dev; 65949bada43SJean-Philippe Brucker struct net_dev_queue *queue = &ndev->queues[vq]; 66049bada43SJean-Philippe Brucker 66149bada43SJean-Philippe Brucker if (!is_ctrl_vq(ndev, vq) && queue->gsi) { 66249bada43SJean-Philippe Brucker irq__del_irqfd(kvm, queue->gsi, queue->irqfd); 66349bada43SJean-Philippe Brucker close(queue->irqfd); 66449bada43SJean-Philippe Brucker queue->gsi = queue->irqfd = 0; 66549bada43SJean-Philippe Brucker } 66649bada43SJean-Philippe Brucker 66749bada43SJean-Philippe Brucker /* 66849bada43SJean-Philippe Brucker * TODO: vhost reset owner. It's the only way to cleanly stop vhost, but 66949bada43SJean-Philippe Brucker * we can't restart it at the moment. 67049bada43SJean-Philippe Brucker */ 67149bada43SJean-Philippe Brucker if (ndev->vhost_fd && !is_ctrl_vq(ndev, vq)) { 67249bada43SJean-Philippe Brucker pr_warning("Cannot reset VHOST queue"); 67349bada43SJean-Philippe Brucker ioctl(ndev->vhost_fd, VHOST_RESET_OWNER); 67449bada43SJean-Philippe Brucker return; 67549bada43SJean-Philippe Brucker } 67649bada43SJean-Philippe Brucker 67749bada43SJean-Philippe Brucker /* 67849bada43SJean-Philippe Brucker * Threads are waiting on cancellation points (readv or 67949bada43SJean-Philippe Brucker * pthread_cond_wait) and should stop gracefully. 68049bada43SJean-Philippe Brucker */ 68149bada43SJean-Philippe Brucker pthread_cancel(queue->thread); 68249bada43SJean-Philippe Brucker pthread_join(queue->thread, NULL); 68349bada43SJean-Philippe Brucker } 68449bada43SJean-Philippe Brucker 6859ed67cdcSSasha Levin static void notify_vq_gsi(struct kvm *kvm, void *dev, u32 vq, u32 gsi) 6869ed67cdcSSasha Levin { 6879ed67cdcSSasha Levin struct net_dev *ndev = dev; 688ad96e867SJean-Philippe Brucker struct net_dev_queue *queue = &ndev->queues[vq]; 6899ed67cdcSSasha Levin struct vhost_vring_file file; 6909ed67cdcSSasha Levin int r; 6919ed67cdcSSasha Levin 6929ed67cdcSSasha Levin if (ndev->vhost_fd == 0) 6939ed67cdcSSasha Levin return; 6949ed67cdcSSasha Levin 6959ed67cdcSSasha Levin file = (struct vhost_vring_file) { 6969ed67cdcSSasha Levin .index = vq, 697e59679d2SJean-Philippe Brucker .fd = eventfd(0, 0), 6989ed67cdcSSasha Levin }; 6999ed67cdcSSasha Levin 700e59679d2SJean-Philippe Brucker r = irq__add_irqfd(kvm, gsi, file.fd, -1); 7019ed67cdcSSasha Levin if (r < 0) 7029ed67cdcSSasha Levin die_perror("KVM_IRQFD failed"); 7039ed67cdcSSasha Levin 70449bada43SJean-Philippe Brucker queue->irqfd = file.fd; 70549bada43SJean-Philippe Brucker queue->gsi = gsi; 70649bada43SJean-Philippe Brucker 7079ed67cdcSSasha Levin r = ioctl(ndev->vhost_fd, VHOST_SET_VRING_CALL, &file); 7089ed67cdcSSasha Levin if (r < 0) 7099ed67cdcSSasha Levin die_perror("VHOST_SET_VRING_CALL failed"); 7109ed67cdcSSasha Levin file.fd = ndev->tap_fd; 7119ed67cdcSSasha Levin r = ioctl(ndev->vhost_fd, VHOST_NET_SET_BACKEND, &file); 7129ed67cdcSSasha Levin if (r != 0) 7139ed67cdcSSasha Levin die("VHOST_NET_SET_BACKEND failed %d", errno); 7149ed67cdcSSasha Levin 7159ed67cdcSSasha Levin } 7169ed67cdcSSasha Levin 7179ed67cdcSSasha Levin static void notify_vq_eventfd(struct kvm *kvm, void *dev, u32 vq, u32 efd) 7189ed67cdcSSasha Levin { 7199ed67cdcSSasha Levin struct net_dev *ndev = dev; 7209ed67cdcSSasha Levin struct vhost_vring_file file = { 7219ed67cdcSSasha Levin .index = vq, 7229ed67cdcSSasha Levin .fd = efd, 7239ed67cdcSSasha Levin }; 7249ed67cdcSSasha Levin int r; 7259ed67cdcSSasha Levin 7269e56ec14SSasha Levin if (ndev->vhost_fd == 0 || is_ctrl_vq(ndev, vq)) 7279ed67cdcSSasha Levin return; 7289ed67cdcSSasha Levin 7299ed67cdcSSasha Levin r = ioctl(ndev->vhost_fd, VHOST_SET_VRING_KICK, &file); 7309ed67cdcSSasha Levin if (r < 0) 7319ed67cdcSSasha Levin die_perror("VHOST_SET_VRING_KICK failed"); 73278a2a3e2SSasha Levin } 73378a2a3e2SSasha Levin 73478a2a3e2SSasha Levin static int notify_vq(struct kvm *kvm, void *dev, u32 vq) 73578a2a3e2SSasha Levin { 7369a6d73f1SSasha Levin struct net_dev *ndev = dev; 7379a6d73f1SSasha Levin 7389a6d73f1SSasha Levin virtio_net_handle_callback(kvm, ndev, vq); 73978a2a3e2SSasha Levin 74078a2a3e2SSasha Levin return 0; 74178a2a3e2SSasha Levin } 74278a2a3e2SSasha Levin 74353fbb17bSJean-Philippe Brucker static struct virt_queue *get_vq(struct kvm *kvm, void *dev, u32 vq) 74478a2a3e2SSasha Levin { 74578a2a3e2SSasha Levin struct net_dev *ndev = dev; 74678a2a3e2SSasha Levin 747ad96e867SJean-Philippe Brucker return &ndev->queues[vq].vq; 74878a2a3e2SSasha Levin } 74978a2a3e2SSasha Levin 75078a2a3e2SSasha Levin static int get_size_vq(struct kvm *kvm, void *dev, u32 vq) 75178a2a3e2SSasha Levin { 7520f4f51a8SAsias He /* FIXME: dynamic */ 75378a2a3e2SSasha Levin return VIRTIO_NET_QUEUE_SIZE; 75478a2a3e2SSasha Levin } 75578a2a3e2SSasha Levin 7560f4f51a8SAsias He static int set_size_vq(struct kvm *kvm, void *dev, u32 vq, int size) 7570f4f51a8SAsias He { 7580f4f51a8SAsias He /* FIXME: dynamic */ 7590f4f51a8SAsias He return size; 7600f4f51a8SAsias He } 7610f4f51a8SAsias He 76231e0eaccSMartin Radev static unsigned int get_vq_count(struct kvm *kvm, void *dev) 763b98ac591SJean-Philippe Brucker { 764b98ac591SJean-Philippe Brucker struct net_dev *ndev = dev; 765b98ac591SJean-Philippe Brucker 766b98ac591SJean-Philippe Brucker return ndev->queue_pairs * 2 + 1; 767b98ac591SJean-Philippe Brucker } 768b98ac591SJean-Philippe Brucker 76915542babSAndre Przywara static struct virtio_ops net_dev_virtio_ops = { 7701c47ce69SSasha Levin .get_config = get_config, 771e4730284SMartin Radev .get_config_size = get_config_size, 7721c47ce69SSasha Levin .get_host_features = get_host_features, 7731c47ce69SSasha Levin .set_guest_features = set_guest_features, 774b98ac591SJean-Philippe Brucker .get_vq_count = get_vq_count, 7751c47ce69SSasha Levin .init_vq = init_vq, 77649bada43SJean-Philippe Brucker .exit_vq = exit_vq, 77753fbb17bSJean-Philippe Brucker .get_vq = get_vq, 7781c47ce69SSasha Levin .get_size_vq = get_size_vq, 7790f4f51a8SAsias He .set_size_vq = set_size_vq, 7800f4f51a8SAsias He .notify_vq = notify_vq, 7819ed67cdcSSasha Levin .notify_vq_gsi = notify_vq_gsi, 7829ed67cdcSSasha Levin .notify_vq_eventfd = notify_vq_eventfd, 78395242e44SJean-Philippe Brucker .notify_status = notify_status, 7841c47ce69SSasha Levin }; 7851c47ce69SSasha Levin 7869ed67cdcSSasha Levin static void virtio_net__vhost_init(struct kvm *kvm, struct net_dev *ndev) 7879ed67cdcSSasha Levin { 7887f9733c2SAndreas Herrmann struct kvm_mem_bank *bank; 7899ed67cdcSSasha Levin struct vhost_memory *mem; 7907f9733c2SAndreas Herrmann int r, i; 7919ed67cdcSSasha Levin 7929ed67cdcSSasha Levin ndev->vhost_fd = open("/dev/vhost-net", O_RDWR); 7939ed67cdcSSasha Levin if (ndev->vhost_fd < 0) 7949ed67cdcSSasha Levin die_perror("Failed openning vhost-net device"); 7959ed67cdcSSasha Levin 7967f9733c2SAndreas Herrmann mem = calloc(1, sizeof(*mem) + kvm->mem_slots * sizeof(struct vhost_memory_region)); 7979ed67cdcSSasha Levin if (mem == NULL) 7989ed67cdcSSasha Levin die("Failed allocating memory for vhost memory map"); 7999ed67cdcSSasha Levin 8007f9733c2SAndreas Herrmann i = 0; 8017f9733c2SAndreas Herrmann list_for_each_entry(bank, &kvm->mem_banks, list) { 8027f9733c2SAndreas Herrmann mem->regions[i] = (struct vhost_memory_region) { 8037f9733c2SAndreas Herrmann .guest_phys_addr = bank->guest_phys_addr, 8047f9733c2SAndreas Herrmann .memory_size = bank->size, 8057f9733c2SAndreas Herrmann .userspace_addr = (unsigned long)bank->host_addr, 8069ed67cdcSSasha Levin }; 8077f9733c2SAndreas Herrmann i++; 8087f9733c2SAndreas Herrmann } 8097f9733c2SAndreas Herrmann mem->nregions = i; 8109ed67cdcSSasha Levin 8119ed67cdcSSasha Levin r = ioctl(ndev->vhost_fd, VHOST_SET_OWNER); 8129ed67cdcSSasha Levin if (r != 0) 8139ed67cdcSSasha Levin die_perror("VHOST_SET_OWNER failed"); 8149ed67cdcSSasha Levin 8159ed67cdcSSasha Levin r = ioctl(ndev->vhost_fd, VHOST_SET_MEM_TABLE, mem); 8169ed67cdcSSasha Levin if (r != 0) 8179ed67cdcSSasha Levin die_perror("VHOST_SET_MEM_TABLE failed"); 818627d6874SAsias He 819627d6874SAsias He ndev->vdev.use_vhost = true; 820627d6874SAsias He 8219ed67cdcSSasha Levin free(mem); 8229ed67cdcSSasha Levin } 8239ed67cdcSSasha Levin 8245f225124SSasha Levin static inline void str_to_mac(const char *str, char *mac) 8255f225124SSasha Levin { 8265f225124SSasha Levin sscanf(str, "%hhx:%hhx:%hhx:%hhx:%hhx:%hhx", 8275f225124SSasha Levin mac, mac+1, mac+2, mac+3, mac+4, mac+5); 8285f225124SSasha Levin } 8294346fd8fSSasha Levin static int set_net_param(struct kvm *kvm, struct virtio_net_params *p, 8304346fd8fSSasha Levin const char *param, const char *val) 8315f225124SSasha Levin { 8325f225124SSasha Levin if (strcmp(param, "guest_mac") == 0) { 8335f225124SSasha Levin str_to_mac(val, p->guest_mac); 8345f225124SSasha Levin } else if (strcmp(param, "mode") == 0) { 8355f225124SSasha Levin if (!strncmp(val, "user", 4)) { 8365f225124SSasha Levin int i; 8375f225124SSasha Levin 8385f225124SSasha Levin for (i = 0; i < kvm->cfg.num_net_devices; i++) 8395f225124SSasha Levin if (kvm->cfg.net_params[i].mode == NET_MODE_USER) 8405f225124SSasha Levin die("Only one usermode network device allowed at a time"); 8415f225124SSasha Levin p->mode = NET_MODE_USER; 8425f225124SSasha Levin } else if (!strncmp(val, "tap", 3)) { 8435f225124SSasha Levin p->mode = NET_MODE_TAP; 8445f225124SSasha Levin } else if (!strncmp(val, "none", 4)) { 8455f225124SSasha Levin kvm->cfg.no_net = 1; 8465f225124SSasha Levin return -1; 8475f225124SSasha Levin } else 8485f225124SSasha Levin die("Unknown network mode %s, please use user, tap or none", kvm->cfg.network); 8495f225124SSasha Levin } else if (strcmp(param, "script") == 0) { 8505f225124SSasha Levin p->script = strdup(val); 851eef27ae3SFan Du } else if (strcmp(param, "downscript") == 0) { 852eef27ae3SFan Du p->downscript = strdup(val); 8535f225124SSasha Levin } else if (strcmp(param, "guest_ip") == 0) { 8545f225124SSasha Levin p->guest_ip = strdup(val); 8555f225124SSasha Levin } else if (strcmp(param, "host_ip") == 0) { 8565f225124SSasha Levin p->host_ip = strdup(val); 8575f225124SSasha Levin } else if (strcmp(param, "trans") == 0) { 8585f225124SSasha Levin p->trans = strdup(val); 8591dfc7c24SMarc Zyngier } else if (strcmp(param, "tapif") == 0) { 8601dfc7c24SMarc Zyngier p->tapif = strdup(val); 8615f225124SSasha Levin } else if (strcmp(param, "vhost") == 0) { 8625f225124SSasha Levin p->vhost = atoi(val); 8635f225124SSasha Levin } else if (strcmp(param, "fd") == 0) { 8645f225124SSasha Levin p->fd = atoi(val); 86579052597SSasha Levin } else if (strcmp(param, "mq") == 0) { 86679052597SSasha Levin p->mq = atoi(val); 8675f225124SSasha Levin } else 8685f225124SSasha Levin die("Unknown network parameter %s", param); 8695f225124SSasha Levin 8705f225124SSasha Levin return 0; 8715f225124SSasha Levin } 8725f225124SSasha Levin 8735f225124SSasha Levin int netdev_parser(const struct option *opt, const char *arg, int unset) 8745f225124SSasha Levin { 8755f225124SSasha Levin struct virtio_net_params p; 8765f225124SSasha Levin char *buf = NULL, *cmd = NULL, *cur = NULL; 8775f225124SSasha Levin bool on_cmd = true; 8785f225124SSasha Levin struct kvm *kvm = opt->ptr; 8795f225124SSasha Levin 8805f225124SSasha Levin if (arg) { 8815f225124SSasha Levin buf = strdup(arg); 8825f225124SSasha Levin if (buf == NULL) 8835f225124SSasha Levin die("Failed allocating new net buffer"); 8845f225124SSasha Levin cur = strtok(buf, ",="); 8855f225124SSasha Levin } 8865f225124SSasha Levin 8875f225124SSasha Levin p = (struct virtio_net_params) { 8885f225124SSasha Levin .guest_ip = DEFAULT_GUEST_ADDR, 8895f225124SSasha Levin .host_ip = DEFAULT_HOST_ADDR, 8905f225124SSasha Levin .script = DEFAULT_SCRIPT, 891eef27ae3SFan Du .downscript = DEFAULT_SCRIPT, 8925f225124SSasha Levin .mode = NET_MODE_TAP, 8935f225124SSasha Levin }; 8945f225124SSasha Levin 8955f225124SSasha Levin str_to_mac(DEFAULT_GUEST_MAC, p.guest_mac); 8965f225124SSasha Levin p.guest_mac[5] += kvm->cfg.num_net_devices; 8975f225124SSasha Levin 8985f225124SSasha Levin while (cur) { 8995f225124SSasha Levin if (on_cmd) { 9005f225124SSasha Levin cmd = cur; 9015f225124SSasha Levin } else { 9024346fd8fSSasha Levin if (set_net_param(kvm, &p, cmd, cur) < 0) 9035f225124SSasha Levin goto done; 9045f225124SSasha Levin } 9055f225124SSasha Levin on_cmd = !on_cmd; 9065f225124SSasha Levin 9075f225124SSasha Levin cur = strtok(NULL, ",="); 9085f225124SSasha Levin }; 9095f225124SSasha Levin 9105f225124SSasha Levin kvm->cfg.num_net_devices++; 9115f225124SSasha Levin 9125f225124SSasha Levin kvm->cfg.net_params = realloc(kvm->cfg.net_params, kvm->cfg.num_net_devices * sizeof(*kvm->cfg.net_params)); 9135f225124SSasha Levin if (kvm->cfg.net_params == NULL) 9145f225124SSasha Levin die("Failed adding new network device"); 9155f225124SSasha Levin 9165f225124SSasha Levin kvm->cfg.net_params[kvm->cfg.num_net_devices - 1] = p; 9175f225124SSasha Levin 9185f225124SSasha Levin done: 9195f225124SSasha Levin free(buf); 9205f225124SSasha Levin return 0; 9215f225124SSasha Levin } 9225f225124SSasha Levin 9235f225124SSasha Levin static int virtio_net__init_one(struct virtio_net_params *params) 9244f56d42cSAsias He { 925db927775SAlexandru Elisei int i, r; 9269a6d73f1SSasha Levin struct net_dev *ndev; 92776a4aac6SWill Deacon struct virtio_ops *ops; 928dc7a55d6SSuzuki K. Poulose enum virtio_trans trans = VIRTIO_DEFAULT_TRANS(params->kvm); 9299a6d73f1SSasha Levin 9309a6d73f1SSasha Levin ndev = calloc(1, sizeof(struct net_dev)); 9319a6d73f1SSasha Levin if (ndev == NULL) 9325f225124SSasha Levin return -ENOMEM; 9339a6d73f1SSasha Levin 9349a6d73f1SSasha Levin list_add_tail(&ndev->list, &ndevs); 9359a6d73f1SSasha Levin 936db927775SAlexandru Elisei ops = malloc(sizeof(*ops)); 937db927775SAlexandru Elisei if (ops == NULL) 938db927775SAlexandru Elisei return -ENOMEM; 939db927775SAlexandru Elisei 9409a6d73f1SSasha Levin ndev->kvm = params->kvm; 9418c0ae74dSSasha Levin ndev->params = params; 9429a6d73f1SSasha Levin 9439a6d73f1SSasha Levin mutex_init(&ndev->mutex); 94479052597SSasha Levin ndev->queue_pairs = max(1, min(VIRTIO_NET_NUM_QUEUES, params->mq)); 94579052597SSasha Levin 9460c54698eSAsias He for (i = 0 ; i < 6 ; i++) { 9479a6d73f1SSasha Levin ndev->config.mac[i] = params->guest_mac[i]; 9489a6d73f1SSasha Levin ndev->info.guest_mac.addr[i] = params->guest_mac[i]; 9499a6d73f1SSasha Levin ndev->info.host_mac.addr[i] = params->host_mac[i]; 9500c54698eSAsias He } 951f715177dSAsias He 9529a6d73f1SSasha Levin ndev->mode = params->mode; 9539a6d73f1SSasha Levin if (ndev->mode == NET_MODE_TAP) { 9549a6d73f1SSasha Levin ndev->ops = &tap_ops; 95559ee54ebSWei Chen if (!virtio_net__tap_create(ndev)) 95659ee54ebSWei Chen die_perror("You have requested a TAP device, but creation of one has failed because"); 957b4fdde6dSAsias He } else { 9589a6d73f1SSasha Levin ndev->info.host_ip = ntohl(inet_addr(params->host_ip)); 9599a6d73f1SSasha Levin ndev->info.guest_ip = ntohl(inet_addr(params->guest_ip)); 9609a6d73f1SSasha Levin ndev->info.guest_netmask = ntohl(inet_addr("255.255.255.0")); 9619a6d73f1SSasha Levin ndev->info.buf_nr = 20, 9629a6d73f1SSasha Levin ndev->ops = &uip_ops; 9635f3aaf22SMarc Zyngier uip_static_init(&ndev->info); 964b4fdde6dSAsias He } 965b5ee1ea7SAsias He 96676a4aac6SWill Deacon *ops = net_dev_virtio_ops; 967dc7a55d6SSuzuki K. Poulose 968dc7a55d6SSuzuki K. Poulose if (params->trans) { 969dc7a55d6SSuzuki K. Poulose if (strcmp(params->trans, "mmio") == 0) 970dc7a55d6SSuzuki K. Poulose trans = VIRTIO_MMIO; 971dc7a55d6SSuzuki K. Poulose else if (strcmp(params->trans, "pci") == 0) 972dc7a55d6SSuzuki K. Poulose trans = VIRTIO_PCI; 97369205aa1SAsias He else 974dc7a55d6SSuzuki K. Poulose pr_warning("virtio-net: Unknown transport method : %s, " 975dc7a55d6SSuzuki K. Poulose "falling back to %s.", params->trans, 976dc7a55d6SSuzuki K. Poulose virtio_trans_name(trans)); 977dc7a55d6SSuzuki K. Poulose } 978dc7a55d6SSuzuki K. Poulose 979db927775SAlexandru Elisei r = virtio_init(params->kvm, ndev, &ndev->vdev, ops, trans, 98076a4aac6SWill Deacon PCI_DEVICE_ID_VIRTIO_NET, VIRTIO_ID_NET, PCI_CLASS_NET); 981db927775SAlexandru Elisei if (r < 0) { 982db927775SAlexandru Elisei free(ops); 983db927775SAlexandru Elisei return r; 984db927775SAlexandru Elisei } 98527ab67f5SSasha Levin 9869ed67cdcSSasha Levin if (params->vhost) 9879ed67cdcSSasha Levin virtio_net__vhost_init(params->kvm, ndev); 988cb83de6fSSasha Levin 989d278197dSAsias He if (compat_id == -1) 99052f34d2cSAsias He compat_id = virtio_compat_add_message("virtio-net", "CONFIG_VIRTIO_NET"); 9915f225124SSasha Levin 9925f225124SSasha Levin return 0; 9935f225124SSasha Levin } 9945f225124SSasha Levin 9955f225124SSasha Levin int virtio_net__init(struct kvm *kvm) 9965f225124SSasha Levin { 997db927775SAlexandru Elisei int i, r; 9985f225124SSasha Levin 9995f225124SSasha Levin for (i = 0; i < kvm->cfg.num_net_devices; i++) { 10005f225124SSasha Levin kvm->cfg.net_params[i].kvm = kvm; 1001db927775SAlexandru Elisei r = virtio_net__init_one(&kvm->cfg.net_params[i]); 1002db927775SAlexandru Elisei if (r < 0) 1003db927775SAlexandru Elisei goto cleanup; 10045f225124SSasha Levin } 10055f225124SSasha Levin 10065f225124SSasha Levin if (kvm->cfg.num_net_devices == 0 && kvm->cfg.no_net == 0) { 10078c0ae74dSSasha Levin static struct virtio_net_params net_params; 10085f225124SSasha Levin 10095f225124SSasha Levin net_params = (struct virtio_net_params) { 10105f225124SSasha Levin .guest_ip = kvm->cfg.guest_ip, 10115f225124SSasha Levin .host_ip = kvm->cfg.host_ip, 10125f225124SSasha Levin .kvm = kvm, 10135f225124SSasha Levin .script = kvm->cfg.script, 10145f225124SSasha Levin .mode = NET_MODE_USER, 10155f225124SSasha Levin }; 10165f225124SSasha Levin str_to_mac(kvm->cfg.guest_mac, net_params.guest_mac); 10175f225124SSasha Levin str_to_mac(kvm->cfg.host_mac, net_params.host_mac); 10185f225124SSasha Levin 1019db927775SAlexandru Elisei r = virtio_net__init_one(&net_params); 1020db927775SAlexandru Elisei if (r < 0) 1021db927775SAlexandru Elisei goto cleanup; 10225f225124SSasha Levin } 10235f225124SSasha Levin 10245f225124SSasha Levin return 0; 1025db927775SAlexandru Elisei 1026db927775SAlexandru Elisei cleanup: 1027db927775SAlexandru Elisei virtio_net__exit(kvm); 1028db927775SAlexandru Elisei return r; 10295f225124SSasha Levin } 103049a8afd1SSasha Levin virtio_dev_init(virtio_net__init); 10315f225124SSasha Levin 10325f225124SSasha Levin int virtio_net__exit(struct kvm *kvm) 10335f225124SSasha Levin { 1034eef27ae3SFan Du struct virtio_net_params *params; 1035eef27ae3SFan Du struct net_dev *ndev; 1036db927775SAlexandru Elisei struct list_head *ptr, *n; 1037eef27ae3SFan Du 1038db927775SAlexandru Elisei list_for_each_safe(ptr, n, &ndevs) { 1039eef27ae3SFan Du ndev = list_entry(ptr, struct net_dev, list); 1040eef27ae3SFan Du params = ndev->params; 1041eef27ae3SFan Du /* Cleanup any tap device which attached to bridge */ 1042eef27ae3SFan Du if (ndev->mode == NET_MODE_TAP && 1043eef27ae3SFan Du strcmp(params->downscript, "none")) 1044eef27ae3SFan Du virtio_net_exec_script(params->downscript, ndev->tap_name); 1045db927775SAlexandru Elisei 1046db927775SAlexandru Elisei list_del(&ndev->list); 1047db927775SAlexandru Elisei free(ndev); 1048eef27ae3SFan Du } 10495f225124SSasha Levin return 0; 10504f56d42cSAsias He } 105149a8afd1SSasha Levin virtio_dev_exit(virtio_net__exit); 1052