131638bcaSCyrill Gorcunov #include "kvm/virtio-pci-dev.h" 2b5ee1ea7SAsias He #include "kvm/virtio-net.h" 34f56d42cSAsias He #include "kvm/virtio.h" 44f56d42cSAsias He #include "kvm/mutex.h" 54f56d42cSAsias He #include "kvm/util.h" 64f56d42cSAsias He #include "kvm/kvm.h" 7b5ee1ea7SAsias He #include "kvm/uip.h" 8cb83de6fSSasha Levin #include "kvm/guest_compat.h" 97668c3a6SSasha Levin #include "kvm/iovec.h" 1005755b29SAndre Przywara #include "kvm/strbuf.h" 114f56d42cSAsias He 12029cd2bbSJean-Philippe Brucker #include <linux/list.h> 139ed67cdcSSasha Levin #include <linux/vhost.h> 144f56d42cSAsias He #include <linux/virtio_net.h> 154f56d42cSAsias He #include <linux/if_tun.h> 1678a2a3e2SSasha Levin #include <linux/types.h> 17c229370aSIngo Molnar 18c229370aSIngo Molnar #include <arpa/inet.h> 194f56d42cSAsias He #include <net/if.h> 20c229370aSIngo Molnar 21c229370aSIngo Molnar #include <unistd.h> 224f56d42cSAsias He #include <fcntl.h> 23c229370aSIngo Molnar 24cb7202c1SSasha Levin #include <sys/socket.h> 25c229370aSIngo Molnar #include <sys/ioctl.h> 26c229370aSIngo Molnar #include <sys/types.h> 2773b7d038SAmos Kong #include <sys/wait.h> 284f56d42cSAsias He 294059ad8bSAsias He #define VIRTIO_NET_QUEUE_SIZE 256 306585ffb7SSasha Levin #define VIRTIO_NET_NUM_QUEUES 8 314f56d42cSAsias He 32b4fdde6dSAsias He struct net_dev; 33b4fdde6dSAsias He 34b4fdde6dSAsias He struct net_dev_operations { 35b4fdde6dSAsias He int (*rx)(struct iovec *iov, u16 in, struct net_dev *ndev); 36b4fdde6dSAsias He int (*tx)(struct iovec *iov, u16 in, struct net_dev *ndev); 37b4fdde6dSAsias He }; 38b4fdde6dSAsias He 39ad96e867SJean-Philippe Brucker struct net_dev_queue { 40ad96e867SJean-Philippe Brucker int id; 41ad96e867SJean-Philippe Brucker struct net_dev *ndev; 42ad96e867SJean-Philippe Brucker struct virt_queue vq; 43ad96e867SJean-Philippe Brucker pthread_t thread; 44ad96e867SJean-Philippe Brucker struct mutex lock; 45ad96e867SJean-Philippe Brucker pthread_cond_t cond; 46ad96e867SJean-Philippe Brucker }; 47ad96e867SJean-Philippe Brucker 488626798bSAsias He struct net_dev { 49d3476f7dSSasha Levin struct mutex mutex; 5002eca50cSAsias He struct virtio_device vdev; 519a6d73f1SSasha Levin struct list_head list; 524f56d42cSAsias He 53ad96e867SJean-Philippe Brucker struct net_dev_queue queues[VIRTIO_NET_NUM_QUEUES * 2 + 1]; 54c229370aSIngo Molnar struct virtio_net_config config; 55902a8ecbSJean-Philippe Brucker u32 queue_pairs; 56c4aa7c02SPekka Enberg 579ed67cdcSSasha Levin int vhost_fd; 584f56d42cSAsias He int tap_fd; 594f56d42cSAsias He char tap_name[IFNAMSIZ]; 6059ee54ebSWei Chen bool tap_ufo; 61bb1a32f1SAsias He 62bb1a32f1SAsias He int mode; 63bb1a32f1SAsias He 64b5ee1ea7SAsias He struct uip_info info; 65b4fdde6dSAsias He struct net_dev_operations *ops; 669a6d73f1SSasha Levin struct kvm *kvm; 678c0ae74dSSasha Levin 688c0ae74dSSasha Levin struct virtio_net_params *params; 694f56d42cSAsias He }; 704f56d42cSAsias He 719a6d73f1SSasha Levin static LIST_HEAD(ndevs); 72312c62d1SSasha Levin static int compat_id = -1; 734f56d42cSAsias He 747668c3a6SSasha Levin #define MAX_PACKET_SIZE 65550 757668c3a6SSasha Levin 767668c3a6SSasha Levin static bool has_virtio_feature(struct net_dev *ndev, u32 feature) 777668c3a6SSasha Levin { 78902a8ecbSJean-Philippe Brucker return ndev->vdev.features & (1 << feature); 797668c3a6SSasha Levin } 807668c3a6SSasha Levin 81b231683cSJean-Philippe Brucker static int virtio_net_hdr_len(struct net_dev *ndev) 82b231683cSJean-Philippe Brucker { 83b231683cSJean-Philippe Brucker if (has_virtio_feature(ndev, VIRTIO_NET_F_MRG_RXBUF) || 84b231683cSJean-Philippe Brucker !ndev->vdev.legacy) 85b231683cSJean-Philippe Brucker return sizeof(struct virtio_net_hdr_mrg_rxbuf); 86b231683cSJean-Philippe Brucker 87b231683cSJean-Philippe Brucker return sizeof(struct virtio_net_hdr); 88b231683cSJean-Philippe Brucker } 89b231683cSJean-Philippe Brucker 90c4aa7c02SPekka Enberg static void *virtio_net_rx_thread(void *p) 914f56d42cSAsias He { 924f56d42cSAsias He struct iovec iov[VIRTIO_NET_QUEUE_SIZE]; 93ad96e867SJean-Philippe Brucker struct net_dev_queue *queue = p; 94ad96e867SJean-Philippe Brucker struct virt_queue *vq = &queue->vq; 95ad96e867SJean-Philippe Brucker struct net_dev *ndev = queue->ndev; 9643835ac9SSasha Levin struct kvm *kvm; 973fdf659dSSasha Levin u16 out, in; 983fdf659dSSasha Levin u16 head; 996d6cc14bSWill Deacon int len, copied; 1004f56d42cSAsias He 101a4d8c55eSSasha Levin kvm__set_thread_name("virtio-net-rx"); 102a4d8c55eSSasha Levin 1039a6d73f1SSasha Levin kvm = ndev->kvm; 104c4aa7c02SPekka Enberg while (1) { 105ad96e867SJean-Philippe Brucker mutex_lock(&queue->lock); 106c4aa7c02SPekka Enberg if (!virt_queue__available(vq)) 107ad96e867SJean-Philippe Brucker pthread_cond_wait(&queue->cond, &queue->lock.mutex); 108ad96e867SJean-Philippe Brucker mutex_unlock(&queue->lock); 1094f56d42cSAsias He 1104f56d42cSAsias He while (virt_queue__available(vq)) { 1117668c3a6SSasha Levin unsigned char buffer[MAX_PACKET_SIZE + sizeof(struct virtio_net_hdr_mrg_rxbuf)]; 1127668c3a6SSasha Levin struct iovec dummy_iov = { 1137668c3a6SSasha Levin .iov_base = buffer, 1147668c3a6SSasha Levin .iov_len = sizeof(buffer), 1157668c3a6SSasha Levin }; 1167668c3a6SSasha Levin struct virtio_net_hdr_mrg_rxbuf *hdr; 1173fea89a9SWill Deacon u16 num_buffers; 1187f5ffaf5SAsias He 1197668c3a6SSasha Levin len = ndev->ops->rx(&dummy_iov, 1, ndev); 1206d6cc14bSWill Deacon if (len < 0) { 1216d6cc14bSWill Deacon pr_warning("%s: rx on vq %u failed (%d), exiting thread\n", 122ad96e867SJean-Philippe Brucker __func__, queue->id, len); 1236d6cc14bSWill Deacon goto out_err; 1246d6cc14bSWill Deacon } 1256d6cc14bSWill Deacon 1263fea89a9SWill Deacon copied = num_buffers = 0; 1277668c3a6SSasha Levin head = virt_queue__get_iov(vq, iov, &out, &in, kvm); 1288ed60bbeSMarc Zyngier hdr = iov[0].iov_base; 1297668c3a6SSasha Levin while (copied < len) { 1306d6cc14bSWill Deacon size_t iovsize = min_t(size_t, len - copied, iov_size(iov, in)); 1317668c3a6SSasha Levin 132e2493047SAsias He memcpy_toiovec(iov, buffer + copied, iovsize); 1337668c3a6SSasha Levin copied += iovsize; 1343fea89a9SWill Deacon virt_queue__set_used_elem_no_update(vq, head, iovsize, num_buffers++); 1357668c3a6SSasha Levin if (copied == len) 1367668c3a6SSasha Levin break; 1377668c3a6SSasha Levin while (!virt_queue__available(vq)) 1387668c3a6SSasha Levin sleep(0); 1397668c3a6SSasha Levin head = virt_queue__get_iov(vq, iov, &out, &in, kvm); 1407668c3a6SSasha Levin } 1413fea89a9SWill Deacon 142b231683cSJean-Philippe Brucker /* 143b231683cSJean-Philippe Brucker * The device MUST set num_buffers, except in the case 144b231683cSJean-Philippe Brucker * where the legacy driver did not negotiate 145b231683cSJean-Philippe Brucker * VIRTIO_NET_F_MRG_RXBUF and the field does not exist. 146b231683cSJean-Philippe Brucker */ 147b231683cSJean-Philippe Brucker if (has_virtio_feature(ndev, VIRTIO_NET_F_MRG_RXBUF) || 148b231683cSJean-Philippe Brucker !ndev->vdev.legacy) 149b17552eeSAndre Przywara hdr->num_buffers = virtio_host_to_guest_u16(vq->endian, num_buffers); 1503fea89a9SWill Deacon 1513fea89a9SWill Deacon virt_queue__used_idx_advance(vq, num_buffers); 1523fea89a9SWill Deacon 153c4aa7c02SPekka Enberg /* We should interrupt guest right now, otherwise latency is huge. */ 1546585ffb7SSasha Levin if (virtio_queue__should_signal(vq)) 155ad96e867SJean-Philippe Brucker ndev->vdev.ops->signal_vq(kvm, &ndev->vdev, queue->id); 1564f56d42cSAsias He } 157c4aa7c02SPekka Enberg } 158c4aa7c02SPekka Enberg 1596d6cc14bSWill Deacon out_err: 160c4aa7c02SPekka Enberg pthread_exit(NULL); 161c4aa7c02SPekka Enberg return NULL; 162c4aa7c02SPekka Enberg 163c4aa7c02SPekka Enberg } 164c4aa7c02SPekka Enberg 165c4aa7c02SPekka Enberg static void *virtio_net_tx_thread(void *p) 1664f56d42cSAsias He { 1674f56d42cSAsias He struct iovec iov[VIRTIO_NET_QUEUE_SIZE]; 168ad96e867SJean-Philippe Brucker struct net_dev_queue *queue = p; 169ad96e867SJean-Philippe Brucker struct virt_queue *vq = &queue->vq; 170ad96e867SJean-Philippe Brucker struct net_dev *ndev = queue->ndev; 17143835ac9SSasha Levin struct kvm *kvm; 1723fdf659dSSasha Levin u16 out, in; 1733fdf659dSSasha Levin u16 head; 1744f56d42cSAsias He int len; 1754f56d42cSAsias He 176a4d8c55eSSasha Levin kvm__set_thread_name("virtio-net-tx"); 177a4d8c55eSSasha Levin 1789a6d73f1SSasha Levin kvm = ndev->kvm; 179c4aa7c02SPekka Enberg 180c4aa7c02SPekka Enberg while (1) { 181ad96e867SJean-Philippe Brucker mutex_lock(&queue->lock); 182c4aa7c02SPekka Enberg if (!virt_queue__available(vq)) 183ad96e867SJean-Philippe Brucker pthread_cond_wait(&queue->cond, &queue->lock.mutex); 184ad96e867SJean-Philippe Brucker mutex_unlock(&queue->lock); 1854f56d42cSAsias He 1864f56d42cSAsias He while (virt_queue__available(vq)) { 18743835ac9SSasha Levin head = virt_queue__get_iov(vq, iov, &out, &in, kvm); 1889a6d73f1SSasha Levin len = ndev->ops->tx(iov, out, ndev); 1896d6cc14bSWill Deacon if (len < 0) { 1906d6cc14bSWill Deacon pr_warning("%s: tx on vq %u failed (%d)\n", 191ad96e867SJean-Philippe Brucker __func__, queue->id, errno); 1926d6cc14bSWill Deacon goto out_err; 1936d6cc14bSWill Deacon } 1946d6cc14bSWill Deacon 1954f56d42cSAsias He virt_queue__set_used_elem(vq, head, len); 1964f56d42cSAsias He } 1974f56d42cSAsias He 1986585ffb7SSasha Levin if (virtio_queue__should_signal(vq)) 199ad96e867SJean-Philippe Brucker ndev->vdev.ops->signal_vq(kvm, &ndev->vdev, queue->id); 2004f56d42cSAsias He } 2014f56d42cSAsias He 2026d6cc14bSWill Deacon out_err: 203c4aa7c02SPekka Enberg pthread_exit(NULL); 204c4aa7c02SPekka Enberg return NULL; 205c4aa7c02SPekka Enberg } 206407475bfSPekka Enberg 2076585ffb7SSasha Levin static virtio_net_ctrl_ack virtio_net_handle_mq(struct kvm* kvm, struct net_dev *ndev, struct virtio_net_ctrl_hdr *ctrl) 2086585ffb7SSasha Levin { 2096585ffb7SSasha Levin /* Not much to do here */ 2106585ffb7SSasha Levin return VIRTIO_NET_OK; 2116585ffb7SSasha Levin } 2126585ffb7SSasha Levin 2136585ffb7SSasha Levin static void *virtio_net_ctrl_thread(void *p) 214abd4a801SSasha Levin { 215abd4a801SSasha Levin struct iovec iov[VIRTIO_NET_QUEUE_SIZE]; 216ad96e867SJean-Philippe Brucker struct net_dev_queue *queue = p; 217ad96e867SJean-Philippe Brucker struct virt_queue *vq = &queue->vq; 218ad96e867SJean-Philippe Brucker struct net_dev *ndev = queue->ndev; 219abd4a801SSasha Levin u16 out, in, head; 2206585ffb7SSasha Levin struct kvm *kvm = ndev->kvm; 2216daffe57SJean-Philippe Brucker struct virtio_net_ctrl_hdr ctrl; 2226daffe57SJean-Philippe Brucker virtio_net_ctrl_ack ack; 2236daffe57SJean-Philippe Brucker size_t len; 224abd4a801SSasha Levin 225edb4a8a0SSuzuki K. Poulose kvm__set_thread_name("virtio-net-ctrl"); 226edb4a8a0SSuzuki K. Poulose 2276585ffb7SSasha Levin while (1) { 228ad96e867SJean-Philippe Brucker mutex_lock(&queue->lock); 2296585ffb7SSasha Levin if (!virt_queue__available(vq)) 230ad96e867SJean-Philippe Brucker pthread_cond_wait(&queue->cond, &queue->lock.mutex); 231ad96e867SJean-Philippe Brucker mutex_unlock(&queue->lock); 2326585ffb7SSasha Levin 2336585ffb7SSasha Levin while (virt_queue__available(vq)) { 234ad96e867SJean-Philippe Brucker head = virt_queue__get_iov(vq, iov, &out, &in, kvm); 2356daffe57SJean-Philippe Brucker len = min(iov_size(iov, in), sizeof(ctrl)); 2366daffe57SJean-Philippe Brucker memcpy_fromiovec((void *)&ctrl, iov, len); 237abd4a801SSasha Levin 2386daffe57SJean-Philippe Brucker switch (ctrl.class) { 2396585ffb7SSasha Levin case VIRTIO_NET_CTRL_MQ: 2406daffe57SJean-Philippe Brucker ack = virtio_net_handle_mq(kvm, ndev, &ctrl); 2416585ffb7SSasha Levin break; 242abd4a801SSasha Levin default: 2436daffe57SJean-Philippe Brucker ack = VIRTIO_NET_ERR; 244abd4a801SSasha Levin break; 245abd4a801SSasha Levin } 2466daffe57SJean-Philippe Brucker memcpy_toiovec(iov + in, &ack, sizeof(ack)); 2476daffe57SJean-Philippe Brucker virt_queue__set_used_elem(vq, head, sizeof(ack)); 2486585ffb7SSasha Levin } 249abd4a801SSasha Levin 250ad96e867SJean-Philippe Brucker if (virtio_queue__should_signal(vq)) 251ad96e867SJean-Philippe Brucker ndev->vdev.ops->signal_vq(kvm, &ndev->vdev, queue->id); 2526585ffb7SSasha Levin } 253abd4a801SSasha Levin 2546585ffb7SSasha Levin pthread_exit(NULL); 255abd4a801SSasha Levin 2566585ffb7SSasha Levin return NULL; 257abd4a801SSasha Levin } 258abd4a801SSasha Levin 2599a6d73f1SSasha Levin static void virtio_net_handle_callback(struct kvm *kvm, struct net_dev *ndev, int queue) 2604f56d42cSAsias He { 261ad96e867SJean-Philippe Brucker struct net_dev_queue *net_queue = &ndev->queues[queue]; 262ad96e867SJean-Philippe Brucker 26379052597SSasha Levin if ((u32)queue >= (ndev->queue_pairs * 2 + 1)) { 2649a6d73f1SSasha Levin pr_warning("Unknown queue index %u", queue); 2656585ffb7SSasha Levin return; 266c4aa7c02SPekka Enberg } 2676585ffb7SSasha Levin 268ad96e867SJean-Philippe Brucker mutex_lock(&net_queue->lock); 269ad96e867SJean-Philippe Brucker pthread_cond_signal(&net_queue->cond); 270ad96e867SJean-Philippe Brucker mutex_unlock(&net_queue->lock); 2714f56d42cSAsias He } 2724f56d42cSAsias He 273d2a7ddffSMarc Zyngier static int virtio_net_request_tap(struct net_dev *ndev, struct ifreq *ifr, 274d2a7ddffSMarc Zyngier const char *tapname) 275d2a7ddffSMarc Zyngier { 276d2a7ddffSMarc Zyngier int ret; 277d2a7ddffSMarc Zyngier 278d2a7ddffSMarc Zyngier memset(ifr, 0, sizeof(*ifr)); 279d2a7ddffSMarc Zyngier ifr->ifr_flags = IFF_TAP | IFF_NO_PI | IFF_VNET_HDR; 280d2a7ddffSMarc Zyngier if (tapname) 28105755b29SAndre Przywara strlcpy(ifr->ifr_name, tapname, sizeof(ifr->ifr_name)); 282d2a7ddffSMarc Zyngier 283f83dc816SAndreas Herrmann ret = ioctl(ndev->tap_fd, TUNSETIFF, ifr); 284d2a7ddffSMarc Zyngier 285d2a7ddffSMarc Zyngier if (ret >= 0) 28605755b29SAndre Przywara strlcpy(ndev->tap_name, ifr->ifr_name, sizeof(ndev->tap_name)); 287d2a7ddffSMarc Zyngier return ret; 288d2a7ddffSMarc Zyngier } 289d2a7ddffSMarc Zyngier 290eef27ae3SFan Du static int virtio_net_exec_script(const char* script, const char *tap_name) 291eef27ae3SFan Du { 292eef27ae3SFan Du pid_t pid; 293eef27ae3SFan Du int status; 294eef27ae3SFan Du 2959987a37cSSuzuki K Poulose pid = vfork(); 296eef27ae3SFan Du if (pid == 0) { 297eef27ae3SFan Du execl(script, script, tap_name, NULL); 298eef27ae3SFan Du _exit(1); 299eef27ae3SFan Du } else { 300eef27ae3SFan Du waitpid(pid, &status, 0); 301eef27ae3SFan Du if (WIFEXITED(status) && WEXITSTATUS(status) != 0) { 302eef27ae3SFan Du pr_warning("Fail to setup tap by %s", script); 303eef27ae3SFan Du return -1; 304eef27ae3SFan Du } 305eef27ae3SFan Du } 306eef27ae3SFan Du return 0; 307eef27ae3SFan Du } 308eef27ae3SFan Du 3098c0ae74dSSasha Levin static bool virtio_net__tap_init(struct net_dev *ndev) 3104f56d42cSAsias He { 311cb7202c1SSasha Levin int sock = socket(AF_INET, SOCK_STREAM, 0); 31259ee54ebSWei Chen int hdr_len; 313cb7202c1SSasha Levin struct sockaddr_in sin = {0}; 314246c8347SAsias He struct ifreq ifr; 3158c0ae74dSSasha Levin const struct virtio_net_params *params = ndev->params; 3161dfc7c24SMarc Zyngier bool skipconf = !!params->tapif; 3174f56d42cSAsias He 318b231683cSJean-Philippe Brucker hdr_len = virtio_net_hdr_len(ndev); 3199a6d73f1SSasha Levin if (ioctl(ndev->tap_fd, TUNSETVNETHDRSZ, &hdr_len) < 0) 3204542f276SCyrill Gorcunov pr_warning("Config tap device TUNSETVNETHDRSZ error"); 321246c8347SAsias He 32273b7d038SAmos Kong if (strcmp(params->script, "none")) { 323eef27ae3SFan Du if (virtio_net_exec_script(params->script, ndev->tap_name) < 0) 32473b7d038SAmos Kong goto fail; 3251dfc7c24SMarc Zyngier } else if (!skipconf) { 326cb7202c1SSasha Levin memset(&ifr, 0, sizeof(ifr)); 32716509081SAnisse Astier strncpy(ifr.ifr_name, ndev->tap_name, sizeof(ifr.ifr_name)); 328bdfcfca6SSasha Levin sin.sin_addr.s_addr = inet_addr(params->host_ip); 329cb7202c1SSasha Levin memcpy(&(ifr.ifr_addr), &sin, sizeof(ifr.ifr_addr)); 330cb7202c1SSasha Levin ifr.ifr_addr.sa_family = AF_INET; 3313b02f580SSasha Levin if (ioctl(sock, SIOCSIFADDR, &ifr) < 0) { 3324542f276SCyrill Gorcunov pr_warning("Could not set ip address on tap device"); 3333b02f580SSasha Levin goto fail; 3343b02f580SSasha Levin } 33573b7d038SAmos Kong } 336cb7202c1SSasha Levin 3371dfc7c24SMarc Zyngier if (!skipconf) { 338cb7202c1SSasha Levin memset(&ifr, 0, sizeof(ifr)); 33916509081SAnisse Astier strncpy(ifr.ifr_name, ndev->tap_name, sizeof(ifr.ifr_name)); 340cb7202c1SSasha Levin ioctl(sock, SIOCGIFFLAGS, &ifr); 341cb7202c1SSasha Levin ifr.ifr_flags |= IFF_UP | IFF_RUNNING; 342cb7202c1SSasha Levin if (ioctl(sock, SIOCSIFFLAGS, &ifr) < 0) 3434542f276SCyrill Gorcunov pr_warning("Could not bring tap device up"); 3441dfc7c24SMarc Zyngier } 345cb7202c1SSasha Levin 346cb7202c1SSasha Levin close(sock); 3473b02f580SSasha Levin 3483b02f580SSasha Levin return 1; 3493b02f580SSasha Levin 3503b02f580SSasha Levin fail: 3513b02f580SSasha Levin if (sock >= 0) 3523b02f580SSasha Levin close(sock); 3539a6d73f1SSasha Levin if (ndev->tap_fd >= 0) 3549a6d73f1SSasha Levin close(ndev->tap_fd); 3553b02f580SSasha Levin 3563b02f580SSasha Levin return 0; 3574f56d42cSAsias He } 3584f56d42cSAsias He 35949bada43SJean-Philippe Brucker static void virtio_net__tap_exit(struct net_dev *ndev) 36049bada43SJean-Philippe Brucker { 36149bada43SJean-Philippe Brucker int sock; 36249bada43SJean-Philippe Brucker struct ifreq ifr; 36349bada43SJean-Philippe Brucker 36449bada43SJean-Philippe Brucker if (ndev->params->tapif) 36549bada43SJean-Philippe Brucker return; 36649bada43SJean-Philippe Brucker 36749bada43SJean-Philippe Brucker sock = socket(AF_INET, SOCK_STREAM, 0); 36816509081SAnisse Astier strncpy(ifr.ifr_name, ndev->tap_name, sizeof(ifr.ifr_name)); 36949bada43SJean-Philippe Brucker ioctl(sock, SIOCGIFFLAGS, &ifr); 37049bada43SJean-Philippe Brucker ifr.ifr_flags &= ~(IFF_UP | IFF_RUNNING); 37149bada43SJean-Philippe Brucker if (ioctl(sock, SIOCGIFFLAGS, &ifr) < 0) 37249bada43SJean-Philippe Brucker pr_warning("Count not bring tap device down"); 37349bada43SJean-Philippe Brucker close(sock); 37449bada43SJean-Philippe Brucker } 37549bada43SJean-Philippe Brucker 37659ee54ebSWei Chen static bool virtio_net__tap_create(struct net_dev *ndev) 37759ee54ebSWei Chen { 37859ee54ebSWei Chen int offload; 37959ee54ebSWei Chen struct ifreq ifr; 38059ee54ebSWei Chen const struct virtio_net_params *params = ndev->params; 38159ee54ebSWei Chen bool macvtap = (!!params->tapif) && (params->tapif[0] == '/'); 38259ee54ebSWei Chen 38359ee54ebSWei Chen /* Did the user already gave us the FD? */ 38459ee54ebSWei Chen if (params->fd) 38559ee54ebSWei Chen ndev->tap_fd = params->fd; 38659ee54ebSWei Chen else { 38759ee54ebSWei Chen const char *tap_file = "/dev/net/tun"; 38859ee54ebSWei Chen 38959ee54ebSWei Chen /* Did the user ask us to use macvtap? */ 39059ee54ebSWei Chen if (macvtap) 39159ee54ebSWei Chen tap_file = params->tapif; 39259ee54ebSWei Chen 39359ee54ebSWei Chen ndev->tap_fd = open(tap_file, O_RDWR); 39459ee54ebSWei Chen if (ndev->tap_fd < 0) { 39559ee54ebSWei Chen pr_warning("Unable to open %s", tap_file); 39659ee54ebSWei Chen return 0; 39759ee54ebSWei Chen } 39859ee54ebSWei Chen } 39959ee54ebSWei Chen 40059ee54ebSWei Chen if (!macvtap && 40159ee54ebSWei Chen virtio_net_request_tap(ndev, &ifr, params->tapif) < 0) { 40259ee54ebSWei Chen pr_warning("Config tap device error. Are you root?"); 40359ee54ebSWei Chen goto fail; 40459ee54ebSWei Chen } 40559ee54ebSWei Chen 40659ee54ebSWei Chen /* 40759ee54ebSWei Chen * The UFO support had been removed from kernel in commit: 40859ee54ebSWei Chen * ID: fb652fdfe83710da0ca13448a41b7ed027d0a984 40959ee54ebSWei Chen * https://www.spinics.net/lists/netdev/msg443562.html 41059ee54ebSWei Chen * In oder to support the older kernels without this commit, 41159ee54ebSWei Chen * we set the TUN_F_UFO to offload by default to test the status of 41259ee54ebSWei Chen * UFO kernel support. 41359ee54ebSWei Chen */ 41459ee54ebSWei Chen ndev->tap_ufo = true; 41559ee54ebSWei Chen offload = TUN_F_CSUM | TUN_F_TSO4 | TUN_F_TSO6 | TUN_F_UFO; 41659ee54ebSWei Chen if (ioctl(ndev->tap_fd, TUNSETOFFLOAD, offload) < 0) { 41759ee54ebSWei Chen /* 41859ee54ebSWei Chen * Is this failure caused by kernel remove the UFO support? 41959ee54ebSWei Chen * Try TUNSETOFFLOAD without TUN_F_UFO. 42059ee54ebSWei Chen */ 42159ee54ebSWei Chen offload &= ~TUN_F_UFO; 42259ee54ebSWei Chen if (ioctl(ndev->tap_fd, TUNSETOFFLOAD, offload) < 0) { 42359ee54ebSWei Chen pr_warning("Config tap device TUNSETOFFLOAD error"); 42459ee54ebSWei Chen goto fail; 42559ee54ebSWei Chen } 42659ee54ebSWei Chen ndev->tap_ufo = false; 42759ee54ebSWei Chen } 42859ee54ebSWei Chen 42959ee54ebSWei Chen return 1; 43059ee54ebSWei Chen 43159ee54ebSWei Chen fail: 43259ee54ebSWei Chen if ((ndev->tap_fd >= 0) || (!params->fd) ) 43359ee54ebSWei Chen close(ndev->tap_fd); 43459ee54ebSWei Chen 43559ee54ebSWei Chen return 0; 43659ee54ebSWei Chen } 43759ee54ebSWei Chen 438b4fdde6dSAsias He static inline int tap_ops_tx(struct iovec *iov, u16 out, struct net_dev *ndev) 439b4fdde6dSAsias He { 440b4fdde6dSAsias He return writev(ndev->tap_fd, iov, out); 441b4fdde6dSAsias He } 442b4fdde6dSAsias He 443b4fdde6dSAsias He static inline int tap_ops_rx(struct iovec *iov, u16 in, struct net_dev *ndev) 444b4fdde6dSAsias He { 445b4fdde6dSAsias He return readv(ndev->tap_fd, iov, in); 446b4fdde6dSAsias He } 447b4fdde6dSAsias He 448b4fdde6dSAsias He static inline int uip_ops_tx(struct iovec *iov, u16 out, struct net_dev *ndev) 449b4fdde6dSAsias He { 450b4fdde6dSAsias He return uip_tx(iov, out, &ndev->info); 451b4fdde6dSAsias He } 452b4fdde6dSAsias He 453b4fdde6dSAsias He static inline int uip_ops_rx(struct iovec *iov, u16 in, struct net_dev *ndev) 454b4fdde6dSAsias He { 455b4fdde6dSAsias He return uip_rx(iov, in, &ndev->info); 456b4fdde6dSAsias He } 457b4fdde6dSAsias He 458b4fdde6dSAsias He static struct net_dev_operations tap_ops = { 459b4fdde6dSAsias He .rx = tap_ops_rx, 460b4fdde6dSAsias He .tx = tap_ops_tx, 461b4fdde6dSAsias He }; 462b4fdde6dSAsias He 463b4fdde6dSAsias He static struct net_dev_operations uip_ops = { 464b4fdde6dSAsias He .rx = uip_ops_rx, 465b4fdde6dSAsias He .tx = uip_ops_tx, 466b4fdde6dSAsias He }; 467b4fdde6dSAsias He 468c5ae742bSSasha Levin static u8 *get_config(struct kvm *kvm, void *dev) 46978a2a3e2SSasha Levin { 47078a2a3e2SSasha Levin struct net_dev *ndev = dev; 47178a2a3e2SSasha Levin 472c5ae742bSSasha Levin return ((u8 *)(&ndev->config)); 47378a2a3e2SSasha Levin } 47478a2a3e2SSasha Levin 475e4730284SMartin Radev static size_t get_config_size(struct kvm *kvm, void *dev) 476e4730284SMartin Radev { 477e4730284SMartin Radev struct net_dev *ndev = dev; 478e4730284SMartin Radev 479e4730284SMartin Radev return sizeof(ndev->config); 480e4730284SMartin Radev } 481e4730284SMartin Radev 4823c8f82b8SJean-Philippe Brucker static u64 get_host_features(struct kvm *kvm, void *dev) 48378a2a3e2SSasha Levin { 4843c8f82b8SJean-Philippe Brucker u64 features; 48579052597SSasha Levin struct net_dev *ndev = dev; 48679052597SSasha Levin 48759ee54ebSWei Chen features = 1UL << VIRTIO_NET_F_MAC 48878a2a3e2SSasha Levin | 1UL << VIRTIO_NET_F_CSUM 48978a2a3e2SSasha Levin | 1UL << VIRTIO_NET_F_HOST_TSO4 49078a2a3e2SSasha Levin | 1UL << VIRTIO_NET_F_HOST_TSO6 49178a2a3e2SSasha Levin | 1UL << VIRTIO_NET_F_GUEST_TSO4 49292c1f37bSSasha Levin | 1UL << VIRTIO_NET_F_GUEST_TSO6 493754c8ce3SSasha Levin | 1UL << VIRTIO_RING_F_EVENT_IDX 494abd4a801SSasha Levin | 1UL << VIRTIO_RING_F_INDIRECT_DESC 4956585ffb7SSasha Levin | 1UL << VIRTIO_NET_F_CTRL_VQ 4967668c3a6SSasha Levin | 1UL << VIRTIO_NET_F_MRG_RXBUF 4976daffe57SJean-Philippe Brucker | 1UL << (ndev->queue_pairs > 1 ? VIRTIO_NET_F_MQ : 0) 4986daffe57SJean-Philippe Brucker | 1UL << VIRTIO_F_ANY_LAYOUT; 49959ee54ebSWei Chen 50059ee54ebSWei Chen /* 50159ee54ebSWei Chen * The UFO feature for host and guest only can be enabled when the 50259ee54ebSWei Chen * kernel has TAP UFO support. 50359ee54ebSWei Chen */ 50459ee54ebSWei Chen if (ndev->tap_ufo) 50559ee54ebSWei Chen features |= (1UL << VIRTIO_NET_F_HOST_UFO 50659ee54ebSWei Chen | 1UL << VIRTIO_NET_F_GUEST_UFO); 50759ee54ebSWei Chen 508*53171d59SJean-Philippe Brucker if (ndev->vhost_fd) { 50915636d5eSYing-Shiuan Pan u64 vhost_features; 51015636d5eSYing-Shiuan Pan 51115636d5eSYing-Shiuan Pan if (ioctl(ndev->vhost_fd, VHOST_GET_FEATURES, &vhost_features) != 0) 51215636d5eSYing-Shiuan Pan die_perror("VHOST_GET_FEATURES failed"); 51315636d5eSYing-Shiuan Pan 514*53171d59SJean-Philippe Brucker features &= vhost_features; 515*53171d59SJean-Philippe Brucker } 516*53171d59SJean-Philippe Brucker 517*53171d59SJean-Philippe Brucker return features; 518*53171d59SJean-Philippe Brucker } 519*53171d59SJean-Philippe Brucker 520*53171d59SJean-Philippe Brucker static int virtio_net__vhost_set_features(struct net_dev *ndev) 521*53171d59SJean-Philippe Brucker { 522*53171d59SJean-Philippe Brucker /* VHOST_NET_F_VIRTIO_NET_HDR clashes with VIRTIO_F_ANY_LAYOUT! */ 523*53171d59SJean-Philippe Brucker u64 features = ndev->vdev.features & 524*53171d59SJean-Philippe Brucker ~(1UL << VHOST_NET_F_VIRTIO_NET_HDR); 52515636d5eSYing-Shiuan Pan 52615636d5eSYing-Shiuan Pan return ioctl(ndev->vhost_fd, VHOST_SET_FEATURES, &features); 52715636d5eSYing-Shiuan Pan } 52815636d5eSYing-Shiuan Pan 52995242e44SJean-Philippe Brucker static void virtio_net_start(struct net_dev *ndev) 53095242e44SJean-Philippe Brucker { 5318aa155c4SYing-Shiuan Pan if (ndev->mode == NET_MODE_TAP) { 5328aa155c4SYing-Shiuan Pan if (!virtio_net__tap_init(ndev)) 53359ee54ebSWei Chen die_perror("TAP device initialized failed because"); 53459ee54ebSWei Chen 53515636d5eSYing-Shiuan Pan if (ndev->vhost_fd && 53615636d5eSYing-Shiuan Pan virtio_net__vhost_set_features(ndev) != 0) 53715636d5eSYing-Shiuan Pan die_perror("VHOST_SET_FEATURES failed"); 5388aa155c4SYing-Shiuan Pan } else { 539b231683cSJean-Philippe Brucker ndev->info.vnet_hdr_len = virtio_net_hdr_len(ndev); 5408aa155c4SYing-Shiuan Pan uip_init(&ndev->info); 5418aa155c4SYing-Shiuan Pan } 54278a2a3e2SSasha Levin } 54378a2a3e2SSasha Levin 54449bada43SJean-Philippe Brucker static void virtio_net_stop(struct net_dev *ndev) 54549bada43SJean-Philippe Brucker { 54649bada43SJean-Philippe Brucker /* Undo whatever start() did */ 54749bada43SJean-Philippe Brucker if (ndev->mode == NET_MODE_TAP) 54849bada43SJean-Philippe Brucker virtio_net__tap_exit(ndev); 54949bada43SJean-Philippe Brucker else 55049bada43SJean-Philippe Brucker uip_exit(&ndev->info); 55149bada43SJean-Philippe Brucker } 55249bada43SJean-Philippe Brucker 553867b15ccSJean-Philippe Brucker static void virtio_net_update_endian(struct net_dev *ndev) 554867b15ccSJean-Philippe Brucker { 555867b15ccSJean-Philippe Brucker struct virtio_net_config *conf = &ndev->config; 556867b15ccSJean-Philippe Brucker 557b17552eeSAndre Przywara conf->status = virtio_host_to_guest_u16(ndev->vdev.endian, 558867b15ccSJean-Philippe Brucker VIRTIO_NET_S_LINK_UP); 559b17552eeSAndre Przywara conf->max_virtqueue_pairs = virtio_host_to_guest_u16(ndev->vdev.endian, 560867b15ccSJean-Philippe Brucker ndev->queue_pairs); 5618b27bcffSJean-Philippe Brucker 5628b27bcffSJean-Philippe Brucker /* Let TAP know about vnet header endianness */ 5638b27bcffSJean-Philippe Brucker if (ndev->mode == NET_MODE_TAP && 5648b27bcffSJean-Philippe Brucker ndev->vdev.endian != VIRTIO_ENDIAN_HOST) { 5658b27bcffSJean-Philippe Brucker int enable_val = 1, disable_val = 0; 5668b27bcffSJean-Philippe Brucker int enable_req, disable_req; 5678b27bcffSJean-Philippe Brucker 5688b27bcffSJean-Philippe Brucker if (ndev->vdev.endian == VIRTIO_ENDIAN_LE) { 5698b27bcffSJean-Philippe Brucker enable_req = TUNSETVNETLE; 5708b27bcffSJean-Philippe Brucker disable_req = TUNSETVNETBE; 5718b27bcffSJean-Philippe Brucker } else { 5728b27bcffSJean-Philippe Brucker enable_req = TUNSETVNETBE; 5738b27bcffSJean-Philippe Brucker disable_req = TUNSETVNETLE; 5748b27bcffSJean-Philippe Brucker } 5758b27bcffSJean-Philippe Brucker 5768b27bcffSJean-Philippe Brucker ioctl(ndev->tap_fd, disable_req, &disable_val); 5778b27bcffSJean-Philippe Brucker if (ioctl(ndev->tap_fd, enable_req, &enable_val) < 0) 5788b27bcffSJean-Philippe Brucker pr_err("Config tap device TUNSETVNETLE/BE error"); 5798b27bcffSJean-Philippe Brucker } 580867b15ccSJean-Philippe Brucker } 581867b15ccSJean-Philippe Brucker 58295242e44SJean-Philippe Brucker static void notify_status(struct kvm *kvm, void *dev, u32 status) 58395242e44SJean-Philippe Brucker { 584867b15ccSJean-Philippe Brucker struct net_dev *ndev = dev; 585867b15ccSJean-Philippe Brucker 586867b15ccSJean-Philippe Brucker if (status & VIRTIO__STATUS_CONFIG) 587867b15ccSJean-Philippe Brucker virtio_net_update_endian(ndev); 588867b15ccSJean-Philippe Brucker 58995242e44SJean-Philippe Brucker if (status & VIRTIO__STATUS_START) 59095242e44SJean-Philippe Brucker virtio_net_start(dev); 59149bada43SJean-Philippe Brucker else if (status & VIRTIO__STATUS_STOP) 59249bada43SJean-Philippe Brucker virtio_net_stop(dev); 59395242e44SJean-Philippe Brucker } 59495242e44SJean-Philippe Brucker 5959e56ec14SSasha Levin static bool is_ctrl_vq(struct net_dev *ndev, u32 vq) 5969e56ec14SSasha Levin { 5979e56ec14SSasha Levin return vq == (u32)(ndev->queue_pairs * 2); 5989e56ec14SSasha Levin } 5999e56ec14SSasha Levin 600609ee906SJean-Philippe Brucker static int init_vq(struct kvm *kvm, void *dev, u32 vq) 60178a2a3e2SSasha Levin { 602de166e5fSJean-Philippe Brucker struct vhost_vring_file file = { .index = vq }; 603ad96e867SJean-Philippe Brucker struct net_dev_queue *net_queue; 60478a2a3e2SSasha Levin struct net_dev *ndev = dev; 60578a2a3e2SSasha Levin struct virt_queue *queue; 6069ed67cdcSSasha Levin int r; 60778a2a3e2SSasha Levin 608312c62d1SSasha Levin compat__remove_message(compat_id); 60978a2a3e2SSasha Levin 610ad96e867SJean-Philippe Brucker net_queue = &ndev->queues[vq]; 611ad96e867SJean-Philippe Brucker net_queue->id = vq; 612ad96e867SJean-Philippe Brucker net_queue->ndev = ndev; 613ad96e867SJean-Philippe Brucker queue = &net_queue->vq; 614609ee906SJean-Philippe Brucker virtio_init_device_vq(kvm, &ndev->vdev, queue, VIRTIO_NET_QUEUE_SIZE); 61578a2a3e2SSasha Levin 616ad96e867SJean-Philippe Brucker mutex_init(&net_queue->lock); 617ad96e867SJean-Philippe Brucker pthread_cond_init(&net_queue->cond, NULL); 6189e56ec14SSasha Levin if (is_ctrl_vq(ndev, vq)) { 619ad96e867SJean-Philippe Brucker pthread_create(&net_queue->thread, NULL, virtio_net_ctrl_thread, 620ad96e867SJean-Philippe Brucker net_queue); 6219e56ec14SSasha Levin 6229e56ec14SSasha Levin return 0; 6239e56ec14SSasha Levin } else if (ndev->vhost_fd == 0 ) { 6249e56ec14SSasha Levin if (vq & 1) 625ad96e867SJean-Philippe Brucker pthread_create(&net_queue->thread, NULL, 626ad96e867SJean-Philippe Brucker virtio_net_tx_thread, net_queue); 6276585ffb7SSasha Levin else 628ad96e867SJean-Philippe Brucker pthread_create(&net_queue->thread, NULL, 629ad96e867SJean-Philippe Brucker virtio_net_rx_thread, net_queue); 6306585ffb7SSasha Levin 63178a2a3e2SSasha Levin return 0; 6326585ffb7SSasha Levin } 6339ed67cdcSSasha Levin 634745221e5SJean-Philippe Brucker virtio_vhost_set_vring(kvm, ndev->vhost_fd, vq, queue); 6359ed67cdcSSasha Levin 636de166e5fSJean-Philippe Brucker file.fd = ndev->tap_fd; 637de166e5fSJean-Philippe Brucker r = ioctl(ndev->vhost_fd, VHOST_NET_SET_BACKEND, &file); 638de166e5fSJean-Philippe Brucker if (r < 0) 639de166e5fSJean-Philippe Brucker die_perror("VHOST_NET_SET_BACKEND failed"); 640de166e5fSJean-Philippe Brucker 6419ed67cdcSSasha Levin return 0; 6429ed67cdcSSasha Levin } 6439ed67cdcSSasha Levin 64449bada43SJean-Philippe Brucker static void exit_vq(struct kvm *kvm, void *dev, u32 vq) 64549bada43SJean-Philippe Brucker { 64649bada43SJean-Philippe Brucker struct net_dev *ndev = dev; 64749bada43SJean-Philippe Brucker struct net_dev_queue *queue = &ndev->queues[vq]; 64849bada43SJean-Philippe Brucker 649029cd2bbSJean-Philippe Brucker virtio_vhost_reset_vring(kvm, ndev->vhost_fd, vq, &queue->vq); 65049bada43SJean-Philippe Brucker 65149bada43SJean-Philippe Brucker /* 65249bada43SJean-Philippe Brucker * TODO: vhost reset owner. It's the only way to cleanly stop vhost, but 65349bada43SJean-Philippe Brucker * we can't restart it at the moment. 65449bada43SJean-Philippe Brucker */ 65549bada43SJean-Philippe Brucker if (ndev->vhost_fd && !is_ctrl_vq(ndev, vq)) { 65649bada43SJean-Philippe Brucker pr_warning("Cannot reset VHOST queue"); 65749bada43SJean-Philippe Brucker ioctl(ndev->vhost_fd, VHOST_RESET_OWNER); 65849bada43SJean-Philippe Brucker return; 65949bada43SJean-Philippe Brucker } 66049bada43SJean-Philippe Brucker 66149bada43SJean-Philippe Brucker /* 66249bada43SJean-Philippe Brucker * Threads are waiting on cancellation points (readv or 66349bada43SJean-Philippe Brucker * pthread_cond_wait) and should stop gracefully. 66449bada43SJean-Philippe Brucker */ 66549bada43SJean-Philippe Brucker pthread_cancel(queue->thread); 66649bada43SJean-Philippe Brucker pthread_join(queue->thread, NULL); 66749bada43SJean-Philippe Brucker } 66849bada43SJean-Philippe Brucker 6699ed67cdcSSasha Levin static void notify_vq_gsi(struct kvm *kvm, void *dev, u32 vq, u32 gsi) 6709ed67cdcSSasha Levin { 6719ed67cdcSSasha Levin struct net_dev *ndev = dev; 672ad96e867SJean-Philippe Brucker struct net_dev_queue *queue = &ndev->queues[vq]; 6739ed67cdcSSasha Levin 674029cd2bbSJean-Philippe Brucker if (ndev->vhost_fd == 0 || is_ctrl_vq(ndev, vq)) 6759ed67cdcSSasha Levin return; 6769ed67cdcSSasha Levin 677029cd2bbSJean-Philippe Brucker virtio_vhost_set_vring_call(kvm, ndev->vhost_fd, vq, gsi, 678029cd2bbSJean-Philippe Brucker &queue->vq); 6799ed67cdcSSasha Levin } 6809ed67cdcSSasha Levin 6819ed67cdcSSasha Levin static void notify_vq_eventfd(struct kvm *kvm, void *dev, u32 vq, u32 efd) 6829ed67cdcSSasha Levin { 6839ed67cdcSSasha Levin struct net_dev *ndev = dev; 6849ed67cdcSSasha Levin 6859e56ec14SSasha Levin if (ndev->vhost_fd == 0 || is_ctrl_vq(ndev, vq)) 6869ed67cdcSSasha Levin return; 6879ed67cdcSSasha Levin 688676c0c8aSJean-Philippe Brucker virtio_vhost_set_vring_kick(kvm, ndev->vhost_fd, vq, efd); 68978a2a3e2SSasha Levin } 69078a2a3e2SSasha Levin 69178a2a3e2SSasha Levin static int notify_vq(struct kvm *kvm, void *dev, u32 vq) 69278a2a3e2SSasha Levin { 6939a6d73f1SSasha Levin struct net_dev *ndev = dev; 6949a6d73f1SSasha Levin 6959a6d73f1SSasha Levin virtio_net_handle_callback(kvm, ndev, vq); 69678a2a3e2SSasha Levin 69778a2a3e2SSasha Levin return 0; 69878a2a3e2SSasha Levin } 69978a2a3e2SSasha Levin 70053fbb17bSJean-Philippe Brucker static struct virt_queue *get_vq(struct kvm *kvm, void *dev, u32 vq) 70178a2a3e2SSasha Levin { 70278a2a3e2SSasha Levin struct net_dev *ndev = dev; 70378a2a3e2SSasha Levin 704ad96e867SJean-Philippe Brucker return &ndev->queues[vq].vq; 70578a2a3e2SSasha Levin } 70678a2a3e2SSasha Levin 70778a2a3e2SSasha Levin static int get_size_vq(struct kvm *kvm, void *dev, u32 vq) 70878a2a3e2SSasha Levin { 7090f4f51a8SAsias He /* FIXME: dynamic */ 71078a2a3e2SSasha Levin return VIRTIO_NET_QUEUE_SIZE; 71178a2a3e2SSasha Levin } 71278a2a3e2SSasha Levin 7130f4f51a8SAsias He static int set_size_vq(struct kvm *kvm, void *dev, u32 vq, int size) 7140f4f51a8SAsias He { 7150f4f51a8SAsias He /* FIXME: dynamic */ 7160f4f51a8SAsias He return size; 7170f4f51a8SAsias He } 7180f4f51a8SAsias He 71931e0eaccSMartin Radev static unsigned int get_vq_count(struct kvm *kvm, void *dev) 720b98ac591SJean-Philippe Brucker { 721b98ac591SJean-Philippe Brucker struct net_dev *ndev = dev; 722b98ac591SJean-Philippe Brucker 723b98ac591SJean-Philippe Brucker return ndev->queue_pairs * 2 + 1; 724b98ac591SJean-Philippe Brucker } 725b98ac591SJean-Philippe Brucker 72615542babSAndre Przywara static struct virtio_ops net_dev_virtio_ops = { 7271c47ce69SSasha Levin .get_config = get_config, 728e4730284SMartin Radev .get_config_size = get_config_size, 7291c47ce69SSasha Levin .get_host_features = get_host_features, 730b98ac591SJean-Philippe Brucker .get_vq_count = get_vq_count, 7311c47ce69SSasha Levin .init_vq = init_vq, 73249bada43SJean-Philippe Brucker .exit_vq = exit_vq, 73353fbb17bSJean-Philippe Brucker .get_vq = get_vq, 7341c47ce69SSasha Levin .get_size_vq = get_size_vq, 7350f4f51a8SAsias He .set_size_vq = set_size_vq, 7360f4f51a8SAsias He .notify_vq = notify_vq, 7379ed67cdcSSasha Levin .notify_vq_gsi = notify_vq_gsi, 7389ed67cdcSSasha Levin .notify_vq_eventfd = notify_vq_eventfd, 73995242e44SJean-Philippe Brucker .notify_status = notify_status, 7401c47ce69SSasha Levin }; 7411c47ce69SSasha Levin 7429ed67cdcSSasha Levin static void virtio_net__vhost_init(struct kvm *kvm, struct net_dev *ndev) 7439ed67cdcSSasha Levin { 7449ed67cdcSSasha Levin ndev->vhost_fd = open("/dev/vhost-net", O_RDWR); 7459ed67cdcSSasha Levin if (ndev->vhost_fd < 0) 7469ed67cdcSSasha Levin die_perror("Failed openning vhost-net device"); 7479ed67cdcSSasha Levin 748f84ab9ebSJean-Philippe Brucker virtio_vhost_init(kvm, ndev->vhost_fd); 749627d6874SAsias He 750627d6874SAsias He ndev->vdev.use_vhost = true; 7519ed67cdcSSasha Levin } 7529ed67cdcSSasha Levin 7535f225124SSasha Levin static inline void str_to_mac(const char *str, char *mac) 7545f225124SSasha Levin { 7555f225124SSasha Levin sscanf(str, "%hhx:%hhx:%hhx:%hhx:%hhx:%hhx", 7565f225124SSasha Levin mac, mac+1, mac+2, mac+3, mac+4, mac+5); 7575f225124SSasha Levin } 7584346fd8fSSasha Levin static int set_net_param(struct kvm *kvm, struct virtio_net_params *p, 7594346fd8fSSasha Levin const char *param, const char *val) 7605f225124SSasha Levin { 7615f225124SSasha Levin if (strcmp(param, "guest_mac") == 0) { 7625f225124SSasha Levin str_to_mac(val, p->guest_mac); 7635f225124SSasha Levin } else if (strcmp(param, "mode") == 0) { 7645f225124SSasha Levin if (!strncmp(val, "user", 4)) { 7655f225124SSasha Levin int i; 7665f225124SSasha Levin 7675f225124SSasha Levin for (i = 0; i < kvm->cfg.num_net_devices; i++) 7685f225124SSasha Levin if (kvm->cfg.net_params[i].mode == NET_MODE_USER) 7695f225124SSasha Levin die("Only one usermode network device allowed at a time"); 7705f225124SSasha Levin p->mode = NET_MODE_USER; 7715f225124SSasha Levin } else if (!strncmp(val, "tap", 3)) { 7725f225124SSasha Levin p->mode = NET_MODE_TAP; 7735f225124SSasha Levin } else if (!strncmp(val, "none", 4)) { 7745f225124SSasha Levin kvm->cfg.no_net = 1; 7755f225124SSasha Levin return -1; 7765f225124SSasha Levin } else 7775f225124SSasha Levin die("Unknown network mode %s, please use user, tap or none", kvm->cfg.network); 7785f225124SSasha Levin } else if (strcmp(param, "script") == 0) { 7795f225124SSasha Levin p->script = strdup(val); 780eef27ae3SFan Du } else if (strcmp(param, "downscript") == 0) { 781eef27ae3SFan Du p->downscript = strdup(val); 7825f225124SSasha Levin } else if (strcmp(param, "guest_ip") == 0) { 7835f225124SSasha Levin p->guest_ip = strdup(val); 7845f225124SSasha Levin } else if (strcmp(param, "host_ip") == 0) { 7855f225124SSasha Levin p->host_ip = strdup(val); 7865f225124SSasha Levin } else if (strcmp(param, "trans") == 0) { 7875f225124SSasha Levin p->trans = strdup(val); 7881dfc7c24SMarc Zyngier } else if (strcmp(param, "tapif") == 0) { 7891dfc7c24SMarc Zyngier p->tapif = strdup(val); 7905f225124SSasha Levin } else if (strcmp(param, "vhost") == 0) { 7915f225124SSasha Levin p->vhost = atoi(val); 7925f225124SSasha Levin } else if (strcmp(param, "fd") == 0) { 7935f225124SSasha Levin p->fd = atoi(val); 79479052597SSasha Levin } else if (strcmp(param, "mq") == 0) { 79579052597SSasha Levin p->mq = atoi(val); 7965f225124SSasha Levin } else 7975f225124SSasha Levin die("Unknown network parameter %s", param); 7985f225124SSasha Levin 7995f225124SSasha Levin return 0; 8005f225124SSasha Levin } 8015f225124SSasha Levin 8025f225124SSasha Levin int netdev_parser(const struct option *opt, const char *arg, int unset) 8035f225124SSasha Levin { 8045f225124SSasha Levin struct virtio_net_params p; 8055f225124SSasha Levin char *buf = NULL, *cmd = NULL, *cur = NULL; 8065f225124SSasha Levin bool on_cmd = true; 8075f225124SSasha Levin struct kvm *kvm = opt->ptr; 8085f225124SSasha Levin 8095f225124SSasha Levin if (arg) { 8105f225124SSasha Levin buf = strdup(arg); 8115f225124SSasha Levin if (buf == NULL) 8125f225124SSasha Levin die("Failed allocating new net buffer"); 8135f225124SSasha Levin cur = strtok(buf, ",="); 8145f225124SSasha Levin } 8155f225124SSasha Levin 8165f225124SSasha Levin p = (struct virtio_net_params) { 8175f225124SSasha Levin .guest_ip = DEFAULT_GUEST_ADDR, 8185f225124SSasha Levin .host_ip = DEFAULT_HOST_ADDR, 8195f225124SSasha Levin .script = DEFAULT_SCRIPT, 820eef27ae3SFan Du .downscript = DEFAULT_SCRIPT, 8215f225124SSasha Levin .mode = NET_MODE_TAP, 8225f225124SSasha Levin }; 8235f225124SSasha Levin 8245f225124SSasha Levin str_to_mac(DEFAULT_GUEST_MAC, p.guest_mac); 8255f225124SSasha Levin p.guest_mac[5] += kvm->cfg.num_net_devices; 8265f225124SSasha Levin 8275f225124SSasha Levin while (cur) { 8285f225124SSasha Levin if (on_cmd) { 8295f225124SSasha Levin cmd = cur; 8305f225124SSasha Levin } else { 8314346fd8fSSasha Levin if (set_net_param(kvm, &p, cmd, cur) < 0) 8325f225124SSasha Levin goto done; 8335f225124SSasha Levin } 8345f225124SSasha Levin on_cmd = !on_cmd; 8355f225124SSasha Levin 8365f225124SSasha Levin cur = strtok(NULL, ",="); 8375f225124SSasha Levin }; 8385f225124SSasha Levin 8395f225124SSasha Levin kvm->cfg.num_net_devices++; 8405f225124SSasha Levin 8415f225124SSasha Levin kvm->cfg.net_params = realloc(kvm->cfg.net_params, kvm->cfg.num_net_devices * sizeof(*kvm->cfg.net_params)); 8425f225124SSasha Levin if (kvm->cfg.net_params == NULL) 8435f225124SSasha Levin die("Failed adding new network device"); 8445f225124SSasha Levin 8455f225124SSasha Levin kvm->cfg.net_params[kvm->cfg.num_net_devices - 1] = p; 8465f225124SSasha Levin 8475f225124SSasha Levin done: 8485f225124SSasha Levin free(buf); 8495f225124SSasha Levin return 0; 8505f225124SSasha Levin } 8515f225124SSasha Levin 8525f225124SSasha Levin static int virtio_net__init_one(struct virtio_net_params *params) 8534f56d42cSAsias He { 8549b46ebc5SRajnesh Kanwal enum virtio_trans trans = params->kvm->cfg.virtio_transport; 8559a6d73f1SSasha Levin struct net_dev *ndev; 85676a4aac6SWill Deacon struct virtio_ops *ops; 8579b46ebc5SRajnesh Kanwal int i, r; 8589a6d73f1SSasha Levin 8599a6d73f1SSasha Levin ndev = calloc(1, sizeof(struct net_dev)); 8609a6d73f1SSasha Levin if (ndev == NULL) 8615f225124SSasha Levin return -ENOMEM; 8629a6d73f1SSasha Levin 8639a6d73f1SSasha Levin list_add_tail(&ndev->list, &ndevs); 8649a6d73f1SSasha Levin 865db927775SAlexandru Elisei ops = malloc(sizeof(*ops)); 866db927775SAlexandru Elisei if (ops == NULL) 867db927775SAlexandru Elisei return -ENOMEM; 868db927775SAlexandru Elisei 8699a6d73f1SSasha Levin ndev->kvm = params->kvm; 8708c0ae74dSSasha Levin ndev->params = params; 8719a6d73f1SSasha Levin 8729a6d73f1SSasha Levin mutex_init(&ndev->mutex); 87379052597SSasha Levin ndev->queue_pairs = max(1, min(VIRTIO_NET_NUM_QUEUES, params->mq)); 87479052597SSasha Levin 8750c54698eSAsias He for (i = 0 ; i < 6 ; i++) { 8769a6d73f1SSasha Levin ndev->config.mac[i] = params->guest_mac[i]; 8779a6d73f1SSasha Levin ndev->info.guest_mac.addr[i] = params->guest_mac[i]; 8789a6d73f1SSasha Levin ndev->info.host_mac.addr[i] = params->host_mac[i]; 8790c54698eSAsias He } 880f715177dSAsias He 8819a6d73f1SSasha Levin ndev->mode = params->mode; 8829a6d73f1SSasha Levin if (ndev->mode == NET_MODE_TAP) { 8839a6d73f1SSasha Levin ndev->ops = &tap_ops; 88459ee54ebSWei Chen if (!virtio_net__tap_create(ndev)) 88559ee54ebSWei Chen die_perror("You have requested a TAP device, but creation of one has failed because"); 886b4fdde6dSAsias He } else { 8879a6d73f1SSasha Levin ndev->info.host_ip = ntohl(inet_addr(params->host_ip)); 8889a6d73f1SSasha Levin ndev->info.guest_ip = ntohl(inet_addr(params->guest_ip)); 8899a6d73f1SSasha Levin ndev->info.guest_netmask = ntohl(inet_addr("255.255.255.0")); 8909a6d73f1SSasha Levin ndev->info.buf_nr = 20, 8919a6d73f1SSasha Levin ndev->ops = &uip_ops; 8925f3aaf22SMarc Zyngier uip_static_init(&ndev->info); 893b4fdde6dSAsias He } 894b5ee1ea7SAsias He 89576a4aac6SWill Deacon *ops = net_dev_virtio_ops; 896dc7a55d6SSuzuki K. Poulose 897dc7a55d6SSuzuki K. Poulose if (params->trans) { 898dc7a55d6SSuzuki K. Poulose if (strcmp(params->trans, "mmio") == 0) 899dc7a55d6SSuzuki K. Poulose trans = VIRTIO_MMIO; 900dc7a55d6SSuzuki K. Poulose else if (strcmp(params->trans, "pci") == 0) 901dc7a55d6SSuzuki K. Poulose trans = VIRTIO_PCI; 90269205aa1SAsias He else 903dc7a55d6SSuzuki K. Poulose pr_warning("virtio-net: Unknown transport method : %s, " 904dc7a55d6SSuzuki K. Poulose "falling back to %s.", params->trans, 905dc7a55d6SSuzuki K. Poulose virtio_trans_name(trans)); 906dc7a55d6SSuzuki K. Poulose } 907dc7a55d6SSuzuki K. Poulose 908db927775SAlexandru Elisei r = virtio_init(params->kvm, ndev, &ndev->vdev, ops, trans, 90976a4aac6SWill Deacon PCI_DEVICE_ID_VIRTIO_NET, VIRTIO_ID_NET, PCI_CLASS_NET); 910db927775SAlexandru Elisei if (r < 0) { 911db927775SAlexandru Elisei free(ops); 912db927775SAlexandru Elisei return r; 913db927775SAlexandru Elisei } 91427ab67f5SSasha Levin 9159ed67cdcSSasha Levin if (params->vhost) 9169ed67cdcSSasha Levin virtio_net__vhost_init(params->kvm, ndev); 917cb83de6fSSasha Levin 918d278197dSAsias He if (compat_id == -1) 91952f34d2cSAsias He compat_id = virtio_compat_add_message("virtio-net", "CONFIG_VIRTIO_NET"); 9205f225124SSasha Levin 9215f225124SSasha Levin return 0; 9225f225124SSasha Levin } 9235f225124SSasha Levin 9245f225124SSasha Levin int virtio_net__init(struct kvm *kvm) 9255f225124SSasha Levin { 926db927775SAlexandru Elisei int i, r; 9275f225124SSasha Levin 9285f225124SSasha Levin for (i = 0; i < kvm->cfg.num_net_devices; i++) { 9295f225124SSasha Levin kvm->cfg.net_params[i].kvm = kvm; 930db927775SAlexandru Elisei r = virtio_net__init_one(&kvm->cfg.net_params[i]); 931db927775SAlexandru Elisei if (r < 0) 932db927775SAlexandru Elisei goto cleanup; 9335f225124SSasha Levin } 9345f225124SSasha Levin 9355f225124SSasha Levin if (kvm->cfg.num_net_devices == 0 && kvm->cfg.no_net == 0) { 9368c0ae74dSSasha Levin static struct virtio_net_params net_params; 9375f225124SSasha Levin 9385f225124SSasha Levin net_params = (struct virtio_net_params) { 9395f225124SSasha Levin .guest_ip = kvm->cfg.guest_ip, 9405f225124SSasha Levin .host_ip = kvm->cfg.host_ip, 9415f225124SSasha Levin .kvm = kvm, 9425f225124SSasha Levin .script = kvm->cfg.script, 9435f225124SSasha Levin .mode = NET_MODE_USER, 9445f225124SSasha Levin }; 9455f225124SSasha Levin str_to_mac(kvm->cfg.guest_mac, net_params.guest_mac); 9465f225124SSasha Levin str_to_mac(kvm->cfg.host_mac, net_params.host_mac); 9475f225124SSasha Levin 948db927775SAlexandru Elisei r = virtio_net__init_one(&net_params); 949db927775SAlexandru Elisei if (r < 0) 950db927775SAlexandru Elisei goto cleanup; 9515f225124SSasha Levin } 9525f225124SSasha Levin 9535f225124SSasha Levin return 0; 954db927775SAlexandru Elisei 955db927775SAlexandru Elisei cleanup: 956db927775SAlexandru Elisei virtio_net__exit(kvm); 957db927775SAlexandru Elisei return r; 9585f225124SSasha Levin } 95949a8afd1SSasha Levin virtio_dev_init(virtio_net__init); 9605f225124SSasha Levin 9615f225124SSasha Levin int virtio_net__exit(struct kvm *kvm) 9625f225124SSasha Levin { 963eef27ae3SFan Du struct virtio_net_params *params; 964eef27ae3SFan Du struct net_dev *ndev; 965db927775SAlexandru Elisei struct list_head *ptr, *n; 966eef27ae3SFan Du 967db927775SAlexandru Elisei list_for_each_safe(ptr, n, &ndevs) { 968eef27ae3SFan Du ndev = list_entry(ptr, struct net_dev, list); 969eef27ae3SFan Du params = ndev->params; 970eef27ae3SFan Du /* Cleanup any tap device which attached to bridge */ 971eef27ae3SFan Du if (ndev->mode == NET_MODE_TAP && 972eef27ae3SFan Du strcmp(params->downscript, "none")) 973eef27ae3SFan Du virtio_net_exec_script(params->downscript, ndev->tap_name); 974db927775SAlexandru Elisei 975db927775SAlexandru Elisei list_del(&ndev->list); 976db927775SAlexandru Elisei free(ndev); 977eef27ae3SFan Du } 9785f225124SSasha Levin return 0; 9794f56d42cSAsias He } 98049a8afd1SSasha Levin virtio_dev_exit(virtio_net__exit); 981