1117d6495STianjia Zhang #include "kvm/virtio-vsock.h" 2117d6495STianjia Zhang #include "kvm/virtio-pci-dev.h" 3117d6495STianjia Zhang #include "kvm/kvm.h" 4117d6495STianjia Zhang #include "kvm/pci.h" 5117d6495STianjia Zhang #include "kvm/ioeventfd.h" 6117d6495STianjia Zhang #include "kvm/guest_compat.h" 7117d6495STianjia Zhang #include "kvm/virtio-pci.h" 8117d6495STianjia Zhang #include "kvm/virtio.h" 9117d6495STianjia Zhang 10867b15ccSJean-Philippe Brucker #include <linux/byteorder.h> 11117d6495STianjia Zhang #include <linux/kernel.h> 12117d6495STianjia Zhang #include <linux/virtio_vsock.h> 13117d6495STianjia Zhang #include <linux/vhost.h> 14117d6495STianjia Zhang 15117d6495STianjia Zhang #define VIRTIO_VSOCK_QUEUE_SIZE 128 16117d6495STianjia Zhang 17117d6495STianjia Zhang static LIST_HEAD(vdevs); 18117d6495STianjia Zhang static int compat_id = -1; 19117d6495STianjia Zhang 20117d6495STianjia Zhang enum { 21117d6495STianjia Zhang VSOCK_VQ_RX = 0, /* for host to guest data */ 22117d6495STianjia Zhang VSOCK_VQ_TX = 1, /* for guest to host data */ 23117d6495STianjia Zhang VSOCK_VQ_EVENT = 2, 24117d6495STianjia Zhang VSOCK_VQ_MAX = 3, 25117d6495STianjia Zhang }; 26117d6495STianjia Zhang 27117d6495STianjia Zhang struct vsock_dev { 28117d6495STianjia Zhang struct virt_queue vqs[VSOCK_VQ_MAX]; 29117d6495STianjia Zhang struct virtio_vsock_config config; 30867b15ccSJean-Philippe Brucker u64 guest_cid; 31117d6495STianjia Zhang u32 features; 32117d6495STianjia Zhang int vhost_fd; 33117d6495STianjia Zhang struct virtio_device vdev; 34117d6495STianjia Zhang struct list_head list; 35117d6495STianjia Zhang struct kvm *kvm; 36117d6495STianjia Zhang }; 37117d6495STianjia Zhang 38117d6495STianjia Zhang static u8 *get_config(struct kvm *kvm, void *dev) 39117d6495STianjia Zhang { 40117d6495STianjia Zhang struct vsock_dev *vdev = dev; 41117d6495STianjia Zhang 42117d6495STianjia Zhang return ((u8 *)(&vdev->config)); 43117d6495STianjia Zhang } 44117d6495STianjia Zhang 45e4730284SMartin Radev static size_t get_config_size(struct kvm *kvm, void *dev) 46e4730284SMartin Radev { 47e4730284SMartin Radev struct vsock_dev *vdev = dev; 48e4730284SMartin Radev 49e4730284SMartin Radev return sizeof(vdev->config); 50e4730284SMartin Radev } 51e4730284SMartin Radev 523c8f82b8SJean-Philippe Brucker static u64 get_host_features(struct kvm *kvm, void *dev) 53117d6495STianjia Zhang { 54117d6495STianjia Zhang return 1UL << VIRTIO_RING_F_EVENT_IDX 55117d6495STianjia Zhang | 1UL << VIRTIO_RING_F_INDIRECT_DESC; 56117d6495STianjia Zhang } 57117d6495STianjia Zhang 58117d6495STianjia Zhang static bool is_event_vq(u32 vq) 59117d6495STianjia Zhang { 60117d6495STianjia Zhang return vq == VSOCK_VQ_EVENT; 61117d6495STianjia Zhang } 62117d6495STianjia Zhang 63609ee906SJean-Philippe Brucker static int init_vq(struct kvm *kvm, void *dev, u32 vq) 64117d6495STianjia Zhang { 65117d6495STianjia Zhang struct vhost_vring_state state = { .index = vq }; 66117d6495STianjia Zhang struct vhost_vring_addr addr; 67117d6495STianjia Zhang struct vsock_dev *vdev = dev; 68117d6495STianjia Zhang struct virt_queue *queue; 69117d6495STianjia Zhang int r; 70117d6495STianjia Zhang 71117d6495STianjia Zhang compat__remove_message(compat_id); 72117d6495STianjia Zhang 73117d6495STianjia Zhang queue = &vdev->vqs[vq]; 74609ee906SJean-Philippe Brucker virtio_init_device_vq(kvm, &vdev->vdev, queue, VIRTIO_VSOCK_QUEUE_SIZE); 75117d6495STianjia Zhang 76117d6495STianjia Zhang if (vdev->vhost_fd == -1) 77117d6495STianjia Zhang return 0; 78117d6495STianjia Zhang 79117d6495STianjia Zhang if (is_event_vq(vq)) 80117d6495STianjia Zhang return 0; 81117d6495STianjia Zhang 82117d6495STianjia Zhang state.num = queue->vring.num; 83117d6495STianjia Zhang r = ioctl(vdev->vhost_fd, VHOST_SET_VRING_NUM, &state); 84117d6495STianjia Zhang if (r < 0) 85117d6495STianjia Zhang die_perror("VHOST_SET_VRING_NUM failed"); 86117d6495STianjia Zhang 87117d6495STianjia Zhang state.num = 0; 88117d6495STianjia Zhang r = ioctl(vdev->vhost_fd, VHOST_SET_VRING_BASE, &state); 89117d6495STianjia Zhang if (r < 0) 90117d6495STianjia Zhang die_perror("VHOST_SET_VRING_BASE failed"); 91117d6495STianjia Zhang 92117d6495STianjia Zhang addr = (struct vhost_vring_addr) { 93117d6495STianjia Zhang .index = vq, 94117d6495STianjia Zhang .desc_user_addr = (u64)(unsigned long)queue->vring.desc, 95117d6495STianjia Zhang .avail_user_addr = (u64)(unsigned long)queue->vring.avail, 96117d6495STianjia Zhang .used_user_addr = (u64)(unsigned long)queue->vring.used, 97117d6495STianjia Zhang }; 98117d6495STianjia Zhang 99117d6495STianjia Zhang r = ioctl(vdev->vhost_fd, VHOST_SET_VRING_ADDR, &addr); 100117d6495STianjia Zhang if (r < 0) 101117d6495STianjia Zhang die_perror("VHOST_SET_VRING_ADDR failed"); 102117d6495STianjia Zhang 103117d6495STianjia Zhang return 0; 104117d6495STianjia Zhang } 105117d6495STianjia Zhang 106117d6495STianjia Zhang static void notify_vq_eventfd(struct kvm *kvm, void *dev, u32 vq, u32 efd) 107117d6495STianjia Zhang { 108117d6495STianjia Zhang struct vsock_dev *vdev = dev; 109117d6495STianjia Zhang struct vhost_vring_file file = { 110117d6495STianjia Zhang .index = vq, 111117d6495STianjia Zhang .fd = efd, 112117d6495STianjia Zhang }; 113117d6495STianjia Zhang int r; 114117d6495STianjia Zhang 115117d6495STianjia Zhang if (is_event_vq(vq)) 116117d6495STianjia Zhang return; 117117d6495STianjia Zhang 118117d6495STianjia Zhang if (vdev->vhost_fd == -1) 119117d6495STianjia Zhang return; 120117d6495STianjia Zhang 121117d6495STianjia Zhang r = ioctl(vdev->vhost_fd, VHOST_SET_VRING_KICK, &file); 122117d6495STianjia Zhang if (r < 0) 123117d6495STianjia Zhang die_perror("VHOST_SET_VRING_KICK failed"); 124117d6495STianjia Zhang } 125117d6495STianjia Zhang 126117d6495STianjia Zhang static void notify_status(struct kvm *kvm, void *dev, u32 status) 127117d6495STianjia Zhang { 128117d6495STianjia Zhang struct vsock_dev *vdev = dev; 129117d6495STianjia Zhang int r, start; 130117d6495STianjia Zhang 131867b15ccSJean-Philippe Brucker if (status & VIRTIO__STATUS_CONFIG) 132867b15ccSJean-Philippe Brucker vdev->config.guest_cid = cpu_to_le64(vdev->guest_cid); 133867b15ccSJean-Philippe Brucker 134a8e397bbSJean-Philippe Brucker if (status & VIRTIO__STATUS_START) 135a8e397bbSJean-Philippe Brucker start = 1; 136a8e397bbSJean-Philippe Brucker else if (status & VIRTIO__STATUS_STOP) 137a8e397bbSJean-Philippe Brucker start = 0; 138a8e397bbSJean-Philippe Brucker else 139117d6495STianjia Zhang return; 140117d6495STianjia Zhang 141117d6495STianjia Zhang r = ioctl(vdev->vhost_fd, VHOST_VSOCK_SET_RUNNING, &start); 142117d6495STianjia Zhang if (r != 0) 143117d6495STianjia Zhang die("VHOST_VSOCK_SET_RUNNING failed %d", errno); 144117d6495STianjia Zhang } 145117d6495STianjia Zhang 146117d6495STianjia Zhang static int notify_vq(struct kvm *kvm, void *dev, u32 vq) 147117d6495STianjia Zhang { 148117d6495STianjia Zhang return 0; 149117d6495STianjia Zhang } 150117d6495STianjia Zhang 151117d6495STianjia Zhang static struct virt_queue *get_vq(struct kvm *kvm, void *dev, u32 vq) 152117d6495STianjia Zhang { 153117d6495STianjia Zhang struct vsock_dev *vdev = dev; 154117d6495STianjia Zhang 155117d6495STianjia Zhang return &vdev->vqs[vq]; 156117d6495STianjia Zhang } 157117d6495STianjia Zhang 158117d6495STianjia Zhang static int get_size_vq(struct kvm *kvm, void *dev, u32 vq) 159117d6495STianjia Zhang { 160117d6495STianjia Zhang return VIRTIO_VSOCK_QUEUE_SIZE; 161117d6495STianjia Zhang } 162117d6495STianjia Zhang 163117d6495STianjia Zhang static int set_size_vq(struct kvm *kvm, void *dev, u32 vq, int size) 164117d6495STianjia Zhang { 165117d6495STianjia Zhang return size; 166117d6495STianjia Zhang } 167117d6495STianjia Zhang 168117d6495STianjia Zhang static void notify_vq_gsi(struct kvm *kvm, void *dev, u32 vq, u32 gsi) 169117d6495STianjia Zhang { 170117d6495STianjia Zhang struct vhost_vring_file file; 171117d6495STianjia Zhang struct vsock_dev *vdev = dev; 172117d6495STianjia Zhang struct kvm_irqfd irq; 173117d6495STianjia Zhang int r; 174117d6495STianjia Zhang 175117d6495STianjia Zhang if (vdev->vhost_fd == -1) 176117d6495STianjia Zhang return; 177117d6495STianjia Zhang 178117d6495STianjia Zhang if (is_event_vq(vq)) 179117d6495STianjia Zhang return; 180117d6495STianjia Zhang 181117d6495STianjia Zhang irq = (struct kvm_irqfd) { 182117d6495STianjia Zhang .gsi = gsi, 183117d6495STianjia Zhang .fd = eventfd(0, 0), 184117d6495STianjia Zhang }; 185117d6495STianjia Zhang file = (struct vhost_vring_file) { 186117d6495STianjia Zhang .index = vq, 187117d6495STianjia Zhang .fd = irq.fd, 188117d6495STianjia Zhang }; 189117d6495STianjia Zhang 190117d6495STianjia Zhang r = ioctl(kvm->vm_fd, KVM_IRQFD, &irq); 191117d6495STianjia Zhang if (r < 0) 192117d6495STianjia Zhang die_perror("KVM_IRQFD failed"); 193117d6495STianjia Zhang 194117d6495STianjia Zhang r = ioctl(vdev->vhost_fd, VHOST_SET_VRING_CALL, &file); 195117d6495STianjia Zhang if (r < 0) 196117d6495STianjia Zhang die_perror("VHOST_SET_VRING_CALL failed"); 197117d6495STianjia Zhang } 198117d6495STianjia Zhang 19931e0eaccSMartin Radev static unsigned int get_vq_count(struct kvm *kvm, void *dev) 200117d6495STianjia Zhang { 201117d6495STianjia Zhang return VSOCK_VQ_MAX; 202117d6495STianjia Zhang } 203117d6495STianjia Zhang 204117d6495STianjia Zhang static struct virtio_ops vsock_dev_virtio_ops = { 205117d6495STianjia Zhang .get_config = get_config, 206e4730284SMartin Radev .get_config_size = get_config_size, 207117d6495STianjia Zhang .get_host_features = get_host_features, 208117d6495STianjia Zhang .init_vq = init_vq, 209117d6495STianjia Zhang .get_vq = get_vq, 210117d6495STianjia Zhang .get_size_vq = get_size_vq, 211117d6495STianjia Zhang .set_size_vq = set_size_vq, 212117d6495STianjia Zhang .notify_vq_eventfd = notify_vq_eventfd, 213117d6495STianjia Zhang .notify_status = notify_status, 214117d6495STianjia Zhang .notify_vq_gsi = notify_vq_gsi, 215117d6495STianjia Zhang .notify_vq = notify_vq, 216117d6495STianjia Zhang .get_vq_count = get_vq_count, 217117d6495STianjia Zhang }; 218117d6495STianjia Zhang 219117d6495STianjia Zhang static void virtio_vhost_vsock_init(struct kvm *kvm, struct vsock_dev *vdev) 220117d6495STianjia Zhang { 221117d6495STianjia Zhang u64 features; 222*f84ab9ebSJean-Philippe Brucker int r; 223117d6495STianjia Zhang 224117d6495STianjia Zhang vdev->vhost_fd = open("/dev/vhost-vsock", O_RDWR); 225117d6495STianjia Zhang if (vdev->vhost_fd < 0) 226117d6495STianjia Zhang die_perror("Failed opening vhost-vsock device"); 227117d6495STianjia Zhang 228*f84ab9ebSJean-Philippe Brucker virtio_vhost_init(kvm, vdev->vhost_fd); 229117d6495STianjia Zhang 230117d6495STianjia Zhang r = ioctl(vdev->vhost_fd, VHOST_GET_FEATURES, &features); 231117d6495STianjia Zhang if (r != 0) 232117d6495STianjia Zhang die_perror("VHOST_GET_FEATURES failed"); 233117d6495STianjia Zhang 234117d6495STianjia Zhang r = ioctl(vdev->vhost_fd, VHOST_SET_FEATURES, &features); 235117d6495STianjia Zhang if (r != 0) 236117d6495STianjia Zhang die_perror("VHOST_SET_FEATURES failed"); 237117d6495STianjia Zhang 238867b15ccSJean-Philippe Brucker r = ioctl(vdev->vhost_fd, VHOST_VSOCK_SET_GUEST_CID, &vdev->guest_cid); 239117d6495STianjia Zhang if (r != 0) 240117d6495STianjia Zhang die_perror("VHOST_VSOCK_SET_GUEST_CID failed"); 241117d6495STianjia Zhang 242117d6495STianjia Zhang vdev->vdev.use_vhost = true; 243117d6495STianjia Zhang } 244117d6495STianjia Zhang 245117d6495STianjia Zhang static int virtio_vsock_init_one(struct kvm *kvm, u64 guest_cid) 246117d6495STianjia Zhang { 247117d6495STianjia Zhang struct vsock_dev *vdev; 248117d6495STianjia Zhang int r; 249117d6495STianjia Zhang 250117d6495STianjia Zhang vdev = calloc(1, sizeof(struct vsock_dev)); 251117d6495STianjia Zhang if (vdev == NULL) 252117d6495STianjia Zhang return -ENOMEM; 253117d6495STianjia Zhang 254117d6495STianjia Zhang *vdev = (struct vsock_dev) { 255117d6495STianjia Zhang .guest_cid = guest_cid, 256117d6495STianjia Zhang .vhost_fd = -1, 257117d6495STianjia Zhang .kvm = kvm, 258117d6495STianjia Zhang }; 259117d6495STianjia Zhang 260117d6495STianjia Zhang list_add_tail(&vdev->list, &vdevs); 261117d6495STianjia Zhang 262117d6495STianjia Zhang r = virtio_init(kvm, vdev, &vdev->vdev, &vsock_dev_virtio_ops, 2639b46ebc5SRajnesh Kanwal kvm->cfg.virtio_transport, PCI_DEVICE_ID_VIRTIO_VSOCK, 264117d6495STianjia Zhang VIRTIO_ID_VSOCK, PCI_CLASS_VSOCK); 265117d6495STianjia Zhang if (r < 0) 266117d6495STianjia Zhang return r; 267117d6495STianjia Zhang 268117d6495STianjia Zhang virtio_vhost_vsock_init(kvm, vdev); 269117d6495STianjia Zhang 270117d6495STianjia Zhang if (compat_id == -1) 271117d6495STianjia Zhang compat_id = virtio_compat_add_message("virtio-vsock", "CONFIG_VIRTIO_VSOCK"); 272117d6495STianjia Zhang 273117d6495STianjia Zhang return 0; 274117d6495STianjia Zhang } 275117d6495STianjia Zhang 276117d6495STianjia Zhang static int virtio_vsock_exit_one(struct kvm *kvm, struct vsock_dev *vdev) 277117d6495STianjia Zhang { 278117d6495STianjia Zhang list_del(&vdev->list); 279117d6495STianjia Zhang free(vdev); 280117d6495STianjia Zhang 281117d6495STianjia Zhang return 0; 282117d6495STianjia Zhang } 283117d6495STianjia Zhang 284117d6495STianjia Zhang int virtio_vsock_init(struct kvm *kvm) 285117d6495STianjia Zhang { 286117d6495STianjia Zhang int r; 287117d6495STianjia Zhang 288117d6495STianjia Zhang if (kvm->cfg.vsock_cid == 0) 289117d6495STianjia Zhang return 0; 290117d6495STianjia Zhang 291117d6495STianjia Zhang r = virtio_vsock_init_one(kvm, kvm->cfg.vsock_cid); 292117d6495STianjia Zhang if (r < 0) 293117d6495STianjia Zhang goto cleanup; 294117d6495STianjia Zhang 295117d6495STianjia Zhang return 0; 296117d6495STianjia Zhang cleanup: 297117d6495STianjia Zhang return virtio_vsock_exit(kvm); 298117d6495STianjia Zhang } 299117d6495STianjia Zhang virtio_dev_init(virtio_vsock_init); 300117d6495STianjia Zhang 301117d6495STianjia Zhang int virtio_vsock_exit(struct kvm *kvm) 302117d6495STianjia Zhang { 303117d6495STianjia Zhang while (!list_empty(&vdevs)) { 304117d6495STianjia Zhang struct vsock_dev *vdev; 305117d6495STianjia Zhang 306117d6495STianjia Zhang vdev = list_first_entry(&vdevs, struct vsock_dev, list); 307117d6495STianjia Zhang virtio_vsock_exit_one(kvm, vdev); 308117d6495STianjia Zhang } 309117d6495STianjia Zhang 310117d6495STianjia Zhang return 0; 311117d6495STianjia Zhang } 312117d6495STianjia Zhang virtio_dev_exit(virtio_vsock_exit); 313