1117d6495STianjia Zhang #include "kvm/virtio-vsock.h" 2117d6495STianjia Zhang #include "kvm/virtio-pci-dev.h" 3117d6495STianjia Zhang #include "kvm/kvm.h" 4117d6495STianjia Zhang #include "kvm/pci.h" 5117d6495STianjia Zhang #include "kvm/ioeventfd.h" 6117d6495STianjia Zhang #include "kvm/guest_compat.h" 7117d6495STianjia Zhang #include "kvm/virtio-pci.h" 8117d6495STianjia Zhang #include "kvm/virtio.h" 9117d6495STianjia Zhang 10867b15ccSJean-Philippe Brucker #include <linux/byteorder.h> 11117d6495STianjia Zhang #include <linux/kernel.h> 12117d6495STianjia Zhang #include <linux/virtio_vsock.h> 13117d6495STianjia Zhang #include <linux/vhost.h> 14117d6495STianjia Zhang 15117d6495STianjia Zhang #define VIRTIO_VSOCK_QUEUE_SIZE 128 16117d6495STianjia Zhang 17117d6495STianjia Zhang static LIST_HEAD(vdevs); 18117d6495STianjia Zhang static int compat_id = -1; 19117d6495STianjia Zhang 20117d6495STianjia Zhang enum { 21117d6495STianjia Zhang VSOCK_VQ_RX = 0, /* for host to guest data */ 22117d6495STianjia Zhang VSOCK_VQ_TX = 1, /* for guest to host data */ 23117d6495STianjia Zhang VSOCK_VQ_EVENT = 2, 24117d6495STianjia Zhang VSOCK_VQ_MAX = 3, 25117d6495STianjia Zhang }; 26117d6495STianjia Zhang 27117d6495STianjia Zhang struct vsock_dev { 28117d6495STianjia Zhang struct virt_queue vqs[VSOCK_VQ_MAX]; 29117d6495STianjia Zhang struct virtio_vsock_config config; 30867b15ccSJean-Philippe Brucker u64 guest_cid; 31117d6495STianjia Zhang u32 features; 32117d6495STianjia Zhang int vhost_fd; 33117d6495STianjia Zhang struct virtio_device vdev; 34117d6495STianjia Zhang struct list_head list; 35117d6495STianjia Zhang struct kvm *kvm; 36117d6495STianjia Zhang }; 37117d6495STianjia Zhang 38117d6495STianjia Zhang static u8 *get_config(struct kvm *kvm, void *dev) 39117d6495STianjia Zhang { 40117d6495STianjia Zhang struct vsock_dev *vdev = dev; 41117d6495STianjia Zhang 42117d6495STianjia Zhang return ((u8 *)(&vdev->config)); 43117d6495STianjia Zhang } 44117d6495STianjia Zhang 45e4730284SMartin Radev static size_t get_config_size(struct kvm *kvm, void *dev) 46e4730284SMartin Radev { 47e4730284SMartin Radev struct vsock_dev *vdev = dev; 48e4730284SMartin Radev 49e4730284SMartin Radev return sizeof(vdev->config); 50e4730284SMartin Radev } 51e4730284SMartin Radev 523c8f82b8SJean-Philippe Brucker static u64 get_host_features(struct kvm *kvm, void *dev) 53117d6495STianjia Zhang { 54117d6495STianjia Zhang return 1UL << VIRTIO_RING_F_EVENT_IDX 55117d6495STianjia Zhang | 1UL << VIRTIO_RING_F_INDIRECT_DESC; 56117d6495STianjia Zhang } 57117d6495STianjia Zhang 58117d6495STianjia Zhang static bool is_event_vq(u32 vq) 59117d6495STianjia Zhang { 60117d6495STianjia Zhang return vq == VSOCK_VQ_EVENT; 61117d6495STianjia Zhang } 62117d6495STianjia Zhang 63609ee906SJean-Philippe Brucker static int init_vq(struct kvm *kvm, void *dev, u32 vq) 64117d6495STianjia Zhang { 65117d6495STianjia Zhang struct vhost_vring_state state = { .index = vq }; 66117d6495STianjia Zhang struct vhost_vring_addr addr; 67117d6495STianjia Zhang struct vsock_dev *vdev = dev; 68117d6495STianjia Zhang struct virt_queue *queue; 69117d6495STianjia Zhang int r; 70117d6495STianjia Zhang 71117d6495STianjia Zhang compat__remove_message(compat_id); 72117d6495STianjia Zhang 73117d6495STianjia Zhang queue = &vdev->vqs[vq]; 74609ee906SJean-Philippe Brucker virtio_init_device_vq(kvm, &vdev->vdev, queue, VIRTIO_VSOCK_QUEUE_SIZE); 75117d6495STianjia Zhang 76117d6495STianjia Zhang if (vdev->vhost_fd == -1) 77117d6495STianjia Zhang return 0; 78117d6495STianjia Zhang 79117d6495STianjia Zhang if (is_event_vq(vq)) 80117d6495STianjia Zhang return 0; 81117d6495STianjia Zhang 82117d6495STianjia Zhang state.num = queue->vring.num; 83117d6495STianjia Zhang r = ioctl(vdev->vhost_fd, VHOST_SET_VRING_NUM, &state); 84117d6495STianjia Zhang if (r < 0) 85117d6495STianjia Zhang die_perror("VHOST_SET_VRING_NUM failed"); 86117d6495STianjia Zhang 87117d6495STianjia Zhang state.num = 0; 88117d6495STianjia Zhang r = ioctl(vdev->vhost_fd, VHOST_SET_VRING_BASE, &state); 89117d6495STianjia Zhang if (r < 0) 90117d6495STianjia Zhang die_perror("VHOST_SET_VRING_BASE failed"); 91117d6495STianjia Zhang 92117d6495STianjia Zhang addr = (struct vhost_vring_addr) { 93117d6495STianjia Zhang .index = vq, 94117d6495STianjia Zhang .desc_user_addr = (u64)(unsigned long)queue->vring.desc, 95117d6495STianjia Zhang .avail_user_addr = (u64)(unsigned long)queue->vring.avail, 96117d6495STianjia Zhang .used_user_addr = (u64)(unsigned long)queue->vring.used, 97117d6495STianjia Zhang }; 98117d6495STianjia Zhang 99117d6495STianjia Zhang r = ioctl(vdev->vhost_fd, VHOST_SET_VRING_ADDR, &addr); 100117d6495STianjia Zhang if (r < 0) 101117d6495STianjia Zhang die_perror("VHOST_SET_VRING_ADDR failed"); 102117d6495STianjia Zhang 103117d6495STianjia Zhang return 0; 104117d6495STianjia Zhang } 105117d6495STianjia Zhang 106117d6495STianjia Zhang static void notify_vq_eventfd(struct kvm *kvm, void *dev, u32 vq, u32 efd) 107117d6495STianjia Zhang { 108117d6495STianjia Zhang struct vsock_dev *vdev = dev; 109117d6495STianjia Zhang struct vhost_vring_file file = { 110117d6495STianjia Zhang .index = vq, 111117d6495STianjia Zhang .fd = efd, 112117d6495STianjia Zhang }; 113117d6495STianjia Zhang int r; 114117d6495STianjia Zhang 115117d6495STianjia Zhang if (is_event_vq(vq)) 116117d6495STianjia Zhang return; 117117d6495STianjia Zhang 118117d6495STianjia Zhang if (vdev->vhost_fd == -1) 119117d6495STianjia Zhang return; 120117d6495STianjia Zhang 121117d6495STianjia Zhang r = ioctl(vdev->vhost_fd, VHOST_SET_VRING_KICK, &file); 122117d6495STianjia Zhang if (r < 0) 123117d6495STianjia Zhang die_perror("VHOST_SET_VRING_KICK failed"); 124117d6495STianjia Zhang } 125117d6495STianjia Zhang 126117d6495STianjia Zhang static void notify_status(struct kvm *kvm, void *dev, u32 status) 127117d6495STianjia Zhang { 128117d6495STianjia Zhang struct vsock_dev *vdev = dev; 129117d6495STianjia Zhang int r, start; 130117d6495STianjia Zhang 131867b15ccSJean-Philippe Brucker if (status & VIRTIO__STATUS_CONFIG) 132867b15ccSJean-Philippe Brucker vdev->config.guest_cid = cpu_to_le64(vdev->guest_cid); 133867b15ccSJean-Philippe Brucker 134a8e397bbSJean-Philippe Brucker if (status & VIRTIO__STATUS_START) 135a8e397bbSJean-Philippe Brucker start = 1; 136a8e397bbSJean-Philippe Brucker else if (status & VIRTIO__STATUS_STOP) 137a8e397bbSJean-Philippe Brucker start = 0; 138a8e397bbSJean-Philippe Brucker else 139117d6495STianjia Zhang return; 140117d6495STianjia Zhang 141117d6495STianjia Zhang r = ioctl(vdev->vhost_fd, VHOST_VSOCK_SET_RUNNING, &start); 142117d6495STianjia Zhang if (r != 0) 143117d6495STianjia Zhang die("VHOST_VSOCK_SET_RUNNING failed %d", errno); 144117d6495STianjia Zhang } 145117d6495STianjia Zhang 146117d6495STianjia Zhang static int notify_vq(struct kvm *kvm, void *dev, u32 vq) 147117d6495STianjia Zhang { 148117d6495STianjia Zhang return 0; 149117d6495STianjia Zhang } 150117d6495STianjia Zhang 151117d6495STianjia Zhang static struct virt_queue *get_vq(struct kvm *kvm, void *dev, u32 vq) 152117d6495STianjia Zhang { 153117d6495STianjia Zhang struct vsock_dev *vdev = dev; 154117d6495STianjia Zhang 155117d6495STianjia Zhang return &vdev->vqs[vq]; 156117d6495STianjia Zhang } 157117d6495STianjia Zhang 158117d6495STianjia Zhang static int get_size_vq(struct kvm *kvm, void *dev, u32 vq) 159117d6495STianjia Zhang { 160117d6495STianjia Zhang return VIRTIO_VSOCK_QUEUE_SIZE; 161117d6495STianjia Zhang } 162117d6495STianjia Zhang 163117d6495STianjia Zhang static int set_size_vq(struct kvm *kvm, void *dev, u32 vq, int size) 164117d6495STianjia Zhang { 165117d6495STianjia Zhang return size; 166117d6495STianjia Zhang } 167117d6495STianjia Zhang 168117d6495STianjia Zhang static void notify_vq_gsi(struct kvm *kvm, void *dev, u32 vq, u32 gsi) 169117d6495STianjia Zhang { 170117d6495STianjia Zhang struct vhost_vring_file file; 171117d6495STianjia Zhang struct vsock_dev *vdev = dev; 172117d6495STianjia Zhang struct kvm_irqfd irq; 173117d6495STianjia Zhang int r; 174117d6495STianjia Zhang 175117d6495STianjia Zhang if (vdev->vhost_fd == -1) 176117d6495STianjia Zhang return; 177117d6495STianjia Zhang 178117d6495STianjia Zhang if (is_event_vq(vq)) 179117d6495STianjia Zhang return; 180117d6495STianjia Zhang 181117d6495STianjia Zhang irq = (struct kvm_irqfd) { 182117d6495STianjia Zhang .gsi = gsi, 183117d6495STianjia Zhang .fd = eventfd(0, 0), 184117d6495STianjia Zhang }; 185117d6495STianjia Zhang file = (struct vhost_vring_file) { 186117d6495STianjia Zhang .index = vq, 187117d6495STianjia Zhang .fd = irq.fd, 188117d6495STianjia Zhang }; 189117d6495STianjia Zhang 190117d6495STianjia Zhang r = ioctl(kvm->vm_fd, KVM_IRQFD, &irq); 191117d6495STianjia Zhang if (r < 0) 192117d6495STianjia Zhang die_perror("KVM_IRQFD failed"); 193117d6495STianjia Zhang 194117d6495STianjia Zhang r = ioctl(vdev->vhost_fd, VHOST_SET_VRING_CALL, &file); 195117d6495STianjia Zhang if (r < 0) 196117d6495STianjia Zhang die_perror("VHOST_SET_VRING_CALL failed"); 197117d6495STianjia Zhang } 198117d6495STianjia Zhang 19931e0eaccSMartin Radev static unsigned int get_vq_count(struct kvm *kvm, void *dev) 200117d6495STianjia Zhang { 201117d6495STianjia Zhang return VSOCK_VQ_MAX; 202117d6495STianjia Zhang } 203117d6495STianjia Zhang 204117d6495STianjia Zhang static struct virtio_ops vsock_dev_virtio_ops = { 205117d6495STianjia Zhang .get_config = get_config, 206e4730284SMartin Radev .get_config_size = get_config_size, 207117d6495STianjia Zhang .get_host_features = get_host_features, 208117d6495STianjia Zhang .init_vq = init_vq, 209117d6495STianjia Zhang .get_vq = get_vq, 210117d6495STianjia Zhang .get_size_vq = get_size_vq, 211117d6495STianjia Zhang .set_size_vq = set_size_vq, 212117d6495STianjia Zhang .notify_vq_eventfd = notify_vq_eventfd, 213117d6495STianjia Zhang .notify_status = notify_status, 214117d6495STianjia Zhang .notify_vq_gsi = notify_vq_gsi, 215117d6495STianjia Zhang .notify_vq = notify_vq, 216117d6495STianjia Zhang .get_vq_count = get_vq_count, 217117d6495STianjia Zhang }; 218117d6495STianjia Zhang 219117d6495STianjia Zhang static void virtio_vhost_vsock_init(struct kvm *kvm, struct vsock_dev *vdev) 220117d6495STianjia Zhang { 221117d6495STianjia Zhang struct kvm_mem_bank *bank; 222117d6495STianjia Zhang struct vhost_memory *mem; 223117d6495STianjia Zhang u64 features; 224117d6495STianjia Zhang int r, i; 225117d6495STianjia Zhang 226117d6495STianjia Zhang vdev->vhost_fd = open("/dev/vhost-vsock", O_RDWR); 227117d6495STianjia Zhang if (vdev->vhost_fd < 0) 228117d6495STianjia Zhang die_perror("Failed opening vhost-vsock device"); 229117d6495STianjia Zhang 230117d6495STianjia Zhang mem = calloc(1, sizeof(*mem) + sizeof(struct vhost_memory_region)); 231117d6495STianjia Zhang if (mem == NULL) 232117d6495STianjia Zhang die("Failed allocating memory for vhost memory map"); 233117d6495STianjia Zhang 234117d6495STianjia Zhang i = 0; 235117d6495STianjia Zhang list_for_each_entry(bank, &kvm->mem_banks, list) { 236117d6495STianjia Zhang mem->regions[i] = (struct vhost_memory_region) { 237117d6495STianjia Zhang .guest_phys_addr = bank->guest_phys_addr, 238117d6495STianjia Zhang .memory_size = bank->size, 239117d6495STianjia Zhang .userspace_addr = (unsigned long)bank->host_addr, 240117d6495STianjia Zhang }; 241117d6495STianjia Zhang i++; 242117d6495STianjia Zhang } 243117d6495STianjia Zhang mem->nregions = i; 244117d6495STianjia Zhang 245117d6495STianjia Zhang r = ioctl(vdev->vhost_fd, VHOST_SET_OWNER); 246117d6495STianjia Zhang if (r != 0) 247117d6495STianjia Zhang die_perror("VHOST_SET_OWNER failed"); 248117d6495STianjia Zhang 249117d6495STianjia Zhang r = ioctl(vdev->vhost_fd, VHOST_SET_MEM_TABLE, mem); 250117d6495STianjia Zhang if (r != 0) 251117d6495STianjia Zhang die_perror("VHOST_SET_MEM_TABLE failed"); 252117d6495STianjia Zhang 253117d6495STianjia Zhang r = ioctl(vdev->vhost_fd, VHOST_GET_FEATURES, &features); 254117d6495STianjia Zhang if (r != 0) 255117d6495STianjia Zhang die_perror("VHOST_GET_FEATURES failed"); 256117d6495STianjia Zhang 257117d6495STianjia Zhang r = ioctl(vdev->vhost_fd, VHOST_SET_FEATURES, &features); 258117d6495STianjia Zhang if (r != 0) 259117d6495STianjia Zhang die_perror("VHOST_SET_FEATURES failed"); 260117d6495STianjia Zhang 261867b15ccSJean-Philippe Brucker r = ioctl(vdev->vhost_fd, VHOST_VSOCK_SET_GUEST_CID, &vdev->guest_cid); 262117d6495STianjia Zhang if (r != 0) 263117d6495STianjia Zhang die_perror("VHOST_VSOCK_SET_GUEST_CID failed"); 264117d6495STianjia Zhang 265117d6495STianjia Zhang vdev->vdev.use_vhost = true; 266117d6495STianjia Zhang 267117d6495STianjia Zhang free(mem); 268117d6495STianjia Zhang } 269117d6495STianjia Zhang 270117d6495STianjia Zhang static int virtio_vsock_init_one(struct kvm *kvm, u64 guest_cid) 271117d6495STianjia Zhang { 272117d6495STianjia Zhang struct vsock_dev *vdev; 273117d6495STianjia Zhang int r; 274117d6495STianjia Zhang 275117d6495STianjia Zhang vdev = calloc(1, sizeof(struct vsock_dev)); 276117d6495STianjia Zhang if (vdev == NULL) 277117d6495STianjia Zhang return -ENOMEM; 278117d6495STianjia Zhang 279117d6495STianjia Zhang *vdev = (struct vsock_dev) { 280117d6495STianjia Zhang .guest_cid = guest_cid, 281117d6495STianjia Zhang .vhost_fd = -1, 282117d6495STianjia Zhang .kvm = kvm, 283117d6495STianjia Zhang }; 284117d6495STianjia Zhang 285117d6495STianjia Zhang list_add_tail(&vdev->list, &vdevs); 286117d6495STianjia Zhang 287117d6495STianjia Zhang r = virtio_init(kvm, vdev, &vdev->vdev, &vsock_dev_virtio_ops, 288*9b46ebc5SRajnesh Kanwal kvm->cfg.virtio_transport, PCI_DEVICE_ID_VIRTIO_VSOCK, 289117d6495STianjia Zhang VIRTIO_ID_VSOCK, PCI_CLASS_VSOCK); 290117d6495STianjia Zhang if (r < 0) 291117d6495STianjia Zhang return r; 292117d6495STianjia Zhang 293117d6495STianjia Zhang virtio_vhost_vsock_init(kvm, vdev); 294117d6495STianjia Zhang 295117d6495STianjia Zhang if (compat_id == -1) 296117d6495STianjia Zhang compat_id = virtio_compat_add_message("virtio-vsock", "CONFIG_VIRTIO_VSOCK"); 297117d6495STianjia Zhang 298117d6495STianjia Zhang return 0; 299117d6495STianjia Zhang } 300117d6495STianjia Zhang 301117d6495STianjia Zhang static int virtio_vsock_exit_one(struct kvm *kvm, struct vsock_dev *vdev) 302117d6495STianjia Zhang { 303117d6495STianjia Zhang list_del(&vdev->list); 304117d6495STianjia Zhang free(vdev); 305117d6495STianjia Zhang 306117d6495STianjia Zhang return 0; 307117d6495STianjia Zhang } 308117d6495STianjia Zhang 309117d6495STianjia Zhang int virtio_vsock_init(struct kvm *kvm) 310117d6495STianjia Zhang { 311117d6495STianjia Zhang int r; 312117d6495STianjia Zhang 313117d6495STianjia Zhang if (kvm->cfg.vsock_cid == 0) 314117d6495STianjia Zhang return 0; 315117d6495STianjia Zhang 316117d6495STianjia Zhang r = virtio_vsock_init_one(kvm, kvm->cfg.vsock_cid); 317117d6495STianjia Zhang if (r < 0) 318117d6495STianjia Zhang goto cleanup; 319117d6495STianjia Zhang 320117d6495STianjia Zhang return 0; 321117d6495STianjia Zhang cleanup: 322117d6495STianjia Zhang return virtio_vsock_exit(kvm); 323117d6495STianjia Zhang } 324117d6495STianjia Zhang virtio_dev_init(virtio_vsock_init); 325117d6495STianjia Zhang 326117d6495STianjia Zhang int virtio_vsock_exit(struct kvm *kvm) 327117d6495STianjia Zhang { 328117d6495STianjia Zhang while (!list_empty(&vdevs)) { 329117d6495STianjia Zhang struct vsock_dev *vdev; 330117d6495STianjia Zhang 331117d6495STianjia Zhang vdev = list_first_entry(&vdevs, struct vsock_dev, list); 332117d6495STianjia Zhang virtio_vsock_exit_one(kvm, vdev); 333117d6495STianjia Zhang } 334117d6495STianjia Zhang 335117d6495STianjia Zhang return 0; 336117d6495STianjia Zhang } 337117d6495STianjia Zhang virtio_dev_exit(virtio_vsock_exit); 338