1117d6495STianjia Zhang #include "kvm/virtio-vsock.h" 2117d6495STianjia Zhang #include "kvm/virtio-pci-dev.h" 3117d6495STianjia Zhang #include "kvm/kvm.h" 4117d6495STianjia Zhang #include "kvm/pci.h" 5117d6495STianjia Zhang #include "kvm/ioeventfd.h" 6117d6495STianjia Zhang #include "kvm/guest_compat.h" 7117d6495STianjia Zhang #include "kvm/virtio-pci.h" 8117d6495STianjia Zhang #include "kvm/virtio.h" 9117d6495STianjia Zhang 10*867b15ccSJean-Philippe Brucker #include <linux/byteorder.h> 11117d6495STianjia Zhang #include <linux/kernel.h> 12117d6495STianjia Zhang #include <linux/virtio_vsock.h> 13117d6495STianjia Zhang #include <linux/vhost.h> 14117d6495STianjia Zhang 15117d6495STianjia Zhang #define VIRTIO_VSOCK_QUEUE_SIZE 128 16117d6495STianjia Zhang 17117d6495STianjia Zhang static LIST_HEAD(vdevs); 18117d6495STianjia Zhang static int compat_id = -1; 19117d6495STianjia Zhang 20117d6495STianjia Zhang enum { 21117d6495STianjia Zhang VSOCK_VQ_RX = 0, /* for host to guest data */ 22117d6495STianjia Zhang VSOCK_VQ_TX = 1, /* for guest to host data */ 23117d6495STianjia Zhang VSOCK_VQ_EVENT = 2, 24117d6495STianjia Zhang VSOCK_VQ_MAX = 3, 25117d6495STianjia Zhang }; 26117d6495STianjia Zhang 27117d6495STianjia Zhang struct vsock_dev { 28117d6495STianjia Zhang struct virt_queue vqs[VSOCK_VQ_MAX]; 29117d6495STianjia Zhang struct virtio_vsock_config config; 30*867b15ccSJean-Philippe Brucker u64 guest_cid; 31117d6495STianjia Zhang u32 features; 32117d6495STianjia Zhang int vhost_fd; 33117d6495STianjia Zhang struct virtio_device vdev; 34117d6495STianjia Zhang struct list_head list; 35117d6495STianjia Zhang struct kvm *kvm; 36117d6495STianjia Zhang }; 37117d6495STianjia Zhang 38117d6495STianjia Zhang static u8 *get_config(struct kvm *kvm, void *dev) 39117d6495STianjia Zhang { 40117d6495STianjia Zhang struct vsock_dev *vdev = dev; 41117d6495STianjia Zhang 42117d6495STianjia Zhang return ((u8 *)(&vdev->config)); 43117d6495STianjia Zhang } 44117d6495STianjia Zhang 45e4730284SMartin Radev static size_t get_config_size(struct kvm *kvm, void *dev) 46e4730284SMartin Radev { 47e4730284SMartin Radev struct vsock_dev *vdev = dev; 48e4730284SMartin Radev 49e4730284SMartin Radev return sizeof(vdev->config); 50e4730284SMartin Radev } 51e4730284SMartin Radev 52117d6495STianjia Zhang static u32 get_host_features(struct kvm *kvm, void *dev) 53117d6495STianjia Zhang { 54117d6495STianjia Zhang return 1UL << VIRTIO_RING_F_EVENT_IDX 55117d6495STianjia Zhang | 1UL << VIRTIO_RING_F_INDIRECT_DESC; 56117d6495STianjia Zhang } 57117d6495STianjia Zhang 58117d6495STianjia Zhang static void set_guest_features(struct kvm *kvm, void *dev, u32 features) 59117d6495STianjia Zhang { 60117d6495STianjia Zhang struct vsock_dev *vdev = dev; 61117d6495STianjia Zhang 62117d6495STianjia Zhang vdev->features = features; 63117d6495STianjia Zhang } 64117d6495STianjia Zhang 65117d6495STianjia Zhang static bool is_event_vq(u32 vq) 66117d6495STianjia Zhang { 67117d6495STianjia Zhang return vq == VSOCK_VQ_EVENT; 68117d6495STianjia Zhang } 69117d6495STianjia Zhang 70609ee906SJean-Philippe Brucker static int init_vq(struct kvm *kvm, void *dev, u32 vq) 71117d6495STianjia Zhang { 72117d6495STianjia Zhang struct vhost_vring_state state = { .index = vq }; 73117d6495STianjia Zhang struct vhost_vring_addr addr; 74117d6495STianjia Zhang struct vsock_dev *vdev = dev; 75117d6495STianjia Zhang struct virt_queue *queue; 76117d6495STianjia Zhang int r; 77117d6495STianjia Zhang 78117d6495STianjia Zhang compat__remove_message(compat_id); 79117d6495STianjia Zhang 80117d6495STianjia Zhang queue = &vdev->vqs[vq]; 81609ee906SJean-Philippe Brucker virtio_init_device_vq(kvm, &vdev->vdev, queue, VIRTIO_VSOCK_QUEUE_SIZE); 82117d6495STianjia Zhang 83117d6495STianjia Zhang if (vdev->vhost_fd == -1) 84117d6495STianjia Zhang return 0; 85117d6495STianjia Zhang 86117d6495STianjia Zhang if (is_event_vq(vq)) 87117d6495STianjia Zhang return 0; 88117d6495STianjia Zhang 89117d6495STianjia Zhang state.num = queue->vring.num; 90117d6495STianjia Zhang r = ioctl(vdev->vhost_fd, VHOST_SET_VRING_NUM, &state); 91117d6495STianjia Zhang if (r < 0) 92117d6495STianjia Zhang die_perror("VHOST_SET_VRING_NUM failed"); 93117d6495STianjia Zhang 94117d6495STianjia Zhang state.num = 0; 95117d6495STianjia Zhang r = ioctl(vdev->vhost_fd, VHOST_SET_VRING_BASE, &state); 96117d6495STianjia Zhang if (r < 0) 97117d6495STianjia Zhang die_perror("VHOST_SET_VRING_BASE failed"); 98117d6495STianjia Zhang 99117d6495STianjia Zhang addr = (struct vhost_vring_addr) { 100117d6495STianjia Zhang .index = vq, 101117d6495STianjia Zhang .desc_user_addr = (u64)(unsigned long)queue->vring.desc, 102117d6495STianjia Zhang .avail_user_addr = (u64)(unsigned long)queue->vring.avail, 103117d6495STianjia Zhang .used_user_addr = (u64)(unsigned long)queue->vring.used, 104117d6495STianjia Zhang }; 105117d6495STianjia Zhang 106117d6495STianjia Zhang r = ioctl(vdev->vhost_fd, VHOST_SET_VRING_ADDR, &addr); 107117d6495STianjia Zhang if (r < 0) 108117d6495STianjia Zhang die_perror("VHOST_SET_VRING_ADDR failed"); 109117d6495STianjia Zhang 110117d6495STianjia Zhang return 0; 111117d6495STianjia Zhang } 112117d6495STianjia Zhang 113117d6495STianjia Zhang static void notify_vq_eventfd(struct kvm *kvm, void *dev, u32 vq, u32 efd) 114117d6495STianjia Zhang { 115117d6495STianjia Zhang struct vsock_dev *vdev = dev; 116117d6495STianjia Zhang struct vhost_vring_file file = { 117117d6495STianjia Zhang .index = vq, 118117d6495STianjia Zhang .fd = efd, 119117d6495STianjia Zhang }; 120117d6495STianjia Zhang int r; 121117d6495STianjia Zhang 122117d6495STianjia Zhang if (is_event_vq(vq)) 123117d6495STianjia Zhang return; 124117d6495STianjia Zhang 125117d6495STianjia Zhang if (vdev->vhost_fd == -1) 126117d6495STianjia Zhang return; 127117d6495STianjia Zhang 128117d6495STianjia Zhang r = ioctl(vdev->vhost_fd, VHOST_SET_VRING_KICK, &file); 129117d6495STianjia Zhang if (r < 0) 130117d6495STianjia Zhang die_perror("VHOST_SET_VRING_KICK failed"); 131117d6495STianjia Zhang } 132117d6495STianjia Zhang 133117d6495STianjia Zhang static void notify_status(struct kvm *kvm, void *dev, u32 status) 134117d6495STianjia Zhang { 135117d6495STianjia Zhang struct vsock_dev *vdev = dev; 136117d6495STianjia Zhang int r, start; 137117d6495STianjia Zhang 138*867b15ccSJean-Philippe Brucker if (status & VIRTIO__STATUS_CONFIG) 139*867b15ccSJean-Philippe Brucker vdev->config.guest_cid = cpu_to_le64(vdev->guest_cid); 140*867b15ccSJean-Philippe Brucker 141a8e397bbSJean-Philippe Brucker if (status & VIRTIO__STATUS_START) 142a8e397bbSJean-Philippe Brucker start = 1; 143a8e397bbSJean-Philippe Brucker else if (status & VIRTIO__STATUS_STOP) 144a8e397bbSJean-Philippe Brucker start = 0; 145a8e397bbSJean-Philippe Brucker else 146117d6495STianjia Zhang return; 147117d6495STianjia Zhang 148117d6495STianjia Zhang r = ioctl(vdev->vhost_fd, VHOST_VSOCK_SET_RUNNING, &start); 149117d6495STianjia Zhang if (r != 0) 150117d6495STianjia Zhang die("VHOST_VSOCK_SET_RUNNING failed %d", errno); 151117d6495STianjia Zhang } 152117d6495STianjia Zhang 153117d6495STianjia Zhang static int notify_vq(struct kvm *kvm, void *dev, u32 vq) 154117d6495STianjia Zhang { 155117d6495STianjia Zhang return 0; 156117d6495STianjia Zhang } 157117d6495STianjia Zhang 158117d6495STianjia Zhang static struct virt_queue *get_vq(struct kvm *kvm, void *dev, u32 vq) 159117d6495STianjia Zhang { 160117d6495STianjia Zhang struct vsock_dev *vdev = dev; 161117d6495STianjia Zhang 162117d6495STianjia Zhang return &vdev->vqs[vq]; 163117d6495STianjia Zhang } 164117d6495STianjia Zhang 165117d6495STianjia Zhang static int get_size_vq(struct kvm *kvm, void *dev, u32 vq) 166117d6495STianjia Zhang { 167117d6495STianjia Zhang return VIRTIO_VSOCK_QUEUE_SIZE; 168117d6495STianjia Zhang } 169117d6495STianjia Zhang 170117d6495STianjia Zhang static int set_size_vq(struct kvm *kvm, void *dev, u32 vq, int size) 171117d6495STianjia Zhang { 172117d6495STianjia Zhang return size; 173117d6495STianjia Zhang } 174117d6495STianjia Zhang 175117d6495STianjia Zhang static void notify_vq_gsi(struct kvm *kvm, void *dev, u32 vq, u32 gsi) 176117d6495STianjia Zhang { 177117d6495STianjia Zhang struct vhost_vring_file file; 178117d6495STianjia Zhang struct vsock_dev *vdev = dev; 179117d6495STianjia Zhang struct kvm_irqfd irq; 180117d6495STianjia Zhang int r; 181117d6495STianjia Zhang 182117d6495STianjia Zhang if (vdev->vhost_fd == -1) 183117d6495STianjia Zhang return; 184117d6495STianjia Zhang 185117d6495STianjia Zhang if (is_event_vq(vq)) 186117d6495STianjia Zhang return; 187117d6495STianjia Zhang 188117d6495STianjia Zhang irq = (struct kvm_irqfd) { 189117d6495STianjia Zhang .gsi = gsi, 190117d6495STianjia Zhang .fd = eventfd(0, 0), 191117d6495STianjia Zhang }; 192117d6495STianjia Zhang file = (struct vhost_vring_file) { 193117d6495STianjia Zhang .index = vq, 194117d6495STianjia Zhang .fd = irq.fd, 195117d6495STianjia Zhang }; 196117d6495STianjia Zhang 197117d6495STianjia Zhang r = ioctl(kvm->vm_fd, KVM_IRQFD, &irq); 198117d6495STianjia Zhang if (r < 0) 199117d6495STianjia Zhang die_perror("KVM_IRQFD failed"); 200117d6495STianjia Zhang 201117d6495STianjia Zhang r = ioctl(vdev->vhost_fd, VHOST_SET_VRING_CALL, &file); 202117d6495STianjia Zhang if (r < 0) 203117d6495STianjia Zhang die_perror("VHOST_SET_VRING_CALL failed"); 204117d6495STianjia Zhang } 205117d6495STianjia Zhang 20631e0eaccSMartin Radev static unsigned int get_vq_count(struct kvm *kvm, void *dev) 207117d6495STianjia Zhang { 208117d6495STianjia Zhang return VSOCK_VQ_MAX; 209117d6495STianjia Zhang } 210117d6495STianjia Zhang 211117d6495STianjia Zhang static struct virtio_ops vsock_dev_virtio_ops = { 212117d6495STianjia Zhang .get_config = get_config, 213e4730284SMartin Radev .get_config_size = get_config_size, 214117d6495STianjia Zhang .get_host_features = get_host_features, 215117d6495STianjia Zhang .set_guest_features = set_guest_features, 216117d6495STianjia Zhang .init_vq = init_vq, 217117d6495STianjia Zhang .get_vq = get_vq, 218117d6495STianjia Zhang .get_size_vq = get_size_vq, 219117d6495STianjia Zhang .set_size_vq = set_size_vq, 220117d6495STianjia Zhang .notify_vq_eventfd = notify_vq_eventfd, 221117d6495STianjia Zhang .notify_status = notify_status, 222117d6495STianjia Zhang .notify_vq_gsi = notify_vq_gsi, 223117d6495STianjia Zhang .notify_vq = notify_vq, 224117d6495STianjia Zhang .get_vq_count = get_vq_count, 225117d6495STianjia Zhang }; 226117d6495STianjia Zhang 227117d6495STianjia Zhang static void virtio_vhost_vsock_init(struct kvm *kvm, struct vsock_dev *vdev) 228117d6495STianjia Zhang { 229117d6495STianjia Zhang struct kvm_mem_bank *bank; 230117d6495STianjia Zhang struct vhost_memory *mem; 231117d6495STianjia Zhang u64 features; 232117d6495STianjia Zhang int r, i; 233117d6495STianjia Zhang 234117d6495STianjia Zhang vdev->vhost_fd = open("/dev/vhost-vsock", O_RDWR); 235117d6495STianjia Zhang if (vdev->vhost_fd < 0) 236117d6495STianjia Zhang die_perror("Failed opening vhost-vsock device"); 237117d6495STianjia Zhang 238117d6495STianjia Zhang mem = calloc(1, sizeof(*mem) + sizeof(struct vhost_memory_region)); 239117d6495STianjia Zhang if (mem == NULL) 240117d6495STianjia Zhang die("Failed allocating memory for vhost memory map"); 241117d6495STianjia Zhang 242117d6495STianjia Zhang i = 0; 243117d6495STianjia Zhang list_for_each_entry(bank, &kvm->mem_banks, list) { 244117d6495STianjia Zhang mem->regions[i] = (struct vhost_memory_region) { 245117d6495STianjia Zhang .guest_phys_addr = bank->guest_phys_addr, 246117d6495STianjia Zhang .memory_size = bank->size, 247117d6495STianjia Zhang .userspace_addr = (unsigned long)bank->host_addr, 248117d6495STianjia Zhang }; 249117d6495STianjia Zhang i++; 250117d6495STianjia Zhang } 251117d6495STianjia Zhang mem->nregions = i; 252117d6495STianjia Zhang 253117d6495STianjia Zhang r = ioctl(vdev->vhost_fd, VHOST_SET_OWNER); 254117d6495STianjia Zhang if (r != 0) 255117d6495STianjia Zhang die_perror("VHOST_SET_OWNER failed"); 256117d6495STianjia Zhang 257117d6495STianjia Zhang r = ioctl(vdev->vhost_fd, VHOST_SET_MEM_TABLE, mem); 258117d6495STianjia Zhang if (r != 0) 259117d6495STianjia Zhang die_perror("VHOST_SET_MEM_TABLE failed"); 260117d6495STianjia Zhang 261117d6495STianjia Zhang r = ioctl(vdev->vhost_fd, VHOST_GET_FEATURES, &features); 262117d6495STianjia Zhang if (r != 0) 263117d6495STianjia Zhang die_perror("VHOST_GET_FEATURES failed"); 264117d6495STianjia Zhang 265117d6495STianjia Zhang r = ioctl(vdev->vhost_fd, VHOST_SET_FEATURES, &features); 266117d6495STianjia Zhang if (r != 0) 267117d6495STianjia Zhang die_perror("VHOST_SET_FEATURES failed"); 268117d6495STianjia Zhang 269*867b15ccSJean-Philippe Brucker r = ioctl(vdev->vhost_fd, VHOST_VSOCK_SET_GUEST_CID, &vdev->guest_cid); 270117d6495STianjia Zhang if (r != 0) 271117d6495STianjia Zhang die_perror("VHOST_VSOCK_SET_GUEST_CID failed"); 272117d6495STianjia Zhang 273117d6495STianjia Zhang vdev->vdev.use_vhost = true; 274117d6495STianjia Zhang 275117d6495STianjia Zhang free(mem); 276117d6495STianjia Zhang } 277117d6495STianjia Zhang 278117d6495STianjia Zhang static int virtio_vsock_init_one(struct kvm *kvm, u64 guest_cid) 279117d6495STianjia Zhang { 280117d6495STianjia Zhang struct vsock_dev *vdev; 281117d6495STianjia Zhang int r; 282117d6495STianjia Zhang 283117d6495STianjia Zhang vdev = calloc(1, sizeof(struct vsock_dev)); 284117d6495STianjia Zhang if (vdev == NULL) 285117d6495STianjia Zhang return -ENOMEM; 286117d6495STianjia Zhang 287117d6495STianjia Zhang *vdev = (struct vsock_dev) { 288117d6495STianjia Zhang .guest_cid = guest_cid, 289117d6495STianjia Zhang .vhost_fd = -1, 290117d6495STianjia Zhang .kvm = kvm, 291117d6495STianjia Zhang }; 292117d6495STianjia Zhang 293117d6495STianjia Zhang list_add_tail(&vdev->list, &vdevs); 294117d6495STianjia Zhang 295117d6495STianjia Zhang r = virtio_init(kvm, vdev, &vdev->vdev, &vsock_dev_virtio_ops, 296117d6495STianjia Zhang VIRTIO_DEFAULT_TRANS(kvm), PCI_DEVICE_ID_VIRTIO_VSOCK, 297117d6495STianjia Zhang VIRTIO_ID_VSOCK, PCI_CLASS_VSOCK); 298117d6495STianjia Zhang if (r < 0) 299117d6495STianjia Zhang return r; 300117d6495STianjia Zhang 301117d6495STianjia Zhang virtio_vhost_vsock_init(kvm, vdev); 302117d6495STianjia Zhang 303117d6495STianjia Zhang if (compat_id == -1) 304117d6495STianjia Zhang compat_id = virtio_compat_add_message("virtio-vsock", "CONFIG_VIRTIO_VSOCK"); 305117d6495STianjia Zhang 306117d6495STianjia Zhang return 0; 307117d6495STianjia Zhang } 308117d6495STianjia Zhang 309117d6495STianjia Zhang static int virtio_vsock_exit_one(struct kvm *kvm, struct vsock_dev *vdev) 310117d6495STianjia Zhang { 311117d6495STianjia Zhang list_del(&vdev->list); 312117d6495STianjia Zhang free(vdev); 313117d6495STianjia Zhang 314117d6495STianjia Zhang return 0; 315117d6495STianjia Zhang } 316117d6495STianjia Zhang 317117d6495STianjia Zhang int virtio_vsock_init(struct kvm *kvm) 318117d6495STianjia Zhang { 319117d6495STianjia Zhang int r; 320117d6495STianjia Zhang 321117d6495STianjia Zhang if (kvm->cfg.vsock_cid == 0) 322117d6495STianjia Zhang return 0; 323117d6495STianjia Zhang 324117d6495STianjia Zhang r = virtio_vsock_init_one(kvm, kvm->cfg.vsock_cid); 325117d6495STianjia Zhang if (r < 0) 326117d6495STianjia Zhang goto cleanup; 327117d6495STianjia Zhang 328117d6495STianjia Zhang return 0; 329117d6495STianjia Zhang cleanup: 330117d6495STianjia Zhang return virtio_vsock_exit(kvm); 331117d6495STianjia Zhang } 332117d6495STianjia Zhang virtio_dev_init(virtio_vsock_init); 333117d6495STianjia Zhang 334117d6495STianjia Zhang int virtio_vsock_exit(struct kvm *kvm) 335117d6495STianjia Zhang { 336117d6495STianjia Zhang while (!list_empty(&vdevs)) { 337117d6495STianjia Zhang struct vsock_dev *vdev; 338117d6495STianjia Zhang 339117d6495STianjia Zhang vdev = list_first_entry(&vdevs, struct vsock_dev, list); 340117d6495STianjia Zhang virtio_vsock_exit_one(kvm, vdev); 341117d6495STianjia Zhang } 342117d6495STianjia Zhang 343117d6495STianjia Zhang return 0; 344117d6495STianjia Zhang } 345117d6495STianjia Zhang virtio_dev_exit(virtio_vsock_exit); 346