1117d6495STianjia Zhang #include "kvm/virtio-vsock.h" 2117d6495STianjia Zhang #include "kvm/virtio-pci-dev.h" 3117d6495STianjia Zhang #include "kvm/kvm.h" 4117d6495STianjia Zhang #include "kvm/pci.h" 5117d6495STianjia Zhang #include "kvm/ioeventfd.h" 6117d6495STianjia Zhang #include "kvm/guest_compat.h" 7117d6495STianjia Zhang #include "kvm/virtio-pci.h" 8117d6495STianjia Zhang #include "kvm/virtio.h" 9117d6495STianjia Zhang 10117d6495STianjia Zhang #include <linux/kernel.h> 11117d6495STianjia Zhang #include <linux/virtio_vsock.h> 12117d6495STianjia Zhang #include <linux/vhost.h> 13117d6495STianjia Zhang 14117d6495STianjia Zhang #define VIRTIO_VSOCK_QUEUE_SIZE 128 15117d6495STianjia Zhang 16117d6495STianjia Zhang static LIST_HEAD(vdevs); 17117d6495STianjia Zhang static int compat_id = -1; 18117d6495STianjia Zhang 19117d6495STianjia Zhang enum { 20117d6495STianjia Zhang VSOCK_VQ_RX = 0, /* for host to guest data */ 21117d6495STianjia Zhang VSOCK_VQ_TX = 1, /* for guest to host data */ 22117d6495STianjia Zhang VSOCK_VQ_EVENT = 2, 23117d6495STianjia Zhang VSOCK_VQ_MAX = 3, 24117d6495STianjia Zhang }; 25117d6495STianjia Zhang 26117d6495STianjia Zhang struct vsock_dev { 27117d6495STianjia Zhang struct virt_queue vqs[VSOCK_VQ_MAX]; 28117d6495STianjia Zhang struct virtio_vsock_config config; 29117d6495STianjia Zhang u32 features; 30117d6495STianjia Zhang int vhost_fd; 31117d6495STianjia Zhang struct virtio_device vdev; 32117d6495STianjia Zhang struct list_head list; 33117d6495STianjia Zhang struct kvm *kvm; 34117d6495STianjia Zhang }; 35117d6495STianjia Zhang 36117d6495STianjia Zhang static u8 *get_config(struct kvm *kvm, void *dev) 37117d6495STianjia Zhang { 38117d6495STianjia Zhang struct vsock_dev *vdev = dev; 39117d6495STianjia Zhang 40117d6495STianjia Zhang return ((u8 *)(&vdev->config)); 41117d6495STianjia Zhang } 42117d6495STianjia Zhang 43e4730284SMartin Radev static size_t get_config_size(struct kvm *kvm, void *dev) 44e4730284SMartin Radev { 45e4730284SMartin Radev struct vsock_dev *vdev = dev; 46e4730284SMartin Radev 47e4730284SMartin Radev return sizeof(vdev->config); 48e4730284SMartin Radev } 49e4730284SMartin Radev 50117d6495STianjia Zhang static u32 get_host_features(struct kvm *kvm, void *dev) 51117d6495STianjia Zhang { 52117d6495STianjia Zhang return 1UL << VIRTIO_RING_F_EVENT_IDX 53117d6495STianjia Zhang | 1UL << VIRTIO_RING_F_INDIRECT_DESC; 54117d6495STianjia Zhang } 55117d6495STianjia Zhang 56117d6495STianjia Zhang static void set_guest_features(struct kvm *kvm, void *dev, u32 features) 57117d6495STianjia Zhang { 58117d6495STianjia Zhang struct vsock_dev *vdev = dev; 59117d6495STianjia Zhang 60117d6495STianjia Zhang vdev->features = features; 61117d6495STianjia Zhang } 62117d6495STianjia Zhang 63117d6495STianjia Zhang static bool is_event_vq(u32 vq) 64117d6495STianjia Zhang { 65117d6495STianjia Zhang return vq == VSOCK_VQ_EVENT; 66117d6495STianjia Zhang } 67117d6495STianjia Zhang 68*609ee906SJean-Philippe Brucker static int init_vq(struct kvm *kvm, void *dev, u32 vq) 69117d6495STianjia Zhang { 70117d6495STianjia Zhang struct vhost_vring_state state = { .index = vq }; 71117d6495STianjia Zhang struct vhost_vring_addr addr; 72117d6495STianjia Zhang struct vsock_dev *vdev = dev; 73117d6495STianjia Zhang struct virt_queue *queue; 74117d6495STianjia Zhang int r; 75117d6495STianjia Zhang 76117d6495STianjia Zhang compat__remove_message(compat_id); 77117d6495STianjia Zhang 78117d6495STianjia Zhang queue = &vdev->vqs[vq]; 79*609ee906SJean-Philippe Brucker virtio_init_device_vq(kvm, &vdev->vdev, queue, VIRTIO_VSOCK_QUEUE_SIZE); 80117d6495STianjia Zhang 81117d6495STianjia Zhang if (vdev->vhost_fd == -1) 82117d6495STianjia Zhang return 0; 83117d6495STianjia Zhang 84117d6495STianjia Zhang if (is_event_vq(vq)) 85117d6495STianjia Zhang return 0; 86117d6495STianjia Zhang 87117d6495STianjia Zhang state.num = queue->vring.num; 88117d6495STianjia Zhang r = ioctl(vdev->vhost_fd, VHOST_SET_VRING_NUM, &state); 89117d6495STianjia Zhang if (r < 0) 90117d6495STianjia Zhang die_perror("VHOST_SET_VRING_NUM failed"); 91117d6495STianjia Zhang 92117d6495STianjia Zhang state.num = 0; 93117d6495STianjia Zhang r = ioctl(vdev->vhost_fd, VHOST_SET_VRING_BASE, &state); 94117d6495STianjia Zhang if (r < 0) 95117d6495STianjia Zhang die_perror("VHOST_SET_VRING_BASE failed"); 96117d6495STianjia Zhang 97117d6495STianjia Zhang addr = (struct vhost_vring_addr) { 98117d6495STianjia Zhang .index = vq, 99117d6495STianjia Zhang .desc_user_addr = (u64)(unsigned long)queue->vring.desc, 100117d6495STianjia Zhang .avail_user_addr = (u64)(unsigned long)queue->vring.avail, 101117d6495STianjia Zhang .used_user_addr = (u64)(unsigned long)queue->vring.used, 102117d6495STianjia Zhang }; 103117d6495STianjia Zhang 104117d6495STianjia Zhang r = ioctl(vdev->vhost_fd, VHOST_SET_VRING_ADDR, &addr); 105117d6495STianjia Zhang if (r < 0) 106117d6495STianjia Zhang die_perror("VHOST_SET_VRING_ADDR failed"); 107117d6495STianjia Zhang 108117d6495STianjia Zhang return 0; 109117d6495STianjia Zhang } 110117d6495STianjia Zhang 111117d6495STianjia Zhang static void notify_vq_eventfd(struct kvm *kvm, void *dev, u32 vq, u32 efd) 112117d6495STianjia Zhang { 113117d6495STianjia Zhang struct vsock_dev *vdev = dev; 114117d6495STianjia Zhang struct vhost_vring_file file = { 115117d6495STianjia Zhang .index = vq, 116117d6495STianjia Zhang .fd = efd, 117117d6495STianjia Zhang }; 118117d6495STianjia Zhang int r; 119117d6495STianjia Zhang 120117d6495STianjia Zhang if (is_event_vq(vq)) 121117d6495STianjia Zhang return; 122117d6495STianjia Zhang 123117d6495STianjia Zhang if (vdev->vhost_fd == -1) 124117d6495STianjia Zhang return; 125117d6495STianjia Zhang 126117d6495STianjia Zhang r = ioctl(vdev->vhost_fd, VHOST_SET_VRING_KICK, &file); 127117d6495STianjia Zhang if (r < 0) 128117d6495STianjia Zhang die_perror("VHOST_SET_VRING_KICK failed"); 129117d6495STianjia Zhang } 130117d6495STianjia Zhang 131117d6495STianjia Zhang static void notify_status(struct kvm *kvm, void *dev, u32 status) 132117d6495STianjia Zhang { 133117d6495STianjia Zhang struct vsock_dev *vdev = dev; 134117d6495STianjia Zhang int r, start; 135117d6495STianjia Zhang 136a8e397bbSJean-Philippe Brucker if (status & VIRTIO__STATUS_START) 137a8e397bbSJean-Philippe Brucker start = 1; 138a8e397bbSJean-Philippe Brucker else if (status & VIRTIO__STATUS_STOP) 139a8e397bbSJean-Philippe Brucker start = 0; 140a8e397bbSJean-Philippe Brucker else 141117d6495STianjia Zhang return; 142117d6495STianjia Zhang 143117d6495STianjia Zhang r = ioctl(vdev->vhost_fd, VHOST_VSOCK_SET_RUNNING, &start); 144117d6495STianjia Zhang if (r != 0) 145117d6495STianjia Zhang die("VHOST_VSOCK_SET_RUNNING failed %d", errno); 146117d6495STianjia Zhang } 147117d6495STianjia Zhang 148117d6495STianjia Zhang static int notify_vq(struct kvm *kvm, void *dev, u32 vq) 149117d6495STianjia Zhang { 150117d6495STianjia Zhang return 0; 151117d6495STianjia Zhang } 152117d6495STianjia Zhang 153117d6495STianjia Zhang static struct virt_queue *get_vq(struct kvm *kvm, void *dev, u32 vq) 154117d6495STianjia Zhang { 155117d6495STianjia Zhang struct vsock_dev *vdev = dev; 156117d6495STianjia Zhang 157117d6495STianjia Zhang return &vdev->vqs[vq]; 158117d6495STianjia Zhang } 159117d6495STianjia Zhang 160117d6495STianjia Zhang static int get_size_vq(struct kvm *kvm, void *dev, u32 vq) 161117d6495STianjia Zhang { 162117d6495STianjia Zhang return VIRTIO_VSOCK_QUEUE_SIZE; 163117d6495STianjia Zhang } 164117d6495STianjia Zhang 165117d6495STianjia Zhang static int set_size_vq(struct kvm *kvm, void *dev, u32 vq, int size) 166117d6495STianjia Zhang { 167117d6495STianjia Zhang return size; 168117d6495STianjia Zhang } 169117d6495STianjia Zhang 170117d6495STianjia Zhang static void notify_vq_gsi(struct kvm *kvm, void *dev, u32 vq, u32 gsi) 171117d6495STianjia Zhang { 172117d6495STianjia Zhang struct vhost_vring_file file; 173117d6495STianjia Zhang struct vsock_dev *vdev = dev; 174117d6495STianjia Zhang struct kvm_irqfd irq; 175117d6495STianjia Zhang int r; 176117d6495STianjia Zhang 177117d6495STianjia Zhang if (vdev->vhost_fd == -1) 178117d6495STianjia Zhang return; 179117d6495STianjia Zhang 180117d6495STianjia Zhang if (is_event_vq(vq)) 181117d6495STianjia Zhang return; 182117d6495STianjia Zhang 183117d6495STianjia Zhang irq = (struct kvm_irqfd) { 184117d6495STianjia Zhang .gsi = gsi, 185117d6495STianjia Zhang .fd = eventfd(0, 0), 186117d6495STianjia Zhang }; 187117d6495STianjia Zhang file = (struct vhost_vring_file) { 188117d6495STianjia Zhang .index = vq, 189117d6495STianjia Zhang .fd = irq.fd, 190117d6495STianjia Zhang }; 191117d6495STianjia Zhang 192117d6495STianjia Zhang r = ioctl(kvm->vm_fd, KVM_IRQFD, &irq); 193117d6495STianjia Zhang if (r < 0) 194117d6495STianjia Zhang die_perror("KVM_IRQFD failed"); 195117d6495STianjia Zhang 196117d6495STianjia Zhang r = ioctl(vdev->vhost_fd, VHOST_SET_VRING_CALL, &file); 197117d6495STianjia Zhang if (r < 0) 198117d6495STianjia Zhang die_perror("VHOST_SET_VRING_CALL failed"); 199117d6495STianjia Zhang } 200117d6495STianjia Zhang 20131e0eaccSMartin Radev static unsigned int get_vq_count(struct kvm *kvm, void *dev) 202117d6495STianjia Zhang { 203117d6495STianjia Zhang return VSOCK_VQ_MAX; 204117d6495STianjia Zhang } 205117d6495STianjia Zhang 206117d6495STianjia Zhang static struct virtio_ops vsock_dev_virtio_ops = { 207117d6495STianjia Zhang .get_config = get_config, 208e4730284SMartin Radev .get_config_size = get_config_size, 209117d6495STianjia Zhang .get_host_features = get_host_features, 210117d6495STianjia Zhang .set_guest_features = set_guest_features, 211117d6495STianjia Zhang .init_vq = init_vq, 212117d6495STianjia Zhang .get_vq = get_vq, 213117d6495STianjia Zhang .get_size_vq = get_size_vq, 214117d6495STianjia Zhang .set_size_vq = set_size_vq, 215117d6495STianjia Zhang .notify_vq_eventfd = notify_vq_eventfd, 216117d6495STianjia Zhang .notify_status = notify_status, 217117d6495STianjia Zhang .notify_vq_gsi = notify_vq_gsi, 218117d6495STianjia Zhang .notify_vq = notify_vq, 219117d6495STianjia Zhang .get_vq_count = get_vq_count, 220117d6495STianjia Zhang }; 221117d6495STianjia Zhang 222117d6495STianjia Zhang static void virtio_vhost_vsock_init(struct kvm *kvm, struct vsock_dev *vdev) 223117d6495STianjia Zhang { 224117d6495STianjia Zhang struct kvm_mem_bank *bank; 225117d6495STianjia Zhang struct vhost_memory *mem; 226117d6495STianjia Zhang u64 features; 227117d6495STianjia Zhang int r, i; 228117d6495STianjia Zhang 229117d6495STianjia Zhang vdev->vhost_fd = open("/dev/vhost-vsock", O_RDWR); 230117d6495STianjia Zhang if (vdev->vhost_fd < 0) 231117d6495STianjia Zhang die_perror("Failed opening vhost-vsock device"); 232117d6495STianjia Zhang 233117d6495STianjia Zhang mem = calloc(1, sizeof(*mem) + sizeof(struct vhost_memory_region)); 234117d6495STianjia Zhang if (mem == NULL) 235117d6495STianjia Zhang die("Failed allocating memory for vhost memory map"); 236117d6495STianjia Zhang 237117d6495STianjia Zhang i = 0; 238117d6495STianjia Zhang list_for_each_entry(bank, &kvm->mem_banks, list) { 239117d6495STianjia Zhang mem->regions[i] = (struct vhost_memory_region) { 240117d6495STianjia Zhang .guest_phys_addr = bank->guest_phys_addr, 241117d6495STianjia Zhang .memory_size = bank->size, 242117d6495STianjia Zhang .userspace_addr = (unsigned long)bank->host_addr, 243117d6495STianjia Zhang }; 244117d6495STianjia Zhang i++; 245117d6495STianjia Zhang } 246117d6495STianjia Zhang mem->nregions = i; 247117d6495STianjia Zhang 248117d6495STianjia Zhang r = ioctl(vdev->vhost_fd, VHOST_SET_OWNER); 249117d6495STianjia Zhang if (r != 0) 250117d6495STianjia Zhang die_perror("VHOST_SET_OWNER failed"); 251117d6495STianjia Zhang 252117d6495STianjia Zhang r = ioctl(vdev->vhost_fd, VHOST_SET_MEM_TABLE, mem); 253117d6495STianjia Zhang if (r != 0) 254117d6495STianjia Zhang die_perror("VHOST_SET_MEM_TABLE failed"); 255117d6495STianjia Zhang 256117d6495STianjia Zhang r = ioctl(vdev->vhost_fd, VHOST_GET_FEATURES, &features); 257117d6495STianjia Zhang if (r != 0) 258117d6495STianjia Zhang die_perror("VHOST_GET_FEATURES failed"); 259117d6495STianjia Zhang 260117d6495STianjia Zhang r = ioctl(vdev->vhost_fd, VHOST_SET_FEATURES, &features); 261117d6495STianjia Zhang if (r != 0) 262117d6495STianjia Zhang die_perror("VHOST_SET_FEATURES failed"); 263117d6495STianjia Zhang 264117d6495STianjia Zhang r = ioctl(vdev->vhost_fd, VHOST_VSOCK_SET_GUEST_CID, &vdev->config.guest_cid); 265117d6495STianjia Zhang if (r != 0) 266117d6495STianjia Zhang die_perror("VHOST_VSOCK_SET_GUEST_CID failed"); 267117d6495STianjia Zhang 268117d6495STianjia Zhang vdev->vdev.use_vhost = true; 269117d6495STianjia Zhang 270117d6495STianjia Zhang free(mem); 271117d6495STianjia Zhang } 272117d6495STianjia Zhang 273117d6495STianjia Zhang static int virtio_vsock_init_one(struct kvm *kvm, u64 guest_cid) 274117d6495STianjia Zhang { 275117d6495STianjia Zhang struct vsock_dev *vdev; 276117d6495STianjia Zhang int r; 277117d6495STianjia Zhang 278117d6495STianjia Zhang vdev = calloc(1, sizeof(struct vsock_dev)); 279117d6495STianjia Zhang if (vdev == NULL) 280117d6495STianjia Zhang return -ENOMEM; 281117d6495STianjia Zhang 282117d6495STianjia Zhang *vdev = (struct vsock_dev) { 283117d6495STianjia Zhang .config = (struct virtio_vsock_config) { 284117d6495STianjia Zhang .guest_cid = guest_cid, 285117d6495STianjia Zhang }, 286117d6495STianjia Zhang .vhost_fd = -1, 287117d6495STianjia Zhang .kvm = kvm, 288117d6495STianjia Zhang }; 289117d6495STianjia Zhang 290117d6495STianjia Zhang list_add_tail(&vdev->list, &vdevs); 291117d6495STianjia Zhang 292117d6495STianjia Zhang r = virtio_init(kvm, vdev, &vdev->vdev, &vsock_dev_virtio_ops, 293117d6495STianjia Zhang VIRTIO_DEFAULT_TRANS(kvm), PCI_DEVICE_ID_VIRTIO_VSOCK, 294117d6495STianjia Zhang VIRTIO_ID_VSOCK, PCI_CLASS_VSOCK); 295117d6495STianjia Zhang if (r < 0) 296117d6495STianjia Zhang return r; 297117d6495STianjia Zhang 298117d6495STianjia Zhang virtio_vhost_vsock_init(kvm, vdev); 299117d6495STianjia Zhang 300117d6495STianjia Zhang if (compat_id == -1) 301117d6495STianjia Zhang compat_id = virtio_compat_add_message("virtio-vsock", "CONFIG_VIRTIO_VSOCK"); 302117d6495STianjia Zhang 303117d6495STianjia Zhang return 0; 304117d6495STianjia Zhang } 305117d6495STianjia Zhang 306117d6495STianjia Zhang static int virtio_vsock_exit_one(struct kvm *kvm, struct vsock_dev *vdev) 307117d6495STianjia Zhang { 308117d6495STianjia Zhang list_del(&vdev->list); 309117d6495STianjia Zhang free(vdev); 310117d6495STianjia Zhang 311117d6495STianjia Zhang return 0; 312117d6495STianjia Zhang } 313117d6495STianjia Zhang 314117d6495STianjia Zhang int virtio_vsock_init(struct kvm *kvm) 315117d6495STianjia Zhang { 316117d6495STianjia Zhang int r; 317117d6495STianjia Zhang 318117d6495STianjia Zhang if (kvm->cfg.vsock_cid == 0) 319117d6495STianjia Zhang return 0; 320117d6495STianjia Zhang 321117d6495STianjia Zhang r = virtio_vsock_init_one(kvm, kvm->cfg.vsock_cid); 322117d6495STianjia Zhang if (r < 0) 323117d6495STianjia Zhang goto cleanup; 324117d6495STianjia Zhang 325117d6495STianjia Zhang return 0; 326117d6495STianjia Zhang cleanup: 327117d6495STianjia Zhang return virtio_vsock_exit(kvm); 328117d6495STianjia Zhang } 329117d6495STianjia Zhang virtio_dev_init(virtio_vsock_init); 330117d6495STianjia Zhang 331117d6495STianjia Zhang int virtio_vsock_exit(struct kvm *kvm) 332117d6495STianjia Zhang { 333117d6495STianjia Zhang while (!list_empty(&vdevs)) { 334117d6495STianjia Zhang struct vsock_dev *vdev; 335117d6495STianjia Zhang 336117d6495STianjia Zhang vdev = list_first_entry(&vdevs, struct vsock_dev, list); 337117d6495STianjia Zhang virtio_vsock_exit_one(kvm, vdev); 338117d6495STianjia Zhang } 339117d6495STianjia Zhang 340117d6495STianjia Zhang return 0; 341117d6495STianjia Zhang } 342117d6495STianjia Zhang virtio_dev_exit(virtio_vsock_exit); 343