1108a6481SCindy Lu /* 2108a6481SCindy Lu * vhost-vdpa 3108a6481SCindy Lu * 4108a6481SCindy Lu * Copyright(c) 2017-2018 Intel Corporation. 5108a6481SCindy Lu * Copyright(c) 2020 Red Hat, Inc. 6108a6481SCindy Lu * 7108a6481SCindy Lu * This work is licensed under the terms of the GNU GPL, version 2 or later. 8108a6481SCindy Lu * See the COPYING file in the top-level directory. 9108a6481SCindy Lu * 10108a6481SCindy Lu */ 11108a6481SCindy Lu 12108a6481SCindy Lu #include "qemu/osdep.h" 13108a6481SCindy Lu #include <linux/vhost.h> 14108a6481SCindy Lu #include <linux/vfio.h> 15108a6481SCindy Lu #include <sys/eventfd.h> 16108a6481SCindy Lu #include <sys/ioctl.h> 17108a6481SCindy Lu #include "hw/virtio/vhost.h" 18108a6481SCindy Lu #include "hw/virtio/vhost-backend.h" 19108a6481SCindy Lu #include "hw/virtio/virtio-net.h" 20108a6481SCindy Lu #include "hw/virtio/vhost-vdpa.h" 21df77d45aSXie Yongji #include "exec/address-spaces.h" 22108a6481SCindy Lu #include "qemu/main-loop.h" 234dc5acc0SCindy Lu #include "cpu.h" 24778e67deSLaurent Vivier #include "trace.h" 25778e67deSLaurent Vivier #include "qemu-common.h" 26108a6481SCindy Lu 27*032e4d68SEugenio Pérez /* 28*032e4d68SEugenio Pérez * Return one past the end of the end of section. Be careful with uint64_t 29*032e4d68SEugenio Pérez * conversions! 30*032e4d68SEugenio Pérez */ 31*032e4d68SEugenio Pérez static Int128 vhost_vdpa_section_end(const MemoryRegionSection *section) 32*032e4d68SEugenio Pérez { 33*032e4d68SEugenio Pérez Int128 llend = int128_make64(section->offset_within_address_space); 34*032e4d68SEugenio Pérez llend = int128_add(llend, section->size); 35*032e4d68SEugenio Pérez llend = int128_and(llend, int128_exts64(TARGET_PAGE_MASK)); 36*032e4d68SEugenio Pérez 37*032e4d68SEugenio Pérez return llend; 38*032e4d68SEugenio Pérez } 39*032e4d68SEugenio Pérez 40108a6481SCindy Lu static bool vhost_vdpa_listener_skipped_section(MemoryRegionSection *section) 41108a6481SCindy Lu { 42108a6481SCindy Lu return (!memory_region_is_ram(section->mr) && 43108a6481SCindy Lu !memory_region_is_iommu(section->mr)) || 44c64038c9SEugenio Pérez memory_region_is_protected(section->mr) || 45d60c75d2SJason Wang /* vhost-vDPA doesn't allow MMIO to be mapped */ 46d60c75d2SJason Wang memory_region_is_ram_device(section->mr) || 47108a6481SCindy Lu /* 48108a6481SCindy Lu * Sizing an enabled 64-bit BAR can cause spurious mappings to 49108a6481SCindy Lu * addresses in the upper part of the 64-bit address space. These 50108a6481SCindy Lu * are never accessed by the CPU and beyond the address width of 51108a6481SCindy Lu * some IOMMU hardware. TODO: VDPA should tell us the IOMMU width. 52108a6481SCindy Lu */ 53108a6481SCindy Lu section->offset_within_address_space & (1ULL << 63); 54108a6481SCindy Lu } 55108a6481SCindy Lu 56108a6481SCindy Lu static int vhost_vdpa_dma_map(struct vhost_vdpa *v, hwaddr iova, hwaddr size, 57108a6481SCindy Lu void *vaddr, bool readonly) 58108a6481SCindy Lu { 59386494f2SCindy Lu struct vhost_msg_v2 msg = {}; 60108a6481SCindy Lu int fd = v->device_fd; 61108a6481SCindy Lu int ret = 0; 62108a6481SCindy Lu 63108a6481SCindy Lu msg.type = v->msg_type; 64108a6481SCindy Lu msg.iotlb.iova = iova; 65108a6481SCindy Lu msg.iotlb.size = size; 66108a6481SCindy Lu msg.iotlb.uaddr = (uint64_t)(uintptr_t)vaddr; 67108a6481SCindy Lu msg.iotlb.perm = readonly ? VHOST_ACCESS_RO : VHOST_ACCESS_RW; 68108a6481SCindy Lu msg.iotlb.type = VHOST_IOTLB_UPDATE; 69108a6481SCindy Lu 70778e67deSLaurent Vivier trace_vhost_vdpa_dma_map(v, fd, msg.type, msg.iotlb.iova, msg.iotlb.size, 71778e67deSLaurent Vivier msg.iotlb.uaddr, msg.iotlb.perm, msg.iotlb.type); 72778e67deSLaurent Vivier 73108a6481SCindy Lu if (write(fd, &msg, sizeof(msg)) != sizeof(msg)) { 74108a6481SCindy Lu error_report("failed to write, fd=%d, errno=%d (%s)", 75108a6481SCindy Lu fd, errno, strerror(errno)); 76108a6481SCindy Lu return -EIO ; 77108a6481SCindy Lu } 78108a6481SCindy Lu 79108a6481SCindy Lu return ret; 80108a6481SCindy Lu } 81108a6481SCindy Lu 82108a6481SCindy Lu static int vhost_vdpa_dma_unmap(struct vhost_vdpa *v, hwaddr iova, 83108a6481SCindy Lu hwaddr size) 84108a6481SCindy Lu { 85386494f2SCindy Lu struct vhost_msg_v2 msg = {}; 86108a6481SCindy Lu int fd = v->device_fd; 87108a6481SCindy Lu int ret = 0; 88108a6481SCindy Lu 89108a6481SCindy Lu msg.type = v->msg_type; 90108a6481SCindy Lu msg.iotlb.iova = iova; 91108a6481SCindy Lu msg.iotlb.size = size; 92108a6481SCindy Lu msg.iotlb.type = VHOST_IOTLB_INVALIDATE; 93108a6481SCindy Lu 94778e67deSLaurent Vivier trace_vhost_vdpa_dma_unmap(v, fd, msg.type, msg.iotlb.iova, 95778e67deSLaurent Vivier msg.iotlb.size, msg.iotlb.type); 96778e67deSLaurent Vivier 97108a6481SCindy Lu if (write(fd, &msg, sizeof(msg)) != sizeof(msg)) { 98108a6481SCindy Lu error_report("failed to write, fd=%d, errno=%d (%s)", 99108a6481SCindy Lu fd, errno, strerror(errno)); 100108a6481SCindy Lu return -EIO ; 101108a6481SCindy Lu } 102108a6481SCindy Lu 103108a6481SCindy Lu return ret; 104108a6481SCindy Lu } 105108a6481SCindy Lu 106e6db5df7SEugenio Pérez static void vhost_vdpa_listener_begin_batch(struct vhost_vdpa *v) 107a5bd0580SJason Wang { 108a5bd0580SJason Wang int fd = v->device_fd; 109e6db5df7SEugenio Pérez struct vhost_msg_v2 msg = { 110e6db5df7SEugenio Pérez .type = v->msg_type, 111e6db5df7SEugenio Pérez .iotlb.type = VHOST_IOTLB_BATCH_BEGIN, 112e6db5df7SEugenio Pérez }; 113a5bd0580SJason Wang 114a5bd0580SJason Wang if (write(fd, &msg, sizeof(msg)) != sizeof(msg)) { 115a5bd0580SJason Wang error_report("failed to write, fd=%d, errno=%d (%s)", 116a5bd0580SJason Wang fd, errno, strerror(errno)); 117a5bd0580SJason Wang } 118a5bd0580SJason Wang } 119a5bd0580SJason Wang 120e6db5df7SEugenio Pérez static void vhost_vdpa_iotlb_batch_begin_once(struct vhost_vdpa *v) 121e6db5df7SEugenio Pérez { 122e6db5df7SEugenio Pérez if (v->dev->backend_cap & (0x1ULL << VHOST_BACKEND_F_IOTLB_BATCH) && 123e6db5df7SEugenio Pérez !v->iotlb_batch_begin_sent) { 124e6db5df7SEugenio Pérez vhost_vdpa_listener_begin_batch(v); 125e6db5df7SEugenio Pérez } 126e6db5df7SEugenio Pérez 127e6db5df7SEugenio Pérez v->iotlb_batch_begin_sent = true; 128e6db5df7SEugenio Pérez } 129e6db5df7SEugenio Pérez 130a5bd0580SJason Wang static void vhost_vdpa_listener_commit(MemoryListener *listener) 131a5bd0580SJason Wang { 132a5bd0580SJason Wang struct vhost_vdpa *v = container_of(listener, struct vhost_vdpa, listener); 133a5bd0580SJason Wang struct vhost_dev *dev = v->dev; 1348acb3218SPhilippe Mathieu-Daudé struct vhost_msg_v2 msg = {}; 135a5bd0580SJason Wang int fd = v->device_fd; 136a5bd0580SJason Wang 137a5bd0580SJason Wang if (!(dev->backend_cap & (0x1ULL << VHOST_BACKEND_F_IOTLB_BATCH))) { 138a5bd0580SJason Wang return; 139a5bd0580SJason Wang } 140a5bd0580SJason Wang 141e6db5df7SEugenio Pérez if (!v->iotlb_batch_begin_sent) { 142e6db5df7SEugenio Pérez return; 143e6db5df7SEugenio Pérez } 144e6db5df7SEugenio Pérez 145a5bd0580SJason Wang msg.type = v->msg_type; 146a5bd0580SJason Wang msg.iotlb.type = VHOST_IOTLB_BATCH_END; 147a5bd0580SJason Wang 148a5bd0580SJason Wang if (write(fd, &msg, sizeof(msg)) != sizeof(msg)) { 149a5bd0580SJason Wang error_report("failed to write, fd=%d, errno=%d (%s)", 150a5bd0580SJason Wang fd, errno, strerror(errno)); 151a5bd0580SJason Wang } 152e6db5df7SEugenio Pérez 153e6db5df7SEugenio Pérez v->iotlb_batch_begin_sent = false; 154a5bd0580SJason Wang } 155a5bd0580SJason Wang 156108a6481SCindy Lu static void vhost_vdpa_listener_region_add(MemoryListener *listener, 157108a6481SCindy Lu MemoryRegionSection *section) 158108a6481SCindy Lu { 159108a6481SCindy Lu struct vhost_vdpa *v = container_of(listener, struct vhost_vdpa, listener); 160108a6481SCindy Lu hwaddr iova; 161108a6481SCindy Lu Int128 llend, llsize; 162108a6481SCindy Lu void *vaddr; 163108a6481SCindy Lu int ret; 164108a6481SCindy Lu 165108a6481SCindy Lu if (vhost_vdpa_listener_skipped_section(section)) { 166108a6481SCindy Lu return; 167108a6481SCindy Lu } 168108a6481SCindy Lu 169108a6481SCindy Lu if (unlikely((section->offset_within_address_space & ~TARGET_PAGE_MASK) != 170108a6481SCindy Lu (section->offset_within_region & ~TARGET_PAGE_MASK))) { 171108a6481SCindy Lu error_report("%s received unaligned region", __func__); 172108a6481SCindy Lu return; 173108a6481SCindy Lu } 174108a6481SCindy Lu 175108a6481SCindy Lu iova = TARGET_PAGE_ALIGN(section->offset_within_address_space); 176*032e4d68SEugenio Pérez llend = vhost_vdpa_section_end(section); 177108a6481SCindy Lu if (int128_ge(int128_make64(iova), llend)) { 178108a6481SCindy Lu return; 179108a6481SCindy Lu } 180108a6481SCindy Lu 181108a6481SCindy Lu memory_region_ref(section->mr); 182108a6481SCindy Lu 183108a6481SCindy Lu /* Here we assume that memory_region_is_ram(section->mr)==true */ 184108a6481SCindy Lu 185108a6481SCindy Lu vaddr = memory_region_get_ram_ptr(section->mr) + 186108a6481SCindy Lu section->offset_within_region + 187108a6481SCindy Lu (iova - section->offset_within_address_space); 188108a6481SCindy Lu 189778e67deSLaurent Vivier trace_vhost_vdpa_listener_region_add(v, iova, int128_get64(llend), 190778e67deSLaurent Vivier vaddr, section->readonly); 191778e67deSLaurent Vivier 192108a6481SCindy Lu llsize = int128_sub(llend, int128_make64(iova)); 193108a6481SCindy Lu 194e6db5df7SEugenio Pérez vhost_vdpa_iotlb_batch_begin_once(v); 195108a6481SCindy Lu ret = vhost_vdpa_dma_map(v, iova, int128_get64(llsize), 196108a6481SCindy Lu vaddr, section->readonly); 197108a6481SCindy Lu if (ret) { 198108a6481SCindy Lu error_report("vhost vdpa map fail!"); 199108a6481SCindy Lu goto fail; 200108a6481SCindy Lu } 201108a6481SCindy Lu 202108a6481SCindy Lu return; 203108a6481SCindy Lu 204108a6481SCindy Lu fail: 205108a6481SCindy Lu /* 206108a6481SCindy Lu * On the initfn path, store the first error in the container so we 207108a6481SCindy Lu * can gracefully fail. Runtime, there's not much we can do other 208108a6481SCindy Lu * than throw a hardware error. 209108a6481SCindy Lu */ 210108a6481SCindy Lu error_report("vhost-vdpa: DMA mapping failed, unable to continue"); 211108a6481SCindy Lu return; 212108a6481SCindy Lu 213108a6481SCindy Lu } 214108a6481SCindy Lu 215108a6481SCindy Lu static void vhost_vdpa_listener_region_del(MemoryListener *listener, 216108a6481SCindy Lu MemoryRegionSection *section) 217108a6481SCindy Lu { 218108a6481SCindy Lu struct vhost_vdpa *v = container_of(listener, struct vhost_vdpa, listener); 219108a6481SCindy Lu hwaddr iova; 220108a6481SCindy Lu Int128 llend, llsize; 221108a6481SCindy Lu int ret; 222108a6481SCindy Lu 223108a6481SCindy Lu if (vhost_vdpa_listener_skipped_section(section)) { 224108a6481SCindy Lu return; 225108a6481SCindy Lu } 226108a6481SCindy Lu 227108a6481SCindy Lu if (unlikely((section->offset_within_address_space & ~TARGET_PAGE_MASK) != 228108a6481SCindy Lu (section->offset_within_region & ~TARGET_PAGE_MASK))) { 229108a6481SCindy Lu error_report("%s received unaligned region", __func__); 230108a6481SCindy Lu return; 231108a6481SCindy Lu } 232108a6481SCindy Lu 233108a6481SCindy Lu iova = TARGET_PAGE_ALIGN(section->offset_within_address_space); 234*032e4d68SEugenio Pérez llend = vhost_vdpa_section_end(section); 235108a6481SCindy Lu 236778e67deSLaurent Vivier trace_vhost_vdpa_listener_region_del(v, iova, int128_get64(llend)); 237778e67deSLaurent Vivier 238108a6481SCindy Lu if (int128_ge(int128_make64(iova), llend)) { 239108a6481SCindy Lu return; 240108a6481SCindy Lu } 241108a6481SCindy Lu 242108a6481SCindy Lu llsize = int128_sub(llend, int128_make64(iova)); 243108a6481SCindy Lu 244e6db5df7SEugenio Pérez vhost_vdpa_iotlb_batch_begin_once(v); 245108a6481SCindy Lu ret = vhost_vdpa_dma_unmap(v, iova, int128_get64(llsize)); 246108a6481SCindy Lu if (ret) { 247108a6481SCindy Lu error_report("vhost_vdpa dma unmap error!"); 248108a6481SCindy Lu } 249108a6481SCindy Lu 250108a6481SCindy Lu memory_region_unref(section->mr); 251108a6481SCindy Lu } 252108a6481SCindy Lu /* 253108a6481SCindy Lu * IOTLB API is used by vhost-vpda which requires incremental updating 254108a6481SCindy Lu * of the mapping. So we can not use generic vhost memory listener which 255108a6481SCindy Lu * depends on the addnop(). 256108a6481SCindy Lu */ 257108a6481SCindy Lu static const MemoryListener vhost_vdpa_memory_listener = { 258142518bdSPeter Xu .name = "vhost-vdpa", 259a5bd0580SJason Wang .commit = vhost_vdpa_listener_commit, 260108a6481SCindy Lu .region_add = vhost_vdpa_listener_region_add, 261108a6481SCindy Lu .region_del = vhost_vdpa_listener_region_del, 262108a6481SCindy Lu }; 263108a6481SCindy Lu 264108a6481SCindy Lu static int vhost_vdpa_call(struct vhost_dev *dev, unsigned long int request, 265108a6481SCindy Lu void *arg) 266108a6481SCindy Lu { 267108a6481SCindy Lu struct vhost_vdpa *v = dev->opaque; 268108a6481SCindy Lu int fd = v->device_fd; 269f2a6e6c4SKevin Wolf int ret; 270108a6481SCindy Lu 271108a6481SCindy Lu assert(dev->vhost_ops->backend_type == VHOST_BACKEND_TYPE_VDPA); 272108a6481SCindy Lu 273f2a6e6c4SKevin Wolf ret = ioctl(fd, request, arg); 274f2a6e6c4SKevin Wolf return ret < 0 ? -errno : ret; 275108a6481SCindy Lu } 276108a6481SCindy Lu 277108a6481SCindy Lu static void vhost_vdpa_add_status(struct vhost_dev *dev, uint8_t status) 278108a6481SCindy Lu { 279108a6481SCindy Lu uint8_t s; 280108a6481SCindy Lu 281778e67deSLaurent Vivier trace_vhost_vdpa_add_status(dev, status); 282108a6481SCindy Lu if (vhost_vdpa_call(dev, VHOST_VDPA_GET_STATUS, &s)) { 283108a6481SCindy Lu return; 284108a6481SCindy Lu } 285108a6481SCindy Lu 286108a6481SCindy Lu s |= status; 287108a6481SCindy Lu 288108a6481SCindy Lu vhost_vdpa_call(dev, VHOST_VDPA_SET_STATUS, &s); 289108a6481SCindy Lu } 290108a6481SCindy Lu 29128770ff9SKevin Wolf static int vhost_vdpa_init(struct vhost_dev *dev, void *opaque, Error **errp) 292108a6481SCindy Lu { 293108a6481SCindy Lu struct vhost_vdpa *v; 294108a6481SCindy Lu assert(dev->vhost_ops->backend_type == VHOST_BACKEND_TYPE_VDPA); 295778e67deSLaurent Vivier trace_vhost_vdpa_init(dev, opaque); 296108a6481SCindy Lu 297108a6481SCindy Lu v = opaque; 298a5bd0580SJason Wang v->dev = dev; 299108a6481SCindy Lu dev->opaque = opaque ; 300108a6481SCindy Lu v->listener = vhost_vdpa_memory_listener; 301108a6481SCindy Lu v->msg_type = VHOST_IOTLB_MSG_V2; 302108a6481SCindy Lu 303108a6481SCindy Lu vhost_vdpa_add_status(dev, VIRTIO_CONFIG_S_ACKNOWLEDGE | 304108a6481SCindy Lu VIRTIO_CONFIG_S_DRIVER); 305108a6481SCindy Lu 306108a6481SCindy Lu return 0; 307108a6481SCindy Lu } 308108a6481SCindy Lu 309d0416d48SJason Wang static void vhost_vdpa_host_notifier_uninit(struct vhost_dev *dev, 310d0416d48SJason Wang int queue_index) 311d0416d48SJason Wang { 312d0416d48SJason Wang size_t page_size = qemu_real_host_page_size; 313d0416d48SJason Wang struct vhost_vdpa *v = dev->opaque; 314d0416d48SJason Wang VirtIODevice *vdev = dev->vdev; 315d0416d48SJason Wang VhostVDPAHostNotifier *n; 316d0416d48SJason Wang 317d0416d48SJason Wang n = &v->notifier[queue_index]; 318d0416d48SJason Wang 319d0416d48SJason Wang if (n->addr) { 320d0416d48SJason Wang virtio_queue_set_host_notifier_mr(vdev, queue_index, &n->mr, false); 321d0416d48SJason Wang object_unparent(OBJECT(&n->mr)); 322d0416d48SJason Wang munmap(n->addr, page_size); 323d0416d48SJason Wang n->addr = NULL; 324d0416d48SJason Wang } 325d0416d48SJason Wang } 326d0416d48SJason Wang 327d0416d48SJason Wang static void vhost_vdpa_host_notifiers_uninit(struct vhost_dev *dev, int n) 328d0416d48SJason Wang { 329d0416d48SJason Wang int i; 330d0416d48SJason Wang 331d0416d48SJason Wang for (i = 0; i < n; i++) { 332d0416d48SJason Wang vhost_vdpa_host_notifier_uninit(dev, i); 333d0416d48SJason Wang } 334d0416d48SJason Wang } 335d0416d48SJason Wang 336d0416d48SJason Wang static int vhost_vdpa_host_notifier_init(struct vhost_dev *dev, int queue_index) 337d0416d48SJason Wang { 338d0416d48SJason Wang size_t page_size = qemu_real_host_page_size; 339d0416d48SJason Wang struct vhost_vdpa *v = dev->opaque; 340d0416d48SJason Wang VirtIODevice *vdev = dev->vdev; 341d0416d48SJason Wang VhostVDPAHostNotifier *n; 342d0416d48SJason Wang int fd = v->device_fd; 343d0416d48SJason Wang void *addr; 344d0416d48SJason Wang char *name; 345d0416d48SJason Wang 346d0416d48SJason Wang vhost_vdpa_host_notifier_uninit(dev, queue_index); 347d0416d48SJason Wang 348d0416d48SJason Wang n = &v->notifier[queue_index]; 349d0416d48SJason Wang 350d0416d48SJason Wang addr = mmap(NULL, page_size, PROT_WRITE, MAP_SHARED, fd, 351d0416d48SJason Wang queue_index * page_size); 352d0416d48SJason Wang if (addr == MAP_FAILED) { 353d0416d48SJason Wang goto err; 354d0416d48SJason Wang } 355d0416d48SJason Wang 356d0416d48SJason Wang name = g_strdup_printf("vhost-vdpa/host-notifier@%p mmaps[%d]", 357d0416d48SJason Wang v, queue_index); 358d0416d48SJason Wang memory_region_init_ram_device_ptr(&n->mr, OBJECT(vdev), name, 359d0416d48SJason Wang page_size, addr); 360d0416d48SJason Wang g_free(name); 361d0416d48SJason Wang 362d0416d48SJason Wang if (virtio_queue_set_host_notifier_mr(vdev, queue_index, &n->mr, true)) { 363d0416d48SJason Wang munmap(addr, page_size); 364d0416d48SJason Wang goto err; 365d0416d48SJason Wang } 366d0416d48SJason Wang n->addr = addr; 367d0416d48SJason Wang 368d0416d48SJason Wang return 0; 369d0416d48SJason Wang 370d0416d48SJason Wang err: 371d0416d48SJason Wang return -1; 372d0416d48SJason Wang } 373d0416d48SJason Wang 374d0416d48SJason Wang static void vhost_vdpa_host_notifiers_init(struct vhost_dev *dev) 375d0416d48SJason Wang { 376d0416d48SJason Wang int i; 377d0416d48SJason Wang 378d0416d48SJason Wang for (i = dev->vq_index; i < dev->vq_index + dev->nvqs; i++) { 379d0416d48SJason Wang if (vhost_vdpa_host_notifier_init(dev, i)) { 380d0416d48SJason Wang goto err; 381d0416d48SJason Wang } 382d0416d48SJason Wang } 383d0416d48SJason Wang 384d0416d48SJason Wang return; 385d0416d48SJason Wang 386d0416d48SJason Wang err: 387d0416d48SJason Wang vhost_vdpa_host_notifiers_uninit(dev, i); 388d0416d48SJason Wang return; 389d0416d48SJason Wang } 390d0416d48SJason Wang 391108a6481SCindy Lu static int vhost_vdpa_cleanup(struct vhost_dev *dev) 392108a6481SCindy Lu { 393108a6481SCindy Lu struct vhost_vdpa *v; 394108a6481SCindy Lu assert(dev->vhost_ops->backend_type == VHOST_BACKEND_TYPE_VDPA); 395108a6481SCindy Lu v = dev->opaque; 396778e67deSLaurent Vivier trace_vhost_vdpa_cleanup(dev, v); 397d0416d48SJason Wang vhost_vdpa_host_notifiers_uninit(dev, dev->nvqs); 398108a6481SCindy Lu memory_listener_unregister(&v->listener); 399108a6481SCindy Lu 400108a6481SCindy Lu dev->opaque = NULL; 401108a6481SCindy Lu return 0; 402108a6481SCindy Lu } 403108a6481SCindy Lu 404108a6481SCindy Lu static int vhost_vdpa_memslots_limit(struct vhost_dev *dev) 405108a6481SCindy Lu { 406778e67deSLaurent Vivier trace_vhost_vdpa_memslots_limit(dev, INT_MAX); 407108a6481SCindy Lu return INT_MAX; 408108a6481SCindy Lu } 409108a6481SCindy Lu 410108a6481SCindy Lu static int vhost_vdpa_set_mem_table(struct vhost_dev *dev, 411108a6481SCindy Lu struct vhost_memory *mem) 412108a6481SCindy Lu { 413778e67deSLaurent Vivier trace_vhost_vdpa_set_mem_table(dev, mem->nregions, mem->padding); 414778e67deSLaurent Vivier if (trace_event_get_state_backends(TRACE_VHOST_VDPA_SET_MEM_TABLE) && 415778e67deSLaurent Vivier trace_event_get_state_backends(TRACE_VHOST_VDPA_DUMP_REGIONS)) { 416778e67deSLaurent Vivier int i; 417778e67deSLaurent Vivier for (i = 0; i < mem->nregions; i++) { 418778e67deSLaurent Vivier trace_vhost_vdpa_dump_regions(dev, i, 419778e67deSLaurent Vivier mem->regions[i].guest_phys_addr, 420778e67deSLaurent Vivier mem->regions[i].memory_size, 421778e67deSLaurent Vivier mem->regions[i].userspace_addr, 422778e67deSLaurent Vivier mem->regions[i].flags_padding); 423778e67deSLaurent Vivier } 424778e67deSLaurent Vivier } 425108a6481SCindy Lu if (mem->padding) { 426108a6481SCindy Lu return -1; 427108a6481SCindy Lu } 428108a6481SCindy Lu 429108a6481SCindy Lu return 0; 430108a6481SCindy Lu } 431108a6481SCindy Lu 432108a6481SCindy Lu static int vhost_vdpa_set_features(struct vhost_dev *dev, 433108a6481SCindy Lu uint64_t features) 434108a6481SCindy Lu { 435108a6481SCindy Lu int ret; 436778e67deSLaurent Vivier trace_vhost_vdpa_set_features(dev, features); 437108a6481SCindy Lu ret = vhost_vdpa_call(dev, VHOST_SET_FEATURES, &features); 438108a6481SCindy Lu uint8_t status = 0; 439108a6481SCindy Lu if (ret) { 440108a6481SCindy Lu return ret; 441108a6481SCindy Lu } 442108a6481SCindy Lu vhost_vdpa_add_status(dev, VIRTIO_CONFIG_S_FEATURES_OK); 443108a6481SCindy Lu vhost_vdpa_call(dev, VHOST_VDPA_GET_STATUS, &status); 444108a6481SCindy Lu 445108a6481SCindy Lu return !(status & VIRTIO_CONFIG_S_FEATURES_OK); 446108a6481SCindy Lu } 447108a6481SCindy Lu 448a5bd0580SJason Wang static int vhost_vdpa_set_backend_cap(struct vhost_dev *dev) 449a5bd0580SJason Wang { 450a5bd0580SJason Wang uint64_t features; 451a5bd0580SJason Wang uint64_t f = 0x1ULL << VHOST_BACKEND_F_IOTLB_MSG_V2 | 452a5bd0580SJason Wang 0x1ULL << VHOST_BACKEND_F_IOTLB_BATCH; 453a5bd0580SJason Wang int r; 454a5bd0580SJason Wang 455a5bd0580SJason Wang if (vhost_vdpa_call(dev, VHOST_GET_BACKEND_FEATURES, &features)) { 4562a83e97eSJason Wang return -EFAULT; 457a5bd0580SJason Wang } 458a5bd0580SJason Wang 459a5bd0580SJason Wang features &= f; 460a5bd0580SJason Wang r = vhost_vdpa_call(dev, VHOST_SET_BACKEND_FEATURES, &features); 461a5bd0580SJason Wang if (r) { 4622a83e97eSJason Wang return -EFAULT; 463a5bd0580SJason Wang } 464a5bd0580SJason Wang 465a5bd0580SJason Wang dev->backend_cap = features; 466a5bd0580SJason Wang 467a5bd0580SJason Wang return 0; 468a5bd0580SJason Wang } 469a5bd0580SJason Wang 470c232b8f4SZenghui Yu static int vhost_vdpa_get_device_id(struct vhost_dev *dev, 471108a6481SCindy Lu uint32_t *device_id) 472108a6481SCindy Lu { 473778e67deSLaurent Vivier int ret; 474778e67deSLaurent Vivier ret = vhost_vdpa_call(dev, VHOST_VDPA_GET_DEVICE_ID, device_id); 475778e67deSLaurent Vivier trace_vhost_vdpa_get_device_id(dev, *device_id); 476778e67deSLaurent Vivier return ret; 477108a6481SCindy Lu } 478108a6481SCindy Lu 479108a6481SCindy Lu static int vhost_vdpa_reset_device(struct vhost_dev *dev) 480108a6481SCindy Lu { 481778e67deSLaurent Vivier int ret; 482108a6481SCindy Lu uint8_t status = 0; 483108a6481SCindy Lu 484778e67deSLaurent Vivier ret = vhost_vdpa_call(dev, VHOST_VDPA_SET_STATUS, &status); 485778e67deSLaurent Vivier trace_vhost_vdpa_reset_device(dev, status); 486778e67deSLaurent Vivier return ret; 487108a6481SCindy Lu } 488108a6481SCindy Lu 489108a6481SCindy Lu static int vhost_vdpa_get_vq_index(struct vhost_dev *dev, int idx) 490108a6481SCindy Lu { 491108a6481SCindy Lu assert(idx >= dev->vq_index && idx < dev->vq_index + dev->nvqs); 492108a6481SCindy Lu 493778e67deSLaurent Vivier trace_vhost_vdpa_get_vq_index(dev, idx, idx - dev->vq_index); 494108a6481SCindy Lu return idx - dev->vq_index; 495108a6481SCindy Lu } 496108a6481SCindy Lu 497108a6481SCindy Lu static int vhost_vdpa_set_vring_ready(struct vhost_dev *dev) 498108a6481SCindy Lu { 499108a6481SCindy Lu int i; 500778e67deSLaurent Vivier trace_vhost_vdpa_set_vring_ready(dev); 501108a6481SCindy Lu for (i = 0; i < dev->nvqs; ++i) { 502108a6481SCindy Lu struct vhost_vring_state state = { 503108a6481SCindy Lu .index = dev->vq_index + i, 504108a6481SCindy Lu .num = 1, 505108a6481SCindy Lu }; 506108a6481SCindy Lu vhost_vdpa_call(dev, VHOST_VDPA_SET_VRING_ENABLE, &state); 507108a6481SCindy Lu } 508108a6481SCindy Lu return 0; 509108a6481SCindy Lu } 510108a6481SCindy Lu 511778e67deSLaurent Vivier static void vhost_vdpa_dump_config(struct vhost_dev *dev, const uint8_t *config, 512778e67deSLaurent Vivier uint32_t config_len) 513778e67deSLaurent Vivier { 514778e67deSLaurent Vivier int b, len; 515778e67deSLaurent Vivier char line[QEMU_HEXDUMP_LINE_LEN]; 516778e67deSLaurent Vivier 517778e67deSLaurent Vivier for (b = 0; b < config_len; b += 16) { 518778e67deSLaurent Vivier len = config_len - b; 519778e67deSLaurent Vivier qemu_hexdump_line(line, b, config, len, false); 520778e67deSLaurent Vivier trace_vhost_vdpa_dump_config(dev, line); 521778e67deSLaurent Vivier } 522778e67deSLaurent Vivier } 523778e67deSLaurent Vivier 524108a6481SCindy Lu static int vhost_vdpa_set_config(struct vhost_dev *dev, const uint8_t *data, 525108a6481SCindy Lu uint32_t offset, uint32_t size, 526108a6481SCindy Lu uint32_t flags) 527108a6481SCindy Lu { 528108a6481SCindy Lu struct vhost_vdpa_config *config; 529108a6481SCindy Lu int ret; 530108a6481SCindy Lu unsigned long config_size = offsetof(struct vhost_vdpa_config, buf); 531986d4f78SLi Qiang 532778e67deSLaurent Vivier trace_vhost_vdpa_set_config(dev, offset, size, flags); 533108a6481SCindy Lu config = g_malloc(size + config_size); 534108a6481SCindy Lu config->off = offset; 535108a6481SCindy Lu config->len = size; 536108a6481SCindy Lu memcpy(config->buf, data, size); 537778e67deSLaurent Vivier if (trace_event_get_state_backends(TRACE_VHOST_VDPA_SET_CONFIG) && 538778e67deSLaurent Vivier trace_event_get_state_backends(TRACE_VHOST_VDPA_DUMP_CONFIG)) { 539778e67deSLaurent Vivier vhost_vdpa_dump_config(dev, data, size); 540778e67deSLaurent Vivier } 541108a6481SCindy Lu ret = vhost_vdpa_call(dev, VHOST_VDPA_SET_CONFIG, config); 542108a6481SCindy Lu g_free(config); 543108a6481SCindy Lu return ret; 544108a6481SCindy Lu } 545108a6481SCindy Lu 546108a6481SCindy Lu static int vhost_vdpa_get_config(struct vhost_dev *dev, uint8_t *config, 54750de5138SKevin Wolf uint32_t config_len, Error **errp) 548108a6481SCindy Lu { 549108a6481SCindy Lu struct vhost_vdpa_config *v_config; 550108a6481SCindy Lu unsigned long config_size = offsetof(struct vhost_vdpa_config, buf); 551108a6481SCindy Lu int ret; 552108a6481SCindy Lu 553778e67deSLaurent Vivier trace_vhost_vdpa_get_config(dev, config, config_len); 554108a6481SCindy Lu v_config = g_malloc(config_len + config_size); 555108a6481SCindy Lu v_config->len = config_len; 556108a6481SCindy Lu v_config->off = 0; 557108a6481SCindy Lu ret = vhost_vdpa_call(dev, VHOST_VDPA_GET_CONFIG, v_config); 558108a6481SCindy Lu memcpy(config, v_config->buf, config_len); 559108a6481SCindy Lu g_free(v_config); 560778e67deSLaurent Vivier if (trace_event_get_state_backends(TRACE_VHOST_VDPA_GET_CONFIG) && 561778e67deSLaurent Vivier trace_event_get_state_backends(TRACE_VHOST_VDPA_DUMP_CONFIG)) { 562778e67deSLaurent Vivier vhost_vdpa_dump_config(dev, config, config_len); 563778e67deSLaurent Vivier } 564108a6481SCindy Lu return ret; 565108a6481SCindy Lu } 566108a6481SCindy Lu 567108a6481SCindy Lu static int vhost_vdpa_dev_start(struct vhost_dev *dev, bool started) 568108a6481SCindy Lu { 569108a6481SCindy Lu struct vhost_vdpa *v = dev->opaque; 570778e67deSLaurent Vivier trace_vhost_vdpa_dev_start(dev, started); 571108a6481SCindy Lu if (started) { 572108a6481SCindy Lu uint8_t status = 0; 573108a6481SCindy Lu memory_listener_register(&v->listener, &address_space_memory); 574d0416d48SJason Wang vhost_vdpa_host_notifiers_init(dev); 575108a6481SCindy Lu vhost_vdpa_set_vring_ready(dev); 576108a6481SCindy Lu vhost_vdpa_add_status(dev, VIRTIO_CONFIG_S_DRIVER_OK); 577108a6481SCindy Lu vhost_vdpa_call(dev, VHOST_VDPA_GET_STATUS, &status); 578108a6481SCindy Lu 579108a6481SCindy Lu return !(status & VIRTIO_CONFIG_S_DRIVER_OK); 580108a6481SCindy Lu } else { 581108a6481SCindy Lu vhost_vdpa_reset_device(dev); 582108a6481SCindy Lu vhost_vdpa_add_status(dev, VIRTIO_CONFIG_S_ACKNOWLEDGE | 583108a6481SCindy Lu VIRTIO_CONFIG_S_DRIVER); 584d0416d48SJason Wang vhost_vdpa_host_notifiers_uninit(dev, dev->nvqs); 585108a6481SCindy Lu memory_listener_unregister(&v->listener); 586108a6481SCindy Lu 587108a6481SCindy Lu return 0; 588108a6481SCindy Lu } 589108a6481SCindy Lu } 590108a6481SCindy Lu 591108a6481SCindy Lu static int vhost_vdpa_set_log_base(struct vhost_dev *dev, uint64_t base, 592108a6481SCindy Lu struct vhost_log *log) 593108a6481SCindy Lu { 594778e67deSLaurent Vivier trace_vhost_vdpa_set_log_base(dev, base, log->size, log->refcnt, log->fd, 595778e67deSLaurent Vivier log->log); 596108a6481SCindy Lu return vhost_vdpa_call(dev, VHOST_SET_LOG_BASE, &base); 597108a6481SCindy Lu } 598108a6481SCindy Lu 599108a6481SCindy Lu static int vhost_vdpa_set_vring_addr(struct vhost_dev *dev, 600108a6481SCindy Lu struct vhost_vring_addr *addr) 601108a6481SCindy Lu { 602778e67deSLaurent Vivier trace_vhost_vdpa_set_vring_addr(dev, addr->index, addr->flags, 603778e67deSLaurent Vivier addr->desc_user_addr, addr->used_user_addr, 604778e67deSLaurent Vivier addr->avail_user_addr, 605778e67deSLaurent Vivier addr->log_guest_addr); 606108a6481SCindy Lu return vhost_vdpa_call(dev, VHOST_SET_VRING_ADDR, addr); 607108a6481SCindy Lu } 608108a6481SCindy Lu 609108a6481SCindy Lu static int vhost_vdpa_set_vring_num(struct vhost_dev *dev, 610108a6481SCindy Lu struct vhost_vring_state *ring) 611108a6481SCindy Lu { 612778e67deSLaurent Vivier trace_vhost_vdpa_set_vring_num(dev, ring->index, ring->num); 613108a6481SCindy Lu return vhost_vdpa_call(dev, VHOST_SET_VRING_NUM, ring); 614108a6481SCindy Lu } 615108a6481SCindy Lu 616108a6481SCindy Lu static int vhost_vdpa_set_vring_base(struct vhost_dev *dev, 617108a6481SCindy Lu struct vhost_vring_state *ring) 618108a6481SCindy Lu { 619778e67deSLaurent Vivier trace_vhost_vdpa_set_vring_base(dev, ring->index, ring->num); 620108a6481SCindy Lu return vhost_vdpa_call(dev, VHOST_SET_VRING_BASE, ring); 621108a6481SCindy Lu } 622108a6481SCindy Lu 623108a6481SCindy Lu static int vhost_vdpa_get_vring_base(struct vhost_dev *dev, 624108a6481SCindy Lu struct vhost_vring_state *ring) 625108a6481SCindy Lu { 626778e67deSLaurent Vivier int ret; 627778e67deSLaurent Vivier 628778e67deSLaurent Vivier ret = vhost_vdpa_call(dev, VHOST_GET_VRING_BASE, ring); 629778e67deSLaurent Vivier trace_vhost_vdpa_get_vring_base(dev, ring->index, ring->num); 630778e67deSLaurent Vivier return ret; 631108a6481SCindy Lu } 632108a6481SCindy Lu 633108a6481SCindy Lu static int vhost_vdpa_set_vring_kick(struct vhost_dev *dev, 634108a6481SCindy Lu struct vhost_vring_file *file) 635108a6481SCindy Lu { 636778e67deSLaurent Vivier trace_vhost_vdpa_set_vring_kick(dev, file->index, file->fd); 637108a6481SCindy Lu return vhost_vdpa_call(dev, VHOST_SET_VRING_KICK, file); 638108a6481SCindy Lu } 639108a6481SCindy Lu 640108a6481SCindy Lu static int vhost_vdpa_set_vring_call(struct vhost_dev *dev, 641108a6481SCindy Lu struct vhost_vring_file *file) 642108a6481SCindy Lu { 643778e67deSLaurent Vivier trace_vhost_vdpa_set_vring_call(dev, file->index, file->fd); 644108a6481SCindy Lu return vhost_vdpa_call(dev, VHOST_SET_VRING_CALL, file); 645108a6481SCindy Lu } 646108a6481SCindy Lu 647108a6481SCindy Lu static int vhost_vdpa_get_features(struct vhost_dev *dev, 648108a6481SCindy Lu uint64_t *features) 649108a6481SCindy Lu { 650778e67deSLaurent Vivier int ret; 651778e67deSLaurent Vivier 652778e67deSLaurent Vivier ret = vhost_vdpa_call(dev, VHOST_GET_FEATURES, features); 653778e67deSLaurent Vivier trace_vhost_vdpa_get_features(dev, *features); 654778e67deSLaurent Vivier return ret; 655108a6481SCindy Lu } 656108a6481SCindy Lu 657108a6481SCindy Lu static int vhost_vdpa_set_owner(struct vhost_dev *dev) 658108a6481SCindy Lu { 659778e67deSLaurent Vivier trace_vhost_vdpa_set_owner(dev); 660108a6481SCindy Lu return vhost_vdpa_call(dev, VHOST_SET_OWNER, NULL); 661108a6481SCindy Lu } 662108a6481SCindy Lu 663108a6481SCindy Lu static int vhost_vdpa_vq_get_addr(struct vhost_dev *dev, 664108a6481SCindy Lu struct vhost_vring_addr *addr, struct vhost_virtqueue *vq) 665108a6481SCindy Lu { 666108a6481SCindy Lu assert(dev->vhost_ops->backend_type == VHOST_BACKEND_TYPE_VDPA); 667108a6481SCindy Lu addr->desc_user_addr = (uint64_t)(unsigned long)vq->desc_phys; 668108a6481SCindy Lu addr->avail_user_addr = (uint64_t)(unsigned long)vq->avail_phys; 669108a6481SCindy Lu addr->used_user_addr = (uint64_t)(unsigned long)vq->used_phys; 670778e67deSLaurent Vivier trace_vhost_vdpa_vq_get_addr(dev, vq, addr->desc_user_addr, 671778e67deSLaurent Vivier addr->avail_user_addr, addr->used_user_addr); 672108a6481SCindy Lu return 0; 673108a6481SCindy Lu } 674108a6481SCindy Lu 675108a6481SCindy Lu static bool vhost_vdpa_force_iommu(struct vhost_dev *dev) 676108a6481SCindy Lu { 677108a6481SCindy Lu return true; 678108a6481SCindy Lu } 679108a6481SCindy Lu 680108a6481SCindy Lu const VhostOps vdpa_ops = { 681108a6481SCindy Lu .backend_type = VHOST_BACKEND_TYPE_VDPA, 682108a6481SCindy Lu .vhost_backend_init = vhost_vdpa_init, 683108a6481SCindy Lu .vhost_backend_cleanup = vhost_vdpa_cleanup, 684108a6481SCindy Lu .vhost_set_log_base = vhost_vdpa_set_log_base, 685108a6481SCindy Lu .vhost_set_vring_addr = vhost_vdpa_set_vring_addr, 686108a6481SCindy Lu .vhost_set_vring_num = vhost_vdpa_set_vring_num, 687108a6481SCindy Lu .vhost_set_vring_base = vhost_vdpa_set_vring_base, 688108a6481SCindy Lu .vhost_get_vring_base = vhost_vdpa_get_vring_base, 689108a6481SCindy Lu .vhost_set_vring_kick = vhost_vdpa_set_vring_kick, 690108a6481SCindy Lu .vhost_set_vring_call = vhost_vdpa_set_vring_call, 691108a6481SCindy Lu .vhost_get_features = vhost_vdpa_get_features, 692a5bd0580SJason Wang .vhost_set_backend_cap = vhost_vdpa_set_backend_cap, 693108a6481SCindy Lu .vhost_set_owner = vhost_vdpa_set_owner, 694108a6481SCindy Lu .vhost_set_vring_endian = NULL, 695108a6481SCindy Lu .vhost_backend_memslots_limit = vhost_vdpa_memslots_limit, 696108a6481SCindy Lu .vhost_set_mem_table = vhost_vdpa_set_mem_table, 697108a6481SCindy Lu .vhost_set_features = vhost_vdpa_set_features, 698108a6481SCindy Lu .vhost_reset_device = vhost_vdpa_reset_device, 699108a6481SCindy Lu .vhost_get_vq_index = vhost_vdpa_get_vq_index, 700108a6481SCindy Lu .vhost_get_config = vhost_vdpa_get_config, 701108a6481SCindy Lu .vhost_set_config = vhost_vdpa_set_config, 702108a6481SCindy Lu .vhost_requires_shm_log = NULL, 703108a6481SCindy Lu .vhost_migration_done = NULL, 704108a6481SCindy Lu .vhost_backend_can_merge = NULL, 705108a6481SCindy Lu .vhost_net_set_mtu = NULL, 706108a6481SCindy Lu .vhost_set_iotlb_callback = NULL, 707108a6481SCindy Lu .vhost_send_device_iotlb_msg = NULL, 708108a6481SCindy Lu .vhost_dev_start = vhost_vdpa_dev_start, 709108a6481SCindy Lu .vhost_get_device_id = vhost_vdpa_get_device_id, 710108a6481SCindy Lu .vhost_vq_get_addr = vhost_vdpa_vq_get_addr, 711108a6481SCindy Lu .vhost_force_iommu = vhost_vdpa_force_iommu, 712108a6481SCindy Lu }; 713