1108a6481SCindy Lu /* 2108a6481SCindy Lu * vhost-vdpa 3108a6481SCindy Lu * 4108a6481SCindy Lu * Copyright(c) 2017-2018 Intel Corporation. 5108a6481SCindy Lu * Copyright(c) 2020 Red Hat, Inc. 6108a6481SCindy Lu * 7108a6481SCindy Lu * This work is licensed under the terms of the GNU GPL, version 2 or later. 8108a6481SCindy Lu * See the COPYING file in the top-level directory. 9108a6481SCindy Lu * 10108a6481SCindy Lu */ 11108a6481SCindy Lu 12108a6481SCindy Lu #include "qemu/osdep.h" 13108a6481SCindy Lu #include <linux/vhost.h> 14108a6481SCindy Lu #include <linux/vfio.h> 15108a6481SCindy Lu #include <sys/eventfd.h> 16108a6481SCindy Lu #include <sys/ioctl.h> 17108a6481SCindy Lu #include "hw/virtio/vhost.h" 18108a6481SCindy Lu #include "hw/virtio/vhost-backend.h" 19108a6481SCindy Lu #include "hw/virtio/virtio-net.h" 20108a6481SCindy Lu #include "hw/virtio/vhost-vdpa.h" 21df77d45aSXie Yongji #include "exec/address-spaces.h" 22108a6481SCindy Lu #include "qemu/main-loop.h" 234dc5acc0SCindy Lu #include "cpu.h" 24778e67deSLaurent Vivier #include "trace.h" 25778e67deSLaurent Vivier #include "qemu-common.h" 26108a6481SCindy Lu 27108a6481SCindy Lu static bool vhost_vdpa_listener_skipped_section(MemoryRegionSection *section) 28108a6481SCindy Lu { 29108a6481SCindy Lu return (!memory_region_is_ram(section->mr) && 30108a6481SCindy Lu !memory_region_is_iommu(section->mr)) || 31d60c75d2SJason Wang /* vhost-vDPA doesn't allow MMIO to be mapped */ 32d60c75d2SJason Wang memory_region_is_ram_device(section->mr) || 33108a6481SCindy Lu /* 34108a6481SCindy Lu * Sizing an enabled 64-bit BAR can cause spurious mappings to 35108a6481SCindy Lu * addresses in the upper part of the 64-bit address space. These 36108a6481SCindy Lu * are never accessed by the CPU and beyond the address width of 37108a6481SCindy Lu * some IOMMU hardware. TODO: VDPA should tell us the IOMMU width. 38108a6481SCindy Lu */ 39108a6481SCindy Lu section->offset_within_address_space & (1ULL << 63); 40108a6481SCindy Lu } 41108a6481SCindy Lu 42108a6481SCindy Lu static int vhost_vdpa_dma_map(struct vhost_vdpa *v, hwaddr iova, hwaddr size, 43108a6481SCindy Lu void *vaddr, bool readonly) 44108a6481SCindy Lu { 45386494f2SCindy Lu struct vhost_msg_v2 msg = {}; 46108a6481SCindy Lu int fd = v->device_fd; 47108a6481SCindy Lu int ret = 0; 48108a6481SCindy Lu 49108a6481SCindy Lu msg.type = v->msg_type; 50108a6481SCindy Lu msg.iotlb.iova = iova; 51108a6481SCindy Lu msg.iotlb.size = size; 52108a6481SCindy Lu msg.iotlb.uaddr = (uint64_t)(uintptr_t)vaddr; 53108a6481SCindy Lu msg.iotlb.perm = readonly ? VHOST_ACCESS_RO : VHOST_ACCESS_RW; 54108a6481SCindy Lu msg.iotlb.type = VHOST_IOTLB_UPDATE; 55108a6481SCindy Lu 56778e67deSLaurent Vivier trace_vhost_vdpa_dma_map(v, fd, msg.type, msg.iotlb.iova, msg.iotlb.size, 57778e67deSLaurent Vivier msg.iotlb.uaddr, msg.iotlb.perm, msg.iotlb.type); 58778e67deSLaurent Vivier 59108a6481SCindy Lu if (write(fd, &msg, sizeof(msg)) != sizeof(msg)) { 60108a6481SCindy Lu error_report("failed to write, fd=%d, errno=%d (%s)", 61108a6481SCindy Lu fd, errno, strerror(errno)); 62108a6481SCindy Lu return -EIO ; 63108a6481SCindy Lu } 64108a6481SCindy Lu 65108a6481SCindy Lu return ret; 66108a6481SCindy Lu } 67108a6481SCindy Lu 68108a6481SCindy Lu static int vhost_vdpa_dma_unmap(struct vhost_vdpa *v, hwaddr iova, 69108a6481SCindy Lu hwaddr size) 70108a6481SCindy Lu { 71386494f2SCindy Lu struct vhost_msg_v2 msg = {}; 72108a6481SCindy Lu int fd = v->device_fd; 73108a6481SCindy Lu int ret = 0; 74108a6481SCindy Lu 75108a6481SCindy Lu msg.type = v->msg_type; 76108a6481SCindy Lu msg.iotlb.iova = iova; 77108a6481SCindy Lu msg.iotlb.size = size; 78108a6481SCindy Lu msg.iotlb.type = VHOST_IOTLB_INVALIDATE; 79108a6481SCindy Lu 80778e67deSLaurent Vivier trace_vhost_vdpa_dma_unmap(v, fd, msg.type, msg.iotlb.iova, 81778e67deSLaurent Vivier msg.iotlb.size, msg.iotlb.type); 82778e67deSLaurent Vivier 83108a6481SCindy Lu if (write(fd, &msg, sizeof(msg)) != sizeof(msg)) { 84108a6481SCindy Lu error_report("failed to write, fd=%d, errno=%d (%s)", 85108a6481SCindy Lu fd, errno, strerror(errno)); 86108a6481SCindy Lu return -EIO ; 87108a6481SCindy Lu } 88108a6481SCindy Lu 89108a6481SCindy Lu return ret; 90108a6481SCindy Lu } 91108a6481SCindy Lu 92a5bd0580SJason Wang static void vhost_vdpa_listener_begin(MemoryListener *listener) 93a5bd0580SJason Wang { 94a5bd0580SJason Wang struct vhost_vdpa *v = container_of(listener, struct vhost_vdpa, listener); 95a5bd0580SJason Wang struct vhost_dev *dev = v->dev; 968acb3218SPhilippe Mathieu-Daudé struct vhost_msg_v2 msg = {}; 97a5bd0580SJason Wang int fd = v->device_fd; 98a5bd0580SJason Wang 99a5bd0580SJason Wang if (!(dev->backend_cap & (0x1ULL << VHOST_BACKEND_F_IOTLB_BATCH))) { 100a5bd0580SJason Wang return; 101a5bd0580SJason Wang } 102a5bd0580SJason Wang 103a5bd0580SJason Wang msg.type = v->msg_type; 104a5bd0580SJason Wang msg.iotlb.type = VHOST_IOTLB_BATCH_BEGIN; 105a5bd0580SJason Wang 106a5bd0580SJason Wang if (write(fd, &msg, sizeof(msg)) != sizeof(msg)) { 107a5bd0580SJason Wang error_report("failed to write, fd=%d, errno=%d (%s)", 108a5bd0580SJason Wang fd, errno, strerror(errno)); 109a5bd0580SJason Wang } 110a5bd0580SJason Wang } 111a5bd0580SJason Wang 112a5bd0580SJason Wang static void vhost_vdpa_listener_commit(MemoryListener *listener) 113a5bd0580SJason Wang { 114a5bd0580SJason Wang struct vhost_vdpa *v = container_of(listener, struct vhost_vdpa, listener); 115a5bd0580SJason Wang struct vhost_dev *dev = v->dev; 1168acb3218SPhilippe Mathieu-Daudé struct vhost_msg_v2 msg = {}; 117a5bd0580SJason Wang int fd = v->device_fd; 118a5bd0580SJason Wang 119a5bd0580SJason Wang if (!(dev->backend_cap & (0x1ULL << VHOST_BACKEND_F_IOTLB_BATCH))) { 120a5bd0580SJason Wang return; 121a5bd0580SJason Wang } 122a5bd0580SJason Wang 123a5bd0580SJason Wang msg.type = v->msg_type; 124a5bd0580SJason Wang msg.iotlb.type = VHOST_IOTLB_BATCH_END; 125a5bd0580SJason Wang 126a5bd0580SJason Wang if (write(fd, &msg, sizeof(msg)) != sizeof(msg)) { 127a5bd0580SJason Wang error_report("failed to write, fd=%d, errno=%d (%s)", 128a5bd0580SJason Wang fd, errno, strerror(errno)); 129a5bd0580SJason Wang } 130a5bd0580SJason Wang } 131a5bd0580SJason Wang 132108a6481SCindy Lu static void vhost_vdpa_listener_region_add(MemoryListener *listener, 133108a6481SCindy Lu MemoryRegionSection *section) 134108a6481SCindy Lu { 135108a6481SCindy Lu struct vhost_vdpa *v = container_of(listener, struct vhost_vdpa, listener); 136108a6481SCindy Lu hwaddr iova; 137108a6481SCindy Lu Int128 llend, llsize; 138108a6481SCindy Lu void *vaddr; 139108a6481SCindy Lu int ret; 140108a6481SCindy Lu 141108a6481SCindy Lu if (vhost_vdpa_listener_skipped_section(section)) { 142108a6481SCindy Lu return; 143108a6481SCindy Lu } 144108a6481SCindy Lu 145108a6481SCindy Lu if (unlikely((section->offset_within_address_space & ~TARGET_PAGE_MASK) != 146108a6481SCindy Lu (section->offset_within_region & ~TARGET_PAGE_MASK))) { 147108a6481SCindy Lu error_report("%s received unaligned region", __func__); 148108a6481SCindy Lu return; 149108a6481SCindy Lu } 150108a6481SCindy Lu 151108a6481SCindy Lu iova = TARGET_PAGE_ALIGN(section->offset_within_address_space); 152108a6481SCindy Lu llend = int128_make64(section->offset_within_address_space); 153108a6481SCindy Lu llend = int128_add(llend, section->size); 154108a6481SCindy Lu llend = int128_and(llend, int128_exts64(TARGET_PAGE_MASK)); 155108a6481SCindy Lu 156108a6481SCindy Lu if (int128_ge(int128_make64(iova), llend)) { 157108a6481SCindy Lu return; 158108a6481SCindy Lu } 159108a6481SCindy Lu 160108a6481SCindy Lu memory_region_ref(section->mr); 161108a6481SCindy Lu 162108a6481SCindy Lu /* Here we assume that memory_region_is_ram(section->mr)==true */ 163108a6481SCindy Lu 164108a6481SCindy Lu vaddr = memory_region_get_ram_ptr(section->mr) + 165108a6481SCindy Lu section->offset_within_region + 166108a6481SCindy Lu (iova - section->offset_within_address_space); 167108a6481SCindy Lu 168778e67deSLaurent Vivier trace_vhost_vdpa_listener_region_add(v, iova, int128_get64(llend), 169778e67deSLaurent Vivier vaddr, section->readonly); 170778e67deSLaurent Vivier 171108a6481SCindy Lu llsize = int128_sub(llend, int128_make64(iova)); 172108a6481SCindy Lu 173108a6481SCindy Lu ret = vhost_vdpa_dma_map(v, iova, int128_get64(llsize), 174108a6481SCindy Lu vaddr, section->readonly); 175108a6481SCindy Lu if (ret) { 176108a6481SCindy Lu error_report("vhost vdpa map fail!"); 177108a6481SCindy Lu goto fail; 178108a6481SCindy Lu } 179108a6481SCindy Lu 180108a6481SCindy Lu return; 181108a6481SCindy Lu 182108a6481SCindy Lu fail: 183108a6481SCindy Lu /* 184108a6481SCindy Lu * On the initfn path, store the first error in the container so we 185108a6481SCindy Lu * can gracefully fail. Runtime, there's not much we can do other 186108a6481SCindy Lu * than throw a hardware error. 187108a6481SCindy Lu */ 188108a6481SCindy Lu error_report("vhost-vdpa: DMA mapping failed, unable to continue"); 189108a6481SCindy Lu return; 190108a6481SCindy Lu 191108a6481SCindy Lu } 192108a6481SCindy Lu 193108a6481SCindy Lu static void vhost_vdpa_listener_region_del(MemoryListener *listener, 194108a6481SCindy Lu MemoryRegionSection *section) 195108a6481SCindy Lu { 196108a6481SCindy Lu struct vhost_vdpa *v = container_of(listener, struct vhost_vdpa, listener); 197108a6481SCindy Lu hwaddr iova; 198108a6481SCindy Lu Int128 llend, llsize; 199108a6481SCindy Lu int ret; 200108a6481SCindy Lu 201108a6481SCindy Lu if (vhost_vdpa_listener_skipped_section(section)) { 202108a6481SCindy Lu return; 203108a6481SCindy Lu } 204108a6481SCindy Lu 205108a6481SCindy Lu if (unlikely((section->offset_within_address_space & ~TARGET_PAGE_MASK) != 206108a6481SCindy Lu (section->offset_within_region & ~TARGET_PAGE_MASK))) { 207108a6481SCindy Lu error_report("%s received unaligned region", __func__); 208108a6481SCindy Lu return; 209108a6481SCindy Lu } 210108a6481SCindy Lu 211108a6481SCindy Lu iova = TARGET_PAGE_ALIGN(section->offset_within_address_space); 212108a6481SCindy Lu llend = int128_make64(section->offset_within_address_space); 213108a6481SCindy Lu llend = int128_add(llend, section->size); 214108a6481SCindy Lu llend = int128_and(llend, int128_exts64(TARGET_PAGE_MASK)); 215108a6481SCindy Lu 216778e67deSLaurent Vivier trace_vhost_vdpa_listener_region_del(v, iova, int128_get64(llend)); 217778e67deSLaurent Vivier 218108a6481SCindy Lu if (int128_ge(int128_make64(iova), llend)) { 219108a6481SCindy Lu return; 220108a6481SCindy Lu } 221108a6481SCindy Lu 222108a6481SCindy Lu llsize = int128_sub(llend, int128_make64(iova)); 223108a6481SCindy Lu 224108a6481SCindy Lu ret = vhost_vdpa_dma_unmap(v, iova, int128_get64(llsize)); 225108a6481SCindy Lu if (ret) { 226108a6481SCindy Lu error_report("vhost_vdpa dma unmap error!"); 227108a6481SCindy Lu } 228108a6481SCindy Lu 229108a6481SCindy Lu memory_region_unref(section->mr); 230108a6481SCindy Lu } 231108a6481SCindy Lu /* 232108a6481SCindy Lu * IOTLB API is used by vhost-vpda which requires incremental updating 233108a6481SCindy Lu * of the mapping. So we can not use generic vhost memory listener which 234108a6481SCindy Lu * depends on the addnop(). 235108a6481SCindy Lu */ 236108a6481SCindy Lu static const MemoryListener vhost_vdpa_memory_listener = { 237a5bd0580SJason Wang .begin = vhost_vdpa_listener_begin, 238a5bd0580SJason Wang .commit = vhost_vdpa_listener_commit, 239108a6481SCindy Lu .region_add = vhost_vdpa_listener_region_add, 240108a6481SCindy Lu .region_del = vhost_vdpa_listener_region_del, 241108a6481SCindy Lu }; 242108a6481SCindy Lu 243108a6481SCindy Lu static int vhost_vdpa_call(struct vhost_dev *dev, unsigned long int request, 244108a6481SCindy Lu void *arg) 245108a6481SCindy Lu { 246108a6481SCindy Lu struct vhost_vdpa *v = dev->opaque; 247108a6481SCindy Lu int fd = v->device_fd; 248*f2a6e6c4SKevin Wolf int ret; 249108a6481SCindy Lu 250108a6481SCindy Lu assert(dev->vhost_ops->backend_type == VHOST_BACKEND_TYPE_VDPA); 251108a6481SCindy Lu 252*f2a6e6c4SKevin Wolf ret = ioctl(fd, request, arg); 253*f2a6e6c4SKevin Wolf return ret < 0 ? -errno : ret; 254108a6481SCindy Lu } 255108a6481SCindy Lu 256108a6481SCindy Lu static void vhost_vdpa_add_status(struct vhost_dev *dev, uint8_t status) 257108a6481SCindy Lu { 258108a6481SCindy Lu uint8_t s; 259108a6481SCindy Lu 260778e67deSLaurent Vivier trace_vhost_vdpa_add_status(dev, status); 261108a6481SCindy Lu if (vhost_vdpa_call(dev, VHOST_VDPA_GET_STATUS, &s)) { 262108a6481SCindy Lu return; 263108a6481SCindy Lu } 264108a6481SCindy Lu 265108a6481SCindy Lu s |= status; 266108a6481SCindy Lu 267108a6481SCindy Lu vhost_vdpa_call(dev, VHOST_VDPA_SET_STATUS, &s); 268108a6481SCindy Lu } 269108a6481SCindy Lu 27028770ff9SKevin Wolf static int vhost_vdpa_init(struct vhost_dev *dev, void *opaque, Error **errp) 271108a6481SCindy Lu { 272108a6481SCindy Lu struct vhost_vdpa *v; 273108a6481SCindy Lu assert(dev->vhost_ops->backend_type == VHOST_BACKEND_TYPE_VDPA); 274778e67deSLaurent Vivier trace_vhost_vdpa_init(dev, opaque); 275108a6481SCindy Lu 276108a6481SCindy Lu v = opaque; 277a5bd0580SJason Wang v->dev = dev; 278108a6481SCindy Lu dev->opaque = opaque ; 279108a6481SCindy Lu v->listener = vhost_vdpa_memory_listener; 280108a6481SCindy Lu v->msg_type = VHOST_IOTLB_MSG_V2; 281108a6481SCindy Lu 282108a6481SCindy Lu vhost_vdpa_add_status(dev, VIRTIO_CONFIG_S_ACKNOWLEDGE | 283108a6481SCindy Lu VIRTIO_CONFIG_S_DRIVER); 284108a6481SCindy Lu 285108a6481SCindy Lu return 0; 286108a6481SCindy Lu } 287108a6481SCindy Lu 288d0416d48SJason Wang static void vhost_vdpa_host_notifier_uninit(struct vhost_dev *dev, 289d0416d48SJason Wang int queue_index) 290d0416d48SJason Wang { 291d0416d48SJason Wang size_t page_size = qemu_real_host_page_size; 292d0416d48SJason Wang struct vhost_vdpa *v = dev->opaque; 293d0416d48SJason Wang VirtIODevice *vdev = dev->vdev; 294d0416d48SJason Wang VhostVDPAHostNotifier *n; 295d0416d48SJason Wang 296d0416d48SJason Wang n = &v->notifier[queue_index]; 297d0416d48SJason Wang 298d0416d48SJason Wang if (n->addr) { 299d0416d48SJason Wang virtio_queue_set_host_notifier_mr(vdev, queue_index, &n->mr, false); 300d0416d48SJason Wang object_unparent(OBJECT(&n->mr)); 301d0416d48SJason Wang munmap(n->addr, page_size); 302d0416d48SJason Wang n->addr = NULL; 303d0416d48SJason Wang } 304d0416d48SJason Wang } 305d0416d48SJason Wang 306d0416d48SJason Wang static void vhost_vdpa_host_notifiers_uninit(struct vhost_dev *dev, int n) 307d0416d48SJason Wang { 308d0416d48SJason Wang int i; 309d0416d48SJason Wang 310d0416d48SJason Wang for (i = 0; i < n; i++) { 311d0416d48SJason Wang vhost_vdpa_host_notifier_uninit(dev, i); 312d0416d48SJason Wang } 313d0416d48SJason Wang } 314d0416d48SJason Wang 315d0416d48SJason Wang static int vhost_vdpa_host_notifier_init(struct vhost_dev *dev, int queue_index) 316d0416d48SJason Wang { 317d0416d48SJason Wang size_t page_size = qemu_real_host_page_size; 318d0416d48SJason Wang struct vhost_vdpa *v = dev->opaque; 319d0416d48SJason Wang VirtIODevice *vdev = dev->vdev; 320d0416d48SJason Wang VhostVDPAHostNotifier *n; 321d0416d48SJason Wang int fd = v->device_fd; 322d0416d48SJason Wang void *addr; 323d0416d48SJason Wang char *name; 324d0416d48SJason Wang 325d0416d48SJason Wang vhost_vdpa_host_notifier_uninit(dev, queue_index); 326d0416d48SJason Wang 327d0416d48SJason Wang n = &v->notifier[queue_index]; 328d0416d48SJason Wang 329d0416d48SJason Wang addr = mmap(NULL, page_size, PROT_WRITE, MAP_SHARED, fd, 330d0416d48SJason Wang queue_index * page_size); 331d0416d48SJason Wang if (addr == MAP_FAILED) { 332d0416d48SJason Wang goto err; 333d0416d48SJason Wang } 334d0416d48SJason Wang 335d0416d48SJason Wang name = g_strdup_printf("vhost-vdpa/host-notifier@%p mmaps[%d]", 336d0416d48SJason Wang v, queue_index); 337d0416d48SJason Wang memory_region_init_ram_device_ptr(&n->mr, OBJECT(vdev), name, 338d0416d48SJason Wang page_size, addr); 339d0416d48SJason Wang g_free(name); 340d0416d48SJason Wang 341d0416d48SJason Wang if (virtio_queue_set_host_notifier_mr(vdev, queue_index, &n->mr, true)) { 342d0416d48SJason Wang munmap(addr, page_size); 343d0416d48SJason Wang goto err; 344d0416d48SJason Wang } 345d0416d48SJason Wang n->addr = addr; 346d0416d48SJason Wang 347d0416d48SJason Wang return 0; 348d0416d48SJason Wang 349d0416d48SJason Wang err: 350d0416d48SJason Wang return -1; 351d0416d48SJason Wang } 352d0416d48SJason Wang 353d0416d48SJason Wang static void vhost_vdpa_host_notifiers_init(struct vhost_dev *dev) 354d0416d48SJason Wang { 355d0416d48SJason Wang int i; 356d0416d48SJason Wang 357d0416d48SJason Wang for (i = dev->vq_index; i < dev->vq_index + dev->nvqs; i++) { 358d0416d48SJason Wang if (vhost_vdpa_host_notifier_init(dev, i)) { 359d0416d48SJason Wang goto err; 360d0416d48SJason Wang } 361d0416d48SJason Wang } 362d0416d48SJason Wang 363d0416d48SJason Wang return; 364d0416d48SJason Wang 365d0416d48SJason Wang err: 366d0416d48SJason Wang vhost_vdpa_host_notifiers_uninit(dev, i); 367d0416d48SJason Wang return; 368d0416d48SJason Wang } 369d0416d48SJason Wang 370108a6481SCindy Lu static int vhost_vdpa_cleanup(struct vhost_dev *dev) 371108a6481SCindy Lu { 372108a6481SCindy Lu struct vhost_vdpa *v; 373108a6481SCindy Lu assert(dev->vhost_ops->backend_type == VHOST_BACKEND_TYPE_VDPA); 374108a6481SCindy Lu v = dev->opaque; 375778e67deSLaurent Vivier trace_vhost_vdpa_cleanup(dev, v); 376d0416d48SJason Wang vhost_vdpa_host_notifiers_uninit(dev, dev->nvqs); 377108a6481SCindy Lu memory_listener_unregister(&v->listener); 378108a6481SCindy Lu 379108a6481SCindy Lu dev->opaque = NULL; 380108a6481SCindy Lu return 0; 381108a6481SCindy Lu } 382108a6481SCindy Lu 383108a6481SCindy Lu static int vhost_vdpa_memslots_limit(struct vhost_dev *dev) 384108a6481SCindy Lu { 385778e67deSLaurent Vivier trace_vhost_vdpa_memslots_limit(dev, INT_MAX); 386108a6481SCindy Lu return INT_MAX; 387108a6481SCindy Lu } 388108a6481SCindy Lu 389108a6481SCindy Lu static int vhost_vdpa_set_mem_table(struct vhost_dev *dev, 390108a6481SCindy Lu struct vhost_memory *mem) 391108a6481SCindy Lu { 392778e67deSLaurent Vivier trace_vhost_vdpa_set_mem_table(dev, mem->nregions, mem->padding); 393778e67deSLaurent Vivier if (trace_event_get_state_backends(TRACE_VHOST_VDPA_SET_MEM_TABLE) && 394778e67deSLaurent Vivier trace_event_get_state_backends(TRACE_VHOST_VDPA_DUMP_REGIONS)) { 395778e67deSLaurent Vivier int i; 396778e67deSLaurent Vivier for (i = 0; i < mem->nregions; i++) { 397778e67deSLaurent Vivier trace_vhost_vdpa_dump_regions(dev, i, 398778e67deSLaurent Vivier mem->regions[i].guest_phys_addr, 399778e67deSLaurent Vivier mem->regions[i].memory_size, 400778e67deSLaurent Vivier mem->regions[i].userspace_addr, 401778e67deSLaurent Vivier mem->regions[i].flags_padding); 402778e67deSLaurent Vivier } 403778e67deSLaurent Vivier } 404108a6481SCindy Lu if (mem->padding) { 405108a6481SCindy Lu return -1; 406108a6481SCindy Lu } 407108a6481SCindy Lu 408108a6481SCindy Lu return 0; 409108a6481SCindy Lu } 410108a6481SCindy Lu 411108a6481SCindy Lu static int vhost_vdpa_set_features(struct vhost_dev *dev, 412108a6481SCindy Lu uint64_t features) 413108a6481SCindy Lu { 414108a6481SCindy Lu int ret; 415778e67deSLaurent Vivier trace_vhost_vdpa_set_features(dev, features); 416108a6481SCindy Lu ret = vhost_vdpa_call(dev, VHOST_SET_FEATURES, &features); 417108a6481SCindy Lu uint8_t status = 0; 418108a6481SCindy Lu if (ret) { 419108a6481SCindy Lu return ret; 420108a6481SCindy Lu } 421108a6481SCindy Lu vhost_vdpa_add_status(dev, VIRTIO_CONFIG_S_FEATURES_OK); 422108a6481SCindy Lu vhost_vdpa_call(dev, VHOST_VDPA_GET_STATUS, &status); 423108a6481SCindy Lu 424108a6481SCindy Lu return !(status & VIRTIO_CONFIG_S_FEATURES_OK); 425108a6481SCindy Lu } 426108a6481SCindy Lu 427a5bd0580SJason Wang static int vhost_vdpa_set_backend_cap(struct vhost_dev *dev) 428a5bd0580SJason Wang { 429a5bd0580SJason Wang uint64_t features; 430a5bd0580SJason Wang uint64_t f = 0x1ULL << VHOST_BACKEND_F_IOTLB_MSG_V2 | 431a5bd0580SJason Wang 0x1ULL << VHOST_BACKEND_F_IOTLB_BATCH; 432a5bd0580SJason Wang int r; 433a5bd0580SJason Wang 434a5bd0580SJason Wang if (vhost_vdpa_call(dev, VHOST_GET_BACKEND_FEATURES, &features)) { 435a5bd0580SJason Wang return 0; 436a5bd0580SJason Wang } 437a5bd0580SJason Wang 438a5bd0580SJason Wang features &= f; 439a5bd0580SJason Wang r = vhost_vdpa_call(dev, VHOST_SET_BACKEND_FEATURES, &features); 440a5bd0580SJason Wang if (r) { 441a5bd0580SJason Wang return 0; 442a5bd0580SJason Wang } 443a5bd0580SJason Wang 444a5bd0580SJason Wang dev->backend_cap = features; 445a5bd0580SJason Wang 446a5bd0580SJason Wang return 0; 447a5bd0580SJason Wang } 448a5bd0580SJason Wang 449c232b8f4SZenghui Yu static int vhost_vdpa_get_device_id(struct vhost_dev *dev, 450108a6481SCindy Lu uint32_t *device_id) 451108a6481SCindy Lu { 452778e67deSLaurent Vivier int ret; 453778e67deSLaurent Vivier ret = vhost_vdpa_call(dev, VHOST_VDPA_GET_DEVICE_ID, device_id); 454778e67deSLaurent Vivier trace_vhost_vdpa_get_device_id(dev, *device_id); 455778e67deSLaurent Vivier return ret; 456108a6481SCindy Lu } 457108a6481SCindy Lu 458108a6481SCindy Lu static int vhost_vdpa_reset_device(struct vhost_dev *dev) 459108a6481SCindy Lu { 460778e67deSLaurent Vivier int ret; 461108a6481SCindy Lu uint8_t status = 0; 462108a6481SCindy Lu 463778e67deSLaurent Vivier ret = vhost_vdpa_call(dev, VHOST_VDPA_SET_STATUS, &status); 464778e67deSLaurent Vivier trace_vhost_vdpa_reset_device(dev, status); 465778e67deSLaurent Vivier return ret; 466108a6481SCindy Lu } 467108a6481SCindy Lu 468108a6481SCindy Lu static int vhost_vdpa_get_vq_index(struct vhost_dev *dev, int idx) 469108a6481SCindy Lu { 470108a6481SCindy Lu assert(idx >= dev->vq_index && idx < dev->vq_index + dev->nvqs); 471108a6481SCindy Lu 472778e67deSLaurent Vivier trace_vhost_vdpa_get_vq_index(dev, idx, idx - dev->vq_index); 473108a6481SCindy Lu return idx - dev->vq_index; 474108a6481SCindy Lu } 475108a6481SCindy Lu 476108a6481SCindy Lu static int vhost_vdpa_set_vring_ready(struct vhost_dev *dev) 477108a6481SCindy Lu { 478108a6481SCindy Lu int i; 479778e67deSLaurent Vivier trace_vhost_vdpa_set_vring_ready(dev); 480108a6481SCindy Lu for (i = 0; i < dev->nvqs; ++i) { 481108a6481SCindy Lu struct vhost_vring_state state = { 482108a6481SCindy Lu .index = dev->vq_index + i, 483108a6481SCindy Lu .num = 1, 484108a6481SCindy Lu }; 485108a6481SCindy Lu vhost_vdpa_call(dev, VHOST_VDPA_SET_VRING_ENABLE, &state); 486108a6481SCindy Lu } 487108a6481SCindy Lu return 0; 488108a6481SCindy Lu } 489108a6481SCindy Lu 490778e67deSLaurent Vivier static void vhost_vdpa_dump_config(struct vhost_dev *dev, const uint8_t *config, 491778e67deSLaurent Vivier uint32_t config_len) 492778e67deSLaurent Vivier { 493778e67deSLaurent Vivier int b, len; 494778e67deSLaurent Vivier char line[QEMU_HEXDUMP_LINE_LEN]; 495778e67deSLaurent Vivier 496778e67deSLaurent Vivier for (b = 0; b < config_len; b += 16) { 497778e67deSLaurent Vivier len = config_len - b; 498778e67deSLaurent Vivier qemu_hexdump_line(line, b, config, len, false); 499778e67deSLaurent Vivier trace_vhost_vdpa_dump_config(dev, line); 500778e67deSLaurent Vivier } 501778e67deSLaurent Vivier } 502778e67deSLaurent Vivier 503108a6481SCindy Lu static int vhost_vdpa_set_config(struct vhost_dev *dev, const uint8_t *data, 504108a6481SCindy Lu uint32_t offset, uint32_t size, 505108a6481SCindy Lu uint32_t flags) 506108a6481SCindy Lu { 507108a6481SCindy Lu struct vhost_vdpa_config *config; 508108a6481SCindy Lu int ret; 509108a6481SCindy Lu unsigned long config_size = offsetof(struct vhost_vdpa_config, buf); 510986d4f78SLi Qiang 511778e67deSLaurent Vivier trace_vhost_vdpa_set_config(dev, offset, size, flags); 512108a6481SCindy Lu config = g_malloc(size + config_size); 513108a6481SCindy Lu config->off = offset; 514108a6481SCindy Lu config->len = size; 515108a6481SCindy Lu memcpy(config->buf, data, size); 516778e67deSLaurent Vivier if (trace_event_get_state_backends(TRACE_VHOST_VDPA_SET_CONFIG) && 517778e67deSLaurent Vivier trace_event_get_state_backends(TRACE_VHOST_VDPA_DUMP_CONFIG)) { 518778e67deSLaurent Vivier vhost_vdpa_dump_config(dev, data, size); 519778e67deSLaurent Vivier } 520108a6481SCindy Lu ret = vhost_vdpa_call(dev, VHOST_VDPA_SET_CONFIG, config); 521108a6481SCindy Lu g_free(config); 522108a6481SCindy Lu return ret; 523108a6481SCindy Lu } 524108a6481SCindy Lu 525108a6481SCindy Lu static int vhost_vdpa_get_config(struct vhost_dev *dev, uint8_t *config, 526108a6481SCindy Lu uint32_t config_len) 527108a6481SCindy Lu { 528108a6481SCindy Lu struct vhost_vdpa_config *v_config; 529108a6481SCindy Lu unsigned long config_size = offsetof(struct vhost_vdpa_config, buf); 530108a6481SCindy Lu int ret; 531108a6481SCindy Lu 532778e67deSLaurent Vivier trace_vhost_vdpa_get_config(dev, config, config_len); 533108a6481SCindy Lu v_config = g_malloc(config_len + config_size); 534108a6481SCindy Lu v_config->len = config_len; 535108a6481SCindy Lu v_config->off = 0; 536108a6481SCindy Lu ret = vhost_vdpa_call(dev, VHOST_VDPA_GET_CONFIG, v_config); 537108a6481SCindy Lu memcpy(config, v_config->buf, config_len); 538108a6481SCindy Lu g_free(v_config); 539778e67deSLaurent Vivier if (trace_event_get_state_backends(TRACE_VHOST_VDPA_GET_CONFIG) && 540778e67deSLaurent Vivier trace_event_get_state_backends(TRACE_VHOST_VDPA_DUMP_CONFIG)) { 541778e67deSLaurent Vivier vhost_vdpa_dump_config(dev, config, config_len); 542778e67deSLaurent Vivier } 543108a6481SCindy Lu return ret; 544108a6481SCindy Lu } 545108a6481SCindy Lu 546108a6481SCindy Lu static int vhost_vdpa_dev_start(struct vhost_dev *dev, bool started) 547108a6481SCindy Lu { 548108a6481SCindy Lu struct vhost_vdpa *v = dev->opaque; 549778e67deSLaurent Vivier trace_vhost_vdpa_dev_start(dev, started); 550108a6481SCindy Lu if (started) { 551108a6481SCindy Lu uint8_t status = 0; 552108a6481SCindy Lu memory_listener_register(&v->listener, &address_space_memory); 553d0416d48SJason Wang vhost_vdpa_host_notifiers_init(dev); 554108a6481SCindy Lu vhost_vdpa_set_vring_ready(dev); 555108a6481SCindy Lu vhost_vdpa_add_status(dev, VIRTIO_CONFIG_S_DRIVER_OK); 556108a6481SCindy Lu vhost_vdpa_call(dev, VHOST_VDPA_GET_STATUS, &status); 557108a6481SCindy Lu 558108a6481SCindy Lu return !(status & VIRTIO_CONFIG_S_DRIVER_OK); 559108a6481SCindy Lu } else { 560108a6481SCindy Lu vhost_vdpa_reset_device(dev); 561108a6481SCindy Lu vhost_vdpa_add_status(dev, VIRTIO_CONFIG_S_ACKNOWLEDGE | 562108a6481SCindy Lu VIRTIO_CONFIG_S_DRIVER); 563d0416d48SJason Wang vhost_vdpa_host_notifiers_uninit(dev, dev->nvqs); 564108a6481SCindy Lu memory_listener_unregister(&v->listener); 565108a6481SCindy Lu 566108a6481SCindy Lu return 0; 567108a6481SCindy Lu } 568108a6481SCindy Lu } 569108a6481SCindy Lu 570108a6481SCindy Lu static int vhost_vdpa_set_log_base(struct vhost_dev *dev, uint64_t base, 571108a6481SCindy Lu struct vhost_log *log) 572108a6481SCindy Lu { 573778e67deSLaurent Vivier trace_vhost_vdpa_set_log_base(dev, base, log->size, log->refcnt, log->fd, 574778e67deSLaurent Vivier log->log); 575108a6481SCindy Lu return vhost_vdpa_call(dev, VHOST_SET_LOG_BASE, &base); 576108a6481SCindy Lu } 577108a6481SCindy Lu 578108a6481SCindy Lu static int vhost_vdpa_set_vring_addr(struct vhost_dev *dev, 579108a6481SCindy Lu struct vhost_vring_addr *addr) 580108a6481SCindy Lu { 581778e67deSLaurent Vivier trace_vhost_vdpa_set_vring_addr(dev, addr->index, addr->flags, 582778e67deSLaurent Vivier addr->desc_user_addr, addr->used_user_addr, 583778e67deSLaurent Vivier addr->avail_user_addr, 584778e67deSLaurent Vivier addr->log_guest_addr); 585108a6481SCindy Lu return vhost_vdpa_call(dev, VHOST_SET_VRING_ADDR, addr); 586108a6481SCindy Lu } 587108a6481SCindy Lu 588108a6481SCindy Lu static int vhost_vdpa_set_vring_num(struct vhost_dev *dev, 589108a6481SCindy Lu struct vhost_vring_state *ring) 590108a6481SCindy Lu { 591778e67deSLaurent Vivier trace_vhost_vdpa_set_vring_num(dev, ring->index, ring->num); 592108a6481SCindy Lu return vhost_vdpa_call(dev, VHOST_SET_VRING_NUM, ring); 593108a6481SCindy Lu } 594108a6481SCindy Lu 595108a6481SCindy Lu static int vhost_vdpa_set_vring_base(struct vhost_dev *dev, 596108a6481SCindy Lu struct vhost_vring_state *ring) 597108a6481SCindy Lu { 598778e67deSLaurent Vivier trace_vhost_vdpa_set_vring_base(dev, ring->index, ring->num); 599108a6481SCindy Lu return vhost_vdpa_call(dev, VHOST_SET_VRING_BASE, ring); 600108a6481SCindy Lu } 601108a6481SCindy Lu 602108a6481SCindy Lu static int vhost_vdpa_get_vring_base(struct vhost_dev *dev, 603108a6481SCindy Lu struct vhost_vring_state *ring) 604108a6481SCindy Lu { 605778e67deSLaurent Vivier int ret; 606778e67deSLaurent Vivier 607778e67deSLaurent Vivier ret = vhost_vdpa_call(dev, VHOST_GET_VRING_BASE, ring); 608778e67deSLaurent Vivier trace_vhost_vdpa_get_vring_base(dev, ring->index, ring->num); 609778e67deSLaurent Vivier return ret; 610108a6481SCindy Lu } 611108a6481SCindy Lu 612108a6481SCindy Lu static int vhost_vdpa_set_vring_kick(struct vhost_dev *dev, 613108a6481SCindy Lu struct vhost_vring_file *file) 614108a6481SCindy Lu { 615778e67deSLaurent Vivier trace_vhost_vdpa_set_vring_kick(dev, file->index, file->fd); 616108a6481SCindy Lu return vhost_vdpa_call(dev, VHOST_SET_VRING_KICK, file); 617108a6481SCindy Lu } 618108a6481SCindy Lu 619108a6481SCindy Lu static int vhost_vdpa_set_vring_call(struct vhost_dev *dev, 620108a6481SCindy Lu struct vhost_vring_file *file) 621108a6481SCindy Lu { 622778e67deSLaurent Vivier trace_vhost_vdpa_set_vring_call(dev, file->index, file->fd); 623108a6481SCindy Lu return vhost_vdpa_call(dev, VHOST_SET_VRING_CALL, file); 624108a6481SCindy Lu } 625108a6481SCindy Lu 626108a6481SCindy Lu static int vhost_vdpa_get_features(struct vhost_dev *dev, 627108a6481SCindy Lu uint64_t *features) 628108a6481SCindy Lu { 629778e67deSLaurent Vivier int ret; 630778e67deSLaurent Vivier 631778e67deSLaurent Vivier ret = vhost_vdpa_call(dev, VHOST_GET_FEATURES, features); 632778e67deSLaurent Vivier trace_vhost_vdpa_get_features(dev, *features); 633778e67deSLaurent Vivier return ret; 634108a6481SCindy Lu } 635108a6481SCindy Lu 636108a6481SCindy Lu static int vhost_vdpa_set_owner(struct vhost_dev *dev) 637108a6481SCindy Lu { 638778e67deSLaurent Vivier trace_vhost_vdpa_set_owner(dev); 639108a6481SCindy Lu return vhost_vdpa_call(dev, VHOST_SET_OWNER, NULL); 640108a6481SCindy Lu } 641108a6481SCindy Lu 642108a6481SCindy Lu static int vhost_vdpa_vq_get_addr(struct vhost_dev *dev, 643108a6481SCindy Lu struct vhost_vring_addr *addr, struct vhost_virtqueue *vq) 644108a6481SCindy Lu { 645108a6481SCindy Lu assert(dev->vhost_ops->backend_type == VHOST_BACKEND_TYPE_VDPA); 646108a6481SCindy Lu addr->desc_user_addr = (uint64_t)(unsigned long)vq->desc_phys; 647108a6481SCindy Lu addr->avail_user_addr = (uint64_t)(unsigned long)vq->avail_phys; 648108a6481SCindy Lu addr->used_user_addr = (uint64_t)(unsigned long)vq->used_phys; 649778e67deSLaurent Vivier trace_vhost_vdpa_vq_get_addr(dev, vq, addr->desc_user_addr, 650778e67deSLaurent Vivier addr->avail_user_addr, addr->used_user_addr); 651108a6481SCindy Lu return 0; 652108a6481SCindy Lu } 653108a6481SCindy Lu 654108a6481SCindy Lu static bool vhost_vdpa_force_iommu(struct vhost_dev *dev) 655108a6481SCindy Lu { 656108a6481SCindy Lu return true; 657108a6481SCindy Lu } 658108a6481SCindy Lu 659108a6481SCindy Lu const VhostOps vdpa_ops = { 660108a6481SCindy Lu .backend_type = VHOST_BACKEND_TYPE_VDPA, 661108a6481SCindy Lu .vhost_backend_init = vhost_vdpa_init, 662108a6481SCindy Lu .vhost_backend_cleanup = vhost_vdpa_cleanup, 663108a6481SCindy Lu .vhost_set_log_base = vhost_vdpa_set_log_base, 664108a6481SCindy Lu .vhost_set_vring_addr = vhost_vdpa_set_vring_addr, 665108a6481SCindy Lu .vhost_set_vring_num = vhost_vdpa_set_vring_num, 666108a6481SCindy Lu .vhost_set_vring_base = vhost_vdpa_set_vring_base, 667108a6481SCindy Lu .vhost_get_vring_base = vhost_vdpa_get_vring_base, 668108a6481SCindy Lu .vhost_set_vring_kick = vhost_vdpa_set_vring_kick, 669108a6481SCindy Lu .vhost_set_vring_call = vhost_vdpa_set_vring_call, 670108a6481SCindy Lu .vhost_get_features = vhost_vdpa_get_features, 671a5bd0580SJason Wang .vhost_set_backend_cap = vhost_vdpa_set_backend_cap, 672108a6481SCindy Lu .vhost_set_owner = vhost_vdpa_set_owner, 673108a6481SCindy Lu .vhost_set_vring_endian = NULL, 674108a6481SCindy Lu .vhost_backend_memslots_limit = vhost_vdpa_memslots_limit, 675108a6481SCindy Lu .vhost_set_mem_table = vhost_vdpa_set_mem_table, 676108a6481SCindy Lu .vhost_set_features = vhost_vdpa_set_features, 677108a6481SCindy Lu .vhost_reset_device = vhost_vdpa_reset_device, 678108a6481SCindy Lu .vhost_get_vq_index = vhost_vdpa_get_vq_index, 679108a6481SCindy Lu .vhost_get_config = vhost_vdpa_get_config, 680108a6481SCindy Lu .vhost_set_config = vhost_vdpa_set_config, 681108a6481SCindy Lu .vhost_requires_shm_log = NULL, 682108a6481SCindy Lu .vhost_migration_done = NULL, 683108a6481SCindy Lu .vhost_backend_can_merge = NULL, 684108a6481SCindy Lu .vhost_net_set_mtu = NULL, 685108a6481SCindy Lu .vhost_set_iotlb_callback = NULL, 686108a6481SCindy Lu .vhost_send_device_iotlb_msg = NULL, 687108a6481SCindy Lu .vhost_dev_start = vhost_vdpa_dev_start, 688108a6481SCindy Lu .vhost_get_device_id = vhost_vdpa_get_device_id, 689108a6481SCindy Lu .vhost_vq_get_addr = vhost_vdpa_vq_get_addr, 690108a6481SCindy Lu .vhost_force_iommu = vhost_vdpa_force_iommu, 691108a6481SCindy Lu }; 692