1108a6481SCindy Lu /* 2108a6481SCindy Lu * vhost-vdpa 3108a6481SCindy Lu * 4108a6481SCindy Lu * Copyright(c) 2017-2018 Intel Corporation. 5108a6481SCindy Lu * Copyright(c) 2020 Red Hat, Inc. 6108a6481SCindy Lu * 7108a6481SCindy Lu * This work is licensed under the terms of the GNU GPL, version 2 or later. 8108a6481SCindy Lu * See the COPYING file in the top-level directory. 9108a6481SCindy Lu * 10108a6481SCindy Lu */ 11108a6481SCindy Lu 12108a6481SCindy Lu #include "qemu/osdep.h" 13108a6481SCindy Lu #include <linux/vhost.h> 14108a6481SCindy Lu #include <linux/vfio.h> 15108a6481SCindy Lu #include <sys/eventfd.h> 16108a6481SCindy Lu #include <sys/ioctl.h> 17108a6481SCindy Lu #include "hw/virtio/vhost.h" 18108a6481SCindy Lu #include "hw/virtio/vhost-backend.h" 19108a6481SCindy Lu #include "hw/virtio/virtio-net.h" 20108a6481SCindy Lu #include "hw/virtio/vhost-vdpa.h" 21df77d45aSXie Yongji #include "exec/address-spaces.h" 22108a6481SCindy Lu #include "qemu/main-loop.h" 234dc5acc0SCindy Lu #include "cpu.h" 24778e67deSLaurent Vivier #include "trace.h" 25778e67deSLaurent Vivier #include "qemu-common.h" 26108a6481SCindy Lu 27108a6481SCindy Lu static bool vhost_vdpa_listener_skipped_section(MemoryRegionSection *section) 28108a6481SCindy Lu { 29108a6481SCindy Lu return (!memory_region_is_ram(section->mr) && 30108a6481SCindy Lu !memory_region_is_iommu(section->mr)) || 31d60c75d2SJason Wang /* vhost-vDPA doesn't allow MMIO to be mapped */ 32d60c75d2SJason Wang memory_region_is_ram_device(section->mr) || 33108a6481SCindy Lu /* 34108a6481SCindy Lu * Sizing an enabled 64-bit BAR can cause spurious mappings to 35108a6481SCindy Lu * addresses in the upper part of the 64-bit address space. These 36108a6481SCindy Lu * are never accessed by the CPU and beyond the address width of 37108a6481SCindy Lu * some IOMMU hardware. TODO: VDPA should tell us the IOMMU width. 38108a6481SCindy Lu */ 39108a6481SCindy Lu section->offset_within_address_space & (1ULL << 63); 40108a6481SCindy Lu } 41108a6481SCindy Lu 42108a6481SCindy Lu static int vhost_vdpa_dma_map(struct vhost_vdpa *v, hwaddr iova, hwaddr size, 43108a6481SCindy Lu void *vaddr, bool readonly) 44108a6481SCindy Lu { 45386494f2SCindy Lu struct vhost_msg_v2 msg = {}; 46108a6481SCindy Lu int fd = v->device_fd; 47108a6481SCindy Lu int ret = 0; 48108a6481SCindy Lu 49108a6481SCindy Lu msg.type = v->msg_type; 50108a6481SCindy Lu msg.iotlb.iova = iova; 51108a6481SCindy Lu msg.iotlb.size = size; 52108a6481SCindy Lu msg.iotlb.uaddr = (uint64_t)(uintptr_t)vaddr; 53108a6481SCindy Lu msg.iotlb.perm = readonly ? VHOST_ACCESS_RO : VHOST_ACCESS_RW; 54108a6481SCindy Lu msg.iotlb.type = VHOST_IOTLB_UPDATE; 55108a6481SCindy Lu 56778e67deSLaurent Vivier trace_vhost_vdpa_dma_map(v, fd, msg.type, msg.iotlb.iova, msg.iotlb.size, 57778e67deSLaurent Vivier msg.iotlb.uaddr, msg.iotlb.perm, msg.iotlb.type); 58778e67deSLaurent Vivier 59108a6481SCindy Lu if (write(fd, &msg, sizeof(msg)) != sizeof(msg)) { 60108a6481SCindy Lu error_report("failed to write, fd=%d, errno=%d (%s)", 61108a6481SCindy Lu fd, errno, strerror(errno)); 62108a6481SCindy Lu return -EIO ; 63108a6481SCindy Lu } 64108a6481SCindy Lu 65108a6481SCindy Lu return ret; 66108a6481SCindy Lu } 67108a6481SCindy Lu 68108a6481SCindy Lu static int vhost_vdpa_dma_unmap(struct vhost_vdpa *v, hwaddr iova, 69108a6481SCindy Lu hwaddr size) 70108a6481SCindy Lu { 71386494f2SCindy Lu struct vhost_msg_v2 msg = {}; 72108a6481SCindy Lu int fd = v->device_fd; 73108a6481SCindy Lu int ret = 0; 74108a6481SCindy Lu 75108a6481SCindy Lu msg.type = v->msg_type; 76108a6481SCindy Lu msg.iotlb.iova = iova; 77108a6481SCindy Lu msg.iotlb.size = size; 78108a6481SCindy Lu msg.iotlb.type = VHOST_IOTLB_INVALIDATE; 79108a6481SCindy Lu 80778e67deSLaurent Vivier trace_vhost_vdpa_dma_unmap(v, fd, msg.type, msg.iotlb.iova, 81778e67deSLaurent Vivier msg.iotlb.size, msg.iotlb.type); 82778e67deSLaurent Vivier 83108a6481SCindy Lu if (write(fd, &msg, sizeof(msg)) != sizeof(msg)) { 84108a6481SCindy Lu error_report("failed to write, fd=%d, errno=%d (%s)", 85108a6481SCindy Lu fd, errno, strerror(errno)); 86108a6481SCindy Lu return -EIO ; 87108a6481SCindy Lu } 88108a6481SCindy Lu 89108a6481SCindy Lu return ret; 90108a6481SCindy Lu } 91108a6481SCindy Lu 92e6db5df7SEugenio Pérez static void vhost_vdpa_listener_begin_batch(struct vhost_vdpa *v) 93a5bd0580SJason Wang { 94a5bd0580SJason Wang int fd = v->device_fd; 95e6db5df7SEugenio Pérez struct vhost_msg_v2 msg = { 96e6db5df7SEugenio Pérez .type = v->msg_type, 97e6db5df7SEugenio Pérez .iotlb.type = VHOST_IOTLB_BATCH_BEGIN, 98e6db5df7SEugenio Pérez }; 99a5bd0580SJason Wang 100a5bd0580SJason Wang if (write(fd, &msg, sizeof(msg)) != sizeof(msg)) { 101a5bd0580SJason Wang error_report("failed to write, fd=%d, errno=%d (%s)", 102a5bd0580SJason Wang fd, errno, strerror(errno)); 103a5bd0580SJason Wang } 104a5bd0580SJason Wang } 105a5bd0580SJason Wang 106e6db5df7SEugenio Pérez static void vhost_vdpa_iotlb_batch_begin_once(struct vhost_vdpa *v) 107e6db5df7SEugenio Pérez { 108e6db5df7SEugenio Pérez if (v->dev->backend_cap & (0x1ULL << VHOST_BACKEND_F_IOTLB_BATCH) && 109e6db5df7SEugenio Pérez !v->iotlb_batch_begin_sent) { 110e6db5df7SEugenio Pérez vhost_vdpa_listener_begin_batch(v); 111e6db5df7SEugenio Pérez } 112e6db5df7SEugenio Pérez 113e6db5df7SEugenio Pérez v->iotlb_batch_begin_sent = true; 114e6db5df7SEugenio Pérez } 115e6db5df7SEugenio Pérez 116a5bd0580SJason Wang static void vhost_vdpa_listener_commit(MemoryListener *listener) 117a5bd0580SJason Wang { 118a5bd0580SJason Wang struct vhost_vdpa *v = container_of(listener, struct vhost_vdpa, listener); 119a5bd0580SJason Wang struct vhost_dev *dev = v->dev; 1208acb3218SPhilippe Mathieu-Daudé struct vhost_msg_v2 msg = {}; 121a5bd0580SJason Wang int fd = v->device_fd; 122a5bd0580SJason Wang 123a5bd0580SJason Wang if (!(dev->backend_cap & (0x1ULL << VHOST_BACKEND_F_IOTLB_BATCH))) { 124a5bd0580SJason Wang return; 125a5bd0580SJason Wang } 126a5bd0580SJason Wang 127e6db5df7SEugenio Pérez if (!v->iotlb_batch_begin_sent) { 128e6db5df7SEugenio Pérez return; 129e6db5df7SEugenio Pérez } 130e6db5df7SEugenio Pérez 131a5bd0580SJason Wang msg.type = v->msg_type; 132a5bd0580SJason Wang msg.iotlb.type = VHOST_IOTLB_BATCH_END; 133a5bd0580SJason Wang 134a5bd0580SJason Wang if (write(fd, &msg, sizeof(msg)) != sizeof(msg)) { 135a5bd0580SJason Wang error_report("failed to write, fd=%d, errno=%d (%s)", 136a5bd0580SJason Wang fd, errno, strerror(errno)); 137a5bd0580SJason Wang } 138e6db5df7SEugenio Pérez 139e6db5df7SEugenio Pérez v->iotlb_batch_begin_sent = false; 140a5bd0580SJason Wang } 141a5bd0580SJason Wang 142108a6481SCindy Lu static void vhost_vdpa_listener_region_add(MemoryListener *listener, 143108a6481SCindy Lu MemoryRegionSection *section) 144108a6481SCindy Lu { 145108a6481SCindy Lu struct vhost_vdpa *v = container_of(listener, struct vhost_vdpa, listener); 146108a6481SCindy Lu hwaddr iova; 147108a6481SCindy Lu Int128 llend, llsize; 148108a6481SCindy Lu void *vaddr; 149108a6481SCindy Lu int ret; 150108a6481SCindy Lu 151108a6481SCindy Lu if (vhost_vdpa_listener_skipped_section(section)) { 152108a6481SCindy Lu return; 153108a6481SCindy Lu } 154108a6481SCindy Lu 155108a6481SCindy Lu if (unlikely((section->offset_within_address_space & ~TARGET_PAGE_MASK) != 156108a6481SCindy Lu (section->offset_within_region & ~TARGET_PAGE_MASK))) { 157108a6481SCindy Lu error_report("%s received unaligned region", __func__); 158108a6481SCindy Lu return; 159108a6481SCindy Lu } 160108a6481SCindy Lu 161108a6481SCindy Lu iova = TARGET_PAGE_ALIGN(section->offset_within_address_space); 162108a6481SCindy Lu llend = int128_make64(section->offset_within_address_space); 163108a6481SCindy Lu llend = int128_add(llend, section->size); 164108a6481SCindy Lu llend = int128_and(llend, int128_exts64(TARGET_PAGE_MASK)); 165108a6481SCindy Lu 166108a6481SCindy Lu if (int128_ge(int128_make64(iova), llend)) { 167108a6481SCindy Lu return; 168108a6481SCindy Lu } 169108a6481SCindy Lu 170108a6481SCindy Lu memory_region_ref(section->mr); 171108a6481SCindy Lu 172108a6481SCindy Lu /* Here we assume that memory_region_is_ram(section->mr)==true */ 173108a6481SCindy Lu 174108a6481SCindy Lu vaddr = memory_region_get_ram_ptr(section->mr) + 175108a6481SCindy Lu section->offset_within_region + 176108a6481SCindy Lu (iova - section->offset_within_address_space); 177108a6481SCindy Lu 178778e67deSLaurent Vivier trace_vhost_vdpa_listener_region_add(v, iova, int128_get64(llend), 179778e67deSLaurent Vivier vaddr, section->readonly); 180778e67deSLaurent Vivier 181108a6481SCindy Lu llsize = int128_sub(llend, int128_make64(iova)); 182108a6481SCindy Lu 183e6db5df7SEugenio Pérez vhost_vdpa_iotlb_batch_begin_once(v); 184108a6481SCindy Lu ret = vhost_vdpa_dma_map(v, iova, int128_get64(llsize), 185108a6481SCindy Lu vaddr, section->readonly); 186108a6481SCindy Lu if (ret) { 187108a6481SCindy Lu error_report("vhost vdpa map fail!"); 188108a6481SCindy Lu goto fail; 189108a6481SCindy Lu } 190108a6481SCindy Lu 191108a6481SCindy Lu return; 192108a6481SCindy Lu 193108a6481SCindy Lu fail: 194108a6481SCindy Lu /* 195108a6481SCindy Lu * On the initfn path, store the first error in the container so we 196108a6481SCindy Lu * can gracefully fail. Runtime, there's not much we can do other 197108a6481SCindy Lu * than throw a hardware error. 198108a6481SCindy Lu */ 199108a6481SCindy Lu error_report("vhost-vdpa: DMA mapping failed, unable to continue"); 200108a6481SCindy Lu return; 201108a6481SCindy Lu 202108a6481SCindy Lu } 203108a6481SCindy Lu 204108a6481SCindy Lu static void vhost_vdpa_listener_region_del(MemoryListener *listener, 205108a6481SCindy Lu MemoryRegionSection *section) 206108a6481SCindy Lu { 207108a6481SCindy Lu struct vhost_vdpa *v = container_of(listener, struct vhost_vdpa, listener); 208108a6481SCindy Lu hwaddr iova; 209108a6481SCindy Lu Int128 llend, llsize; 210108a6481SCindy Lu int ret; 211108a6481SCindy Lu 212108a6481SCindy Lu if (vhost_vdpa_listener_skipped_section(section)) { 213108a6481SCindy Lu return; 214108a6481SCindy Lu } 215108a6481SCindy Lu 216108a6481SCindy Lu if (unlikely((section->offset_within_address_space & ~TARGET_PAGE_MASK) != 217108a6481SCindy Lu (section->offset_within_region & ~TARGET_PAGE_MASK))) { 218108a6481SCindy Lu error_report("%s received unaligned region", __func__); 219108a6481SCindy Lu return; 220108a6481SCindy Lu } 221108a6481SCindy Lu 222108a6481SCindy Lu iova = TARGET_PAGE_ALIGN(section->offset_within_address_space); 223108a6481SCindy Lu llend = int128_make64(section->offset_within_address_space); 224108a6481SCindy Lu llend = int128_add(llend, section->size); 225108a6481SCindy Lu llend = int128_and(llend, int128_exts64(TARGET_PAGE_MASK)); 226108a6481SCindy Lu 227778e67deSLaurent Vivier trace_vhost_vdpa_listener_region_del(v, iova, int128_get64(llend)); 228778e67deSLaurent Vivier 229108a6481SCindy Lu if (int128_ge(int128_make64(iova), llend)) { 230108a6481SCindy Lu return; 231108a6481SCindy Lu } 232108a6481SCindy Lu 233108a6481SCindy Lu llsize = int128_sub(llend, int128_make64(iova)); 234108a6481SCindy Lu 235e6db5df7SEugenio Pérez vhost_vdpa_iotlb_batch_begin_once(v); 236108a6481SCindy Lu ret = vhost_vdpa_dma_unmap(v, iova, int128_get64(llsize)); 237108a6481SCindy Lu if (ret) { 238108a6481SCindy Lu error_report("vhost_vdpa dma unmap error!"); 239108a6481SCindy Lu } 240108a6481SCindy Lu 241108a6481SCindy Lu memory_region_unref(section->mr); 242108a6481SCindy Lu } 243108a6481SCindy Lu /* 244108a6481SCindy Lu * IOTLB API is used by vhost-vpda which requires incremental updating 245108a6481SCindy Lu * of the mapping. So we can not use generic vhost memory listener which 246108a6481SCindy Lu * depends on the addnop(). 247108a6481SCindy Lu */ 248108a6481SCindy Lu static const MemoryListener vhost_vdpa_memory_listener = { 249a5bd0580SJason Wang .commit = vhost_vdpa_listener_commit, 250108a6481SCindy Lu .region_add = vhost_vdpa_listener_region_add, 251108a6481SCindy Lu .region_del = vhost_vdpa_listener_region_del, 252108a6481SCindy Lu }; 253108a6481SCindy Lu 254108a6481SCindy Lu static int vhost_vdpa_call(struct vhost_dev *dev, unsigned long int request, 255108a6481SCindy Lu void *arg) 256108a6481SCindy Lu { 257108a6481SCindy Lu struct vhost_vdpa *v = dev->opaque; 258108a6481SCindy Lu int fd = v->device_fd; 259f2a6e6c4SKevin Wolf int ret; 260108a6481SCindy Lu 261108a6481SCindy Lu assert(dev->vhost_ops->backend_type == VHOST_BACKEND_TYPE_VDPA); 262108a6481SCindy Lu 263f2a6e6c4SKevin Wolf ret = ioctl(fd, request, arg); 264f2a6e6c4SKevin Wolf return ret < 0 ? -errno : ret; 265108a6481SCindy Lu } 266108a6481SCindy Lu 267108a6481SCindy Lu static void vhost_vdpa_add_status(struct vhost_dev *dev, uint8_t status) 268108a6481SCindy Lu { 269108a6481SCindy Lu uint8_t s; 270108a6481SCindy Lu 271778e67deSLaurent Vivier trace_vhost_vdpa_add_status(dev, status); 272108a6481SCindy Lu if (vhost_vdpa_call(dev, VHOST_VDPA_GET_STATUS, &s)) { 273108a6481SCindy Lu return; 274108a6481SCindy Lu } 275108a6481SCindy Lu 276108a6481SCindy Lu s |= status; 277108a6481SCindy Lu 278108a6481SCindy Lu vhost_vdpa_call(dev, VHOST_VDPA_SET_STATUS, &s); 279108a6481SCindy Lu } 280108a6481SCindy Lu 28128770ff9SKevin Wolf static int vhost_vdpa_init(struct vhost_dev *dev, void *opaque, Error **errp) 282108a6481SCindy Lu { 283108a6481SCindy Lu struct vhost_vdpa *v; 284108a6481SCindy Lu assert(dev->vhost_ops->backend_type == VHOST_BACKEND_TYPE_VDPA); 285778e67deSLaurent Vivier trace_vhost_vdpa_init(dev, opaque); 286108a6481SCindy Lu 287108a6481SCindy Lu v = opaque; 288a5bd0580SJason Wang v->dev = dev; 289108a6481SCindy Lu dev->opaque = opaque ; 290108a6481SCindy Lu v->listener = vhost_vdpa_memory_listener; 291108a6481SCindy Lu v->msg_type = VHOST_IOTLB_MSG_V2; 292108a6481SCindy Lu 293108a6481SCindy Lu vhost_vdpa_add_status(dev, VIRTIO_CONFIG_S_ACKNOWLEDGE | 294108a6481SCindy Lu VIRTIO_CONFIG_S_DRIVER); 295108a6481SCindy Lu 296108a6481SCindy Lu return 0; 297108a6481SCindy Lu } 298108a6481SCindy Lu 299d0416d48SJason Wang static void vhost_vdpa_host_notifier_uninit(struct vhost_dev *dev, 300d0416d48SJason Wang int queue_index) 301d0416d48SJason Wang { 302d0416d48SJason Wang size_t page_size = qemu_real_host_page_size; 303d0416d48SJason Wang struct vhost_vdpa *v = dev->opaque; 304d0416d48SJason Wang VirtIODevice *vdev = dev->vdev; 305d0416d48SJason Wang VhostVDPAHostNotifier *n; 306d0416d48SJason Wang 307d0416d48SJason Wang n = &v->notifier[queue_index]; 308d0416d48SJason Wang 309d0416d48SJason Wang if (n->addr) { 310d0416d48SJason Wang virtio_queue_set_host_notifier_mr(vdev, queue_index, &n->mr, false); 311d0416d48SJason Wang object_unparent(OBJECT(&n->mr)); 312d0416d48SJason Wang munmap(n->addr, page_size); 313d0416d48SJason Wang n->addr = NULL; 314d0416d48SJason Wang } 315d0416d48SJason Wang } 316d0416d48SJason Wang 317d0416d48SJason Wang static void vhost_vdpa_host_notifiers_uninit(struct vhost_dev *dev, int n) 318d0416d48SJason Wang { 319d0416d48SJason Wang int i; 320d0416d48SJason Wang 321d0416d48SJason Wang for (i = 0; i < n; i++) { 322d0416d48SJason Wang vhost_vdpa_host_notifier_uninit(dev, i); 323d0416d48SJason Wang } 324d0416d48SJason Wang } 325d0416d48SJason Wang 326d0416d48SJason Wang static int vhost_vdpa_host_notifier_init(struct vhost_dev *dev, int queue_index) 327d0416d48SJason Wang { 328d0416d48SJason Wang size_t page_size = qemu_real_host_page_size; 329d0416d48SJason Wang struct vhost_vdpa *v = dev->opaque; 330d0416d48SJason Wang VirtIODevice *vdev = dev->vdev; 331d0416d48SJason Wang VhostVDPAHostNotifier *n; 332d0416d48SJason Wang int fd = v->device_fd; 333d0416d48SJason Wang void *addr; 334d0416d48SJason Wang char *name; 335d0416d48SJason Wang 336d0416d48SJason Wang vhost_vdpa_host_notifier_uninit(dev, queue_index); 337d0416d48SJason Wang 338d0416d48SJason Wang n = &v->notifier[queue_index]; 339d0416d48SJason Wang 340d0416d48SJason Wang addr = mmap(NULL, page_size, PROT_WRITE, MAP_SHARED, fd, 341d0416d48SJason Wang queue_index * page_size); 342d0416d48SJason Wang if (addr == MAP_FAILED) { 343d0416d48SJason Wang goto err; 344d0416d48SJason Wang } 345d0416d48SJason Wang 346d0416d48SJason Wang name = g_strdup_printf("vhost-vdpa/host-notifier@%p mmaps[%d]", 347d0416d48SJason Wang v, queue_index); 348d0416d48SJason Wang memory_region_init_ram_device_ptr(&n->mr, OBJECT(vdev), name, 349d0416d48SJason Wang page_size, addr); 350d0416d48SJason Wang g_free(name); 351d0416d48SJason Wang 352d0416d48SJason Wang if (virtio_queue_set_host_notifier_mr(vdev, queue_index, &n->mr, true)) { 353d0416d48SJason Wang munmap(addr, page_size); 354d0416d48SJason Wang goto err; 355d0416d48SJason Wang } 356d0416d48SJason Wang n->addr = addr; 357d0416d48SJason Wang 358d0416d48SJason Wang return 0; 359d0416d48SJason Wang 360d0416d48SJason Wang err: 361d0416d48SJason Wang return -1; 362d0416d48SJason Wang } 363d0416d48SJason Wang 364d0416d48SJason Wang static void vhost_vdpa_host_notifiers_init(struct vhost_dev *dev) 365d0416d48SJason Wang { 366d0416d48SJason Wang int i; 367d0416d48SJason Wang 368d0416d48SJason Wang for (i = dev->vq_index; i < dev->vq_index + dev->nvqs; i++) { 369d0416d48SJason Wang if (vhost_vdpa_host_notifier_init(dev, i)) { 370d0416d48SJason Wang goto err; 371d0416d48SJason Wang } 372d0416d48SJason Wang } 373d0416d48SJason Wang 374d0416d48SJason Wang return; 375d0416d48SJason Wang 376d0416d48SJason Wang err: 377d0416d48SJason Wang vhost_vdpa_host_notifiers_uninit(dev, i); 378d0416d48SJason Wang return; 379d0416d48SJason Wang } 380d0416d48SJason Wang 381108a6481SCindy Lu static int vhost_vdpa_cleanup(struct vhost_dev *dev) 382108a6481SCindy Lu { 383108a6481SCindy Lu struct vhost_vdpa *v; 384108a6481SCindy Lu assert(dev->vhost_ops->backend_type == VHOST_BACKEND_TYPE_VDPA); 385108a6481SCindy Lu v = dev->opaque; 386778e67deSLaurent Vivier trace_vhost_vdpa_cleanup(dev, v); 387d0416d48SJason Wang vhost_vdpa_host_notifiers_uninit(dev, dev->nvqs); 388108a6481SCindy Lu memory_listener_unregister(&v->listener); 389108a6481SCindy Lu 390108a6481SCindy Lu dev->opaque = NULL; 391108a6481SCindy Lu return 0; 392108a6481SCindy Lu } 393108a6481SCindy Lu 394108a6481SCindy Lu static int vhost_vdpa_memslots_limit(struct vhost_dev *dev) 395108a6481SCindy Lu { 396778e67deSLaurent Vivier trace_vhost_vdpa_memslots_limit(dev, INT_MAX); 397108a6481SCindy Lu return INT_MAX; 398108a6481SCindy Lu } 399108a6481SCindy Lu 400108a6481SCindy Lu static int vhost_vdpa_set_mem_table(struct vhost_dev *dev, 401108a6481SCindy Lu struct vhost_memory *mem) 402108a6481SCindy Lu { 403778e67deSLaurent Vivier trace_vhost_vdpa_set_mem_table(dev, mem->nregions, mem->padding); 404778e67deSLaurent Vivier if (trace_event_get_state_backends(TRACE_VHOST_VDPA_SET_MEM_TABLE) && 405778e67deSLaurent Vivier trace_event_get_state_backends(TRACE_VHOST_VDPA_DUMP_REGIONS)) { 406778e67deSLaurent Vivier int i; 407778e67deSLaurent Vivier for (i = 0; i < mem->nregions; i++) { 408778e67deSLaurent Vivier trace_vhost_vdpa_dump_regions(dev, i, 409778e67deSLaurent Vivier mem->regions[i].guest_phys_addr, 410778e67deSLaurent Vivier mem->regions[i].memory_size, 411778e67deSLaurent Vivier mem->regions[i].userspace_addr, 412778e67deSLaurent Vivier mem->regions[i].flags_padding); 413778e67deSLaurent Vivier } 414778e67deSLaurent Vivier } 415108a6481SCindy Lu if (mem->padding) { 416108a6481SCindy Lu return -1; 417108a6481SCindy Lu } 418108a6481SCindy Lu 419108a6481SCindy Lu return 0; 420108a6481SCindy Lu } 421108a6481SCindy Lu 422108a6481SCindy Lu static int vhost_vdpa_set_features(struct vhost_dev *dev, 423108a6481SCindy Lu uint64_t features) 424108a6481SCindy Lu { 425108a6481SCindy Lu int ret; 426778e67deSLaurent Vivier trace_vhost_vdpa_set_features(dev, features); 427108a6481SCindy Lu ret = vhost_vdpa_call(dev, VHOST_SET_FEATURES, &features); 428108a6481SCindy Lu uint8_t status = 0; 429108a6481SCindy Lu if (ret) { 430108a6481SCindy Lu return ret; 431108a6481SCindy Lu } 432108a6481SCindy Lu vhost_vdpa_add_status(dev, VIRTIO_CONFIG_S_FEATURES_OK); 433108a6481SCindy Lu vhost_vdpa_call(dev, VHOST_VDPA_GET_STATUS, &status); 434108a6481SCindy Lu 435108a6481SCindy Lu return !(status & VIRTIO_CONFIG_S_FEATURES_OK); 436108a6481SCindy Lu } 437108a6481SCindy Lu 438a5bd0580SJason Wang static int vhost_vdpa_set_backend_cap(struct vhost_dev *dev) 439a5bd0580SJason Wang { 440a5bd0580SJason Wang uint64_t features; 441a5bd0580SJason Wang uint64_t f = 0x1ULL << VHOST_BACKEND_F_IOTLB_MSG_V2 | 442a5bd0580SJason Wang 0x1ULL << VHOST_BACKEND_F_IOTLB_BATCH; 443a5bd0580SJason Wang int r; 444a5bd0580SJason Wang 445a5bd0580SJason Wang if (vhost_vdpa_call(dev, VHOST_GET_BACKEND_FEATURES, &features)) { 446*2a83e97eSJason Wang return -EFAULT; 447a5bd0580SJason Wang } 448a5bd0580SJason Wang 449a5bd0580SJason Wang features &= f; 450a5bd0580SJason Wang r = vhost_vdpa_call(dev, VHOST_SET_BACKEND_FEATURES, &features); 451a5bd0580SJason Wang if (r) { 452*2a83e97eSJason Wang return -EFAULT; 453a5bd0580SJason Wang } 454a5bd0580SJason Wang 455a5bd0580SJason Wang dev->backend_cap = features; 456a5bd0580SJason Wang 457a5bd0580SJason Wang return 0; 458a5bd0580SJason Wang } 459a5bd0580SJason Wang 460c232b8f4SZenghui Yu static int vhost_vdpa_get_device_id(struct vhost_dev *dev, 461108a6481SCindy Lu uint32_t *device_id) 462108a6481SCindy Lu { 463778e67deSLaurent Vivier int ret; 464778e67deSLaurent Vivier ret = vhost_vdpa_call(dev, VHOST_VDPA_GET_DEVICE_ID, device_id); 465778e67deSLaurent Vivier trace_vhost_vdpa_get_device_id(dev, *device_id); 466778e67deSLaurent Vivier return ret; 467108a6481SCindy Lu } 468108a6481SCindy Lu 469108a6481SCindy Lu static int vhost_vdpa_reset_device(struct vhost_dev *dev) 470108a6481SCindy Lu { 471778e67deSLaurent Vivier int ret; 472108a6481SCindy Lu uint8_t status = 0; 473108a6481SCindy Lu 474778e67deSLaurent Vivier ret = vhost_vdpa_call(dev, VHOST_VDPA_SET_STATUS, &status); 475778e67deSLaurent Vivier trace_vhost_vdpa_reset_device(dev, status); 476778e67deSLaurent Vivier return ret; 477108a6481SCindy Lu } 478108a6481SCindy Lu 479108a6481SCindy Lu static int vhost_vdpa_get_vq_index(struct vhost_dev *dev, int idx) 480108a6481SCindy Lu { 481108a6481SCindy Lu assert(idx >= dev->vq_index && idx < dev->vq_index + dev->nvqs); 482108a6481SCindy Lu 483778e67deSLaurent Vivier trace_vhost_vdpa_get_vq_index(dev, idx, idx - dev->vq_index); 484108a6481SCindy Lu return idx - dev->vq_index; 485108a6481SCindy Lu } 486108a6481SCindy Lu 487108a6481SCindy Lu static int vhost_vdpa_set_vring_ready(struct vhost_dev *dev) 488108a6481SCindy Lu { 489108a6481SCindy Lu int i; 490778e67deSLaurent Vivier trace_vhost_vdpa_set_vring_ready(dev); 491108a6481SCindy Lu for (i = 0; i < dev->nvqs; ++i) { 492108a6481SCindy Lu struct vhost_vring_state state = { 493108a6481SCindy Lu .index = dev->vq_index + i, 494108a6481SCindy Lu .num = 1, 495108a6481SCindy Lu }; 496108a6481SCindy Lu vhost_vdpa_call(dev, VHOST_VDPA_SET_VRING_ENABLE, &state); 497108a6481SCindy Lu } 498108a6481SCindy Lu return 0; 499108a6481SCindy Lu } 500108a6481SCindy Lu 501778e67deSLaurent Vivier static void vhost_vdpa_dump_config(struct vhost_dev *dev, const uint8_t *config, 502778e67deSLaurent Vivier uint32_t config_len) 503778e67deSLaurent Vivier { 504778e67deSLaurent Vivier int b, len; 505778e67deSLaurent Vivier char line[QEMU_HEXDUMP_LINE_LEN]; 506778e67deSLaurent Vivier 507778e67deSLaurent Vivier for (b = 0; b < config_len; b += 16) { 508778e67deSLaurent Vivier len = config_len - b; 509778e67deSLaurent Vivier qemu_hexdump_line(line, b, config, len, false); 510778e67deSLaurent Vivier trace_vhost_vdpa_dump_config(dev, line); 511778e67deSLaurent Vivier } 512778e67deSLaurent Vivier } 513778e67deSLaurent Vivier 514108a6481SCindy Lu static int vhost_vdpa_set_config(struct vhost_dev *dev, const uint8_t *data, 515108a6481SCindy Lu uint32_t offset, uint32_t size, 516108a6481SCindy Lu uint32_t flags) 517108a6481SCindy Lu { 518108a6481SCindy Lu struct vhost_vdpa_config *config; 519108a6481SCindy Lu int ret; 520108a6481SCindy Lu unsigned long config_size = offsetof(struct vhost_vdpa_config, buf); 521986d4f78SLi Qiang 522778e67deSLaurent Vivier trace_vhost_vdpa_set_config(dev, offset, size, flags); 523108a6481SCindy Lu config = g_malloc(size + config_size); 524108a6481SCindy Lu config->off = offset; 525108a6481SCindy Lu config->len = size; 526108a6481SCindy Lu memcpy(config->buf, data, size); 527778e67deSLaurent Vivier if (trace_event_get_state_backends(TRACE_VHOST_VDPA_SET_CONFIG) && 528778e67deSLaurent Vivier trace_event_get_state_backends(TRACE_VHOST_VDPA_DUMP_CONFIG)) { 529778e67deSLaurent Vivier vhost_vdpa_dump_config(dev, data, size); 530778e67deSLaurent Vivier } 531108a6481SCindy Lu ret = vhost_vdpa_call(dev, VHOST_VDPA_SET_CONFIG, config); 532108a6481SCindy Lu g_free(config); 533108a6481SCindy Lu return ret; 534108a6481SCindy Lu } 535108a6481SCindy Lu 536108a6481SCindy Lu static int vhost_vdpa_get_config(struct vhost_dev *dev, uint8_t *config, 53750de5138SKevin Wolf uint32_t config_len, Error **errp) 538108a6481SCindy Lu { 539108a6481SCindy Lu struct vhost_vdpa_config *v_config; 540108a6481SCindy Lu unsigned long config_size = offsetof(struct vhost_vdpa_config, buf); 541108a6481SCindy Lu int ret; 542108a6481SCindy Lu 543778e67deSLaurent Vivier trace_vhost_vdpa_get_config(dev, config, config_len); 544108a6481SCindy Lu v_config = g_malloc(config_len + config_size); 545108a6481SCindy Lu v_config->len = config_len; 546108a6481SCindy Lu v_config->off = 0; 547108a6481SCindy Lu ret = vhost_vdpa_call(dev, VHOST_VDPA_GET_CONFIG, v_config); 548108a6481SCindy Lu memcpy(config, v_config->buf, config_len); 549108a6481SCindy Lu g_free(v_config); 550778e67deSLaurent Vivier if (trace_event_get_state_backends(TRACE_VHOST_VDPA_GET_CONFIG) && 551778e67deSLaurent Vivier trace_event_get_state_backends(TRACE_VHOST_VDPA_DUMP_CONFIG)) { 552778e67deSLaurent Vivier vhost_vdpa_dump_config(dev, config, config_len); 553778e67deSLaurent Vivier } 554108a6481SCindy Lu return ret; 555108a6481SCindy Lu } 556108a6481SCindy Lu 557108a6481SCindy Lu static int vhost_vdpa_dev_start(struct vhost_dev *dev, bool started) 558108a6481SCindy Lu { 559108a6481SCindy Lu struct vhost_vdpa *v = dev->opaque; 560778e67deSLaurent Vivier trace_vhost_vdpa_dev_start(dev, started); 561108a6481SCindy Lu if (started) { 562108a6481SCindy Lu uint8_t status = 0; 563108a6481SCindy Lu memory_listener_register(&v->listener, &address_space_memory); 564d0416d48SJason Wang vhost_vdpa_host_notifiers_init(dev); 565108a6481SCindy Lu vhost_vdpa_set_vring_ready(dev); 566108a6481SCindy Lu vhost_vdpa_add_status(dev, VIRTIO_CONFIG_S_DRIVER_OK); 567108a6481SCindy Lu vhost_vdpa_call(dev, VHOST_VDPA_GET_STATUS, &status); 568108a6481SCindy Lu 569108a6481SCindy Lu return !(status & VIRTIO_CONFIG_S_DRIVER_OK); 570108a6481SCindy Lu } else { 571108a6481SCindy Lu vhost_vdpa_reset_device(dev); 572108a6481SCindy Lu vhost_vdpa_add_status(dev, VIRTIO_CONFIG_S_ACKNOWLEDGE | 573108a6481SCindy Lu VIRTIO_CONFIG_S_DRIVER); 574d0416d48SJason Wang vhost_vdpa_host_notifiers_uninit(dev, dev->nvqs); 575108a6481SCindy Lu memory_listener_unregister(&v->listener); 576108a6481SCindy Lu 577108a6481SCindy Lu return 0; 578108a6481SCindy Lu } 579108a6481SCindy Lu } 580108a6481SCindy Lu 581108a6481SCindy Lu static int vhost_vdpa_set_log_base(struct vhost_dev *dev, uint64_t base, 582108a6481SCindy Lu struct vhost_log *log) 583108a6481SCindy Lu { 584778e67deSLaurent Vivier trace_vhost_vdpa_set_log_base(dev, base, log->size, log->refcnt, log->fd, 585778e67deSLaurent Vivier log->log); 586108a6481SCindy Lu return vhost_vdpa_call(dev, VHOST_SET_LOG_BASE, &base); 587108a6481SCindy Lu } 588108a6481SCindy Lu 589108a6481SCindy Lu static int vhost_vdpa_set_vring_addr(struct vhost_dev *dev, 590108a6481SCindy Lu struct vhost_vring_addr *addr) 591108a6481SCindy Lu { 592778e67deSLaurent Vivier trace_vhost_vdpa_set_vring_addr(dev, addr->index, addr->flags, 593778e67deSLaurent Vivier addr->desc_user_addr, addr->used_user_addr, 594778e67deSLaurent Vivier addr->avail_user_addr, 595778e67deSLaurent Vivier addr->log_guest_addr); 596108a6481SCindy Lu return vhost_vdpa_call(dev, VHOST_SET_VRING_ADDR, addr); 597108a6481SCindy Lu } 598108a6481SCindy Lu 599108a6481SCindy Lu static int vhost_vdpa_set_vring_num(struct vhost_dev *dev, 600108a6481SCindy Lu struct vhost_vring_state *ring) 601108a6481SCindy Lu { 602778e67deSLaurent Vivier trace_vhost_vdpa_set_vring_num(dev, ring->index, ring->num); 603108a6481SCindy Lu return vhost_vdpa_call(dev, VHOST_SET_VRING_NUM, ring); 604108a6481SCindy Lu } 605108a6481SCindy Lu 606108a6481SCindy Lu static int vhost_vdpa_set_vring_base(struct vhost_dev *dev, 607108a6481SCindy Lu struct vhost_vring_state *ring) 608108a6481SCindy Lu { 609778e67deSLaurent Vivier trace_vhost_vdpa_set_vring_base(dev, ring->index, ring->num); 610108a6481SCindy Lu return vhost_vdpa_call(dev, VHOST_SET_VRING_BASE, ring); 611108a6481SCindy Lu } 612108a6481SCindy Lu 613108a6481SCindy Lu static int vhost_vdpa_get_vring_base(struct vhost_dev *dev, 614108a6481SCindy Lu struct vhost_vring_state *ring) 615108a6481SCindy Lu { 616778e67deSLaurent Vivier int ret; 617778e67deSLaurent Vivier 618778e67deSLaurent Vivier ret = vhost_vdpa_call(dev, VHOST_GET_VRING_BASE, ring); 619778e67deSLaurent Vivier trace_vhost_vdpa_get_vring_base(dev, ring->index, ring->num); 620778e67deSLaurent Vivier return ret; 621108a6481SCindy Lu } 622108a6481SCindy Lu 623108a6481SCindy Lu static int vhost_vdpa_set_vring_kick(struct vhost_dev *dev, 624108a6481SCindy Lu struct vhost_vring_file *file) 625108a6481SCindy Lu { 626778e67deSLaurent Vivier trace_vhost_vdpa_set_vring_kick(dev, file->index, file->fd); 627108a6481SCindy Lu return vhost_vdpa_call(dev, VHOST_SET_VRING_KICK, file); 628108a6481SCindy Lu } 629108a6481SCindy Lu 630108a6481SCindy Lu static int vhost_vdpa_set_vring_call(struct vhost_dev *dev, 631108a6481SCindy Lu struct vhost_vring_file *file) 632108a6481SCindy Lu { 633778e67deSLaurent Vivier trace_vhost_vdpa_set_vring_call(dev, file->index, file->fd); 634108a6481SCindy Lu return vhost_vdpa_call(dev, VHOST_SET_VRING_CALL, file); 635108a6481SCindy Lu } 636108a6481SCindy Lu 637108a6481SCindy Lu static int vhost_vdpa_get_features(struct vhost_dev *dev, 638108a6481SCindy Lu uint64_t *features) 639108a6481SCindy Lu { 640778e67deSLaurent Vivier int ret; 641778e67deSLaurent Vivier 642778e67deSLaurent Vivier ret = vhost_vdpa_call(dev, VHOST_GET_FEATURES, features); 643778e67deSLaurent Vivier trace_vhost_vdpa_get_features(dev, *features); 644778e67deSLaurent Vivier return ret; 645108a6481SCindy Lu } 646108a6481SCindy Lu 647108a6481SCindy Lu static int vhost_vdpa_set_owner(struct vhost_dev *dev) 648108a6481SCindy Lu { 649778e67deSLaurent Vivier trace_vhost_vdpa_set_owner(dev); 650108a6481SCindy Lu return vhost_vdpa_call(dev, VHOST_SET_OWNER, NULL); 651108a6481SCindy Lu } 652108a6481SCindy Lu 653108a6481SCindy Lu static int vhost_vdpa_vq_get_addr(struct vhost_dev *dev, 654108a6481SCindy Lu struct vhost_vring_addr *addr, struct vhost_virtqueue *vq) 655108a6481SCindy Lu { 656108a6481SCindy Lu assert(dev->vhost_ops->backend_type == VHOST_BACKEND_TYPE_VDPA); 657108a6481SCindy Lu addr->desc_user_addr = (uint64_t)(unsigned long)vq->desc_phys; 658108a6481SCindy Lu addr->avail_user_addr = (uint64_t)(unsigned long)vq->avail_phys; 659108a6481SCindy Lu addr->used_user_addr = (uint64_t)(unsigned long)vq->used_phys; 660778e67deSLaurent Vivier trace_vhost_vdpa_vq_get_addr(dev, vq, addr->desc_user_addr, 661778e67deSLaurent Vivier addr->avail_user_addr, addr->used_user_addr); 662108a6481SCindy Lu return 0; 663108a6481SCindy Lu } 664108a6481SCindy Lu 665108a6481SCindy Lu static bool vhost_vdpa_force_iommu(struct vhost_dev *dev) 666108a6481SCindy Lu { 667108a6481SCindy Lu return true; 668108a6481SCindy Lu } 669108a6481SCindy Lu 670108a6481SCindy Lu const VhostOps vdpa_ops = { 671108a6481SCindy Lu .backend_type = VHOST_BACKEND_TYPE_VDPA, 672108a6481SCindy Lu .vhost_backend_init = vhost_vdpa_init, 673108a6481SCindy Lu .vhost_backend_cleanup = vhost_vdpa_cleanup, 674108a6481SCindy Lu .vhost_set_log_base = vhost_vdpa_set_log_base, 675108a6481SCindy Lu .vhost_set_vring_addr = vhost_vdpa_set_vring_addr, 676108a6481SCindy Lu .vhost_set_vring_num = vhost_vdpa_set_vring_num, 677108a6481SCindy Lu .vhost_set_vring_base = vhost_vdpa_set_vring_base, 678108a6481SCindy Lu .vhost_get_vring_base = vhost_vdpa_get_vring_base, 679108a6481SCindy Lu .vhost_set_vring_kick = vhost_vdpa_set_vring_kick, 680108a6481SCindy Lu .vhost_set_vring_call = vhost_vdpa_set_vring_call, 681108a6481SCindy Lu .vhost_get_features = vhost_vdpa_get_features, 682a5bd0580SJason Wang .vhost_set_backend_cap = vhost_vdpa_set_backend_cap, 683108a6481SCindy Lu .vhost_set_owner = vhost_vdpa_set_owner, 684108a6481SCindy Lu .vhost_set_vring_endian = NULL, 685108a6481SCindy Lu .vhost_backend_memslots_limit = vhost_vdpa_memslots_limit, 686108a6481SCindy Lu .vhost_set_mem_table = vhost_vdpa_set_mem_table, 687108a6481SCindy Lu .vhost_set_features = vhost_vdpa_set_features, 688108a6481SCindy Lu .vhost_reset_device = vhost_vdpa_reset_device, 689108a6481SCindy Lu .vhost_get_vq_index = vhost_vdpa_get_vq_index, 690108a6481SCindy Lu .vhost_get_config = vhost_vdpa_get_config, 691108a6481SCindy Lu .vhost_set_config = vhost_vdpa_set_config, 692108a6481SCindy Lu .vhost_requires_shm_log = NULL, 693108a6481SCindy Lu .vhost_migration_done = NULL, 694108a6481SCindy Lu .vhost_backend_can_merge = NULL, 695108a6481SCindy Lu .vhost_net_set_mtu = NULL, 696108a6481SCindy Lu .vhost_set_iotlb_callback = NULL, 697108a6481SCindy Lu .vhost_send_device_iotlb_msg = NULL, 698108a6481SCindy Lu .vhost_dev_start = vhost_vdpa_dev_start, 699108a6481SCindy Lu .vhost_get_device_id = vhost_vdpa_get_device_id, 700108a6481SCindy Lu .vhost_vq_get_addr = vhost_vdpa_vq_get_addr, 701108a6481SCindy Lu .vhost_force_iommu = vhost_vdpa_force_iommu, 702108a6481SCindy Lu }; 703