1108a6481SCindy Lu /* 2108a6481SCindy Lu * vhost-vdpa 3108a6481SCindy Lu * 4108a6481SCindy Lu * Copyright(c) 2017-2018 Intel Corporation. 5108a6481SCindy Lu * Copyright(c) 2020 Red Hat, Inc. 6108a6481SCindy Lu * 7108a6481SCindy Lu * This work is licensed under the terms of the GNU GPL, version 2 or later. 8108a6481SCindy Lu * See the COPYING file in the top-level directory. 9108a6481SCindy Lu * 10108a6481SCindy Lu */ 11108a6481SCindy Lu 12108a6481SCindy Lu #include "qemu/osdep.h" 13108a6481SCindy Lu #include <linux/vhost.h> 14108a6481SCindy Lu #include <linux/vfio.h> 15108a6481SCindy Lu #include <sys/eventfd.h> 16108a6481SCindy Lu #include <sys/ioctl.h> 17108a6481SCindy Lu #include "hw/virtio/vhost.h" 18108a6481SCindy Lu #include "hw/virtio/vhost-backend.h" 19108a6481SCindy Lu #include "hw/virtio/virtio-net.h" 20108a6481SCindy Lu #include "hw/virtio/vhost-vdpa.h" 21*df77d45aSXie Yongji #include "exec/address-spaces.h" 22108a6481SCindy Lu #include "qemu/main-loop.h" 234dc5acc0SCindy Lu #include "cpu.h" 24778e67deSLaurent Vivier #include "trace.h" 25778e67deSLaurent Vivier #include "qemu-common.h" 26108a6481SCindy Lu 27108a6481SCindy Lu static bool vhost_vdpa_listener_skipped_section(MemoryRegionSection *section) 28108a6481SCindy Lu { 29108a6481SCindy Lu return (!memory_region_is_ram(section->mr) && 30108a6481SCindy Lu !memory_region_is_iommu(section->mr)) || 31108a6481SCindy Lu /* 32108a6481SCindy Lu * Sizing an enabled 64-bit BAR can cause spurious mappings to 33108a6481SCindy Lu * addresses in the upper part of the 64-bit address space. These 34108a6481SCindy Lu * are never accessed by the CPU and beyond the address width of 35108a6481SCindy Lu * some IOMMU hardware. TODO: VDPA should tell us the IOMMU width. 36108a6481SCindy Lu */ 37108a6481SCindy Lu section->offset_within_address_space & (1ULL << 63); 38108a6481SCindy Lu } 39108a6481SCindy Lu 40108a6481SCindy Lu static int vhost_vdpa_dma_map(struct vhost_vdpa *v, hwaddr iova, hwaddr size, 41108a6481SCindy Lu void *vaddr, bool readonly) 42108a6481SCindy Lu { 43386494f2SCindy Lu struct vhost_msg_v2 msg = {}; 44108a6481SCindy Lu int fd = v->device_fd; 45108a6481SCindy Lu int ret = 0; 46108a6481SCindy Lu 47108a6481SCindy Lu msg.type = v->msg_type; 48108a6481SCindy Lu msg.iotlb.iova = iova; 49108a6481SCindy Lu msg.iotlb.size = size; 50108a6481SCindy Lu msg.iotlb.uaddr = (uint64_t)(uintptr_t)vaddr; 51108a6481SCindy Lu msg.iotlb.perm = readonly ? VHOST_ACCESS_RO : VHOST_ACCESS_RW; 52108a6481SCindy Lu msg.iotlb.type = VHOST_IOTLB_UPDATE; 53108a6481SCindy Lu 54778e67deSLaurent Vivier trace_vhost_vdpa_dma_map(v, fd, msg.type, msg.iotlb.iova, msg.iotlb.size, 55778e67deSLaurent Vivier msg.iotlb.uaddr, msg.iotlb.perm, msg.iotlb.type); 56778e67deSLaurent Vivier 57108a6481SCindy Lu if (write(fd, &msg, sizeof(msg)) != sizeof(msg)) { 58108a6481SCindy Lu error_report("failed to write, fd=%d, errno=%d (%s)", 59108a6481SCindy Lu fd, errno, strerror(errno)); 60108a6481SCindy Lu return -EIO ; 61108a6481SCindy Lu } 62108a6481SCindy Lu 63108a6481SCindy Lu return ret; 64108a6481SCindy Lu } 65108a6481SCindy Lu 66108a6481SCindy Lu static int vhost_vdpa_dma_unmap(struct vhost_vdpa *v, hwaddr iova, 67108a6481SCindy Lu hwaddr size) 68108a6481SCindy Lu { 69386494f2SCindy Lu struct vhost_msg_v2 msg = {}; 70108a6481SCindy Lu int fd = v->device_fd; 71108a6481SCindy Lu int ret = 0; 72108a6481SCindy Lu 73108a6481SCindy Lu msg.type = v->msg_type; 74108a6481SCindy Lu msg.iotlb.iova = iova; 75108a6481SCindy Lu msg.iotlb.size = size; 76108a6481SCindy Lu msg.iotlb.type = VHOST_IOTLB_INVALIDATE; 77108a6481SCindy Lu 78778e67deSLaurent Vivier trace_vhost_vdpa_dma_unmap(v, fd, msg.type, msg.iotlb.iova, 79778e67deSLaurent Vivier msg.iotlb.size, msg.iotlb.type); 80778e67deSLaurent Vivier 81108a6481SCindy Lu if (write(fd, &msg, sizeof(msg)) != sizeof(msg)) { 82108a6481SCindy Lu error_report("failed to write, fd=%d, errno=%d (%s)", 83108a6481SCindy Lu fd, errno, strerror(errno)); 84108a6481SCindy Lu return -EIO ; 85108a6481SCindy Lu } 86108a6481SCindy Lu 87108a6481SCindy Lu return ret; 88108a6481SCindy Lu } 89108a6481SCindy Lu 90a5bd0580SJason Wang static void vhost_vdpa_listener_begin(MemoryListener *listener) 91a5bd0580SJason Wang { 92a5bd0580SJason Wang struct vhost_vdpa *v = container_of(listener, struct vhost_vdpa, listener); 93a5bd0580SJason Wang struct vhost_dev *dev = v->dev; 948acb3218SPhilippe Mathieu-Daudé struct vhost_msg_v2 msg = {}; 95a5bd0580SJason Wang int fd = v->device_fd; 96a5bd0580SJason Wang 97a5bd0580SJason Wang if (!(dev->backend_cap & (0x1ULL << VHOST_BACKEND_F_IOTLB_BATCH))) { 98a5bd0580SJason Wang return; 99a5bd0580SJason Wang } 100a5bd0580SJason Wang 101a5bd0580SJason Wang msg.type = v->msg_type; 102a5bd0580SJason Wang msg.iotlb.type = VHOST_IOTLB_BATCH_BEGIN; 103a5bd0580SJason Wang 104a5bd0580SJason Wang if (write(fd, &msg, sizeof(msg)) != sizeof(msg)) { 105a5bd0580SJason Wang error_report("failed to write, fd=%d, errno=%d (%s)", 106a5bd0580SJason Wang fd, errno, strerror(errno)); 107a5bd0580SJason Wang } 108a5bd0580SJason Wang } 109a5bd0580SJason Wang 110a5bd0580SJason Wang static void vhost_vdpa_listener_commit(MemoryListener *listener) 111a5bd0580SJason Wang { 112a5bd0580SJason Wang struct vhost_vdpa *v = container_of(listener, struct vhost_vdpa, listener); 113a5bd0580SJason Wang struct vhost_dev *dev = v->dev; 1148acb3218SPhilippe Mathieu-Daudé struct vhost_msg_v2 msg = {}; 115a5bd0580SJason Wang int fd = v->device_fd; 116a5bd0580SJason Wang 117a5bd0580SJason Wang if (!(dev->backend_cap & (0x1ULL << VHOST_BACKEND_F_IOTLB_BATCH))) { 118a5bd0580SJason Wang return; 119a5bd0580SJason Wang } 120a5bd0580SJason Wang 121a5bd0580SJason Wang msg.type = v->msg_type; 122a5bd0580SJason Wang msg.iotlb.type = VHOST_IOTLB_BATCH_END; 123a5bd0580SJason Wang 124a5bd0580SJason Wang if (write(fd, &msg, sizeof(msg)) != sizeof(msg)) { 125a5bd0580SJason Wang error_report("failed to write, fd=%d, errno=%d (%s)", 126a5bd0580SJason Wang fd, errno, strerror(errno)); 127a5bd0580SJason Wang } 128a5bd0580SJason Wang } 129a5bd0580SJason Wang 130108a6481SCindy Lu static void vhost_vdpa_listener_region_add(MemoryListener *listener, 131108a6481SCindy Lu MemoryRegionSection *section) 132108a6481SCindy Lu { 133108a6481SCindy Lu struct vhost_vdpa *v = container_of(listener, struct vhost_vdpa, listener); 134108a6481SCindy Lu hwaddr iova; 135108a6481SCindy Lu Int128 llend, llsize; 136108a6481SCindy Lu void *vaddr; 137108a6481SCindy Lu int ret; 138108a6481SCindy Lu 139108a6481SCindy Lu if (vhost_vdpa_listener_skipped_section(section)) { 140108a6481SCindy Lu return; 141108a6481SCindy Lu } 142108a6481SCindy Lu 143108a6481SCindy Lu if (unlikely((section->offset_within_address_space & ~TARGET_PAGE_MASK) != 144108a6481SCindy Lu (section->offset_within_region & ~TARGET_PAGE_MASK))) { 145108a6481SCindy Lu error_report("%s received unaligned region", __func__); 146108a6481SCindy Lu return; 147108a6481SCindy Lu } 148108a6481SCindy Lu 149108a6481SCindy Lu iova = TARGET_PAGE_ALIGN(section->offset_within_address_space); 150108a6481SCindy Lu llend = int128_make64(section->offset_within_address_space); 151108a6481SCindy Lu llend = int128_add(llend, section->size); 152108a6481SCindy Lu llend = int128_and(llend, int128_exts64(TARGET_PAGE_MASK)); 153108a6481SCindy Lu 154108a6481SCindy Lu if (int128_ge(int128_make64(iova), llend)) { 155108a6481SCindy Lu return; 156108a6481SCindy Lu } 157108a6481SCindy Lu 158108a6481SCindy Lu memory_region_ref(section->mr); 159108a6481SCindy Lu 160108a6481SCindy Lu /* Here we assume that memory_region_is_ram(section->mr)==true */ 161108a6481SCindy Lu 162108a6481SCindy Lu vaddr = memory_region_get_ram_ptr(section->mr) + 163108a6481SCindy Lu section->offset_within_region + 164108a6481SCindy Lu (iova - section->offset_within_address_space); 165108a6481SCindy Lu 166778e67deSLaurent Vivier trace_vhost_vdpa_listener_region_add(v, iova, int128_get64(llend), 167778e67deSLaurent Vivier vaddr, section->readonly); 168778e67deSLaurent Vivier 169108a6481SCindy Lu llsize = int128_sub(llend, int128_make64(iova)); 170108a6481SCindy Lu 171108a6481SCindy Lu ret = vhost_vdpa_dma_map(v, iova, int128_get64(llsize), 172108a6481SCindy Lu vaddr, section->readonly); 173108a6481SCindy Lu if (ret) { 174108a6481SCindy Lu error_report("vhost vdpa map fail!"); 175108a6481SCindy Lu if (memory_region_is_ram_device(section->mr)) { 176108a6481SCindy Lu /* Allow unexpected mappings not to be fatal for RAM devices */ 177108a6481SCindy Lu error_report("map ram fail!"); 178108a6481SCindy Lu return ; 179108a6481SCindy Lu } 180108a6481SCindy Lu goto fail; 181108a6481SCindy Lu } 182108a6481SCindy Lu 183108a6481SCindy Lu return; 184108a6481SCindy Lu 185108a6481SCindy Lu fail: 186108a6481SCindy Lu if (memory_region_is_ram_device(section->mr)) { 187108a6481SCindy Lu error_report("failed to vdpa_dma_map. pci p2p may not work"); 188108a6481SCindy Lu return; 189108a6481SCindy Lu 190108a6481SCindy Lu } 191108a6481SCindy Lu /* 192108a6481SCindy Lu * On the initfn path, store the first error in the container so we 193108a6481SCindy Lu * can gracefully fail. Runtime, there's not much we can do other 194108a6481SCindy Lu * than throw a hardware error. 195108a6481SCindy Lu */ 196108a6481SCindy Lu error_report("vhost-vdpa: DMA mapping failed, unable to continue"); 197108a6481SCindy Lu return; 198108a6481SCindy Lu 199108a6481SCindy Lu } 200108a6481SCindy Lu 201108a6481SCindy Lu static void vhost_vdpa_listener_region_del(MemoryListener *listener, 202108a6481SCindy Lu MemoryRegionSection *section) 203108a6481SCindy Lu { 204108a6481SCindy Lu struct vhost_vdpa *v = container_of(listener, struct vhost_vdpa, listener); 205108a6481SCindy Lu hwaddr iova; 206108a6481SCindy Lu Int128 llend, llsize; 207108a6481SCindy Lu int ret; 208108a6481SCindy Lu 209108a6481SCindy Lu if (vhost_vdpa_listener_skipped_section(section)) { 210108a6481SCindy Lu return; 211108a6481SCindy Lu } 212108a6481SCindy Lu 213108a6481SCindy Lu if (unlikely((section->offset_within_address_space & ~TARGET_PAGE_MASK) != 214108a6481SCindy Lu (section->offset_within_region & ~TARGET_PAGE_MASK))) { 215108a6481SCindy Lu error_report("%s received unaligned region", __func__); 216108a6481SCindy Lu return; 217108a6481SCindy Lu } 218108a6481SCindy Lu 219108a6481SCindy Lu iova = TARGET_PAGE_ALIGN(section->offset_within_address_space); 220108a6481SCindy Lu llend = int128_make64(section->offset_within_address_space); 221108a6481SCindy Lu llend = int128_add(llend, section->size); 222108a6481SCindy Lu llend = int128_and(llend, int128_exts64(TARGET_PAGE_MASK)); 223108a6481SCindy Lu 224778e67deSLaurent Vivier trace_vhost_vdpa_listener_region_del(v, iova, int128_get64(llend)); 225778e67deSLaurent Vivier 226108a6481SCindy Lu if (int128_ge(int128_make64(iova), llend)) { 227108a6481SCindy Lu return; 228108a6481SCindy Lu } 229108a6481SCindy Lu 230108a6481SCindy Lu llsize = int128_sub(llend, int128_make64(iova)); 231108a6481SCindy Lu 232108a6481SCindy Lu ret = vhost_vdpa_dma_unmap(v, iova, int128_get64(llsize)); 233108a6481SCindy Lu if (ret) { 234108a6481SCindy Lu error_report("vhost_vdpa dma unmap error!"); 235108a6481SCindy Lu } 236108a6481SCindy Lu 237108a6481SCindy Lu memory_region_unref(section->mr); 238108a6481SCindy Lu } 239108a6481SCindy Lu /* 240108a6481SCindy Lu * IOTLB API is used by vhost-vpda which requires incremental updating 241108a6481SCindy Lu * of the mapping. So we can not use generic vhost memory listener which 242108a6481SCindy Lu * depends on the addnop(). 243108a6481SCindy Lu */ 244108a6481SCindy Lu static const MemoryListener vhost_vdpa_memory_listener = { 245a5bd0580SJason Wang .begin = vhost_vdpa_listener_begin, 246a5bd0580SJason Wang .commit = vhost_vdpa_listener_commit, 247108a6481SCindy Lu .region_add = vhost_vdpa_listener_region_add, 248108a6481SCindy Lu .region_del = vhost_vdpa_listener_region_del, 249108a6481SCindy Lu }; 250108a6481SCindy Lu 251108a6481SCindy Lu static int vhost_vdpa_call(struct vhost_dev *dev, unsigned long int request, 252108a6481SCindy Lu void *arg) 253108a6481SCindy Lu { 254108a6481SCindy Lu struct vhost_vdpa *v = dev->opaque; 255108a6481SCindy Lu int fd = v->device_fd; 256108a6481SCindy Lu 257108a6481SCindy Lu assert(dev->vhost_ops->backend_type == VHOST_BACKEND_TYPE_VDPA); 258108a6481SCindy Lu 259108a6481SCindy Lu return ioctl(fd, request, arg); 260108a6481SCindy Lu } 261108a6481SCindy Lu 262108a6481SCindy Lu static void vhost_vdpa_add_status(struct vhost_dev *dev, uint8_t status) 263108a6481SCindy Lu { 264108a6481SCindy Lu uint8_t s; 265108a6481SCindy Lu 266778e67deSLaurent Vivier trace_vhost_vdpa_add_status(dev, status); 267108a6481SCindy Lu if (vhost_vdpa_call(dev, VHOST_VDPA_GET_STATUS, &s)) { 268108a6481SCindy Lu return; 269108a6481SCindy Lu } 270108a6481SCindy Lu 271108a6481SCindy Lu s |= status; 272108a6481SCindy Lu 273108a6481SCindy Lu vhost_vdpa_call(dev, VHOST_VDPA_SET_STATUS, &s); 274108a6481SCindy Lu } 275108a6481SCindy Lu 276108a6481SCindy Lu static int vhost_vdpa_init(struct vhost_dev *dev, void *opaque) 277108a6481SCindy Lu { 278108a6481SCindy Lu struct vhost_vdpa *v; 279108a6481SCindy Lu uint64_t features; 280108a6481SCindy Lu assert(dev->vhost_ops->backend_type == VHOST_BACKEND_TYPE_VDPA); 281778e67deSLaurent Vivier trace_vhost_vdpa_init(dev, opaque); 282108a6481SCindy Lu 283108a6481SCindy Lu v = opaque; 284a5bd0580SJason Wang v->dev = dev; 285108a6481SCindy Lu dev->opaque = opaque ; 286108a6481SCindy Lu vhost_vdpa_call(dev, VHOST_GET_FEATURES, &features); 287108a6481SCindy Lu dev->backend_features = features; 288108a6481SCindy Lu v->listener = vhost_vdpa_memory_listener; 289108a6481SCindy Lu v->msg_type = VHOST_IOTLB_MSG_V2; 290108a6481SCindy Lu 291108a6481SCindy Lu vhost_vdpa_add_status(dev, VIRTIO_CONFIG_S_ACKNOWLEDGE | 292108a6481SCindy Lu VIRTIO_CONFIG_S_DRIVER); 293108a6481SCindy Lu 294108a6481SCindy Lu return 0; 295108a6481SCindy Lu } 296108a6481SCindy Lu 297108a6481SCindy Lu static int vhost_vdpa_cleanup(struct vhost_dev *dev) 298108a6481SCindy Lu { 299108a6481SCindy Lu struct vhost_vdpa *v; 300108a6481SCindy Lu assert(dev->vhost_ops->backend_type == VHOST_BACKEND_TYPE_VDPA); 301108a6481SCindy Lu v = dev->opaque; 302778e67deSLaurent Vivier trace_vhost_vdpa_cleanup(dev, v); 303108a6481SCindy Lu memory_listener_unregister(&v->listener); 304108a6481SCindy Lu 305108a6481SCindy Lu dev->opaque = NULL; 306108a6481SCindy Lu return 0; 307108a6481SCindy Lu } 308108a6481SCindy Lu 309108a6481SCindy Lu static int vhost_vdpa_memslots_limit(struct vhost_dev *dev) 310108a6481SCindy Lu { 311778e67deSLaurent Vivier trace_vhost_vdpa_memslots_limit(dev, INT_MAX); 312108a6481SCindy Lu return INT_MAX; 313108a6481SCindy Lu } 314108a6481SCindy Lu 315108a6481SCindy Lu static int vhost_vdpa_set_mem_table(struct vhost_dev *dev, 316108a6481SCindy Lu struct vhost_memory *mem) 317108a6481SCindy Lu { 318778e67deSLaurent Vivier trace_vhost_vdpa_set_mem_table(dev, mem->nregions, mem->padding); 319778e67deSLaurent Vivier if (trace_event_get_state_backends(TRACE_VHOST_VDPA_SET_MEM_TABLE) && 320778e67deSLaurent Vivier trace_event_get_state_backends(TRACE_VHOST_VDPA_DUMP_REGIONS)) { 321778e67deSLaurent Vivier int i; 322778e67deSLaurent Vivier for (i = 0; i < mem->nregions; i++) { 323778e67deSLaurent Vivier trace_vhost_vdpa_dump_regions(dev, i, 324778e67deSLaurent Vivier mem->regions[i].guest_phys_addr, 325778e67deSLaurent Vivier mem->regions[i].memory_size, 326778e67deSLaurent Vivier mem->regions[i].userspace_addr, 327778e67deSLaurent Vivier mem->regions[i].flags_padding); 328778e67deSLaurent Vivier } 329778e67deSLaurent Vivier } 330108a6481SCindy Lu if (mem->padding) { 331108a6481SCindy Lu return -1; 332108a6481SCindy Lu } 333108a6481SCindy Lu 334108a6481SCindy Lu return 0; 335108a6481SCindy Lu } 336108a6481SCindy Lu 337108a6481SCindy Lu static int vhost_vdpa_set_features(struct vhost_dev *dev, 338108a6481SCindy Lu uint64_t features) 339108a6481SCindy Lu { 340108a6481SCindy Lu int ret; 341778e67deSLaurent Vivier trace_vhost_vdpa_set_features(dev, features); 342108a6481SCindy Lu ret = vhost_vdpa_call(dev, VHOST_SET_FEATURES, &features); 343108a6481SCindy Lu uint8_t status = 0; 344108a6481SCindy Lu if (ret) { 345108a6481SCindy Lu return ret; 346108a6481SCindy Lu } 347108a6481SCindy Lu vhost_vdpa_add_status(dev, VIRTIO_CONFIG_S_FEATURES_OK); 348108a6481SCindy Lu vhost_vdpa_call(dev, VHOST_VDPA_GET_STATUS, &status); 349108a6481SCindy Lu 350108a6481SCindy Lu return !(status & VIRTIO_CONFIG_S_FEATURES_OK); 351108a6481SCindy Lu } 352108a6481SCindy Lu 353a5bd0580SJason Wang static int vhost_vdpa_set_backend_cap(struct vhost_dev *dev) 354a5bd0580SJason Wang { 355a5bd0580SJason Wang uint64_t features; 356a5bd0580SJason Wang uint64_t f = 0x1ULL << VHOST_BACKEND_F_IOTLB_MSG_V2 | 357a5bd0580SJason Wang 0x1ULL << VHOST_BACKEND_F_IOTLB_BATCH; 358a5bd0580SJason Wang int r; 359a5bd0580SJason Wang 360a5bd0580SJason Wang if (vhost_vdpa_call(dev, VHOST_GET_BACKEND_FEATURES, &features)) { 361a5bd0580SJason Wang return 0; 362a5bd0580SJason Wang } 363a5bd0580SJason Wang 364a5bd0580SJason Wang features &= f; 365a5bd0580SJason Wang r = vhost_vdpa_call(dev, VHOST_SET_BACKEND_FEATURES, &features); 366a5bd0580SJason Wang if (r) { 367a5bd0580SJason Wang return 0; 368a5bd0580SJason Wang } 369a5bd0580SJason Wang 370a5bd0580SJason Wang dev->backend_cap = features; 371a5bd0580SJason Wang 372a5bd0580SJason Wang return 0; 373a5bd0580SJason Wang } 374a5bd0580SJason Wang 375c232b8f4SZenghui Yu static int vhost_vdpa_get_device_id(struct vhost_dev *dev, 376108a6481SCindy Lu uint32_t *device_id) 377108a6481SCindy Lu { 378778e67deSLaurent Vivier int ret; 379778e67deSLaurent Vivier ret = vhost_vdpa_call(dev, VHOST_VDPA_GET_DEVICE_ID, device_id); 380778e67deSLaurent Vivier trace_vhost_vdpa_get_device_id(dev, *device_id); 381778e67deSLaurent Vivier return ret; 382108a6481SCindy Lu } 383108a6481SCindy Lu 384108a6481SCindy Lu static int vhost_vdpa_reset_device(struct vhost_dev *dev) 385108a6481SCindy Lu { 386778e67deSLaurent Vivier int ret; 387108a6481SCindy Lu uint8_t status = 0; 388108a6481SCindy Lu 389778e67deSLaurent Vivier ret = vhost_vdpa_call(dev, VHOST_VDPA_SET_STATUS, &status); 390778e67deSLaurent Vivier trace_vhost_vdpa_reset_device(dev, status); 391778e67deSLaurent Vivier return ret; 392108a6481SCindy Lu } 393108a6481SCindy Lu 394108a6481SCindy Lu static int vhost_vdpa_get_vq_index(struct vhost_dev *dev, int idx) 395108a6481SCindy Lu { 396108a6481SCindy Lu assert(idx >= dev->vq_index && idx < dev->vq_index + dev->nvqs); 397108a6481SCindy Lu 398778e67deSLaurent Vivier trace_vhost_vdpa_get_vq_index(dev, idx, idx - dev->vq_index); 399108a6481SCindy Lu return idx - dev->vq_index; 400108a6481SCindy Lu } 401108a6481SCindy Lu 402108a6481SCindy Lu static int vhost_vdpa_set_vring_ready(struct vhost_dev *dev) 403108a6481SCindy Lu { 404108a6481SCindy Lu int i; 405778e67deSLaurent Vivier trace_vhost_vdpa_set_vring_ready(dev); 406108a6481SCindy Lu for (i = 0; i < dev->nvqs; ++i) { 407108a6481SCindy Lu struct vhost_vring_state state = { 408108a6481SCindy Lu .index = dev->vq_index + i, 409108a6481SCindy Lu .num = 1, 410108a6481SCindy Lu }; 411108a6481SCindy Lu vhost_vdpa_call(dev, VHOST_VDPA_SET_VRING_ENABLE, &state); 412108a6481SCindy Lu } 413108a6481SCindy Lu return 0; 414108a6481SCindy Lu } 415108a6481SCindy Lu 416778e67deSLaurent Vivier static void vhost_vdpa_dump_config(struct vhost_dev *dev, const uint8_t *config, 417778e67deSLaurent Vivier uint32_t config_len) 418778e67deSLaurent Vivier { 419778e67deSLaurent Vivier int b, len; 420778e67deSLaurent Vivier char line[QEMU_HEXDUMP_LINE_LEN]; 421778e67deSLaurent Vivier 422778e67deSLaurent Vivier for (b = 0; b < config_len; b += 16) { 423778e67deSLaurent Vivier len = config_len - b; 424778e67deSLaurent Vivier qemu_hexdump_line(line, b, config, len, false); 425778e67deSLaurent Vivier trace_vhost_vdpa_dump_config(dev, line); 426778e67deSLaurent Vivier } 427778e67deSLaurent Vivier } 428778e67deSLaurent Vivier 429108a6481SCindy Lu static int vhost_vdpa_set_config(struct vhost_dev *dev, const uint8_t *data, 430108a6481SCindy Lu uint32_t offset, uint32_t size, 431108a6481SCindy Lu uint32_t flags) 432108a6481SCindy Lu { 433108a6481SCindy Lu struct vhost_vdpa_config *config; 434108a6481SCindy Lu int ret; 435108a6481SCindy Lu unsigned long config_size = offsetof(struct vhost_vdpa_config, buf); 436986d4f78SLi Qiang 437778e67deSLaurent Vivier trace_vhost_vdpa_set_config(dev, offset, size, flags); 438108a6481SCindy Lu config = g_malloc(size + config_size); 439108a6481SCindy Lu config->off = offset; 440108a6481SCindy Lu config->len = size; 441108a6481SCindy Lu memcpy(config->buf, data, size); 442778e67deSLaurent Vivier if (trace_event_get_state_backends(TRACE_VHOST_VDPA_SET_CONFIG) && 443778e67deSLaurent Vivier trace_event_get_state_backends(TRACE_VHOST_VDPA_DUMP_CONFIG)) { 444778e67deSLaurent Vivier vhost_vdpa_dump_config(dev, data, size); 445778e67deSLaurent Vivier } 446108a6481SCindy Lu ret = vhost_vdpa_call(dev, VHOST_VDPA_SET_CONFIG, config); 447108a6481SCindy Lu g_free(config); 448108a6481SCindy Lu return ret; 449108a6481SCindy Lu } 450108a6481SCindy Lu 451108a6481SCindy Lu static int vhost_vdpa_get_config(struct vhost_dev *dev, uint8_t *config, 452108a6481SCindy Lu uint32_t config_len) 453108a6481SCindy Lu { 454108a6481SCindy Lu struct vhost_vdpa_config *v_config; 455108a6481SCindy Lu unsigned long config_size = offsetof(struct vhost_vdpa_config, buf); 456108a6481SCindy Lu int ret; 457108a6481SCindy Lu 458778e67deSLaurent Vivier trace_vhost_vdpa_get_config(dev, config, config_len); 459108a6481SCindy Lu v_config = g_malloc(config_len + config_size); 460108a6481SCindy Lu v_config->len = config_len; 461108a6481SCindy Lu v_config->off = 0; 462108a6481SCindy Lu ret = vhost_vdpa_call(dev, VHOST_VDPA_GET_CONFIG, v_config); 463108a6481SCindy Lu memcpy(config, v_config->buf, config_len); 464108a6481SCindy Lu g_free(v_config); 465778e67deSLaurent Vivier if (trace_event_get_state_backends(TRACE_VHOST_VDPA_GET_CONFIG) && 466778e67deSLaurent Vivier trace_event_get_state_backends(TRACE_VHOST_VDPA_DUMP_CONFIG)) { 467778e67deSLaurent Vivier vhost_vdpa_dump_config(dev, config, config_len); 468778e67deSLaurent Vivier } 469108a6481SCindy Lu return ret; 470108a6481SCindy Lu } 471108a6481SCindy Lu 472108a6481SCindy Lu static int vhost_vdpa_dev_start(struct vhost_dev *dev, bool started) 473108a6481SCindy Lu { 474108a6481SCindy Lu struct vhost_vdpa *v = dev->opaque; 475778e67deSLaurent Vivier trace_vhost_vdpa_dev_start(dev, started); 476108a6481SCindy Lu if (started) { 477108a6481SCindy Lu uint8_t status = 0; 478108a6481SCindy Lu memory_listener_register(&v->listener, &address_space_memory); 479108a6481SCindy Lu vhost_vdpa_set_vring_ready(dev); 480108a6481SCindy Lu vhost_vdpa_add_status(dev, VIRTIO_CONFIG_S_DRIVER_OK); 481108a6481SCindy Lu vhost_vdpa_call(dev, VHOST_VDPA_GET_STATUS, &status); 482108a6481SCindy Lu 483108a6481SCindy Lu return !(status & VIRTIO_CONFIG_S_DRIVER_OK); 484108a6481SCindy Lu } else { 485108a6481SCindy Lu vhost_vdpa_reset_device(dev); 486108a6481SCindy Lu vhost_vdpa_add_status(dev, VIRTIO_CONFIG_S_ACKNOWLEDGE | 487108a6481SCindy Lu VIRTIO_CONFIG_S_DRIVER); 488108a6481SCindy Lu memory_listener_unregister(&v->listener); 489108a6481SCindy Lu 490108a6481SCindy Lu return 0; 491108a6481SCindy Lu } 492108a6481SCindy Lu } 493108a6481SCindy Lu 494108a6481SCindy Lu static int vhost_vdpa_set_log_base(struct vhost_dev *dev, uint64_t base, 495108a6481SCindy Lu struct vhost_log *log) 496108a6481SCindy Lu { 497778e67deSLaurent Vivier trace_vhost_vdpa_set_log_base(dev, base, log->size, log->refcnt, log->fd, 498778e67deSLaurent Vivier log->log); 499108a6481SCindy Lu return vhost_vdpa_call(dev, VHOST_SET_LOG_BASE, &base); 500108a6481SCindy Lu } 501108a6481SCindy Lu 502108a6481SCindy Lu static int vhost_vdpa_set_vring_addr(struct vhost_dev *dev, 503108a6481SCindy Lu struct vhost_vring_addr *addr) 504108a6481SCindy Lu { 505778e67deSLaurent Vivier trace_vhost_vdpa_set_vring_addr(dev, addr->index, addr->flags, 506778e67deSLaurent Vivier addr->desc_user_addr, addr->used_user_addr, 507778e67deSLaurent Vivier addr->avail_user_addr, 508778e67deSLaurent Vivier addr->log_guest_addr); 509108a6481SCindy Lu return vhost_vdpa_call(dev, VHOST_SET_VRING_ADDR, addr); 510108a6481SCindy Lu } 511108a6481SCindy Lu 512108a6481SCindy Lu static int vhost_vdpa_set_vring_num(struct vhost_dev *dev, 513108a6481SCindy Lu struct vhost_vring_state *ring) 514108a6481SCindy Lu { 515778e67deSLaurent Vivier trace_vhost_vdpa_set_vring_num(dev, ring->index, ring->num); 516108a6481SCindy Lu return vhost_vdpa_call(dev, VHOST_SET_VRING_NUM, ring); 517108a6481SCindy Lu } 518108a6481SCindy Lu 519108a6481SCindy Lu static int vhost_vdpa_set_vring_base(struct vhost_dev *dev, 520108a6481SCindy Lu struct vhost_vring_state *ring) 521108a6481SCindy Lu { 522778e67deSLaurent Vivier trace_vhost_vdpa_set_vring_base(dev, ring->index, ring->num); 523108a6481SCindy Lu return vhost_vdpa_call(dev, VHOST_SET_VRING_BASE, ring); 524108a6481SCindy Lu } 525108a6481SCindy Lu 526108a6481SCindy Lu static int vhost_vdpa_get_vring_base(struct vhost_dev *dev, 527108a6481SCindy Lu struct vhost_vring_state *ring) 528108a6481SCindy Lu { 529778e67deSLaurent Vivier int ret; 530778e67deSLaurent Vivier 531778e67deSLaurent Vivier ret = vhost_vdpa_call(dev, VHOST_GET_VRING_BASE, ring); 532778e67deSLaurent Vivier trace_vhost_vdpa_get_vring_base(dev, ring->index, ring->num); 533778e67deSLaurent Vivier return ret; 534108a6481SCindy Lu } 535108a6481SCindy Lu 536108a6481SCindy Lu static int vhost_vdpa_set_vring_kick(struct vhost_dev *dev, 537108a6481SCindy Lu struct vhost_vring_file *file) 538108a6481SCindy Lu { 539778e67deSLaurent Vivier trace_vhost_vdpa_set_vring_kick(dev, file->index, file->fd); 540108a6481SCindy Lu return vhost_vdpa_call(dev, VHOST_SET_VRING_KICK, file); 541108a6481SCindy Lu } 542108a6481SCindy Lu 543108a6481SCindy Lu static int vhost_vdpa_set_vring_call(struct vhost_dev *dev, 544108a6481SCindy Lu struct vhost_vring_file *file) 545108a6481SCindy Lu { 546778e67deSLaurent Vivier trace_vhost_vdpa_set_vring_call(dev, file->index, file->fd); 547108a6481SCindy Lu return vhost_vdpa_call(dev, VHOST_SET_VRING_CALL, file); 548108a6481SCindy Lu } 549108a6481SCindy Lu 550108a6481SCindy Lu static int vhost_vdpa_get_features(struct vhost_dev *dev, 551108a6481SCindy Lu uint64_t *features) 552108a6481SCindy Lu { 553778e67deSLaurent Vivier int ret; 554778e67deSLaurent Vivier 555778e67deSLaurent Vivier ret = vhost_vdpa_call(dev, VHOST_GET_FEATURES, features); 556778e67deSLaurent Vivier trace_vhost_vdpa_get_features(dev, *features); 557778e67deSLaurent Vivier return ret; 558108a6481SCindy Lu } 559108a6481SCindy Lu 560108a6481SCindy Lu static int vhost_vdpa_set_owner(struct vhost_dev *dev) 561108a6481SCindy Lu { 562778e67deSLaurent Vivier trace_vhost_vdpa_set_owner(dev); 563108a6481SCindy Lu return vhost_vdpa_call(dev, VHOST_SET_OWNER, NULL); 564108a6481SCindy Lu } 565108a6481SCindy Lu 566108a6481SCindy Lu static int vhost_vdpa_vq_get_addr(struct vhost_dev *dev, 567108a6481SCindy Lu struct vhost_vring_addr *addr, struct vhost_virtqueue *vq) 568108a6481SCindy Lu { 569108a6481SCindy Lu assert(dev->vhost_ops->backend_type == VHOST_BACKEND_TYPE_VDPA); 570108a6481SCindy Lu addr->desc_user_addr = (uint64_t)(unsigned long)vq->desc_phys; 571108a6481SCindy Lu addr->avail_user_addr = (uint64_t)(unsigned long)vq->avail_phys; 572108a6481SCindy Lu addr->used_user_addr = (uint64_t)(unsigned long)vq->used_phys; 573778e67deSLaurent Vivier trace_vhost_vdpa_vq_get_addr(dev, vq, addr->desc_user_addr, 574778e67deSLaurent Vivier addr->avail_user_addr, addr->used_user_addr); 575108a6481SCindy Lu return 0; 576108a6481SCindy Lu } 577108a6481SCindy Lu 578108a6481SCindy Lu static bool vhost_vdpa_force_iommu(struct vhost_dev *dev) 579108a6481SCindy Lu { 580108a6481SCindy Lu return true; 581108a6481SCindy Lu } 582108a6481SCindy Lu 583108a6481SCindy Lu const VhostOps vdpa_ops = { 584108a6481SCindy Lu .backend_type = VHOST_BACKEND_TYPE_VDPA, 585108a6481SCindy Lu .vhost_backend_init = vhost_vdpa_init, 586108a6481SCindy Lu .vhost_backend_cleanup = vhost_vdpa_cleanup, 587108a6481SCindy Lu .vhost_set_log_base = vhost_vdpa_set_log_base, 588108a6481SCindy Lu .vhost_set_vring_addr = vhost_vdpa_set_vring_addr, 589108a6481SCindy Lu .vhost_set_vring_num = vhost_vdpa_set_vring_num, 590108a6481SCindy Lu .vhost_set_vring_base = vhost_vdpa_set_vring_base, 591108a6481SCindy Lu .vhost_get_vring_base = vhost_vdpa_get_vring_base, 592108a6481SCindy Lu .vhost_set_vring_kick = vhost_vdpa_set_vring_kick, 593108a6481SCindy Lu .vhost_set_vring_call = vhost_vdpa_set_vring_call, 594108a6481SCindy Lu .vhost_get_features = vhost_vdpa_get_features, 595a5bd0580SJason Wang .vhost_set_backend_cap = vhost_vdpa_set_backend_cap, 596108a6481SCindy Lu .vhost_set_owner = vhost_vdpa_set_owner, 597108a6481SCindy Lu .vhost_set_vring_endian = NULL, 598108a6481SCindy Lu .vhost_backend_memslots_limit = vhost_vdpa_memslots_limit, 599108a6481SCindy Lu .vhost_set_mem_table = vhost_vdpa_set_mem_table, 600108a6481SCindy Lu .vhost_set_features = vhost_vdpa_set_features, 601108a6481SCindy Lu .vhost_reset_device = vhost_vdpa_reset_device, 602108a6481SCindy Lu .vhost_get_vq_index = vhost_vdpa_get_vq_index, 603108a6481SCindy Lu .vhost_get_config = vhost_vdpa_get_config, 604108a6481SCindy Lu .vhost_set_config = vhost_vdpa_set_config, 605108a6481SCindy Lu .vhost_requires_shm_log = NULL, 606108a6481SCindy Lu .vhost_migration_done = NULL, 607108a6481SCindy Lu .vhost_backend_can_merge = NULL, 608108a6481SCindy Lu .vhost_net_set_mtu = NULL, 609108a6481SCindy Lu .vhost_set_iotlb_callback = NULL, 610108a6481SCindy Lu .vhost_send_device_iotlb_msg = NULL, 611108a6481SCindy Lu .vhost_dev_start = vhost_vdpa_dev_start, 612108a6481SCindy Lu .vhost_get_device_id = vhost_vdpa_get_device_id, 613108a6481SCindy Lu .vhost_vq_get_addr = vhost_vdpa_vq_get_addr, 614108a6481SCindy Lu .vhost_force_iommu = vhost_vdpa_force_iommu, 615108a6481SCindy Lu }; 616