1 /* 2 * VFIO BASE CONTAINER 3 * 4 * Copyright (C) 2023 Intel Corporation. 5 * Copyright Red Hat, Inc. 2023 6 * 7 * Authors: Yi Liu <yi.l.liu@intel.com> 8 * Eric Auger <eric.auger@redhat.com> 9 * 10 * SPDX-License-Identifier: GPL-2.0-or-later 11 */ 12 13 #ifndef HW_VFIO_VFIO_CONTAINER_BASE_H 14 #define HW_VFIO_VFIO_CONTAINER_BASE_H 15 16 #include "system/memory.h" 17 18 typedef struct VFIODevice VFIODevice; 19 typedef struct VFIOIOMMUClass VFIOIOMMUClass; 20 21 typedef struct { 22 unsigned long *bitmap; 23 hwaddr size; 24 hwaddr pages; 25 } VFIOBitmap; 26 27 typedef struct VFIOAddressSpace { 28 AddressSpace *as; 29 QLIST_HEAD(, VFIOContainerBase) containers; 30 QLIST_ENTRY(VFIOAddressSpace) list; 31 } VFIOAddressSpace; 32 33 /* 34 * This is the base object for vfio container backends 35 */ 36 typedef struct VFIOContainerBase { 37 Object parent; 38 VFIOAddressSpace *space; 39 MemoryListener listener; 40 Error *error; 41 bool initialized; 42 uint64_t dirty_pgsizes; 43 uint64_t max_dirty_bitmap_size; 44 unsigned long pgsizes; 45 unsigned int dma_max_mappings; 46 bool dirty_pages_supported; 47 bool dirty_pages_started; /* Protected by BQL */ 48 QLIST_HEAD(, VFIOGuestIOMMU) giommu_list; 49 QLIST_HEAD(, VFIORamDiscardListener) vrdl_list; 50 QLIST_ENTRY(VFIOContainerBase) next; 51 QLIST_HEAD(, VFIODevice) device_list; 52 GList *iova_ranges; 53 NotifierWithReturn cpr_reboot_notifier; 54 } VFIOContainerBase; 55 56 typedef struct VFIOGuestIOMMU { 57 VFIOContainerBase *bcontainer; 58 IOMMUMemoryRegion *iommu_mr; 59 hwaddr iommu_offset; 60 IOMMUNotifier n; 61 QLIST_ENTRY(VFIOGuestIOMMU) giommu_next; 62 } VFIOGuestIOMMU; 63 64 typedef struct VFIORamDiscardListener { 65 VFIOContainerBase *bcontainer; 66 MemoryRegion *mr; 67 hwaddr offset_within_address_space; 68 hwaddr size; 69 uint64_t granularity; 70 RamDiscardListener listener; 71 QLIST_ENTRY(VFIORamDiscardListener) next; 72 } VFIORamDiscardListener; 73 74 VFIOAddressSpace *vfio_address_space_get(AddressSpace *as); 75 void vfio_address_space_put(VFIOAddressSpace *space); 76 void vfio_address_space_insert(VFIOAddressSpace *space, 77 VFIOContainerBase *bcontainer); 78 79 int vfio_container_dma_map(VFIOContainerBase *bcontainer, 80 hwaddr iova, ram_addr_t size, 81 void *vaddr, bool readonly, MemoryRegion *mr); 82 int vfio_container_dma_unmap(VFIOContainerBase *bcontainer, 83 hwaddr iova, ram_addr_t size, 84 IOMMUTLBEntry *iotlb, bool unmap_all); 85 bool vfio_container_add_section_window(VFIOContainerBase *bcontainer, 86 MemoryRegionSection *section, 87 Error **errp); 88 void vfio_container_del_section_window(VFIOContainerBase *bcontainer, 89 MemoryRegionSection *section); 90 int vfio_container_set_dirty_page_tracking(VFIOContainerBase *bcontainer, 91 bool start, Error **errp); 92 bool vfio_container_dirty_tracking_is_started( 93 const VFIOContainerBase *bcontainer); 94 bool vfio_container_devices_dirty_tracking_is_supported( 95 const VFIOContainerBase *bcontainer); 96 int vfio_container_query_dirty_bitmap(const VFIOContainerBase *bcontainer, 97 uint64_t iova, uint64_t size, ram_addr_t ram_addr, Error **errp); 98 99 GList *vfio_container_get_iova_ranges(const VFIOContainerBase *bcontainer); 100 101 static inline uint64_t 102 vfio_container_get_page_size_mask(const VFIOContainerBase *bcontainer) 103 { 104 assert(bcontainer); 105 return bcontainer->pgsizes; 106 } 107 108 #define TYPE_VFIO_IOMMU "vfio-iommu" 109 #define TYPE_VFIO_IOMMU_LEGACY TYPE_VFIO_IOMMU "-legacy" 110 #define TYPE_VFIO_IOMMU_SPAPR TYPE_VFIO_IOMMU "-spapr" 111 #define TYPE_VFIO_IOMMU_IOMMUFD TYPE_VFIO_IOMMU "-iommufd" 112 113 OBJECT_DECLARE_TYPE(VFIOContainerBase, VFIOIOMMUClass, VFIO_IOMMU) 114 115 struct VFIOIOMMUClass { 116 ObjectClass parent_class; 117 118 /** 119 * @setup 120 * 121 * Perform basic setup of the container, including configuring IOMMU 122 * capabilities, IOVA ranges, supported page sizes, etc. 123 * 124 * @bcontainer: #VFIOContainerBase 125 * @errp: pointer to Error*, to store an error if it happens. 126 * 127 * Returns true to indicate success and false for error. 128 */ 129 bool (*setup)(VFIOContainerBase *bcontainer, Error **errp); 130 131 /** 132 * @listener_begin 133 * 134 * Called at the beginning of an address space update transaction. 135 * See #MemoryListener. 136 * 137 * @bcontainer: #VFIOContainerBase 138 */ 139 void (*listener_begin)(VFIOContainerBase *bcontainer); 140 141 /** 142 * @listener_commit 143 * 144 * Called at the end of an address space update transaction, 145 * See #MemoryListener. 146 * 147 * @bcontainer: #VFIOContainerBase 148 */ 149 void (*listener_commit)(VFIOContainerBase *bcontainer); 150 151 /** 152 * @dma_map 153 * 154 * Map an address range into the container. Note that the memory region is 155 * referenced within an RCU read lock region across this call. 156 * 157 * @bcontainer: #VFIOContainerBase to use 158 * @iova: start address to map 159 * @size: size of the range to map 160 * @vaddr: process virtual address of mapping 161 * @readonly: true if mapping should be readonly 162 * @mr: the memory region for this mapping 163 * 164 * Returns 0 to indicate success and -errno otherwise. 165 */ 166 int (*dma_map)(const VFIOContainerBase *bcontainer, 167 hwaddr iova, ram_addr_t size, 168 void *vaddr, bool readonly, MemoryRegion *mr); 169 /** 170 * @dma_unmap 171 * 172 * Unmap an address range from the container. 173 * 174 * @bcontainer: #VFIOContainerBase to use for unmap 175 * @iova: start address to unmap 176 * @size: size of the range to unmap 177 * @iotlb: The IOMMU TLB mapping entry (or NULL) 178 * @unmap_all: if set, unmap the entire address space 179 * 180 * Returns 0 to indicate success and -errno otherwise. 181 */ 182 int (*dma_unmap)(const VFIOContainerBase *bcontainer, 183 hwaddr iova, ram_addr_t size, 184 IOMMUTLBEntry *iotlb, bool unmap_all); 185 186 187 /** 188 * @attach_device 189 * 190 * Associate the given device with a container and do some related 191 * initialization of the device context. 192 * 193 * @name: name of the device 194 * @vbasedev: the device 195 * @as: address space to use 196 * @errp: pointer to Error*, to store an error if it happens. 197 * 198 * Returns true to indicate success and false for error. 199 */ 200 bool (*attach_device)(const char *name, VFIODevice *vbasedev, 201 AddressSpace *as, Error **errp); 202 203 /* 204 * @detach_device 205 * 206 * Detach the given device from its container and clean up any necessary 207 * state. 208 * 209 * @vbasedev: the device to disassociate 210 */ 211 void (*detach_device)(VFIODevice *vbasedev); 212 213 /* migration feature */ 214 215 /** 216 * @set_dirty_page_tracking 217 * 218 * Start or stop dirty pages tracking on VFIO container 219 * 220 * @bcontainer: #VFIOContainerBase on which to de/activate dirty 221 * page tracking 222 * @start: indicates whether to start or stop dirty pages tracking 223 * @errp: pointer to Error*, to store an error if it happens. 224 * 225 * Returns zero to indicate success and negative for error. 226 */ 227 int (*set_dirty_page_tracking)(const VFIOContainerBase *bcontainer, 228 bool start, Error **errp); 229 /** 230 * @query_dirty_bitmap 231 * 232 * Get bitmap of dirty pages from container 233 * 234 * @bcontainer: #VFIOContainerBase from which to get dirty pages 235 * @vbmap: #VFIOBitmap internal bitmap structure 236 * @iova: iova base address 237 * @size: size of iova range 238 * @errp: pointer to Error*, to store an error if it happens. 239 * 240 * Returns zero to indicate success and negative for error. 241 */ 242 int (*query_dirty_bitmap)(const VFIOContainerBase *bcontainer, 243 VFIOBitmap *vbmap, hwaddr iova, hwaddr size, Error **errp); 244 /* PCI specific */ 245 int (*pci_hot_reset)(VFIODevice *vbasedev, bool single); 246 247 /* SPAPR specific */ 248 bool (*add_window)(VFIOContainerBase *bcontainer, 249 MemoryRegionSection *section, 250 Error **errp); 251 void (*del_window)(VFIOContainerBase *bcontainer, 252 MemoryRegionSection *section); 253 void (*release)(VFIOContainerBase *bcontainer); 254 }; 255 256 VFIORamDiscardListener *vfio_find_ram_discard_listener( 257 VFIOContainerBase *bcontainer, MemoryRegionSection *section); 258 259 void vfio_container_region_add(VFIOContainerBase *bcontainer, 260 MemoryRegionSection *section, bool cpr_remap); 261 262 #endif /* HW_VFIO_VFIO_CONTAINER_BASE_H */ 263