xref: /qemu/hw/pci/msix.c (revision c759b24fae08c6c333df03e1db48e13b7f5eda30)
102eb84d0SMichael S. Tsirkin /*
202eb84d0SMichael S. Tsirkin  * MSI-X device support
302eb84d0SMichael S. Tsirkin  *
402eb84d0SMichael S. Tsirkin  * This module includes support for MSI-X in pci devices.
502eb84d0SMichael S. Tsirkin  *
602eb84d0SMichael S. Tsirkin  * Author: Michael S. Tsirkin <mst@redhat.com>
702eb84d0SMichael S. Tsirkin  *
802eb84d0SMichael S. Tsirkin  *  Copyright (c) 2009, Red Hat Inc, Michael S. Tsirkin (mst@redhat.com)
902eb84d0SMichael S. Tsirkin  *
1002eb84d0SMichael S. Tsirkin  * This work is licensed under the terms of the GNU GPL, version 2.  See
1102eb84d0SMichael S. Tsirkin  * the COPYING file in the top-level directory.
126b620ca3SPaolo Bonzini  *
136b620ca3SPaolo Bonzini  * Contributions after 2012-01-13 are licensed under the terms of the
146b620ca3SPaolo Bonzini  * GNU GPL, version 2 or (at your option) any later version.
1502eb84d0SMichael S. Tsirkin  */
1602eb84d0SMichael S. Tsirkin 
17*c759b24fSMichael S. Tsirkin #include "hw/hw.h"
18*c759b24fSMichael S. Tsirkin #include "hw/pci/msi.h"
19*c759b24fSMichael S. Tsirkin #include "hw/pci/msix.h"
20*c759b24fSMichael S. Tsirkin #include "hw/pci/pci.h"
21bf1b0071SBlue Swirl #include "range.h"
2202eb84d0SMichael S. Tsirkin 
2302eb84d0SMichael S. Tsirkin #define MSIX_CAP_LENGTH 12
2402eb84d0SMichael S. Tsirkin 
252760952bSMichael S. Tsirkin /* MSI enable bit and maskall bit are in byte 1 in FLAGS register */
262760952bSMichael S. Tsirkin #define MSIX_CONTROL_OFFSET (PCI_MSIX_FLAGS + 1)
2702eb84d0SMichael S. Tsirkin #define MSIX_ENABLE_MASK (PCI_MSIX_FLAGS_ENABLE >> 8)
285b5cb086SMichael S. Tsirkin #define MSIX_MASKALL_MASK (PCI_MSIX_FLAGS_MASKALL >> 8)
2902eb84d0SMichael S. Tsirkin 
30bc4caf49SJan Kiszka static MSIMessage msix_get_message(PCIDevice *dev, unsigned vector)
31bc4caf49SJan Kiszka {
32d35e428cSAlex Williamson     uint8_t *table_entry = dev->msix_table + vector * PCI_MSIX_ENTRY_SIZE;
33bc4caf49SJan Kiszka     MSIMessage msg;
34bc4caf49SJan Kiszka 
35bc4caf49SJan Kiszka     msg.address = pci_get_quad(table_entry + PCI_MSIX_ENTRY_LOWER_ADDR);
36bc4caf49SJan Kiszka     msg.data = pci_get_long(table_entry + PCI_MSIX_ENTRY_DATA);
37bc4caf49SJan Kiszka     return msg;
38bc4caf49SJan Kiszka }
3902eb84d0SMichael S. Tsirkin 
40932d4a42SAlexey Kardashevskiy /*
41932d4a42SAlexey Kardashevskiy  * Special API for POWER to configure the vectors through
42932d4a42SAlexey Kardashevskiy  * a side channel. Should never be used by devices.
43932d4a42SAlexey Kardashevskiy  */
44932d4a42SAlexey Kardashevskiy void msix_set_message(PCIDevice *dev, int vector, struct MSIMessage msg)
45932d4a42SAlexey Kardashevskiy {
46932d4a42SAlexey Kardashevskiy     uint8_t *table_entry = dev->msix_table + vector * PCI_MSIX_ENTRY_SIZE;
47932d4a42SAlexey Kardashevskiy 
48932d4a42SAlexey Kardashevskiy     pci_set_quad(table_entry + PCI_MSIX_ENTRY_LOWER_ADDR, msg.address);
49932d4a42SAlexey Kardashevskiy     pci_set_long(table_entry + PCI_MSIX_ENTRY_DATA, msg.data);
50932d4a42SAlexey Kardashevskiy     table_entry[PCI_MSIX_ENTRY_VECTOR_CTRL] &= ~PCI_MSIX_ENTRY_CTRL_MASKBIT;
51932d4a42SAlexey Kardashevskiy }
52932d4a42SAlexey Kardashevskiy 
5302eb84d0SMichael S. Tsirkin static uint8_t msix_pending_mask(int vector)
5402eb84d0SMichael S. Tsirkin {
5502eb84d0SMichael S. Tsirkin     return 1 << (vector % 8);
5602eb84d0SMichael S. Tsirkin }
5702eb84d0SMichael S. Tsirkin 
5802eb84d0SMichael S. Tsirkin static uint8_t *msix_pending_byte(PCIDevice *dev, int vector)
5902eb84d0SMichael S. Tsirkin {
60d35e428cSAlex Williamson     return dev->msix_pba + vector / 8;
6102eb84d0SMichael S. Tsirkin }
6202eb84d0SMichael S. Tsirkin 
6302eb84d0SMichael S. Tsirkin static int msix_is_pending(PCIDevice *dev, int vector)
6402eb84d0SMichael S. Tsirkin {
6502eb84d0SMichael S. Tsirkin     return *msix_pending_byte(dev, vector) & msix_pending_mask(vector);
6602eb84d0SMichael S. Tsirkin }
6702eb84d0SMichael S. Tsirkin 
6802eb84d0SMichael S. Tsirkin static void msix_set_pending(PCIDevice *dev, int vector)
6902eb84d0SMichael S. Tsirkin {
7002eb84d0SMichael S. Tsirkin     *msix_pending_byte(dev, vector) |= msix_pending_mask(vector);
7102eb84d0SMichael S. Tsirkin }
7202eb84d0SMichael S. Tsirkin 
7302eb84d0SMichael S. Tsirkin static void msix_clr_pending(PCIDevice *dev, int vector)
7402eb84d0SMichael S. Tsirkin {
7502eb84d0SMichael S. Tsirkin     *msix_pending_byte(dev, vector) &= ~msix_pending_mask(vector);
7602eb84d0SMichael S. Tsirkin }
7702eb84d0SMichael S. Tsirkin 
78ae392c41SMichael S. Tsirkin static bool msix_vector_masked(PCIDevice *dev, int vector, bool fmask)
7902eb84d0SMichael S. Tsirkin {
80ae392c41SMichael S. Tsirkin     unsigned offset = vector * PCI_MSIX_ENTRY_SIZE + PCI_MSIX_ENTRY_VECTOR_CTRL;
81d35e428cSAlex Williamson     return fmask || dev->msix_table[offset] & PCI_MSIX_ENTRY_CTRL_MASKBIT;
825b5cb086SMichael S. Tsirkin }
835b5cb086SMichael S. Tsirkin 
84ae392c41SMichael S. Tsirkin static bool msix_is_masked(PCIDevice *dev, int vector)
855b5cb086SMichael S. Tsirkin {
86ae392c41SMichael S. Tsirkin     return msix_vector_masked(dev, vector, dev->msix_function_masked);
87ae392c41SMichael S. Tsirkin }
88ae392c41SMichael S. Tsirkin 
892cdfe53cSJan Kiszka static void msix_fire_vector_notifier(PCIDevice *dev,
902cdfe53cSJan Kiszka                                       unsigned int vector, bool is_masked)
912cdfe53cSJan Kiszka {
922cdfe53cSJan Kiszka     MSIMessage msg;
932cdfe53cSJan Kiszka     int ret;
942cdfe53cSJan Kiszka 
952cdfe53cSJan Kiszka     if (!dev->msix_vector_use_notifier) {
962cdfe53cSJan Kiszka         return;
972cdfe53cSJan Kiszka     }
982cdfe53cSJan Kiszka     if (is_masked) {
992cdfe53cSJan Kiszka         dev->msix_vector_release_notifier(dev, vector);
1002cdfe53cSJan Kiszka     } else {
1012cdfe53cSJan Kiszka         msg = msix_get_message(dev, vector);
1022cdfe53cSJan Kiszka         ret = dev->msix_vector_use_notifier(dev, vector, msg);
1032cdfe53cSJan Kiszka         assert(ret >= 0);
1042cdfe53cSJan Kiszka     }
1052cdfe53cSJan Kiszka }
1062cdfe53cSJan Kiszka 
107ae392c41SMichael S. Tsirkin static void msix_handle_mask_update(PCIDevice *dev, int vector, bool was_masked)
108ae392c41SMichael S. Tsirkin {
109ae392c41SMichael S. Tsirkin     bool is_masked = msix_is_masked(dev, vector);
1102cdfe53cSJan Kiszka 
111ae392c41SMichael S. Tsirkin     if (is_masked == was_masked) {
112ae392c41SMichael S. Tsirkin         return;
113ae392c41SMichael S. Tsirkin     }
114ae392c41SMichael S. Tsirkin 
1152cdfe53cSJan Kiszka     msix_fire_vector_notifier(dev, vector, is_masked);
1162cdfe53cSJan Kiszka 
117ae392c41SMichael S. Tsirkin     if (!is_masked && msix_is_pending(dev, vector)) {
1185b5cb086SMichael S. Tsirkin         msix_clr_pending(dev, vector);
1195b5cb086SMichael S. Tsirkin         msix_notify(dev, vector);
1205b5cb086SMichael S. Tsirkin     }
1215b5cb086SMichael S. Tsirkin }
1225b5cb086SMichael S. Tsirkin 
12350322249SMichael S. Tsirkin static void msix_update_function_masked(PCIDevice *dev)
12450322249SMichael S. Tsirkin {
12550322249SMichael S. Tsirkin     dev->msix_function_masked = !msix_enabled(dev) ||
12650322249SMichael S. Tsirkin         (dev->config[dev->msix_cap + MSIX_CONTROL_OFFSET] & MSIX_MASKALL_MASK);
12750322249SMichael S. Tsirkin }
12850322249SMichael S. Tsirkin 
1295b5cb086SMichael S. Tsirkin /* Handle MSI-X capability config write. */
1305b5cb086SMichael S. Tsirkin void msix_write_config(PCIDevice *dev, uint32_t addr,
1315b5cb086SMichael S. Tsirkin                        uint32_t val, int len)
1325b5cb086SMichael S. Tsirkin {
1335b5cb086SMichael S. Tsirkin     unsigned enable_pos = dev->msix_cap + MSIX_CONTROL_OFFSET;
1345b5cb086SMichael S. Tsirkin     int vector;
13550322249SMichael S. Tsirkin     bool was_masked;
1365b5cb086SMichael S. Tsirkin 
1377c9958b0SJan Kiszka     if (!msix_present(dev) || !range_covers_byte(addr, len, enable_pos)) {
1385b5cb086SMichael S. Tsirkin         return;
1395b5cb086SMichael S. Tsirkin     }
1405b5cb086SMichael S. Tsirkin 
14150322249SMichael S. Tsirkin     was_masked = dev->msix_function_masked;
14250322249SMichael S. Tsirkin     msix_update_function_masked(dev);
14350322249SMichael S. Tsirkin 
1445b5cb086SMichael S. Tsirkin     if (!msix_enabled(dev)) {
1455b5cb086SMichael S. Tsirkin         return;
1465b5cb086SMichael S. Tsirkin     }
1475b5cb086SMichael S. Tsirkin 
148e407bf13SIsaku Yamahata     pci_device_deassert_intx(dev);
1495b5cb086SMichael S. Tsirkin 
15050322249SMichael S. Tsirkin     if (dev->msix_function_masked == was_masked) {
1515b5cb086SMichael S. Tsirkin         return;
1525b5cb086SMichael S. Tsirkin     }
1535b5cb086SMichael S. Tsirkin 
1545b5cb086SMichael S. Tsirkin     for (vector = 0; vector < dev->msix_entries_nr; ++vector) {
155ae392c41SMichael S. Tsirkin         msix_handle_mask_update(dev, vector,
156ae392c41SMichael S. Tsirkin                                 msix_vector_masked(dev, vector, was_masked));
1575b5cb086SMichael S. Tsirkin     }
15802eb84d0SMichael S. Tsirkin }
15902eb84d0SMichael S. Tsirkin 
160a8170e5eSAvi Kivity static uint64_t msix_table_mmio_read(void *opaque, hwaddr addr,
161eebcb0a7SAlex Williamson                                      unsigned size)
162eebcb0a7SAlex Williamson {
163eebcb0a7SAlex Williamson     PCIDevice *dev = opaque;
164eebcb0a7SAlex Williamson 
165d35e428cSAlex Williamson     return pci_get_long(dev->msix_table + addr);
166eebcb0a7SAlex Williamson }
167eebcb0a7SAlex Williamson 
168a8170e5eSAvi Kivity static void msix_table_mmio_write(void *opaque, hwaddr addr,
16995524ae8SAvi Kivity                                   uint64_t val, unsigned size)
17002eb84d0SMichael S. Tsirkin {
17102eb84d0SMichael S. Tsirkin     PCIDevice *dev = opaque;
172d35e428cSAlex Williamson     int vector = addr / PCI_MSIX_ENTRY_SIZE;
173ae392c41SMichael S. Tsirkin     bool was_masked;
1749a93b617SMichael S. Tsirkin 
175ae392c41SMichael S. Tsirkin     was_masked = msix_is_masked(dev, vector);
176d35e428cSAlex Williamson     pci_set_long(dev->msix_table + addr, val);
177ae392c41SMichael S. Tsirkin     msix_handle_mask_update(dev, vector, was_masked);
17802eb84d0SMichael S. Tsirkin }
17902eb84d0SMichael S. Tsirkin 
180d35e428cSAlex Williamson static const MemoryRegionOps msix_table_mmio_ops = {
181d35e428cSAlex Williamson     .read = msix_table_mmio_read,
182d35e428cSAlex Williamson     .write = msix_table_mmio_write,
183d35e428cSAlex Williamson     /* TODO: MSIX should be LITTLE_ENDIAN. */
184d35e428cSAlex Williamson     .endianness = DEVICE_NATIVE_ENDIAN,
185d35e428cSAlex Williamson     .valid = {
186d35e428cSAlex Williamson         .min_access_size = 4,
187d35e428cSAlex Williamson         .max_access_size = 4,
188d35e428cSAlex Williamson     },
189d35e428cSAlex Williamson };
190d35e428cSAlex Williamson 
191a8170e5eSAvi Kivity static uint64_t msix_pba_mmio_read(void *opaque, hwaddr addr,
192d35e428cSAlex Williamson                                    unsigned size)
193d35e428cSAlex Williamson {
194d35e428cSAlex Williamson     PCIDevice *dev = opaque;
195d35e428cSAlex Williamson 
196d35e428cSAlex Williamson     return pci_get_long(dev->msix_pba + addr);
197d35e428cSAlex Williamson }
198d35e428cSAlex Williamson 
199d35e428cSAlex Williamson static const MemoryRegionOps msix_pba_mmio_ops = {
200d35e428cSAlex Williamson     .read = msix_pba_mmio_read,
2012cf62ad7SAlex Williamson     /* TODO: MSIX should be LITTLE_ENDIAN. */
20295524ae8SAvi Kivity     .endianness = DEVICE_NATIVE_ENDIAN,
20395524ae8SAvi Kivity     .valid = {
20495524ae8SAvi Kivity         .min_access_size = 4,
20595524ae8SAvi Kivity         .max_access_size = 4,
20695524ae8SAvi Kivity     },
20702eb84d0SMichael S. Tsirkin };
20802eb84d0SMichael S. Tsirkin 
209ae1be0bbSMichael S. Tsirkin static void msix_mask_all(struct PCIDevice *dev, unsigned nentries)
210ae1be0bbSMichael S. Tsirkin {
211ae1be0bbSMichael S. Tsirkin     int vector;
2125b5f1330SJan Kiszka 
213ae1be0bbSMichael S. Tsirkin     for (vector = 0; vector < nentries; ++vector) {
21401731cfbSJan Kiszka         unsigned offset =
21501731cfbSJan Kiszka             vector * PCI_MSIX_ENTRY_SIZE + PCI_MSIX_ENTRY_VECTOR_CTRL;
2165b5f1330SJan Kiszka         bool was_masked = msix_is_masked(dev, vector);
2175b5f1330SJan Kiszka 
218d35e428cSAlex Williamson         dev->msix_table[offset] |= PCI_MSIX_ENTRY_CTRL_MASKBIT;
2195b5f1330SJan Kiszka         msix_handle_mask_update(dev, vector, was_masked);
220ae1be0bbSMichael S. Tsirkin     }
221ae1be0bbSMichael S. Tsirkin }
222ae1be0bbSMichael S. Tsirkin 
2235a2c2029SAlex Williamson /* Initialize the MSI-X structures */
22402eb84d0SMichael S. Tsirkin int msix_init(struct PCIDevice *dev, unsigned short nentries,
2255a2c2029SAlex Williamson               MemoryRegion *table_bar, uint8_t table_bar_nr,
2265a2c2029SAlex Williamson               unsigned table_offset, MemoryRegion *pba_bar,
2275a2c2029SAlex Williamson               uint8_t pba_bar_nr, unsigned pba_offset, uint8_t cap_pos)
22802eb84d0SMichael S. Tsirkin {
2295a2c2029SAlex Williamson     int cap;
230d35e428cSAlex Williamson     unsigned table_size, pba_size;
2315a2c2029SAlex Williamson     uint8_t *config;
23202eb84d0SMichael S. Tsirkin 
23360ba3cc2SJan Kiszka     /* Nothing to do if MSI is not supported by interrupt controller */
23460ba3cc2SJan Kiszka     if (!msi_supported) {
23560ba3cc2SJan Kiszka         return -ENOTSUP;
23660ba3cc2SJan Kiszka     }
2375a2c2029SAlex Williamson 
2385a2c2029SAlex Williamson     if (nentries < 1 || nentries > PCI_MSIX_FLAGS_QSIZE + 1) {
23902eb84d0SMichael S. Tsirkin         return -EINVAL;
2405a2c2029SAlex Williamson     }
24102eb84d0SMichael S. Tsirkin 
242d35e428cSAlex Williamson     table_size = nentries * PCI_MSIX_ENTRY_SIZE;
243d35e428cSAlex Williamson     pba_size = QEMU_ALIGN_UP(nentries, 64) / 8;
244d35e428cSAlex Williamson 
2455a2c2029SAlex Williamson     /* Sanity test: table & pba don't overlap, fit within BARs, min aligned */
2465a2c2029SAlex Williamson     if ((table_bar_nr == pba_bar_nr &&
2475a2c2029SAlex Williamson          ranges_overlap(table_offset, table_size, pba_offset, pba_size)) ||
2485a2c2029SAlex Williamson         table_offset + table_size > memory_region_size(table_bar) ||
2495a2c2029SAlex Williamson         pba_offset + pba_size > memory_region_size(pba_bar) ||
2505a2c2029SAlex Williamson         (table_offset | pba_offset) & PCI_MSIX_FLAGS_BIRMASK) {
2515a2c2029SAlex Williamson         return -EINVAL;
2525a2c2029SAlex Williamson     }
2535a2c2029SAlex Williamson 
2545a2c2029SAlex Williamson     cap = pci_add_capability(dev, PCI_CAP_ID_MSIX, cap_pos, MSIX_CAP_LENGTH);
2555a2c2029SAlex Williamson     if (cap < 0) {
2565a2c2029SAlex Williamson         return cap;
2575a2c2029SAlex Williamson     }
2585a2c2029SAlex Williamson 
2595a2c2029SAlex Williamson     dev->msix_cap = cap;
2605a2c2029SAlex Williamson     dev->cap_present |= QEMU_PCI_CAP_MSIX;
2615a2c2029SAlex Williamson     config = dev->config + cap;
2625a2c2029SAlex Williamson 
2635a2c2029SAlex Williamson     pci_set_word(config + PCI_MSIX_FLAGS, nentries - 1);
2645a2c2029SAlex Williamson     dev->msix_entries_nr = nentries;
2655a2c2029SAlex Williamson     dev->msix_function_masked = true;
2665a2c2029SAlex Williamson 
2675a2c2029SAlex Williamson     pci_set_long(config + PCI_MSIX_TABLE, table_offset | table_bar_nr);
2685a2c2029SAlex Williamson     pci_set_long(config + PCI_MSIX_PBA, pba_offset | pba_bar_nr);
2695a2c2029SAlex Williamson 
2705a2c2029SAlex Williamson     /* Make flags bit writable. */
2715a2c2029SAlex Williamson     dev->wmask[cap + MSIX_CONTROL_OFFSET] |= MSIX_ENABLE_MASK |
2725a2c2029SAlex Williamson                                              MSIX_MASKALL_MASK;
27302eb84d0SMichael S. Tsirkin 
274d35e428cSAlex Williamson     dev->msix_table = g_malloc0(table_size);
275d35e428cSAlex Williamson     dev->msix_pba = g_malloc0(pba_size);
2765a2c2029SAlex Williamson     dev->msix_entry_used = g_malloc0(nentries * sizeof *dev->msix_entry_used);
2775a2c2029SAlex Williamson 
278ae1be0bbSMichael S. Tsirkin     msix_mask_all(dev, nentries);
27902eb84d0SMichael S. Tsirkin 
280d35e428cSAlex Williamson     memory_region_init_io(&dev->msix_table_mmio, &msix_table_mmio_ops, dev,
281d35e428cSAlex Williamson                           "msix-table", table_size);
2825a2c2029SAlex Williamson     memory_region_add_subregion(table_bar, table_offset, &dev->msix_table_mmio);
283d35e428cSAlex Williamson     memory_region_init_io(&dev->msix_pba_mmio, &msix_pba_mmio_ops, dev,
284d35e428cSAlex Williamson                           "msix-pba", pba_size);
2855a2c2029SAlex Williamson     memory_region_add_subregion(pba_bar, pba_offset, &dev->msix_pba_mmio);
28602eb84d0SMichael S. Tsirkin 
28702eb84d0SMichael S. Tsirkin     return 0;
28802eb84d0SMichael S. Tsirkin }
28902eb84d0SMichael S. Tsirkin 
29053f94925SAlex Williamson int msix_init_exclusive_bar(PCIDevice *dev, unsigned short nentries,
29153f94925SAlex Williamson                             uint8_t bar_nr)
29253f94925SAlex Williamson {
29353f94925SAlex Williamson     int ret;
29453f94925SAlex Williamson     char *name;
29553f94925SAlex Williamson 
29653f94925SAlex Williamson     /*
29753f94925SAlex Williamson      * Migration compatibility dictates that this remains a 4k
29853f94925SAlex Williamson      * BAR with the vector table in the lower half and PBA in
29953f94925SAlex Williamson      * the upper half.  Do not use these elsewhere!
30053f94925SAlex Williamson      */
30153f94925SAlex Williamson #define MSIX_EXCLUSIVE_BAR_SIZE 4096
3025a2c2029SAlex Williamson #define MSIX_EXCLUSIVE_BAR_TABLE_OFFSET 0
30353f94925SAlex Williamson #define MSIX_EXCLUSIVE_BAR_PBA_OFFSET (MSIX_EXCLUSIVE_BAR_SIZE / 2)
3045a2c2029SAlex Williamson #define MSIX_EXCLUSIVE_CAP_OFFSET 0
30553f94925SAlex Williamson 
30653f94925SAlex Williamson     if (nentries * PCI_MSIX_ENTRY_SIZE > MSIX_EXCLUSIVE_BAR_PBA_OFFSET) {
30753f94925SAlex Williamson         return -EINVAL;
30853f94925SAlex Williamson     }
30953f94925SAlex Williamson 
3105f893b4eSGerd Hoffmann     name = g_strdup_printf("%s-msix", dev->name);
31153f94925SAlex Williamson     memory_region_init(&dev->msix_exclusive_bar, name, MSIX_EXCLUSIVE_BAR_SIZE);
3125f893b4eSGerd Hoffmann     g_free(name);
31353f94925SAlex Williamson 
31453f94925SAlex Williamson     ret = msix_init(dev, nentries, &dev->msix_exclusive_bar, bar_nr,
3155a2c2029SAlex Williamson                     MSIX_EXCLUSIVE_BAR_TABLE_OFFSET, &dev->msix_exclusive_bar,
3165a2c2029SAlex Williamson                     bar_nr, MSIX_EXCLUSIVE_BAR_PBA_OFFSET,
3175a2c2029SAlex Williamson                     MSIX_EXCLUSIVE_CAP_OFFSET);
31853f94925SAlex Williamson     if (ret) {
31953f94925SAlex Williamson         memory_region_destroy(&dev->msix_exclusive_bar);
32053f94925SAlex Williamson         return ret;
32153f94925SAlex Williamson     }
32253f94925SAlex Williamson 
32353f94925SAlex Williamson     pci_register_bar(dev, bar_nr, PCI_BASE_ADDRESS_SPACE_MEMORY,
32453f94925SAlex Williamson                      &dev->msix_exclusive_bar);
32553f94925SAlex Williamson 
32653f94925SAlex Williamson     return 0;
32753f94925SAlex Williamson }
32853f94925SAlex Williamson 
32998304c84SMichael S. Tsirkin static void msix_free_irq_entries(PCIDevice *dev)
33098304c84SMichael S. Tsirkin {
33198304c84SMichael S. Tsirkin     int vector;
33298304c84SMichael S. Tsirkin 
33398304c84SMichael S. Tsirkin     for (vector = 0; vector < dev->msix_entries_nr; ++vector) {
33498304c84SMichael S. Tsirkin         dev->msix_entry_used[vector] = 0;
33598304c84SMichael S. Tsirkin         msix_clr_pending(dev, vector);
33698304c84SMichael S. Tsirkin     }
33798304c84SMichael S. Tsirkin }
33898304c84SMichael S. Tsirkin 
3393cac001eSMichael S. Tsirkin static void msix_clear_all_vectors(PCIDevice *dev)
3403cac001eSMichael S. Tsirkin {
3413cac001eSMichael S. Tsirkin     int vector;
3423cac001eSMichael S. Tsirkin 
3433cac001eSMichael S. Tsirkin     for (vector = 0; vector < dev->msix_entries_nr; ++vector) {
3443cac001eSMichael S. Tsirkin         msix_clr_pending(dev, vector);
3453cac001eSMichael S. Tsirkin     }
3463cac001eSMichael S. Tsirkin }
3473cac001eSMichael S. Tsirkin 
34802eb84d0SMichael S. Tsirkin /* Clean up resources for the device. */
349572992eeSAlex Williamson void msix_uninit(PCIDevice *dev, MemoryRegion *table_bar, MemoryRegion *pba_bar)
35002eb84d0SMichael S. Tsirkin {
35144701ab7SJan Kiszka     if (!msix_present(dev)) {
352572992eeSAlex Williamson         return;
35344701ab7SJan Kiszka     }
35402eb84d0SMichael S. Tsirkin     pci_del_capability(dev, PCI_CAP_ID_MSIX, MSIX_CAP_LENGTH);
35502eb84d0SMichael S. Tsirkin     dev->msix_cap = 0;
35602eb84d0SMichael S. Tsirkin     msix_free_irq_entries(dev);
35702eb84d0SMichael S. Tsirkin     dev->msix_entries_nr = 0;
3585a2c2029SAlex Williamson     memory_region_del_subregion(pba_bar, &dev->msix_pba_mmio);
359d35e428cSAlex Williamson     memory_region_destroy(&dev->msix_pba_mmio);
360d35e428cSAlex Williamson     g_free(dev->msix_pba);
361d35e428cSAlex Williamson     dev->msix_pba = NULL;
3625a2c2029SAlex Williamson     memory_region_del_subregion(table_bar, &dev->msix_table_mmio);
363d35e428cSAlex Williamson     memory_region_destroy(&dev->msix_table_mmio);
364d35e428cSAlex Williamson     g_free(dev->msix_table);
365d35e428cSAlex Williamson     dev->msix_table = NULL;
3667267c094SAnthony Liguori     g_free(dev->msix_entry_used);
36702eb84d0SMichael S. Tsirkin     dev->msix_entry_used = NULL;
36802eb84d0SMichael S. Tsirkin     dev->cap_present &= ~QEMU_PCI_CAP_MSIX;
36902eb84d0SMichael S. Tsirkin }
37002eb84d0SMichael S. Tsirkin 
37153f94925SAlex Williamson void msix_uninit_exclusive_bar(PCIDevice *dev)
37253f94925SAlex Williamson {
37353f94925SAlex Williamson     if (msix_present(dev)) {
3745a2c2029SAlex Williamson         msix_uninit(dev, &dev->msix_exclusive_bar, &dev->msix_exclusive_bar);
37553f94925SAlex Williamson         memory_region_destroy(&dev->msix_exclusive_bar);
37653f94925SAlex Williamson     }
37753f94925SAlex Williamson }
37853f94925SAlex Williamson 
37902eb84d0SMichael S. Tsirkin void msix_save(PCIDevice *dev, QEMUFile *f)
38002eb84d0SMichael S. Tsirkin {
3819a3e12c8SMichael S. Tsirkin     unsigned n = dev->msix_entries_nr;
3829a3e12c8SMichael S. Tsirkin 
38344701ab7SJan Kiszka     if (!msix_present(dev)) {
3849a3e12c8SMichael S. Tsirkin         return;
38572755a70SMichael S. Tsirkin     }
3869a3e12c8SMichael S. Tsirkin 
387d35e428cSAlex Williamson     qemu_put_buffer(f, dev->msix_table, n * PCI_MSIX_ENTRY_SIZE);
388d35e428cSAlex Williamson     qemu_put_buffer(f, dev->msix_pba, (n + 7) / 8);
38902eb84d0SMichael S. Tsirkin }
39002eb84d0SMichael S. Tsirkin 
39102eb84d0SMichael S. Tsirkin /* Should be called after restoring the config space. */
39202eb84d0SMichael S. Tsirkin void msix_load(PCIDevice *dev, QEMUFile *f)
39302eb84d0SMichael S. Tsirkin {
39402eb84d0SMichael S. Tsirkin     unsigned n = dev->msix_entries_nr;
3952cdfe53cSJan Kiszka     unsigned int vector;
39602eb84d0SMichael S. Tsirkin 
39744701ab7SJan Kiszka     if (!msix_present(dev)) {
39802eb84d0SMichael S. Tsirkin         return;
39998846d73SBlue Swirl     }
40002eb84d0SMichael S. Tsirkin 
4013cac001eSMichael S. Tsirkin     msix_clear_all_vectors(dev);
402d35e428cSAlex Williamson     qemu_get_buffer(f, dev->msix_table, n * PCI_MSIX_ENTRY_SIZE);
403d35e428cSAlex Williamson     qemu_get_buffer(f, dev->msix_pba, (n + 7) / 8);
40450322249SMichael S. Tsirkin     msix_update_function_masked(dev);
4052cdfe53cSJan Kiszka 
4062cdfe53cSJan Kiszka     for (vector = 0; vector < n; vector++) {
4072cdfe53cSJan Kiszka         msix_handle_mask_update(dev, vector, true);
4082cdfe53cSJan Kiszka     }
40902eb84d0SMichael S. Tsirkin }
41002eb84d0SMichael S. Tsirkin 
41102eb84d0SMichael S. Tsirkin /* Does device support MSI-X? */
41202eb84d0SMichael S. Tsirkin int msix_present(PCIDevice *dev)
41302eb84d0SMichael S. Tsirkin {
41402eb84d0SMichael S. Tsirkin     return dev->cap_present & QEMU_PCI_CAP_MSIX;
41502eb84d0SMichael S. Tsirkin }
41602eb84d0SMichael S. Tsirkin 
41702eb84d0SMichael S. Tsirkin /* Is MSI-X enabled? */
41802eb84d0SMichael S. Tsirkin int msix_enabled(PCIDevice *dev)
41902eb84d0SMichael S. Tsirkin {
42002eb84d0SMichael S. Tsirkin     return (dev->cap_present & QEMU_PCI_CAP_MSIX) &&
4212760952bSMichael S. Tsirkin         (dev->config[dev->msix_cap + MSIX_CONTROL_OFFSET] &
42202eb84d0SMichael S. Tsirkin          MSIX_ENABLE_MASK);
42302eb84d0SMichael S. Tsirkin }
42402eb84d0SMichael S. Tsirkin 
42502eb84d0SMichael S. Tsirkin /* Send an MSI-X message */
42602eb84d0SMichael S. Tsirkin void msix_notify(PCIDevice *dev, unsigned vector)
42702eb84d0SMichael S. Tsirkin {
428bc4caf49SJan Kiszka     MSIMessage msg;
42902eb84d0SMichael S. Tsirkin 
43002eb84d0SMichael S. Tsirkin     if (vector >= dev->msix_entries_nr || !dev->msix_entry_used[vector])
43102eb84d0SMichael S. Tsirkin         return;
43202eb84d0SMichael S. Tsirkin     if (msix_is_masked(dev, vector)) {
43302eb84d0SMichael S. Tsirkin         msix_set_pending(dev, vector);
43402eb84d0SMichael S. Tsirkin         return;
43502eb84d0SMichael S. Tsirkin     }
43602eb84d0SMichael S. Tsirkin 
437bc4caf49SJan Kiszka     msg = msix_get_message(dev, vector);
438bc4caf49SJan Kiszka 
439bc4caf49SJan Kiszka     stl_le_phys(msg.address, msg.data);
44002eb84d0SMichael S. Tsirkin }
44102eb84d0SMichael S. Tsirkin 
44202eb84d0SMichael S. Tsirkin void msix_reset(PCIDevice *dev)
44302eb84d0SMichael S. Tsirkin {
44444701ab7SJan Kiszka     if (!msix_present(dev)) {
44502eb84d0SMichael S. Tsirkin         return;
44644701ab7SJan Kiszka     }
4473cac001eSMichael S. Tsirkin     msix_clear_all_vectors(dev);
4482760952bSMichael S. Tsirkin     dev->config[dev->msix_cap + MSIX_CONTROL_OFFSET] &=
4492760952bSMichael S. Tsirkin 	    ~dev->wmask[dev->msix_cap + MSIX_CONTROL_OFFSET];
450d35e428cSAlex Williamson     memset(dev->msix_table, 0, dev->msix_entries_nr * PCI_MSIX_ENTRY_SIZE);
451d35e428cSAlex Williamson     memset(dev->msix_pba, 0, QEMU_ALIGN_UP(dev->msix_entries_nr, 64) / 8);
452ae1be0bbSMichael S. Tsirkin     msix_mask_all(dev, dev->msix_entries_nr);
45302eb84d0SMichael S. Tsirkin }
45402eb84d0SMichael S. Tsirkin 
45502eb84d0SMichael S. Tsirkin /* PCI spec suggests that devices make it possible for software to configure
45602eb84d0SMichael S. Tsirkin  * less vectors than supported by the device, but does not specify a standard
45702eb84d0SMichael S. Tsirkin  * mechanism for devices to do so.
45802eb84d0SMichael S. Tsirkin  *
45902eb84d0SMichael S. Tsirkin  * We support this by asking devices to declare vectors software is going to
46002eb84d0SMichael S. Tsirkin  * actually use, and checking this on the notification path. Devices that
46102eb84d0SMichael S. Tsirkin  * don't want to follow the spec suggestion can declare all vectors as used. */
46202eb84d0SMichael S. Tsirkin 
46302eb84d0SMichael S. Tsirkin /* Mark vector as used. */
46402eb84d0SMichael S. Tsirkin int msix_vector_use(PCIDevice *dev, unsigned vector)
46502eb84d0SMichael S. Tsirkin {
46602eb84d0SMichael S. Tsirkin     if (vector >= dev->msix_entries_nr)
46702eb84d0SMichael S. Tsirkin         return -EINVAL;
46802eb84d0SMichael S. Tsirkin     dev->msix_entry_used[vector]++;
46902eb84d0SMichael S. Tsirkin     return 0;
47002eb84d0SMichael S. Tsirkin }
47102eb84d0SMichael S. Tsirkin 
47202eb84d0SMichael S. Tsirkin /* Mark vector as unused. */
47302eb84d0SMichael S. Tsirkin void msix_vector_unuse(PCIDevice *dev, unsigned vector)
47402eb84d0SMichael S. Tsirkin {
47598304c84SMichael S. Tsirkin     if (vector >= dev->msix_entries_nr || !dev->msix_entry_used[vector]) {
47698304c84SMichael S. Tsirkin         return;
47798304c84SMichael S. Tsirkin     }
47898304c84SMichael S. Tsirkin     if (--dev->msix_entry_used[vector]) {
47998304c84SMichael S. Tsirkin         return;
48098304c84SMichael S. Tsirkin     }
48198304c84SMichael S. Tsirkin     msix_clr_pending(dev, vector);
48202eb84d0SMichael S. Tsirkin }
483b5f28bcaSMichael S. Tsirkin 
484b5f28bcaSMichael S. Tsirkin void msix_unuse_all_vectors(PCIDevice *dev)
485b5f28bcaSMichael S. Tsirkin {
48644701ab7SJan Kiszka     if (!msix_present(dev)) {
487b5f28bcaSMichael S. Tsirkin         return;
48844701ab7SJan Kiszka     }
489b5f28bcaSMichael S. Tsirkin     msix_free_irq_entries(dev);
490b5f28bcaSMichael S. Tsirkin }
4912cdfe53cSJan Kiszka 
492cb697aaaSJan Kiszka unsigned int msix_nr_vectors_allocated(const PCIDevice *dev)
493cb697aaaSJan Kiszka {
494cb697aaaSJan Kiszka     return dev->msix_entries_nr;
495cb697aaaSJan Kiszka }
496cb697aaaSJan Kiszka 
4972cdfe53cSJan Kiszka static int msix_set_notifier_for_vector(PCIDevice *dev, unsigned int vector)
4982cdfe53cSJan Kiszka {
4992cdfe53cSJan Kiszka     MSIMessage msg;
5002cdfe53cSJan Kiszka 
5012cdfe53cSJan Kiszka     if (msix_is_masked(dev, vector)) {
5022cdfe53cSJan Kiszka         return 0;
5032cdfe53cSJan Kiszka     }
5042cdfe53cSJan Kiszka     msg = msix_get_message(dev, vector);
5052cdfe53cSJan Kiszka     return dev->msix_vector_use_notifier(dev, vector, msg);
5062cdfe53cSJan Kiszka }
5072cdfe53cSJan Kiszka 
5082cdfe53cSJan Kiszka static void msix_unset_notifier_for_vector(PCIDevice *dev, unsigned int vector)
5092cdfe53cSJan Kiszka {
5102cdfe53cSJan Kiszka     if (msix_is_masked(dev, vector)) {
5112cdfe53cSJan Kiszka         return;
5122cdfe53cSJan Kiszka     }
5132cdfe53cSJan Kiszka     dev->msix_vector_release_notifier(dev, vector);
5142cdfe53cSJan Kiszka }
5152cdfe53cSJan Kiszka 
5162cdfe53cSJan Kiszka int msix_set_vector_notifiers(PCIDevice *dev,
5172cdfe53cSJan Kiszka                               MSIVectorUseNotifier use_notifier,
5182cdfe53cSJan Kiszka                               MSIVectorReleaseNotifier release_notifier)
5192cdfe53cSJan Kiszka {
5202cdfe53cSJan Kiszka     int vector, ret;
5212cdfe53cSJan Kiszka 
5222cdfe53cSJan Kiszka     assert(use_notifier && release_notifier);
5232cdfe53cSJan Kiszka 
5242cdfe53cSJan Kiszka     dev->msix_vector_use_notifier = use_notifier;
5252cdfe53cSJan Kiszka     dev->msix_vector_release_notifier = release_notifier;
5262cdfe53cSJan Kiszka 
5272cdfe53cSJan Kiszka     if ((dev->config[dev->msix_cap + MSIX_CONTROL_OFFSET] &
5282cdfe53cSJan Kiszka         (MSIX_ENABLE_MASK | MSIX_MASKALL_MASK)) == MSIX_ENABLE_MASK) {
5292cdfe53cSJan Kiszka         for (vector = 0; vector < dev->msix_entries_nr; vector++) {
5302cdfe53cSJan Kiszka             ret = msix_set_notifier_for_vector(dev, vector);
5312cdfe53cSJan Kiszka             if (ret < 0) {
5322cdfe53cSJan Kiszka                 goto undo;
5332cdfe53cSJan Kiszka             }
5342cdfe53cSJan Kiszka         }
5352cdfe53cSJan Kiszka     }
5362cdfe53cSJan Kiszka     return 0;
5372cdfe53cSJan Kiszka 
5382cdfe53cSJan Kiszka undo:
5392cdfe53cSJan Kiszka     while (--vector >= 0) {
5402cdfe53cSJan Kiszka         msix_unset_notifier_for_vector(dev, vector);
5412cdfe53cSJan Kiszka     }
5422cdfe53cSJan Kiszka     dev->msix_vector_use_notifier = NULL;
5432cdfe53cSJan Kiszka     dev->msix_vector_release_notifier = NULL;
5442cdfe53cSJan Kiszka     return ret;
5452cdfe53cSJan Kiszka }
5462cdfe53cSJan Kiszka 
5472cdfe53cSJan Kiszka void msix_unset_vector_notifiers(PCIDevice *dev)
5482cdfe53cSJan Kiszka {
5492cdfe53cSJan Kiszka     int vector;
5502cdfe53cSJan Kiszka 
5512cdfe53cSJan Kiszka     assert(dev->msix_vector_use_notifier &&
5522cdfe53cSJan Kiszka            dev->msix_vector_release_notifier);
5532cdfe53cSJan Kiszka 
5542cdfe53cSJan Kiszka     if ((dev->config[dev->msix_cap + MSIX_CONTROL_OFFSET] &
5552cdfe53cSJan Kiszka         (MSIX_ENABLE_MASK | MSIX_MASKALL_MASK)) == MSIX_ENABLE_MASK) {
5562cdfe53cSJan Kiszka         for (vector = 0; vector < dev->msix_entries_nr; vector++) {
5572cdfe53cSJan Kiszka             msix_unset_notifier_for_vector(dev, vector);
5582cdfe53cSJan Kiszka         }
5592cdfe53cSJan Kiszka     }
5602cdfe53cSJan Kiszka     dev->msix_vector_use_notifier = NULL;
5612cdfe53cSJan Kiszka     dev->msix_vector_release_notifier = NULL;
5622cdfe53cSJan Kiszka }
563