xref: /kvmtool/virtio/pci.c (revision e47302846cc538386c6cb62e41da485876f8bed0)
136f5dc91SSasha Levin #include "kvm/virtio-pci.h"
236f5dc91SSasha Levin 
336f5dc91SSasha Levin #include "kvm/ioport.h"
436f5dc91SSasha Levin #include "kvm/kvm.h"
54123ca55SMarc Zyngier #include "kvm/kvm-cpu.h"
636f5dc91SSasha Levin #include "kvm/virtio-pci-dev.h"
736f5dc91SSasha Levin #include "kvm/irq.h"
836f5dc91SSasha Levin #include "kvm/virtio.h"
91599d724SSasha Levin #include "kvm/ioeventfd.h"
102e7380dbSMarc Zyngier #include "kvm/util.h"
1136f5dc91SSasha Levin 
1243c81c74SSasha Levin #include <sys/ioctl.h>
1336f5dc91SSasha Levin #include <linux/virtio_pci.h>
14aa73be70SMatt Evans #include <linux/byteorder.h>
155a8e4f25SAlexandru Elisei #include <assert.h>
1636f5dc91SSasha Levin #include <string.h>
1736f5dc91SSasha Levin 
182e7380dbSMarc Zyngier #define ALIGN_UP(x, s)		ALIGN((x) + (s) - 1, (s))
192e7380dbSMarc Zyngier #define VIRTIO_NR_MSIX		(VIRTIO_PCI_MAX_VQ + VIRTIO_PCI_MAX_CONFIG)
202e7380dbSMarc Zyngier #define VIRTIO_MSIX_TABLE_SIZE	(VIRTIO_NR_MSIX * 16)
212e7380dbSMarc Zyngier #define VIRTIO_MSIX_PBA_SIZE	(ALIGN_UP(VIRTIO_MSIX_TABLE_SIZE, 64) / 8)
222e7380dbSMarc Zyngier #define VIRTIO_MSIX_BAR_SIZE	(1UL << fls_long(VIRTIO_MSIX_TABLE_SIZE + \
232e7380dbSMarc Zyngier 						 VIRTIO_MSIX_PBA_SIZE))
242e7380dbSMarc Zyngier 
25e539f3e4SAlexandru Elisei static u16 virtio_pci__port_addr(struct virtio_pci *vpci)
26e539f3e4SAlexandru Elisei {
27e539f3e4SAlexandru Elisei 	return pci__bar_address(&vpci->pci_hdr, 0);
28e539f3e4SAlexandru Elisei }
29e539f3e4SAlexandru Elisei 
30e539f3e4SAlexandru Elisei static u32 virtio_pci__mmio_addr(struct virtio_pci *vpci)
31e539f3e4SAlexandru Elisei {
32e539f3e4SAlexandru Elisei 	return pci__bar_address(&vpci->pci_hdr, 1);
33e539f3e4SAlexandru Elisei }
34e539f3e4SAlexandru Elisei 
35e539f3e4SAlexandru Elisei static u32 virtio_pci__msix_io_addr(struct virtio_pci *vpci)
36e539f3e4SAlexandru Elisei {
37e539f3e4SAlexandru Elisei 	return pci__bar_address(&vpci->pci_hdr, 2);
38e539f3e4SAlexandru Elisei }
39e539f3e4SAlexandru Elisei 
401599d724SSasha Levin static void virtio_pci__ioevent_callback(struct kvm *kvm, void *param)
411599d724SSasha Levin {
421599d724SSasha Levin 	struct virtio_pci_ioevent_param *ioeventfd = param;
4302eca50cSAsias He 	struct virtio_pci *vpci = ioeventfd->vdev->virtio;
441599d724SSasha Levin 
4502eca50cSAsias He 	ioeventfd->vdev->ops->notify_vq(kvm, vpci->dev, ioeventfd->vq);
461599d724SSasha Levin }
471599d724SSasha Levin 
4802eca50cSAsias He static int virtio_pci__init_ioeventfd(struct kvm *kvm, struct virtio_device *vdev, u32 vq)
491599d724SSasha Levin {
501599d724SSasha Levin 	struct ioevent ioevent;
5102eca50cSAsias He 	struct virtio_pci *vpci = vdev->virtio;
52e539f3e4SAlexandru Elisei 	u32 mmio_addr = virtio_pci__mmio_addr(vpci);
53e539f3e4SAlexandru Elisei 	u16 port_addr = virtio_pci__port_addr(vpci);
540e1882a4SJean-Philippe Brucker 	int r, flags = 0;
550e1882a4SJean-Philippe Brucker 	int fd;
561599d724SSasha Levin 
571599d724SSasha Levin 	vpci->ioeventfds[vq] = (struct virtio_pci_ioevent_param) {
5802eca50cSAsias He 		.vdev		= vdev,
591599d724SSasha Levin 		.vq		= vq,
601599d724SSasha Levin 	};
611599d724SSasha Levin 
621599d724SSasha Levin 	ioevent = (struct ioevent) {
631599d724SSasha Levin 		.fn		= virtio_pci__ioevent_callback,
641599d724SSasha Levin 		.fn_ptr		= &vpci->ioeventfds[vq],
651599d724SSasha Levin 		.datamatch	= vq,
661599d724SSasha Levin 		.fn_kvm		= kvm,
671599d724SSasha Levin 	};
681599d724SSasha Levin 
69627d6874SAsias He 	/*
70a463650cSWill Deacon 	 * Vhost will poll the eventfd in host kernel side, otherwise we
71a463650cSWill Deacon 	 * need to poll in userspace.
72627d6874SAsias He 	 */
73a463650cSWill Deacon 	if (!vdev->use_vhost)
74a463650cSWill Deacon 		flags |= IOEVENTFD_FLAG_USER_POLL;
75a463650cSWill Deacon 
76a463650cSWill Deacon 	/* ioport */
77e539f3e4SAlexandru Elisei 	ioevent.io_addr	= port_addr + VIRTIO_PCI_QUEUE_NOTIFY;
78a463650cSWill Deacon 	ioevent.io_len	= sizeof(u16);
790e1882a4SJean-Philippe Brucker 	ioevent.fd	= fd = eventfd(0, 0);
8071ca0facSAndre Przywara 	r = ioeventfd__add_event(&ioevent, flags | IOEVENTFD_FLAG_PIO);
81ea6eeb1cSSasha Levin 	if (r)
82ea6eeb1cSSasha Levin 		return r;
831599d724SSasha Levin 
84a463650cSWill Deacon 	/* mmio */
85e539f3e4SAlexandru Elisei 	ioevent.io_addr	= mmio_addr + VIRTIO_PCI_QUEUE_NOTIFY;
86fe50bacbSAndreas Herrmann 	ioevent.io_len	= sizeof(u16);
870e1882a4SJean-Philippe Brucker 	ioevent.fd	= eventfd(0, 0);
88a463650cSWill Deacon 	r = ioeventfd__add_event(&ioevent, flags);
89a463650cSWill Deacon 	if (r)
90a463650cSWill Deacon 		goto free_ioport_evt;
91263b80e8SSasha Levin 
92a463650cSWill Deacon 	if (vdev->ops->notify_vq_eventfd)
930e1882a4SJean-Philippe Brucker 		vdev->ops->notify_vq_eventfd(kvm, vpci->dev, vq, fd);
941599d724SSasha Levin 	return 0;
95a463650cSWill Deacon 
96a463650cSWill Deacon free_ioport_evt:
97e539f3e4SAlexandru Elisei 	ioeventfd__del_event(port_addr + VIRTIO_PCI_QUEUE_NOTIFY, vq);
98a463650cSWill Deacon 	return r;
991599d724SSasha Levin }
1001599d724SSasha Levin 
101ad346c2eSJean-Philippe Brucker static void virtio_pci_exit_vq(struct kvm *kvm, struct virtio_device *vdev,
102ad346c2eSJean-Philippe Brucker 			       int vq)
103ad346c2eSJean-Philippe Brucker {
104ad346c2eSJean-Philippe Brucker 	struct virtio_pci *vpci = vdev->virtio;
105e539f3e4SAlexandru Elisei 	u32 mmio_addr = virtio_pci__mmio_addr(vpci);
106e539f3e4SAlexandru Elisei 	u16 port_addr = virtio_pci__port_addr(vpci);
107ad346c2eSJean-Philippe Brucker 
108e539f3e4SAlexandru Elisei 	ioeventfd__del_event(mmio_addr + VIRTIO_PCI_QUEUE_NOTIFY, vq);
109e539f3e4SAlexandru Elisei 	ioeventfd__del_event(port_addr + VIRTIO_PCI_QUEUE_NOTIFY, vq);
110ad346c2eSJean-Philippe Brucker 	virtio_exit_vq(kvm, vdev, vpci->dev, vq);
111ad346c2eSJean-Philippe Brucker }
112ad346c2eSJean-Philippe Brucker 
11306f48103SSasha Levin static inline bool virtio_pci__msix_enabled(struct virtio_pci *vpci)
11406f48103SSasha Levin {
115aa73be70SMatt Evans 	return vpci->pci_hdr.msix.ctrl & cpu_to_le16(PCI_MSIX_FLAGS_ENABLE);
11606f48103SSasha Levin }
11706f48103SSasha Levin 
118e09b599aSJulien Thierry static bool virtio_pci__specific_data_in(struct kvm *kvm, struct virtio_device *vdev,
11906e1e6feSMartin Radev 					 void *data, u32 size, unsigned long offset)
12036f5dc91SSasha Levin {
12136f5dc91SSasha Levin 	u32 config_offset;
12202eca50cSAsias He 	struct virtio_pci *vpci = vdev->virtio;
12306f48103SSasha Levin 	int type = virtio__get_dev_specific_field(offset - 20,
12406f48103SSasha Levin 							virtio_pci__msix_enabled(vpci),
1251382aba0SSasha Levin 							&config_offset);
12636f5dc91SSasha Levin 	if (type == VIRTIO_PCI_O_MSIX) {
12736f5dc91SSasha Levin 		switch (offset) {
12836f5dc91SSasha Levin 		case VIRTIO_MSI_CONFIG_VECTOR:
12936f5dc91SSasha Levin 			ioport__write16(data, vpci->config_vector);
13036f5dc91SSasha Levin 			break;
13136f5dc91SSasha Levin 		case VIRTIO_MSI_QUEUE_VECTOR:
13236f5dc91SSasha Levin 			ioport__write16(data, vpci->vq_vector[vpci->queue_selector]);
13336f5dc91SSasha Levin 			break;
13436f5dc91SSasha Levin 		};
13536f5dc91SSasha Levin 
13636f5dc91SSasha Levin 		return true;
13736f5dc91SSasha Levin 	} else if (type == VIRTIO_PCI_O_CONFIG) {
13836f5dc91SSasha Levin 		u8 cfg;
139*e4730284SMartin Radev 		size_t config_size;
14036f5dc91SSasha Levin 
141*e4730284SMartin Radev 		config_size = vdev->ops->get_config_size(kvm, vpci->dev);
142*e4730284SMartin Radev 		if (config_offset + size > config_size) {
143*e4730284SMartin Radev 			/* Access goes beyond the config size, so return failure. */
144*e4730284SMartin Radev 			WARN_ONCE(1, "Config access offset (%u) is beyond config size (%zu)\n",
145*e4730284SMartin Radev 				config_offset, config_size);
146*e4730284SMartin Radev 			return false;
147*e4730284SMartin Radev 		}
148*e4730284SMartin Radev 
149*e4730284SMartin Radev 		/* TODO: Handle access lengths beyond one byte */
150*e4730284SMartin Radev 		if (size != 1) {
151*e4730284SMartin Radev 			WARN_ONCE(1, "Size (%u) not supported\n", size);
152*e4730284SMartin Radev 			return false;
153*e4730284SMartin Radev 		}
154c5ae742bSSasha Levin 		cfg = vdev->ops->get_config(kvm, vpci->dev)[config_offset];
15536f5dc91SSasha Levin 		ioport__write8(data, cfg);
15636f5dc91SSasha Levin 		return true;
15736f5dc91SSasha Levin 	}
15836f5dc91SSasha Levin 
15936f5dc91SSasha Levin 	return false;
16036f5dc91SSasha Levin }
16136f5dc91SSasha Levin 
162e09b599aSJulien Thierry static bool virtio_pci__data_in(struct kvm_cpu *vcpu, struct virtio_device *vdev,
16306e1e6feSMartin Radev 				unsigned long offset, void *data, u32 size)
16436f5dc91SSasha Levin {
16536f5dc91SSasha Levin 	bool ret = true;
16636f5dc91SSasha Levin 	struct virtio_pci *vpci;
16753fbb17bSJean-Philippe Brucker 	struct virt_queue *vq;
1684123ca55SMarc Zyngier 	struct kvm *kvm;
16936f5dc91SSasha Levin 	u32 val;
17036f5dc91SSasha Levin 
1714123ca55SMarc Zyngier 	kvm = vcpu->kvm;
17202eca50cSAsias He 	vpci = vdev->virtio;
17336f5dc91SSasha Levin 
17436f5dc91SSasha Levin 	switch (offset) {
17536f5dc91SSasha Levin 	case VIRTIO_PCI_HOST_FEATURES:
17602eca50cSAsias He 		val = vdev->ops->get_host_features(kvm, vpci->dev);
17736f5dc91SSasha Levin 		ioport__write32(data, val);
17836f5dc91SSasha Levin 		break;
17936f5dc91SSasha Levin 	case VIRTIO_PCI_QUEUE_PFN:
18053fbb17bSJean-Philippe Brucker 		vq = vdev->ops->get_vq(kvm, vpci->dev, vpci->queue_selector);
18153fbb17bSJean-Philippe Brucker 		ioport__write32(data, vq->pfn);
18236f5dc91SSasha Levin 		break;
18336f5dc91SSasha Levin 	case VIRTIO_PCI_QUEUE_NUM:
18402eca50cSAsias He 		val = vdev->ops->get_size_vq(kvm, vpci->dev, vpci->queue_selector);
185657ee18bSMatt Evans 		ioport__write16(data, val);
18636f5dc91SSasha Levin 		break;
18736f5dc91SSasha Levin 	case VIRTIO_PCI_STATUS:
18836f5dc91SSasha Levin 		ioport__write8(data, vpci->status);
18936f5dc91SSasha Levin 		break;
19036f5dc91SSasha Levin 	case VIRTIO_PCI_ISR:
19136f5dc91SSasha Levin 		ioport__write8(data, vpci->isr);
192e9922aafSAndre Przywara 		kvm__irq_line(kvm, vpci->legacy_irq_line, VIRTIO_IRQ_LOW);
19336f5dc91SSasha Levin 		vpci->isr = VIRTIO_IRQ_LOW;
19436f5dc91SSasha Levin 		break;
19536f5dc91SSasha Levin 	default:
196e09b599aSJulien Thierry 		ret = virtio_pci__specific_data_in(kvm, vdev, data, size, offset);
19736f5dc91SSasha Levin 		break;
19836f5dc91SSasha Levin 	};
19936f5dc91SSasha Levin 
20036f5dc91SSasha Levin 	return ret;
20136f5dc91SSasha Levin }
20236f5dc91SSasha Levin 
2036518065aSAndre Przywara static void update_msix_map(struct virtio_pci *vpci,
2046518065aSAndre Przywara 			    struct msix_table *msix_entry, u32 vecnum)
2056518065aSAndre Przywara {
2066518065aSAndre Przywara 	u32 gsi, i;
2076518065aSAndre Przywara 
2086518065aSAndre Przywara 	/* Find the GSI number used for that vector */
2096518065aSAndre Przywara 	if (vecnum == vpci->config_vector) {
2106518065aSAndre Przywara 		gsi = vpci->config_gsi;
2116518065aSAndre Przywara 	} else {
2126518065aSAndre Przywara 		for (i = 0; i < VIRTIO_PCI_MAX_VQ; i++)
2136518065aSAndre Przywara 			if (vpci->vq_vector[i] == vecnum)
2146518065aSAndre Przywara 				break;
2156518065aSAndre Przywara 		if (i == VIRTIO_PCI_MAX_VQ)
2166518065aSAndre Przywara 			return;
2176518065aSAndre Przywara 		gsi = vpci->gsis[i];
2186518065aSAndre Przywara 	}
2196518065aSAndre Przywara 
2206518065aSAndre Przywara 	if (gsi == 0)
2216518065aSAndre Przywara 		return;
2226518065aSAndre Przywara 
2236518065aSAndre Przywara 	msix_entry = &msix_entry[vecnum];
2246518065aSAndre Przywara 	irq__update_msix_route(vpci->kvm, gsi, &msix_entry->msg);
2256518065aSAndre Przywara }
2266518065aSAndre Przywara 
227e09b599aSJulien Thierry static bool virtio_pci__specific_data_out(struct kvm *kvm, struct virtio_device *vdev,
22806e1e6feSMartin Radev 					  void *data, u32 size, unsigned long offset)
22936f5dc91SSasha Levin {
23002eca50cSAsias He 	struct virtio_pci *vpci = vdev->virtio;
2318ccc8549SAndre Przywara 	u32 config_offset, vec;
2328ccc8549SAndre Przywara 	int gsi;
23306f48103SSasha Levin 	int type = virtio__get_dev_specific_field(offset - 20, virtio_pci__msix_enabled(vpci),
2341382aba0SSasha Levin 							&config_offset);
23536f5dc91SSasha Levin 	if (type == VIRTIO_PCI_O_MSIX) {
23636f5dc91SSasha Levin 		switch (offset) {
23736f5dc91SSasha Levin 		case VIRTIO_MSI_CONFIG_VECTOR:
23836f5dc91SSasha Levin 			vec = vpci->config_vector = ioport__read16(data);
239f8327b05SSasha Levin 			if (vec == VIRTIO_MSI_NO_VECTOR)
240f8327b05SSasha Levin 				break;
24136f5dc91SSasha Levin 
2428ccc8549SAndre Przywara 			gsi = irq__add_msix_route(kvm,
243f9ef46f2SAndre Przywara 						  &vpci->msix_table[vec].msg,
244f9ef46f2SAndre Przywara 						  vpci->dev_hdr.dev_num << 3);
245928ab7acSAndre Przywara 			/*
246928ab7acSAndre Przywara 			 * We don't need IRQ routing if we can use
247928ab7acSAndre Przywara 			 * MSI injection via the KVM_SIGNAL_MSI ioctl.
248928ab7acSAndre Przywara 			 */
249928ab7acSAndre Przywara 			if (gsi == -ENXIO &&
250928ab7acSAndre Przywara 			    vpci->features & VIRTIO_PCI_F_SIGNAL_MSI)
251928ab7acSAndre Przywara 				break;
252928ab7acSAndre Przywara 
253928ab7acSAndre Przywara 			if (gsi < 0) {
254928ab7acSAndre Przywara 				die("failed to configure MSIs");
255928ab7acSAndre Przywara 				break;
256928ab7acSAndre Przywara 			}
257928ab7acSAndre Przywara 
25836f5dc91SSasha Levin 			vpci->config_gsi = gsi;
25936f5dc91SSasha Levin 			break;
2603a60be06SSasha Levin 		case VIRTIO_MSI_QUEUE_VECTOR:
2618ccc8549SAndre Przywara 			vec = ioport__read16(data);
2628ccc8549SAndre Przywara 			vpci->vq_vector[vpci->queue_selector] = vec;
26336f5dc91SSasha Levin 
264f8327b05SSasha Levin 			if (vec == VIRTIO_MSI_NO_VECTOR)
265f8327b05SSasha Levin 				break;
266f8327b05SSasha Levin 
2678ccc8549SAndre Przywara 			gsi = irq__add_msix_route(kvm,
268f9ef46f2SAndre Przywara 						  &vpci->msix_table[vec].msg,
269f9ef46f2SAndre Przywara 						  vpci->dev_hdr.dev_num << 3);
270928ab7acSAndre Przywara 			/*
271928ab7acSAndre Przywara 			 * We don't need IRQ routing if we can use
272928ab7acSAndre Przywara 			 * MSI injection via the KVM_SIGNAL_MSI ioctl.
273928ab7acSAndre Przywara 			 */
274928ab7acSAndre Przywara 			if (gsi == -ENXIO &&
275928ab7acSAndre Przywara 			    vpci->features & VIRTIO_PCI_F_SIGNAL_MSI)
2768ccc8549SAndre Przywara 				break;
277928ab7acSAndre Przywara 
278928ab7acSAndre Przywara 			if (gsi < 0) {
279928ab7acSAndre Przywara 				die("failed to configure MSIs");
280928ab7acSAndre Przywara 				break;
281928ab7acSAndre Przywara 			}
282928ab7acSAndre Przywara 
28336f5dc91SSasha Levin 			vpci->gsis[vpci->queue_selector] = gsi;
28402eca50cSAsias He 			if (vdev->ops->notify_vq_gsi)
28502eca50cSAsias He 				vdev->ops->notify_vq_gsi(kvm, vpci->dev,
2868ccc8549SAndre Przywara 							 vpci->queue_selector,
2878ccc8549SAndre Przywara 							 gsi);
28836f5dc91SSasha Levin 			break;
28936f5dc91SSasha Levin 		};
29036f5dc91SSasha Levin 
29136f5dc91SSasha Levin 		return true;
29236f5dc91SSasha Levin 	} else if (type == VIRTIO_PCI_O_CONFIG) {
293*e4730284SMartin Radev 		size_t config_size;
294*e4730284SMartin Radev 
295*e4730284SMartin Radev 		config_size = vdev->ops->get_config_size(kvm, vpci->dev);
296*e4730284SMartin Radev 		if (config_offset + size > config_size) {
297*e4730284SMartin Radev 			/* Access goes beyond the config size, so return failure. */
298*e4730284SMartin Radev 			WARN_ONCE(1, "Config access offset (%u) is beyond config size (%zu)\n",
299*e4730284SMartin Radev 				config_offset, config_size);
300*e4730284SMartin Radev 			return false;
301*e4730284SMartin Radev 		}
302*e4730284SMartin Radev 
303*e4730284SMartin Radev 		/* TODO: Handle access lengths beyond one byte */
304*e4730284SMartin Radev 		if (size != 1) {
305*e4730284SMartin Radev 			WARN_ONCE(1, "Size (%u) not supported\n", size);
306*e4730284SMartin Radev 			return false;
307*e4730284SMartin Radev 		}
308c5ae742bSSasha Levin 		vdev->ops->get_config(kvm, vpci->dev)[config_offset] = *(u8 *)data;
30936f5dc91SSasha Levin 
31036f5dc91SSasha Levin 		return true;
31136f5dc91SSasha Levin 	}
31236f5dc91SSasha Levin 
31336f5dc91SSasha Levin 	return false;
31436f5dc91SSasha Levin }
31536f5dc91SSasha Levin 
316e09b599aSJulien Thierry static bool virtio_pci__data_out(struct kvm_cpu *vcpu, struct virtio_device *vdev,
31706e1e6feSMartin Radev 				 unsigned long offset, void *data, u32 size)
31836f5dc91SSasha Levin {
31936f5dc91SSasha Levin 	bool ret = true;
32036f5dc91SSasha Levin 	struct virtio_pci *vpci;
3214123ca55SMarc Zyngier 	struct kvm *kvm;
32236f5dc91SSasha Levin 	u32 val;
32336f5dc91SSasha Levin 
3244123ca55SMarc Zyngier 	kvm = vcpu->kvm;
32502eca50cSAsias He 	vpci = vdev->virtio;
32636f5dc91SSasha Levin 
32736f5dc91SSasha Levin 	switch (offset) {
32836f5dc91SSasha Levin 	case VIRTIO_PCI_GUEST_FEATURES:
32936f5dc91SSasha Levin 		val = ioport__read32(data);
33056a16c90SJean-Philippe Brucker 		virtio_set_guest_features(kvm, vdev, vpci->dev, val);
33136f5dc91SSasha Levin 		break;
33236f5dc91SSasha Levin 	case VIRTIO_PCI_QUEUE_PFN:
33336f5dc91SSasha Levin 		val = ioport__read32(data);
334ad346c2eSJean-Philippe Brucker 		if (val) {
335ad346c2eSJean-Philippe Brucker 			virtio_pci__init_ioeventfd(kvm, vdev,
336ad346c2eSJean-Philippe Brucker 						   vpci->queue_selector);
337c59ba304SWill Deacon 			vdev->ops->init_vq(kvm, vpci->dev, vpci->queue_selector,
338c59ba304SWill Deacon 					   1 << VIRTIO_PCI_QUEUE_ADDR_SHIFT,
339c59ba304SWill Deacon 					   VIRTIO_PCI_VRING_ALIGN, val);
340ad346c2eSJean-Philippe Brucker 		} else {
341ad346c2eSJean-Philippe Brucker 			virtio_pci_exit_vq(kvm, vdev, vpci->queue_selector);
342ad346c2eSJean-Philippe Brucker 		}
34336f5dc91SSasha Levin 		break;
34436f5dc91SSasha Levin 	case VIRTIO_PCI_QUEUE_SEL:
34536f5dc91SSasha Levin 		vpci->queue_selector = ioport__read16(data);
34636f5dc91SSasha Levin 		break;
34736f5dc91SSasha Levin 	case VIRTIO_PCI_QUEUE_NOTIFY:
34836f5dc91SSasha Levin 		val = ioport__read16(data);
34902eca50cSAsias He 		vdev->ops->notify_vq(kvm, vpci->dev, val);
35036f5dc91SSasha Levin 		break;
35136f5dc91SSasha Levin 	case VIRTIO_PCI_STATUS:
35236f5dc91SSasha Levin 		vpci->status = ioport__read8(data);
3534123ca55SMarc Zyngier 		if (!vpci->status) /* Sample endianness on reset */
3544123ca55SMarc Zyngier 			vdev->endian = kvm_cpu__get_endianness(vcpu);
35595242e44SJean-Philippe Brucker 		virtio_notify_status(kvm, vdev, vpci->dev, vpci->status);
35636f5dc91SSasha Levin 		break;
35736f5dc91SSasha Levin 	default:
358e09b599aSJulien Thierry 		ret = virtio_pci__specific_data_out(kvm, vdev, data, size, offset);
35936f5dc91SSasha Levin 		break;
36036f5dc91SSasha Levin 	};
36136f5dc91SSasha Levin 
36236f5dc91SSasha Levin 	return ret;
36336f5dc91SSasha Levin }
36436f5dc91SSasha Levin 
3659b735910SMarc Zyngier static void virtio_pci__msix_mmio_callback(struct kvm_cpu *vcpu,
3669b735910SMarc Zyngier 					   u64 addr, u8 *data, u32 len,
367a463650cSWill Deacon 					   u8 is_write, void *ptr)
36836f5dc91SSasha Levin {
369e09b599aSJulien Thierry 	struct virtio_device *vdev = ptr;
370e09b599aSJulien Thierry 	struct virtio_pci *vpci = vdev->virtio;
3716518065aSAndre Przywara 	struct msix_table *table;
372e539f3e4SAlexandru Elisei 	u32 msix_io_addr = virtio_pci__msix_io_addr(vpci);
3732e7380dbSMarc Zyngier 	u32 pba_offset;
3746518065aSAndre Przywara 	int vecnum;
3756518065aSAndre Przywara 	size_t offset;
37636f5dc91SSasha Levin 
3772e7380dbSMarc Zyngier 	BUILD_BUG_ON(VIRTIO_NR_MSIX > (sizeof(vpci->msix_pba) * 8));
3782e7380dbSMarc Zyngier 
3792e7380dbSMarc Zyngier 	pba_offset = vpci->pci_hdr.msix.pba_offset & ~PCI_MSIX_TABLE_BIR;
3802e7380dbSMarc Zyngier 	if (addr >= msix_io_addr + pba_offset) {
3812e7380dbSMarc Zyngier 		/* Read access to PBA */
3826518065aSAndre Przywara 		if (is_write)
3836518065aSAndre Przywara 			return;
3842e7380dbSMarc Zyngier 		offset = addr - (msix_io_addr + pba_offset);
3852e7380dbSMarc Zyngier 		if ((offset + len) > sizeof (vpci->msix_pba))
3862e7380dbSMarc Zyngier 			return;
3872e7380dbSMarc Zyngier 		memcpy(data, (void *)&vpci->msix_pba + offset, len);
3882e7380dbSMarc Zyngier 		return;
3892e7380dbSMarc Zyngier 	}
3902e7380dbSMarc Zyngier 
3916518065aSAndre Przywara 	table  = vpci->msix_table;
392e539f3e4SAlexandru Elisei 	offset = addr - msix_io_addr;
3932e7380dbSMarc Zyngier 
3946518065aSAndre Przywara 	vecnum = offset / sizeof(struct msix_table);
3956518065aSAndre Przywara 	offset = offset % sizeof(struct msix_table);
3966518065aSAndre Przywara 
3976518065aSAndre Przywara 	if (!is_write) {
3986518065aSAndre Przywara 		memcpy(data, (void *)&table[vecnum] + offset, len);
3996518065aSAndre Przywara 		return;
40036f5dc91SSasha Levin 	}
40136f5dc91SSasha Levin 
4026518065aSAndre Przywara 	memcpy((void *)&table[vecnum] + offset, data, len);
4036518065aSAndre Przywara 
4046518065aSAndre Przywara 	/* Did we just update the address or payload? */
4056518065aSAndre Przywara 	if (offset < offsetof(struct msix_table, ctrl))
4066518065aSAndre Przywara 		update_msix_map(vpci, table, vecnum);
40706f48103SSasha Levin }
40806f48103SSasha Levin 
409714ab9e6SAndre Przywara static void virtio_pci__signal_msi(struct kvm *kvm, struct virtio_pci *vpci,
410714ab9e6SAndre Przywara 				   int vec)
41143c81c74SSasha Levin {
41243c81c74SSasha Levin 	struct kvm_msi msi = {
41343c81c74SSasha Levin 		.address_lo = vpci->msix_table[vec].msg.address_lo,
41443c81c74SSasha Levin 		.address_hi = vpci->msix_table[vec].msg.address_hi,
41543c81c74SSasha Levin 		.data = vpci->msix_table[vec].msg.data,
41643c81c74SSasha Levin 	};
41743c81c74SSasha Levin 
418714ab9e6SAndre Przywara 	if (kvm->msix_needs_devid) {
419714ab9e6SAndre Przywara 		msi.flags = KVM_MSI_VALID_DEVID;
420714ab9e6SAndre Przywara 		msi.devid = vpci->dev_hdr.dev_num << 3;
421714ab9e6SAndre Przywara 	}
422714ab9e6SAndre Przywara 
423f6108d72SJean-Philippe Brucker 	irq__signal_msi(kvm, &msi);
42443c81c74SSasha Levin }
42543c81c74SSasha Levin 
42602eca50cSAsias He int virtio_pci__signal_vq(struct kvm *kvm, struct virtio_device *vdev, u32 vq)
42736f5dc91SSasha Levin {
42802eca50cSAsias He 	struct virtio_pci *vpci = vdev->virtio;
42906f48103SSasha Levin 	int tbl = vpci->vq_vector[vq];
43036f5dc91SSasha Levin 
431f8327b05SSasha Levin 	if (virtio_pci__msix_enabled(vpci) && tbl != VIRTIO_MSI_NO_VECTOR) {
432aa73be70SMatt Evans 		if (vpci->pci_hdr.msix.ctrl & cpu_to_le16(PCI_MSIX_FLAGS_MASKALL) ||
433aa73be70SMatt Evans 		    vpci->msix_table[tbl].ctrl & cpu_to_le16(PCI_MSIX_ENTRY_CTRL_MASKBIT)) {
43406f48103SSasha Levin 
43506f48103SSasha Levin 			vpci->msix_pba |= 1 << tbl;
43606f48103SSasha Levin 			return 0;
43706f48103SSasha Levin 		}
43806f48103SSasha Levin 
43943c81c74SSasha Levin 		if (vpci->features & VIRTIO_PCI_F_SIGNAL_MSI)
44043c81c74SSasha Levin 			virtio_pci__signal_msi(kvm, vpci, vpci->vq_vector[vq]);
44143c81c74SSasha Levin 		else
44206f48103SSasha Levin 			kvm__irq_trigger(kvm, vpci->gsis[vq]);
44306f48103SSasha Levin 	} else {
444a36eca7bSSasha Levin 		vpci->isr = VIRTIO_IRQ_HIGH;
4452108c86dSMarc Zyngier 		kvm__irq_line(kvm, vpci->legacy_irq_line, VIRTIO_IRQ_HIGH);
44606f48103SSasha Levin 	}
44736f5dc91SSasha Levin 	return 0;
44836f5dc91SSasha Levin }
44936f5dc91SSasha Levin 
45002eca50cSAsias He int virtio_pci__signal_config(struct kvm *kvm, struct virtio_device *vdev)
45136f5dc91SSasha Levin {
45202eca50cSAsias He 	struct virtio_pci *vpci = vdev->virtio;
45306f48103SSasha Levin 	int tbl = vpci->config_vector;
45406f48103SSasha Levin 
455f8327b05SSasha Levin 	if (virtio_pci__msix_enabled(vpci) && tbl != VIRTIO_MSI_NO_VECTOR) {
456aa73be70SMatt Evans 		if (vpci->pci_hdr.msix.ctrl & cpu_to_le16(PCI_MSIX_FLAGS_MASKALL) ||
457aa73be70SMatt Evans 		    vpci->msix_table[tbl].ctrl & cpu_to_le16(PCI_MSIX_ENTRY_CTRL_MASKBIT)) {
45806f48103SSasha Levin 
45906f48103SSasha Levin 			vpci->msix_pba |= 1 << tbl;
46006f48103SSasha Levin 			return 0;
46106f48103SSasha Levin 		}
46206f48103SSasha Levin 
46343c81c74SSasha Levin 		if (vpci->features & VIRTIO_PCI_F_SIGNAL_MSI)
464f8327b05SSasha Levin 			virtio_pci__signal_msi(kvm, vpci, tbl);
46543c81c74SSasha Levin 		else
46606f48103SSasha Levin 			kvm__irq_trigger(kvm, vpci->config_gsi);
46706f48103SSasha Levin 	} else {
46806f48103SSasha Levin 		vpci->isr = VIRTIO_PCI_ISR_CONFIG;
469e9922aafSAndre Przywara 		kvm__irq_trigger(kvm, vpci->legacy_irq_line);
47006f48103SSasha Levin 	}
47136f5dc91SSasha Levin 
47236f5dc91SSasha Levin 	return 0;
47336f5dc91SSasha Levin }
47436f5dc91SSasha Levin 
4759b735910SMarc Zyngier static void virtio_pci__io_mmio_callback(struct kvm_cpu *vcpu,
4769b735910SMarc Zyngier 					 u64 addr, u8 *data, u32 len,
477a463650cSWill Deacon 					 u8 is_write, void *ptr)
478a463650cSWill Deacon {
479e09b599aSJulien Thierry 	struct virtio_device *vdev = ptr;
480e09b599aSJulien Thierry 	struct virtio_pci *vpci = vdev->virtio;
481205eaa79SAndre Przywara 	u32 ioport_addr = virtio_pci__port_addr(vpci);
482205eaa79SAndre Przywara 	u32 base_addr;
483205eaa79SAndre Przywara 
484205eaa79SAndre Przywara 	if (addr >= ioport_addr &&
485205eaa79SAndre Przywara 	    addr < ioport_addr + pci__bar_size(&vpci->pci_hdr, 0))
486205eaa79SAndre Przywara 		base_addr = ioport_addr;
487205eaa79SAndre Przywara 	else
488205eaa79SAndre Przywara 		base_addr = virtio_pci__mmio_addr(vpci);
489a463650cSWill Deacon 
490e09b599aSJulien Thierry 	if (!is_write)
491205eaa79SAndre Przywara 		virtio_pci__data_in(vcpu, vdev, addr - base_addr, data, len);
492e09b599aSJulien Thierry 	else
493205eaa79SAndre Przywara 		virtio_pci__data_out(vcpu, vdev, addr - base_addr, data, len);
494a463650cSWill Deacon }
495a463650cSWill Deacon 
4965a8e4f25SAlexandru Elisei static int virtio_pci__bar_activate(struct kvm *kvm,
4975a8e4f25SAlexandru Elisei 				    struct pci_device_header *pci_hdr,
4985a8e4f25SAlexandru Elisei 				    int bar_num, void *data)
4995a8e4f25SAlexandru Elisei {
5005a8e4f25SAlexandru Elisei 	struct virtio_device *vdev = data;
5015a8e4f25SAlexandru Elisei 	u32 bar_addr, bar_size;
5025a8e4f25SAlexandru Elisei 	int r = -EINVAL;
5035a8e4f25SAlexandru Elisei 
5045a8e4f25SAlexandru Elisei 	assert(bar_num <= 2);
5055a8e4f25SAlexandru Elisei 
5065a8e4f25SAlexandru Elisei 	bar_addr = pci__bar_address(pci_hdr, bar_num);
5075a8e4f25SAlexandru Elisei 	bar_size = pci__bar_size(pci_hdr, bar_num);
5085a8e4f25SAlexandru Elisei 
5095a8e4f25SAlexandru Elisei 	switch (bar_num) {
5105a8e4f25SAlexandru Elisei 	case 0:
511205eaa79SAndre Przywara 		r = kvm__register_pio(kvm, bar_addr, bar_size,
512205eaa79SAndre Przywara 				      virtio_pci__io_mmio_callback, vdev);
5135a8e4f25SAlexandru Elisei 		break;
5145a8e4f25SAlexandru Elisei 	case 1:
5155a8e4f25SAlexandru Elisei 		r =  kvm__register_mmio(kvm, bar_addr, bar_size, false,
5165a8e4f25SAlexandru Elisei 					virtio_pci__io_mmio_callback, vdev);
5175a8e4f25SAlexandru Elisei 		break;
5185a8e4f25SAlexandru Elisei 	case 2:
5195a8e4f25SAlexandru Elisei 		r =  kvm__register_mmio(kvm, bar_addr, bar_size, false,
5205a8e4f25SAlexandru Elisei 					virtio_pci__msix_mmio_callback, vdev);
5215a8e4f25SAlexandru Elisei 		break;
5225a8e4f25SAlexandru Elisei 	}
5235a8e4f25SAlexandru Elisei 
5245a8e4f25SAlexandru Elisei 	return r;
5255a8e4f25SAlexandru Elisei }
5265a8e4f25SAlexandru Elisei 
5275a8e4f25SAlexandru Elisei static int virtio_pci__bar_deactivate(struct kvm *kvm,
5285a8e4f25SAlexandru Elisei 				      struct pci_device_header *pci_hdr,
5295a8e4f25SAlexandru Elisei 				      int bar_num, void *data)
5305a8e4f25SAlexandru Elisei {
5315a8e4f25SAlexandru Elisei 	u32 bar_addr;
5325a8e4f25SAlexandru Elisei 	bool success;
5335a8e4f25SAlexandru Elisei 	int r = -EINVAL;
5345a8e4f25SAlexandru Elisei 
5355a8e4f25SAlexandru Elisei 	assert(bar_num <= 2);
5365a8e4f25SAlexandru Elisei 
5375a8e4f25SAlexandru Elisei 	bar_addr = pci__bar_address(pci_hdr, bar_num);
5385a8e4f25SAlexandru Elisei 
5395a8e4f25SAlexandru Elisei 	switch (bar_num) {
5405a8e4f25SAlexandru Elisei 	case 0:
541205eaa79SAndre Przywara 		r = kvm__deregister_pio(kvm, bar_addr);
5425a8e4f25SAlexandru Elisei 		break;
5435a8e4f25SAlexandru Elisei 	case 1:
5445a8e4f25SAlexandru Elisei 	case 2:
5455a8e4f25SAlexandru Elisei 		success = kvm__deregister_mmio(kvm, bar_addr);
5465a8e4f25SAlexandru Elisei 		/* kvm__deregister_mmio fails when the region is not found. */
5475a8e4f25SAlexandru Elisei 		r = (success ? 0 : -ENOENT);
5485a8e4f25SAlexandru Elisei 		break;
5495a8e4f25SAlexandru Elisei 	}
5505a8e4f25SAlexandru Elisei 
5515a8e4f25SAlexandru Elisei 	return r;
5525a8e4f25SAlexandru Elisei }
5535a8e4f25SAlexandru Elisei 
55402eca50cSAsias He int virtio_pci__init(struct kvm *kvm, void *dev, struct virtio_device *vdev,
555507e02d8SAsias He 		     int device_id, int subsys_id, int class)
55636f5dc91SSasha Levin {
55702eca50cSAsias He 	struct virtio_pci *vpci = vdev->virtio;
558e539f3e4SAlexandru Elisei 	u32 mmio_addr, msix_io_block;
559e539f3e4SAlexandru Elisei 	u16 port_addr;
5607af40b91SSasha Levin 	int r;
56136f5dc91SSasha Levin 
562a463650cSWill Deacon 	vpci->kvm = kvm;
56336f5dc91SSasha Levin 	vpci->dev = dev;
56436f5dc91SSasha Levin 
565ce2fc8f5SAlexandru Elisei 	BUILD_BUG_ON(!is_power_of_two(PCI_IO_SIZE));
566ce2fc8f5SAlexandru Elisei 
567e539f3e4SAlexandru Elisei 	port_addr = pci_get_io_port_block(PCI_IO_SIZE);
568e539f3e4SAlexandru Elisei 	mmio_addr = pci_get_mmio_block(PCI_IO_SIZE);
5692e7380dbSMarc Zyngier 	msix_io_block = pci_get_mmio_block(VIRTIO_MSIX_BAR_SIZE);
570a463650cSWill Deacon 
57136f5dc91SSasha Levin 	vpci->pci_hdr = (struct pci_device_header) {
572aa73be70SMatt Evans 		.vendor_id		= cpu_to_le16(PCI_VENDOR_ID_REDHAT_QUMRANET),
573aa73be70SMatt Evans 		.device_id		= cpu_to_le16(device_id),
574ec7dd52fSSasha Levin 		.command		= PCI_COMMAND_IO | PCI_COMMAND_MEMORY,
57536f5dc91SSasha Levin 		.header_type		= PCI_HEADER_TYPE_NORMAL,
57636f5dc91SSasha Levin 		.revision_id		= 0,
577aa73be70SMatt Evans 		.class[0]		= class & 0xff,
578aa73be70SMatt Evans 		.class[1]		= (class >> 8) & 0xff,
579aa73be70SMatt Evans 		.class[2]		= (class >> 16) & 0xff,
580aa73be70SMatt Evans 		.subsys_vendor_id	= cpu_to_le16(PCI_SUBSYSTEM_VENDOR_ID_REDHAT_QUMRANET),
581aa73be70SMatt Evans 		.subsys_id		= cpu_to_le16(subsys_id),
582e539f3e4SAlexandru Elisei 		.bar[0]			= cpu_to_le32(port_addr
5839c26dab4SSasha Levin 							| PCI_BASE_ADDRESS_SPACE_IO),
584e539f3e4SAlexandru Elisei 		.bar[1]			= cpu_to_le32(mmio_addr
585a508ea95SJean-Philippe Brucker 							| PCI_BASE_ADDRESS_SPACE_MEMORY),
586e539f3e4SAlexandru Elisei 		.bar[2]			= cpu_to_le32(msix_io_block
587b4dab816SSasha Levin 							| PCI_BASE_ADDRESS_SPACE_MEMORY),
588aa73be70SMatt Evans 		.status			= cpu_to_le16(PCI_STATUS_CAP_LIST),
58936f5dc91SSasha Levin 		.capabilities		= (void *)&vpci->pci_hdr.msix - (void *)&vpci->pci_hdr,
59048843d10SJulien Thierry 		.bar_size[0]		= cpu_to_le32(PCI_IO_SIZE),
59148843d10SJulien Thierry 		.bar_size[1]		= cpu_to_le32(PCI_IO_SIZE),
5922e7380dbSMarc Zyngier 		.bar_size[2]		= cpu_to_le32(VIRTIO_MSIX_BAR_SIZE),
59336f5dc91SSasha Levin 	};
59436f5dc91SSasha Levin 
5955a8e4f25SAlexandru Elisei 	r = pci__register_bar_regions(kvm, &vpci->pci_hdr,
5965a8e4f25SAlexandru Elisei 				      virtio_pci__bar_activate,
5975a8e4f25SAlexandru Elisei 				      virtio_pci__bar_deactivate, vdev);
5985a8e4f25SAlexandru Elisei 	if (r < 0)
5995a8e4f25SAlexandru Elisei 		return r;
6005a8e4f25SAlexandru Elisei 
60121ff329dSWill Deacon 	vpci->dev_hdr = (struct device_header) {
60221ff329dSWill Deacon 		.bus_type		= DEVICE_BUS_PCI,
60321ff329dSWill Deacon 		.data			= &vpci->pci_hdr,
60421ff329dSWill Deacon 	};
60521ff329dSWill Deacon 
60636f5dc91SSasha Levin 	vpci->pci_hdr.msix.cap = PCI_CAP_ID_MSIX;
60736f5dc91SSasha Levin 	vpci->pci_hdr.msix.next = 0;
60814bba8a0SAsias He 	/*
6092e7380dbSMarc Zyngier 	 * We at most have VIRTIO_NR_MSIX entries (VIRTIO_PCI_MAX_VQ
6102e7380dbSMarc Zyngier 	 * entries for virt queue, VIRTIO_PCI_MAX_CONFIG entries for
6112e7380dbSMarc Zyngier 	 * config).
61214bba8a0SAsias He 	 *
61314bba8a0SAsias He 	 * To quote the PCI spec:
61414bba8a0SAsias He 	 *
61514bba8a0SAsias He 	 * System software reads this field to determine the
61614bba8a0SAsias He 	 * MSI-X Table Size N, which is encoded as N-1.
61714bba8a0SAsias He 	 * For example, a returned value of "00000000011"
61814bba8a0SAsias He 	 * indicates a table size of 4.
61914bba8a0SAsias He 	 */
6202e7380dbSMarc Zyngier 	vpci->pci_hdr.msix.ctrl = cpu_to_le16(VIRTIO_NR_MSIX - 1);
62106f48103SSasha Levin 
622a463650cSWill Deacon 	/* Both table and PBA are mapped to the same BAR (2) */
623a463650cSWill Deacon 	vpci->pci_hdr.msix.table_offset = cpu_to_le32(2);
6242e7380dbSMarc Zyngier 	vpci->pci_hdr.msix.pba_offset = cpu_to_le32(2 | VIRTIO_MSIX_TABLE_SIZE);
62536f5dc91SSasha Levin 	vpci->config_vector = 0;
62636f5dc91SSasha Levin 
627f6108d72SJean-Philippe Brucker 	if (irq__can_signal_msi(kvm))
62843c81c74SSasha Levin 		vpci->features |= VIRTIO_PCI_F_SIGNAL_MSI;
62943c81c74SSasha Levin 
630c0c45eedSAndre Przywara 	vpci->legacy_irq_line = pci__assign_irq(&vpci->pci_hdr);
631c0c45eedSAndre Przywara 
63221ff329dSWill Deacon 	r = device__register(&vpci->dev_hdr);
633495fbd4eSSasha Levin 	if (r < 0)
6345a8e4f25SAlexandru Elisei 		return r;
635495fbd4eSSasha Levin 
636495fbd4eSSasha Levin 	return 0;
637495fbd4eSSasha Levin }
638495fbd4eSSasha Levin 
639eb34a8c2SJean-Philippe Brucker int virtio_pci__reset(struct kvm *kvm, struct virtio_device *vdev)
640eb34a8c2SJean-Philippe Brucker {
641eb34a8c2SJean-Philippe Brucker 	int vq;
642eb34a8c2SJean-Philippe Brucker 	struct virtio_pci *vpci = vdev->virtio;
643eb34a8c2SJean-Philippe Brucker 
644eb34a8c2SJean-Philippe Brucker 	for (vq = 0; vq < vdev->ops->get_vq_count(kvm, vpci->dev); vq++)
645eb34a8c2SJean-Philippe Brucker 		virtio_pci_exit_vq(kvm, vdev, vq);
646eb34a8c2SJean-Philippe Brucker 
647eb34a8c2SJean-Philippe Brucker 	return 0;
648eb34a8c2SJean-Philippe Brucker }
649eb34a8c2SJean-Philippe Brucker 
65002eca50cSAsias He int virtio_pci__exit(struct kvm *kvm, struct virtio_device *vdev)
651495fbd4eSSasha Levin {
65202eca50cSAsias He 	struct virtio_pci *vpci = vdev->virtio;
653495fbd4eSSasha Levin 
654eb34a8c2SJean-Philippe Brucker 	virtio_pci__reset(kvm, vdev);
655e539f3e4SAlexandru Elisei 	kvm__deregister_mmio(kvm, virtio_pci__mmio_addr(vpci));
656e539f3e4SAlexandru Elisei 	kvm__deregister_mmio(kvm, virtio_pci__msix_io_addr(vpci));
657205eaa79SAndre Przywara 	kvm__deregister_pio(kvm, virtio_pci__port_addr(vpci));
658495fbd4eSSasha Levin 
65936f5dc91SSasha Levin 	return 0;
66036f5dc91SSasha Levin }
661