xref: /kvmtool/pci.c (revision 5a8e4f25dd7b32228ff214b5d5a68a27d96c9a6c)
121ff329dSWill Deacon #include "kvm/devices.h"
260742802SPekka Enberg #include "kvm/pci.h"
360742802SPekka Enberg #include "kvm/ioport.h"
4b5981636SWill Deacon #include "kvm/irq.h"
576f9c841SCyrill Gorcunov #include "kvm/util.h"
69575e724SSasha Levin #include "kvm/kvm.h"
760742802SPekka Enberg 
86d987703SSasha Levin #include <linux/err.h>
96d987703SSasha Levin #include <assert.h>
106d987703SSasha Levin 
11a0a7d66fSDavid Daney static u32 pci_config_address_bits;
1260742802SPekka Enberg 
1340f2fd06SMatt Evans /* This is within our PCI gap - in an unused area.
1440f2fd06SMatt Evans  * Note this is a PCI *bus address*, is used to assign BARs etc.!
1540f2fd06SMatt Evans  * (That's why it can still 32bit even with 64bit guests-- 64bit
1640f2fd06SMatt Evans  * PCI isn't currently supported.)
1740f2fd06SMatt Evans  */
18854aa2efSJulien Thierry static u32 mmio_blocks			= KVM_PCI_MMIO_AREA;
19854aa2efSJulien Thierry static u16 io_port_blocks		= PCI_IOPORT_START;
20854aa2efSJulien Thierry 
21854aa2efSJulien Thierry u16 pci_get_io_port_block(u32 size)
22854aa2efSJulien Thierry {
2348843d10SJulien Thierry 	u16 port = ALIGN(io_port_blocks, PCI_IO_SIZE);
24854aa2efSJulien Thierry 
25854aa2efSJulien Thierry 	io_port_blocks = port + size;
26854aa2efSJulien Thierry 	return port;
27854aa2efSJulien Thierry }
289575e724SSasha Levin 
29c7575d17SWill Deacon /*
30c7575d17SWill Deacon  * BARs must be naturally aligned, so enforce this in the allocator.
31c7575d17SWill Deacon  */
32854aa2efSJulien Thierry u32 pci_get_mmio_block(u32 size)
339575e724SSasha Levin {
34854aa2efSJulien Thierry 	u32 block = ALIGN(mmio_blocks, size);
35854aa2efSJulien Thierry 	mmio_blocks = block + size;
369575e724SSasha Levin 	return block;
379575e724SSasha Levin }
389575e724SSasha Levin 
391a51c93dSJean-Philippe Brucker void *pci_find_cap(struct pci_device_header *hdr, u8 cap_type)
401a51c93dSJean-Philippe Brucker {
411a51c93dSJean-Philippe Brucker 	u8 pos;
421a51c93dSJean-Philippe Brucker 	struct pci_cap_hdr *cap;
431a51c93dSJean-Philippe Brucker 
441a51c93dSJean-Philippe Brucker 	pci_for_each_cap(pos, cap, hdr) {
451a51c93dSJean-Philippe Brucker 		if (cap->type == cap_type)
461a51c93dSJean-Philippe Brucker 			return cap;
471a51c93dSJean-Philippe Brucker 	}
481a51c93dSJean-Philippe Brucker 
491a51c93dSJean-Philippe Brucker 	return NULL;
501a51c93dSJean-Philippe Brucker }
511a51c93dSJean-Philippe Brucker 
52c0c45eedSAndre Przywara int pci__assign_irq(struct pci_device_header *pci_hdr)
53b5981636SWill Deacon {
54b5981636SWill Deacon 	/*
55b5981636SWill Deacon 	 * PCI supports only INTA#,B#,C#,D# per device.
56b5981636SWill Deacon 	 *
57b5981636SWill Deacon 	 * A#,B#,C#,D# are allowed for multifunctional devices so stick
58b5981636SWill Deacon 	 * with A# for our single function devices.
59b5981636SWill Deacon 	 */
60b5981636SWill Deacon 	pci_hdr->irq_pin	= 1;
61b5981636SWill Deacon 	pci_hdr->irq_line	= irq__alloc_line();
62ff01b5dbSJean-Philippe Brucker 
63ff01b5dbSJean-Philippe Brucker 	if (!pci_hdr->irq_type)
64ff01b5dbSJean-Philippe Brucker 		pci_hdr->irq_type = IRQ_TYPE_EDGE_RISING;
65c0c45eedSAndre Przywara 
66c0c45eedSAndre Przywara 	return pci_hdr->irq_line;
67b5981636SWill Deacon }
68b5981636SWill Deacon 
69*5a8e4f25SAlexandru Elisei static bool pci_bar_is_implemented(struct pci_device_header *pci_hdr, int bar_num)
70*5a8e4f25SAlexandru Elisei {
71*5a8e4f25SAlexandru Elisei 	return pci__bar_size(pci_hdr, bar_num);
72*5a8e4f25SAlexandru Elisei }
73*5a8e4f25SAlexandru Elisei 
743fdf659dSSasha Levin static void *pci_config_address_ptr(u16 port)
75ba824677SPekka Enberg {
76ba824677SPekka Enberg 	unsigned long offset;
77ba824677SPekka Enberg 	void *base;
78ba824677SPekka Enberg 
79ba824677SPekka Enberg 	offset	= port - PCI_CONFIG_ADDRESS;
80a0a7d66fSDavid Daney 	base	= &pci_config_address_bits;
81ba824677SPekka Enberg 
82ba824677SPekka Enberg 	return base + offset;
83ba824677SPekka Enberg }
84ba824677SPekka Enberg 
854123ca55SMarc Zyngier static bool pci_config_address_out(struct ioport *ioport, struct kvm_cpu *vcpu, u16 port, void *data, int size)
8660742802SPekka Enberg {
87ba824677SPekka Enberg 	void *p = pci_config_address_ptr(port);
8860742802SPekka Enberg 
89ba824677SPekka Enberg 	memcpy(p, data, size);
9060742802SPekka Enberg 
9160742802SPekka Enberg 	return true;
9260742802SPekka Enberg }
9360742802SPekka Enberg 
944123ca55SMarc Zyngier static bool pci_config_address_in(struct ioport *ioport, struct kvm_cpu *vcpu, u16 port, void *data, int size)
9560742802SPekka Enberg {
96ba824677SPekka Enberg 	void *p = pci_config_address_ptr(port);
9760742802SPekka Enberg 
98ba824677SPekka Enberg 	memcpy(data, p, size);
9960742802SPekka Enberg 
10060742802SPekka Enberg 	return true;
10160742802SPekka Enberg }
10260742802SPekka Enberg 
103305b72ceSCyrill Gorcunov static struct ioport_operations pci_config_address_ops = {
104305b72ceSCyrill Gorcunov 	.io_in	= pci_config_address_in,
105305b72ceSCyrill Gorcunov 	.io_out	= pci_config_address_out,
10660742802SPekka Enberg };
10760742802SPekka Enberg 
1083fdf659dSSasha Levin static bool pci_device_exists(u8 bus_number, u8 device_number, u8 function_number)
10976f9c841SCyrill Gorcunov {
110a0a7d66fSDavid Daney 	union pci_config_address pci_config_address;
111a0a7d66fSDavid Daney 
112a0a7d66fSDavid Daney 	pci_config_address.w = ioport__read32(&pci_config_address_bits);
113a0a7d66fSDavid Daney 
11476f9c841SCyrill Gorcunov 	if (pci_config_address.bus_number != bus_number)
11576f9c841SCyrill Gorcunov 		return false;
11676f9c841SCyrill Gorcunov 
117b30d05adSPekka Enberg 	if (pci_config_address.function_number != function_number)
11876f9c841SCyrill Gorcunov 		return false;
11976f9c841SCyrill Gorcunov 
12021ff329dSWill Deacon 	return !IS_ERR_OR_NULL(device__find_dev(DEVICE_BUS_PCI, device_number));
12176f9c841SCyrill Gorcunov }
12276f9c841SCyrill Gorcunov 
1234123ca55SMarc Zyngier static bool pci_config_data_out(struct ioport *ioport, struct kvm_cpu *vcpu, u16 port, void *data, int size)
1249575e724SSasha Levin {
125a0a7d66fSDavid Daney 	union pci_config_address pci_config_address;
126a0a7d66fSDavid Daney 
1276ea32ebdSAlexandru Elisei 	if (size > 4)
1286ea32ebdSAlexandru Elisei 		size = 4;
1296ea32ebdSAlexandru Elisei 
130a0a7d66fSDavid Daney 	pci_config_address.w = ioport__read32(&pci_config_address_bits);
1319575e724SSasha Levin 	/*
1329575e724SSasha Levin 	 * If someone accesses PCI configuration space offsets that are not
1339575e724SSasha Levin 	 * aligned to 4 bytes, it uses ioports to signify that.
1349575e724SSasha Levin 	 */
135d0297a59SMatt Evans 	pci_config_address.reg_offset = port - PCI_CONFIG_DATA;
1369575e724SSasha Levin 
1374123ca55SMarc Zyngier 	pci__config_wr(vcpu->kvm, pci_config_address, data, size);
138d0297a59SMatt Evans 
139d0297a59SMatt Evans 	return true;
140d0297a59SMatt Evans }
141d0297a59SMatt Evans 
1424123ca55SMarc Zyngier static bool pci_config_data_in(struct ioport *ioport, struct kvm_cpu *vcpu, u16 port, void *data, int size)
143d0297a59SMatt Evans {
144a0a7d66fSDavid Daney 	union pci_config_address pci_config_address;
145a0a7d66fSDavid Daney 
1466ea32ebdSAlexandru Elisei 	if (size > 4)
1476ea32ebdSAlexandru Elisei 		size = 4;
1486ea32ebdSAlexandru Elisei 
149a0a7d66fSDavid Daney 	pci_config_address.w = ioport__read32(&pci_config_address_bits);
150d0297a59SMatt Evans 	/*
151d0297a59SMatt Evans 	 * If someone accesses PCI configuration space offsets that are not
152d0297a59SMatt Evans 	 * aligned to 4 bytes, it uses ioports to signify that.
153d0297a59SMatt Evans 	 */
154d0297a59SMatt Evans 	pci_config_address.reg_offset = port - PCI_CONFIG_DATA;
155d0297a59SMatt Evans 
1564123ca55SMarc Zyngier 	pci__config_rd(vcpu->kvm, pci_config_address, data, size);
157d0297a59SMatt Evans 
158d0297a59SMatt Evans 	return true;
159d0297a59SMatt Evans }
160d0297a59SMatt Evans 
161d0297a59SMatt Evans static struct ioport_operations pci_config_data_ops = {
162d0297a59SMatt Evans 	.io_in	= pci_config_data_in,
163d0297a59SMatt Evans 	.io_out	= pci_config_data_out,
164d0297a59SMatt Evans };
165d0297a59SMatt Evans 
166d0297a59SMatt Evans void pci__config_wr(struct kvm *kvm, union pci_config_address addr, void *data, int size)
167d0297a59SMatt Evans {
168023fdaaeSJean-Philippe Brucker 	void *base;
169023fdaaeSJean-Philippe Brucker 	u8 bar, offset;
170023fdaaeSJean-Philippe Brucker 	struct pci_device_header *pci_hdr;
171023fdaaeSJean-Philippe Brucker 	u8 dev_num = addr.device_number;
172bb0d509bSSami Mujawar 	u32 value = 0;
173bb0d509bSSami Mujawar 	u32 mask;
174d0297a59SMatt Evans 
175023fdaaeSJean-Philippe Brucker 	if (!pci_device_exists(addr.bus_number, dev_num, 0))
176023fdaaeSJean-Philippe Brucker 		return;
1779575e724SSasha Levin 
178023fdaaeSJean-Philippe Brucker 	offset = addr.w & PCI_DEV_CFG_MASK;
179023fdaaeSJean-Philippe Brucker 	base = pci_hdr = device__find_dev(DEVICE_BUS_PCI, dev_num)->data;
1809575e724SSasha Levin 
181023fdaaeSJean-Philippe Brucker 	if (pci_hdr->cfg_ops.write)
182023fdaaeSJean-Philippe Brucker 		pci_hdr->cfg_ops.write(kvm, pci_hdr, offset, data, size);
183c64f7ff0SSasha Levin 
1849575e724SSasha Levin 	/*
185023fdaaeSJean-Philippe Brucker 	 * legacy hack: ignore writes to uninitialized regions (e.g. ROM BAR).
186023fdaaeSJean-Philippe Brucker 	 * Not very nice but has been working so far.
1879575e724SSasha Levin 	 */
188023fdaaeSJean-Philippe Brucker 	if (*(u32 *)(base + offset) == 0)
189023fdaaeSJean-Philippe Brucker 		return;
190023fdaaeSJean-Philippe Brucker 
191023fdaaeSJean-Philippe Brucker 	bar = (offset - PCI_BAR_OFFSET(0)) / sizeof(u32);
192023fdaaeSJean-Philippe Brucker 
193023fdaaeSJean-Philippe Brucker 	/*
194bb0d509bSSami Mujawar 	 * If the kernel masks the BAR, it will expect to find the size of the
195bb0d509bSSami Mujawar 	 * BAR there next time it reads from it. After the kernel reads the
196bb0d509bSSami Mujawar 	 * size, it will write the address back.
197023fdaaeSJean-Philippe Brucker 	 */
198bb0d509bSSami Mujawar 	if (bar < 6) {
1992f6384f9SAlexandru Elisei 		if (pci__bar_is_io(pci_hdr, bar))
200bb0d509bSSami Mujawar 			mask = (u32)PCI_BASE_ADDRESS_IO_MASK;
201bb0d509bSSami Mujawar 		else
202bb0d509bSSami Mujawar 			mask = (u32)PCI_BASE_ADDRESS_MEM_MASK;
203bb0d509bSSami Mujawar 		/*
204bb0d509bSSami Mujawar 		 * According to the PCI local bus specification REV 3.0:
205bb0d509bSSami Mujawar 		 * The number of upper bits that a device actually implements
206bb0d509bSSami Mujawar 		 * depends on how much of the address space the device will
207bb0d509bSSami Mujawar 		 * respond to. A device that wants a 1 MB memory address space
208bb0d509bSSami Mujawar 		 * (using a 32-bit base address register) would build the top
209bb0d509bSSami Mujawar 		 * 12 bits of the address register, hardwiring the other bits
210bb0d509bSSami Mujawar 		 * to 0.
211bb0d509bSSami Mujawar 		 *
212bb0d509bSSami Mujawar 		 * Furthermore, software can determine how much address space
213bb0d509bSSami Mujawar 		 * the device requires by writing a value of all 1's to the
214bb0d509bSSami Mujawar 		 * register and then reading the value back. The device will
215bb0d509bSSami Mujawar 		 * return 0's in all don't-care address bits, effectively
216bb0d509bSSami Mujawar 		 * specifying the address space required.
217bb0d509bSSami Mujawar 		 *
218bb0d509bSSami Mujawar 		 * Software computes the size of the address space with the
219bb0d509bSSami Mujawar 		 * formula S = ~B + 1, where S is the memory size and B is the
220bb0d509bSSami Mujawar 		 * value read from the BAR. This means that the BAR value that
221bb0d509bSSami Mujawar 		 * kvmtool should return is B = ~(S - 1).
222bb0d509bSSami Mujawar 		 */
223bb0d509bSSami Mujawar 		memcpy(&value, data, size);
224bb0d509bSSami Mujawar 		if (value == 0xffffffff)
2252f6384f9SAlexandru Elisei 			value = ~(pci__bar_size(pci_hdr, bar) - 1);
226bb0d509bSSami Mujawar 		/* Preserve the special bits. */
227bb0d509bSSami Mujawar 		value = (value & mask) | (pci_hdr->bar[bar] & ~mask);
228bb0d509bSSami Mujawar 		memcpy(base + offset, &value, size);
229023fdaaeSJean-Philippe Brucker 	} else {
230023fdaaeSJean-Philippe Brucker 		memcpy(base + offset, data, size);
2319575e724SSasha Levin 	}
2329575e724SSasha Levin }
2339575e724SSasha Levin 
234d0297a59SMatt Evans void pci__config_rd(struct kvm *kvm, union pci_config_address addr, void *data, int size)
23560742802SPekka Enberg {
236023fdaaeSJean-Philippe Brucker 	u8 offset;
237023fdaaeSJean-Philippe Brucker 	struct pci_device_header *pci_hdr;
238023fdaaeSJean-Philippe Brucker 	u8 dev_num = addr.device_number;
239e4d2cea2SPekka Enberg 
240023fdaaeSJean-Philippe Brucker 	if (pci_device_exists(addr.bus_number, dev_num, 0)) {
241023fdaaeSJean-Philippe Brucker 		pci_hdr = device__find_dev(DEVICE_BUS_PCI, dev_num)->data;
242023fdaaeSJean-Philippe Brucker 		offset = addr.w & PCI_DEV_CFG_MASK;
243b30d05adSPekka Enberg 
244023fdaaeSJean-Philippe Brucker 		if (pci_hdr->cfg_ops.read)
245023fdaaeSJean-Philippe Brucker 			pci_hdr->cfg_ops.read(kvm, pci_hdr, offset, data, size);
246598419d5SPekka Enberg 
247023fdaaeSJean-Philippe Brucker 		memcpy(data, (void *)pci_hdr + offset, size);
2483a60be06SSasha Levin 	} else {
249e498ea08SPekka Enberg 		memset(data, 0xff, size);
25060742802SPekka Enberg 	}
2513a60be06SSasha Levin }
25260742802SPekka Enberg 
2539b735910SMarc Zyngier static void pci_config_mmio_access(struct kvm_cpu *vcpu, u64 addr, u8 *data,
2549b735910SMarc Zyngier 				   u32 len, u8 is_write, void *kvm)
255b403f2f7SWill Deacon {
256b403f2f7SWill Deacon 	union pci_config_address cfg_addr;
257b403f2f7SWill Deacon 
258b403f2f7SWill Deacon 	addr			-= KVM_PCI_CFG_AREA;
259b403f2f7SWill Deacon 	cfg_addr.w		= (u32)addr;
260b403f2f7SWill Deacon 	cfg_addr.enable_bit	= 1;
261b403f2f7SWill Deacon 
2626ea32ebdSAlexandru Elisei 	if (len > 4)
2636ea32ebdSAlexandru Elisei 		len = 4;
2646ea32ebdSAlexandru Elisei 
265b403f2f7SWill Deacon 	if (is_write)
266b403f2f7SWill Deacon 		pci__config_wr(kvm, cfg_addr, data, len);
267b403f2f7SWill Deacon 	else
268b403f2f7SWill Deacon 		pci__config_rd(kvm, cfg_addr, data, len);
269b403f2f7SWill Deacon }
270b403f2f7SWill Deacon 
271d0297a59SMatt Evans struct pci_device_header *pci__find_dev(u8 dev_num)
272d0297a59SMatt Evans {
27321ff329dSWill Deacon 	struct device_header *hdr = device__find_dev(DEVICE_BUS_PCI, dev_num);
2746d987703SSasha Levin 
27521ff329dSWill Deacon 	if (IS_ERR_OR_NULL(hdr))
27621ff329dSWill Deacon 		return NULL;
27721ff329dSWill Deacon 
27821ff329dSWill Deacon 	return hdr->data;
279d0297a59SMatt Evans }
280d0297a59SMatt Evans 
281*5a8e4f25SAlexandru Elisei int pci__register_bar_regions(struct kvm *kvm, struct pci_device_header *pci_hdr,
282*5a8e4f25SAlexandru Elisei 			      bar_activate_fn_t bar_activate_fn,
283*5a8e4f25SAlexandru Elisei 			      bar_deactivate_fn_t bar_deactivate_fn, void *data)
284*5a8e4f25SAlexandru Elisei {
285*5a8e4f25SAlexandru Elisei 	int i, r;
286*5a8e4f25SAlexandru Elisei 
287*5a8e4f25SAlexandru Elisei 	assert(bar_activate_fn && bar_deactivate_fn);
288*5a8e4f25SAlexandru Elisei 
289*5a8e4f25SAlexandru Elisei 	pci_hdr->bar_activate_fn = bar_activate_fn;
290*5a8e4f25SAlexandru Elisei 	pci_hdr->bar_deactivate_fn = bar_deactivate_fn;
291*5a8e4f25SAlexandru Elisei 	pci_hdr->data = data;
292*5a8e4f25SAlexandru Elisei 
293*5a8e4f25SAlexandru Elisei 	for (i = 0; i < 6; i++) {
294*5a8e4f25SAlexandru Elisei 		if (!pci_bar_is_implemented(pci_hdr, i))
295*5a8e4f25SAlexandru Elisei 			continue;
296*5a8e4f25SAlexandru Elisei 
297*5a8e4f25SAlexandru Elisei 		if (pci__bar_is_io(pci_hdr, i) &&
298*5a8e4f25SAlexandru Elisei 		    pci__io_space_enabled(pci_hdr)) {
299*5a8e4f25SAlexandru Elisei 			r = bar_activate_fn(kvm, pci_hdr, i, data);
300*5a8e4f25SAlexandru Elisei 			if (r < 0)
301*5a8e4f25SAlexandru Elisei 				return r;
302*5a8e4f25SAlexandru Elisei 		}
303*5a8e4f25SAlexandru Elisei 
304*5a8e4f25SAlexandru Elisei 		if (pci__bar_is_memory(pci_hdr, i) &&
305*5a8e4f25SAlexandru Elisei 		    pci__memory_space_enabled(pci_hdr)) {
306*5a8e4f25SAlexandru Elisei 			r = bar_activate_fn(kvm, pci_hdr, i, data);
307*5a8e4f25SAlexandru Elisei 			if (r < 0)
308*5a8e4f25SAlexandru Elisei 				return r;
309*5a8e4f25SAlexandru Elisei 		}
310*5a8e4f25SAlexandru Elisei 	}
311*5a8e4f25SAlexandru Elisei 
312*5a8e4f25SAlexandru Elisei 	return 0;
313*5a8e4f25SAlexandru Elisei }
314*5a8e4f25SAlexandru Elisei 
3156d987703SSasha Levin int pci__init(struct kvm *kvm)
31660742802SPekka Enberg {
3176d987703SSasha Levin 	int r;
3186d987703SSasha Levin 
3194346fd8fSSasha Levin 	r = ioport__register(kvm, PCI_CONFIG_DATA + 0, &pci_config_data_ops, 4, NULL);
3206d987703SSasha Levin 	if (r < 0)
3216d987703SSasha Levin 		return r;
3226d987703SSasha Levin 
3234346fd8fSSasha Levin 	r = ioport__register(kvm, PCI_CONFIG_ADDRESS + 0, &pci_config_address_ops, 4, NULL);
324b403f2f7SWill Deacon 	if (r < 0)
325b403f2f7SWill Deacon 		goto err_unregister_data;
326b403f2f7SWill Deacon 
327b403f2f7SWill Deacon 	r = kvm__register_mmio(kvm, KVM_PCI_CFG_AREA, PCI_CFG_SIZE, false,
328b403f2f7SWill Deacon 			       pci_config_mmio_access, kvm);
329b403f2f7SWill Deacon 	if (r < 0)
330b403f2f7SWill Deacon 		goto err_unregister_addr;
3316d987703SSasha Levin 
3326d987703SSasha Levin 	return 0;
333b403f2f7SWill Deacon 
334b403f2f7SWill Deacon err_unregister_addr:
335b403f2f7SWill Deacon 	ioport__unregister(kvm, PCI_CONFIG_ADDRESS);
336b403f2f7SWill Deacon err_unregister_data:
337b403f2f7SWill Deacon 	ioport__unregister(kvm, PCI_CONFIG_DATA);
338b403f2f7SWill Deacon 	return r;
3396d987703SSasha Levin }
340bca12bf6SSasha Levin dev_base_init(pci__init);
3416d987703SSasha Levin 
3426d987703SSasha Levin int pci__exit(struct kvm *kvm)
3436d987703SSasha Levin {
3444346fd8fSSasha Levin 	ioport__unregister(kvm, PCI_CONFIG_DATA);
3454346fd8fSSasha Levin 	ioport__unregister(kvm, PCI_CONFIG_ADDRESS);
3466d987703SSasha Levin 
3476d987703SSasha Levin 	return 0;
34860742802SPekka Enberg }
349bca12bf6SSasha Levin dev_base_exit(pci__exit);
350