xref: /kvmtool/kvm.c (revision 55e19624b74ae889611a249b4c78d7cd248951d1)
1ae1fae34SPekka Enberg #include "kvm/kvm.h"
2ae1fae34SPekka Enberg 
3eda03319SPekka Enberg #include "kvm/interrupt.h"
4f3150089SPekka Enberg #include "kvm/util.h"
5eda03319SPekka Enberg 
66c7d8514SPekka Enberg #include <linux/kvm.h>
7f5ab5f67SPekka Enberg 
8f5ab5f67SPekka Enberg #include <asm/bootparam.h>
9f5ab5f67SPekka Enberg 
10ae1fae34SPekka Enberg #include <sys/ioctl.h>
111f9cff23SPekka Enberg #include <inttypes.h>
121f9cff23SPekka Enberg #include <sys/mman.h>
132da26a59SPekka Enberg #include <stdbool.h>
146e5e8b8dSPekka Enberg #include <assert.h>
1506e41eeaSPekka Enberg #include <limits.h>
16f5ab5f67SPekka Enberg #include <stdarg.h>
17b8f6afcdSPekka Enberg #include <stdlib.h>
18f5ab5f67SPekka Enberg #include <string.h>
190d1f17ecSPekka Enberg #include <unistd.h>
201f9cff23SPekka Enberg #include <stdio.h>
21b8f6afcdSPekka Enberg #include <fcntl.h>
22b8f6afcdSPekka Enberg 
231f9cff23SPekka Enberg /*
241f9cff23SPekka Enberg  * Compatibility code. Remove this when we move to tools/kvm.
251f9cff23SPekka Enberg  */
261f9cff23SPekka Enberg #ifndef KVM_EXIT_INTERNAL_ERROR
271f9cff23SPekka Enberg # define KVM_EXIT_INTERNAL_ERROR		17
281f9cff23SPekka Enberg #endif
291f9cff23SPekka Enberg 
30ae1fae34SPekka Enberg #define DEFINE_KVM_EXIT_REASON(reason) [reason] = #reason
310d1f17ecSPekka Enberg 
32ae1fae34SPekka Enberg const char *kvm_exit_reasons[] = {
33ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_UNKNOWN),
34ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_EXCEPTION),
35ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_IO),
36ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_HYPERCALL),
37ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_DEBUG),
38ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_HLT),
39ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_MMIO),
40ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_IRQ_WINDOW_OPEN),
41ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_SHUTDOWN),
42ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_FAIL_ENTRY),
43ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_INTR),
44ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_SET_TPR),
45ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_TPR_ACCESS),
46ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_S390_SIEIC),
47ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_S390_RESET),
48ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_DCR),
49ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_NMI),
50ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_INTERNAL_ERROR),
519b1fb1c3SPekka Enberg };
529b1fb1c3SPekka Enberg 
53*55e19624SCyrill Gorcunov #define DEFINE_KVM_EXT(ext)		\
54*55e19624SCyrill Gorcunov 	.name = #ext,			\
55*55e19624SCyrill Gorcunov 	.code = ext
56*55e19624SCyrill Gorcunov 
57*55e19624SCyrill Gorcunov struct {
58*55e19624SCyrill Gorcunov 	const char *name;
59*55e19624SCyrill Gorcunov 	int code;
60*55e19624SCyrill Gorcunov } kvm_req_ext[] = {
61*55e19624SCyrill Gorcunov 	{ DEFINE_KVM_EXT(KVM_CAP_COALESCED_MMIO) },
62*55e19624SCyrill Gorcunov 	{ DEFINE_KVM_EXT(KVM_CAP_SET_TSS_ADDR) },
63*55e19624SCyrill Gorcunov 	{ DEFINE_KVM_EXT(KVM_CAP_PIT2) },
64*55e19624SCyrill Gorcunov 	{ DEFINE_KVM_EXT(KVM_CAP_USER_MEMORY) },
65*55e19624SCyrill Gorcunov 	{ DEFINE_KVM_EXT(KVM_CAP_IRQ_ROUTING) },
66*55e19624SCyrill Gorcunov 	{ DEFINE_KVM_EXT(KVM_CAP_IRQCHIP) },
67*55e19624SCyrill Gorcunov 	{ DEFINE_KVM_EXT(KVM_CAP_IRQ_INJECT_STATUS) },
68*55e19624SCyrill Gorcunov };
69*55e19624SCyrill Gorcunov 
7048cf3877SPekka Enberg static inline bool host_ptr_in_ram(struct kvm *self, void *p)
7148cf3877SPekka Enberg {
7248cf3877SPekka Enberg 	return self->ram_start <= p && p < (self->ram_start + self->ram_size);
7348cf3877SPekka Enberg }
7448cf3877SPekka Enberg 
756753ed2fSPekka Enberg static inline uint32_t segment_to_flat(uint16_t selector, uint16_t offset)
766753ed2fSPekka Enberg {
776753ed2fSPekka Enberg 	return ((uint32_t)selector << 4) + (uint32_t) offset;
786753ed2fSPekka Enberg }
796753ed2fSPekka Enberg 
806753ed2fSPekka Enberg static inline void *guest_flat_to_host(struct kvm *self, unsigned long offset)
81ae1fae34SPekka Enberg {
82ae1fae34SPekka Enberg 	return self->ram_start + offset;
83ae1fae34SPekka Enberg }
84ae1fae34SPekka Enberg 
856753ed2fSPekka Enberg static inline void *guest_real_to_host(struct kvm *self, uint16_t selector, uint16_t offset)
866753ed2fSPekka Enberg {
876753ed2fSPekka Enberg 	unsigned long flat = segment_to_flat(selector, offset);
886753ed2fSPekka Enberg 
896753ed2fSPekka Enberg 	return guest_flat_to_host(self, flat);
906753ed2fSPekka Enberg }
916753ed2fSPekka Enberg 
92ae1fae34SPekka Enberg static bool kvm__supports_extension(struct kvm *self, unsigned int extension)
93b8f6afcdSPekka Enberg {
9428fa19c0SPekka Enberg 	int ret;
95b8f6afcdSPekka Enberg 
9673ac60e6SPekka Enberg 	ret = ioctl(self->sys_fd, KVM_CHECK_EXTENSION, extension);
974076b041SPekka Enberg 	if (ret < 0)
984076b041SPekka Enberg 		return false;
994076b041SPekka Enberg 
1004076b041SPekka Enberg 	return ret;
1014076b041SPekka Enberg }
1024076b041SPekka Enberg 
103*55e19624SCyrill Gorcunov static int kvm__check_extensions(struct kvm *self)
104*55e19624SCyrill Gorcunov {
105*55e19624SCyrill Gorcunov 	unsigned int i;
106*55e19624SCyrill Gorcunov 
107*55e19624SCyrill Gorcunov 	for (i = 0; i < ARRAY_SIZE(kvm_req_ext); i++) {
108*55e19624SCyrill Gorcunov 		if (!kvm__supports_extension(self, kvm_req_ext[i].code)) {
109*55e19624SCyrill Gorcunov 			error("Unsuppored KVM extension detected: %s",
110*55e19624SCyrill Gorcunov 				kvm_req_ext[i].name);
111*55e19624SCyrill Gorcunov 			return (int)-i;
112*55e19624SCyrill Gorcunov 		}
113*55e19624SCyrill Gorcunov 	}
114*55e19624SCyrill Gorcunov 
115*55e19624SCyrill Gorcunov 	return 0;
116*55e19624SCyrill Gorcunov }
117*55e19624SCyrill Gorcunov 
1184076b041SPekka Enberg static struct kvm *kvm__new(void)
1194076b041SPekka Enberg {
1204076b041SPekka Enberg 	struct kvm *self = calloc(1, sizeof *self);
1214076b041SPekka Enberg 
1224076b041SPekka Enberg 	if (!self)
1234076b041SPekka Enberg 		die("out of memory");
1244076b041SPekka Enberg 
1254076b041SPekka Enberg 	return self;
1264076b041SPekka Enberg }
1274076b041SPekka Enberg 
1289ef4c68eSPekka Enberg void kvm__delete(struct kvm *self)
1299ef4c68eSPekka Enberg {
1309ef4c68eSPekka Enberg 	free(self->ram_start);
1319ef4c68eSPekka Enberg 	free(self);
1329ef4c68eSPekka Enberg }
1339ef4c68eSPekka Enberg 
134ae1fae34SPekka Enberg struct kvm *kvm__init(void)
1354076b041SPekka Enberg {
1362b0e3342SPekka Enberg 	struct kvm_userspace_memory_region mem;
1379687927dSAsias He 	struct kvm_pit_config pit_config = { .flags = 0, };
1384076b041SPekka Enberg 	struct kvm *self;
1390d1f17ecSPekka Enberg 	long page_size;
1401f9cff23SPekka Enberg 	int mmap_size;
1414076b041SPekka Enberg 	int ret;
1424076b041SPekka Enberg 
1434076b041SPekka Enberg 	self = kvm__new();
1444076b041SPekka Enberg 
14573ac60e6SPekka Enberg 	self->sys_fd = open("/dev/kvm", O_RDWR);
14673ac60e6SPekka Enberg 	if (self->sys_fd < 0)
147f5ab5f67SPekka Enberg 		die_perror("open");
148b8f6afcdSPekka Enberg 
14973ac60e6SPekka Enberg 	ret = ioctl(self->sys_fd, KVM_GET_API_VERSION, 0);
1506c7d8514SPekka Enberg 	if (ret != KVM_API_VERSION)
151f5ab5f67SPekka Enberg 		die_perror("KVM_API_VERSION ioctl");
1526c7d8514SPekka Enberg 
15373ac60e6SPekka Enberg 	self->vm_fd = ioctl(self->sys_fd, KVM_CREATE_VM, 0);
15473ac60e6SPekka Enberg 	if (self->vm_fd < 0)
155f5ab5f67SPekka Enberg 		die_perror("KVM_CREATE_VM ioctl");
15628fa19c0SPekka Enberg 
157*55e19624SCyrill Gorcunov 	if (kvm__check_extensions(self))
158*55e19624SCyrill Gorcunov 		die("A required KVM extention is not supported by OS");
1599687927dSAsias He 
1609687927dSAsias He 	ret = ioctl(self->vm_fd, KVM_SET_TSS_ADDR, 0xfffbd000);
1619687927dSAsias He 	if (ret < 0)
1629687927dSAsias He 		die_perror("KVM_SET_TSS_ADDR ioctl");
1639687927dSAsias He 
1649687927dSAsias He 	ret = ioctl(self->vm_fd, KVM_CREATE_PIT2, &pit_config);
1659687927dSAsias He 	if (ret < 0)
1669687927dSAsias He 		die_perror("KVM_CREATE_PIT2 ioctl");
1679687927dSAsias He 
1680d1f17ecSPekka Enberg 	self->ram_size		= 64UL * 1024UL * 1024UL;
1690d1f17ecSPekka Enberg 
1700d1f17ecSPekka Enberg 	page_size	= sysconf(_SC_PAGESIZE);
1710d1f17ecSPekka Enberg 	if (posix_memalign(&self->ram_start, page_size, self->ram_size) != 0)
1720d1f17ecSPekka Enberg 		die("out of memory");
1730d1f17ecSPekka Enberg 
1742b0e3342SPekka Enberg 	mem = (struct kvm_userspace_memory_region) {
1752b0e3342SPekka Enberg 		.slot			= 0,
1762b0e3342SPekka Enberg 		.guest_phys_addr	= 0x0UL,
1770d1f17ecSPekka Enberg 		.memory_size		= self->ram_size,
1780d1f17ecSPekka Enberg 		.userspace_addr		= (unsigned long) self->ram_start,
1792b0e3342SPekka Enberg 	};
1802b0e3342SPekka Enberg 
181b6e68186SAsias He 	ret = ioctl(self->vm_fd, KVM_SET_USER_MEMORY_REGION, &mem);
1822b0e3342SPekka Enberg 	if (ret < 0)
183f5ab5f67SPekka Enberg 		die_perror("KVM_SET_USER_MEMORY_REGION ioctl");
1842b0e3342SPekka Enberg 
1859687927dSAsias He 	ret = ioctl(self->vm_fd, KVM_CREATE_IRQCHIP);
186895c2fefSPekka Enberg 	if (ret < 0)
1879687927dSAsias He 		die_perror("KVM_CREATE_IRQCHIP ioctl");
1889687927dSAsias He 
18973ac60e6SPekka Enberg 	self->vcpu_fd = ioctl(self->vm_fd, KVM_CREATE_VCPU, 0);
1902b0e3342SPekka Enberg 	if (self->vcpu_fd < 0)
191f5ab5f67SPekka Enberg 		die_perror("KVM_CREATE_VCPU ioctl");
1922b0e3342SPekka Enberg 
1931f9cff23SPekka Enberg 	mmap_size = ioctl(self->sys_fd, KVM_GET_VCPU_MMAP_SIZE, 0);
1941f9cff23SPekka Enberg 	if (mmap_size < 0)
195f5ab5f67SPekka Enberg 		die_perror("KVM_GET_VCPU_MMAP_SIZE ioctl");
1961f9cff23SPekka Enberg 
1971f9cff23SPekka Enberg 	self->kvm_run = mmap(NULL, mmap_size, PROT_READ|PROT_WRITE, MAP_SHARED, self->vcpu_fd, 0);
1981f9cff23SPekka Enberg 	if (self->kvm_run == MAP_FAILED)
1991f9cff23SPekka Enberg 		die("unable to mmap vcpu fd");
2001f9cff23SPekka Enberg 
2014076b041SPekka Enberg 	return self;
2024076b041SPekka Enberg }
2034076b041SPekka Enberg 
204ae1fae34SPekka Enberg void kvm__enable_singlestep(struct kvm *self)
205aee6632eSPekka Enberg {
206aee6632eSPekka Enberg 	struct kvm_guest_debug debug = {
207aee6632eSPekka Enberg 		.control	= KVM_GUESTDBG_ENABLE | KVM_GUESTDBG_SINGLESTEP,
208aee6632eSPekka Enberg 	};
209aee6632eSPekka Enberg 
210aee6632eSPekka Enberg 	if (ioctl(self->vcpu_fd, KVM_SET_GUEST_DEBUG, &debug) < 0)
211b625d4b6SCyrill Gorcunov 		warning("KVM_SET_GUEST_DEBUG failed");
212aee6632eSPekka Enberg }
213aee6632eSPekka Enberg 
2145f6772b8SCyrill Gorcunov #define BOOT_LOADER_SELECTOR	0x1000
215b08e9ec4SPekka Enberg #define BOOT_LOADER_IP		0x0000
216dbdb74c2SPekka Enberg #define BOOT_LOADER_SP		0x8000
2172dd4a4edSCyrill Gorcunov #define BOOT_CMDLINE_OFFSET	0x20000
2182dd4a4edSCyrill Gorcunov 
2192dd4a4edSCyrill Gorcunov #define BOOT_PROTOCOL_REQUIRED	0x202
220a43f6460SCyrill Gorcunov #define LOAD_HIGH		0x01
221009b0758SPekka Enberg 
222edc8a14dSPekka Enberg static int load_flat_binary(struct kvm *self, int fd)
223009b0758SPekka Enberg {
224009b0758SPekka Enberg 	void *p;
225009b0758SPekka Enberg 	int nr;
226009b0758SPekka Enberg 
227009b0758SPekka Enberg 	if (lseek(fd, 0, SEEK_SET) < 0)
228009b0758SPekka Enberg 		die_perror("lseek");
229009b0758SPekka Enberg 
2306753ed2fSPekka Enberg 	p = guest_real_to_host(self, BOOT_LOADER_SELECTOR, BOOT_LOADER_IP);
231009b0758SPekka Enberg 
232009b0758SPekka Enberg 	while ((nr = read(fd, p, 65536)) > 0)
233009b0758SPekka Enberg 		p += nr;
234009b0758SPekka Enberg 
235dbdb74c2SPekka Enberg 	self->boot_selector	= BOOT_LOADER_SELECTOR;
236edc8a14dSPekka Enberg 	self->boot_ip		= BOOT_LOADER_IP;
237dbdb74c2SPekka Enberg 	self->boot_sp		= BOOT_LOADER_SP;
238edc8a14dSPekka Enberg 
2397fb218bdSPekka Enberg 	return true;
240009b0758SPekka Enberg }
241009b0758SPekka Enberg 
2427fb218bdSPekka Enberg /*
2437fb218bdSPekka Enberg  * The protected mode kernel part of a modern bzImage is loaded at 1 MB by
2447fb218bdSPekka Enberg  * default.
2457fb218bdSPekka Enberg  */
2467fb218bdSPekka Enberg #define BZ_KERNEL_START			0x100000UL
247ae1fae34SPekka Enberg 
248ae1fae34SPekka Enberg static const char *BZIMAGE_MAGIC	= "HdrS";
249ae1fae34SPekka Enberg 
25010943d14SPekka Enberg #define BZ_DEFAULT_SETUP_SECTS		4
25110943d14SPekka Enberg 
2526d1f350dSCyrill Gorcunov static bool load_bzimage(struct kvm *self, int fd, const char *kernel_cmdline)
253ae1fae34SPekka Enberg {
254bc75b0aeSCyrill Gorcunov 	struct real_intr_desc intr;
25522489bb0SCyrill Gorcunov 	struct boot_params boot;
2564b62331fSPekka Enberg 	unsigned long setup_sects;
257305d9054SCyrill Gorcunov 	unsigned int intr_addr;
2582dd4a4edSCyrill Gorcunov 	size_t cmdline_size;
2597fb218bdSPekka Enberg 	ssize_t setup_size;
26022489bb0SCyrill Gorcunov 	void *p;
261ae1fae34SPekka Enberg 	int nr;
262ae1fae34SPekka Enberg 
2635d67eaf6SPekka Enberg 	/*
2645d67eaf6SPekka Enberg 	 * See Documentation/x86/boot.txt for details no bzImage on-disk and
2655d67eaf6SPekka Enberg 	 * memory layout.
2665d67eaf6SPekka Enberg 	 */
2675d67eaf6SPekka Enberg 
268009b0758SPekka Enberg 	if (lseek(fd, 0, SEEK_SET) < 0)
269009b0758SPekka Enberg 		die_perror("lseek");
270009b0758SPekka Enberg 
271ae1fae34SPekka Enberg 	read(fd, &boot, sizeof(boot));
272ae1fae34SPekka Enberg 
273ae1fae34SPekka Enberg         if (memcmp(&boot.hdr.header, BZIMAGE_MAGIC, strlen(BZIMAGE_MAGIC)) != 0)
2747fb218bdSPekka Enberg 		return false;
275ae1fae34SPekka Enberg 
2762dd4a4edSCyrill Gorcunov 	if (boot.hdr.version < BOOT_PROTOCOL_REQUIRED) {
277ad681038SCyrill Gorcunov 		warning("Too old kernel");
278ad681038SCyrill Gorcunov 		return false;
279ad681038SCyrill Gorcunov 	}
280ad681038SCyrill Gorcunov 
281e93ab78aSPekka Enberg 	if (lseek(fd, 0, SEEK_SET) < 0)
282e93ab78aSPekka Enberg 		die_perror("lseek");
283e93ab78aSPekka Enberg 
2844cf542bbSCyrill Gorcunov 	if (!boot.hdr.setup_sects)
2854cf542bbSCyrill Gorcunov 		boot.hdr.setup_sects = BZ_DEFAULT_SETUP_SECTS;
28610943d14SPekka Enberg 	setup_sects = boot.hdr.setup_sects + 1;
28710943d14SPekka Enberg 
28854d4a626SPekka Enberg 	setup_size = setup_sects << 9;
2896753ed2fSPekka Enberg 	p = guest_real_to_host(self, BOOT_LOADER_SELECTOR, BOOT_LOADER_IP);
290ae1fae34SPekka Enberg 
2917fb218bdSPekka Enberg 	if (read(fd, p, setup_size) != setup_size)
2927fb218bdSPekka Enberg 		die_perror("read");
2937fb218bdSPekka Enberg 
2946753ed2fSPekka Enberg 	p = guest_flat_to_host(self, BZ_KERNEL_START);
295ae1fae34SPekka Enberg 
296ae1fae34SPekka Enberg 	while ((nr = read(fd, p, 65536)) > 0)
297ae1fae34SPekka Enberg 		p += nr;
298ae1fae34SPekka Enberg 
299a43f6460SCyrill Gorcunov 	p = guest_flat_to_host(self, BOOT_CMDLINE_OFFSET);
300debcfac0SCyrill Gorcunov 	if (kernel_cmdline) {
301debcfac0SCyrill Gorcunov 		cmdline_size = strlen(kernel_cmdline) + 1;
302debcfac0SCyrill Gorcunov 		if (cmdline_size > boot.hdr.cmdline_size)
303debcfac0SCyrill Gorcunov 			cmdline_size = boot.hdr.cmdline_size;
304ad681038SCyrill Gorcunov 
3052dd4a4edSCyrill Gorcunov 		memset(p, 0, boot.hdr.cmdline_size);
3062dd4a4edSCyrill Gorcunov 		memcpy(p, kernel_cmdline, cmdline_size - 1);
307debcfac0SCyrill Gorcunov 	}
308debcfac0SCyrill Gorcunov 
309a43f6460SCyrill Gorcunov #define hdr_offset(member)			\
310a43f6460SCyrill Gorcunov 	offsetof(struct boot_params, hdr) +	\
311a43f6460SCyrill Gorcunov 	offsetof(struct setup_header, member)
312a43f6460SCyrill Gorcunov #define guest_hdr(kvm, member)			\
313a43f6460SCyrill Gorcunov 	guest_real_to_host(kvm,			\
314a43f6460SCyrill Gorcunov 		BOOT_LOADER_SELECTOR,		\
315a43f6460SCyrill Gorcunov 		hdr_offset(member))
316a43f6460SCyrill Gorcunov 
317a43f6460SCyrill Gorcunov 	/* some fields in guest header have to be updated */
318a43f6460SCyrill Gorcunov 	p = guest_hdr(self, cmd_line_ptr);
319a43f6460SCyrill Gorcunov 	*(uint32_t *)p = BOOT_CMDLINE_OFFSET;
320a43f6460SCyrill Gorcunov 
321a43f6460SCyrill Gorcunov 	p = guest_hdr(self, type_of_loader);
322a43f6460SCyrill Gorcunov 	*(uint8_t *)p = 0xff;
323a43f6460SCyrill Gorcunov 
324a43f6460SCyrill Gorcunov 	p = guest_hdr(self, heap_end_ptr);
325a43f6460SCyrill Gorcunov 	*(uint16_t *)p = 0xfe00;
326a43f6460SCyrill Gorcunov 
327a43f6460SCyrill Gorcunov 	p = guest_hdr(self, loadflags);
328a43f6460SCyrill Gorcunov 	*(uint8_t *)p |= CAN_USE_HEAP;
329a43f6460SCyrill Gorcunov 
330dbdb74c2SPekka Enberg 	self->boot_selector	= BOOT_LOADER_SELECTOR;
331edc8a14dSPekka Enberg 	/*
332edc8a14dSPekka Enberg 	 * The real-mode setup code starts at offset 0x200 of a bzImage. See
333edc8a14dSPekka Enberg 	 * Documentation/x86/boot.txt for details.
334edc8a14dSPekka Enberg 	 */
335edc8a14dSPekka Enberg 	self->boot_ip		= BOOT_LOADER_IP + 0x200;
336dbdb74c2SPekka Enberg 	self->boot_sp		= BOOT_LOADER_SP;
337edc8a14dSPekka Enberg 
338ea684828SCyrill Gorcunov 	/*
33922489bb0SCyrill Gorcunov 	 * Setup a *fake* real mode vector table, it has only
34022489bb0SCyrill Gorcunov 	 * one real hadler which does just iret
34122489bb0SCyrill Gorcunov 	 *
342305d9054SCyrill Gorcunov 	 * This is where the BIOS lives -- BDA area
343ea684828SCyrill Gorcunov 	 */
344305d9054SCyrill Gorcunov 	intr_addr = BIOS_INTR_NEXT(BDA_START + 0, 16);
345305d9054SCyrill Gorcunov 	p = guest_flat_to_host(self, intr_addr);
3468b8fb6c7SCyrill Gorcunov 	memcpy(p, intfake, intfake_end - intfake);
347bc75b0aeSCyrill Gorcunov 	intr = (struct real_intr_desc) {
348305d9054SCyrill Gorcunov 		.segment	= REAL_SEGMENT(intr_addr),
34922489bb0SCyrill Gorcunov 		.offset		= 0,
350ea684828SCyrill Gorcunov 	};
351bc75b0aeSCyrill Gorcunov 	interrupt_table__setup(&self->interrupt_table, &intr);
352305d9054SCyrill Gorcunov 
3538b8fb6c7SCyrill Gorcunov 	intr_addr = BIOS_INTR_NEXT(BDA_START + (intfake_end - intfake), 16);
354305d9054SCyrill Gorcunov 	p = guest_flat_to_host(self, intr_addr);
3558b8fb6c7SCyrill Gorcunov 	memcpy(p, int10, int10_end - int10);
356305d9054SCyrill Gorcunov 	intr = (struct real_intr_desc) {
357305d9054SCyrill Gorcunov 		.segment	= REAL_SEGMENT(intr_addr),
358305d9054SCyrill Gorcunov 		.offset		= 0,
359305d9054SCyrill Gorcunov 	};
360305d9054SCyrill Gorcunov 	interrupt_table__set(&self->interrupt_table, &intr, 0x10);
361305d9054SCyrill Gorcunov 
362305d9054SCyrill Gorcunov 	p = guest_flat_to_host(self, 0);
363bc75b0aeSCyrill Gorcunov 	interrupt_table__copy(&self->interrupt_table, p, REAL_INTR_SIZE);
364ea684828SCyrill Gorcunov 
3657fb218bdSPekka Enberg 	return true;
366ae1fae34SPekka Enberg }
367ae1fae34SPekka Enberg 
3686d1f350dSCyrill Gorcunov bool kvm__load_kernel(struct kvm *kvm, const char *kernel_filename,
3696d1f350dSCyrill Gorcunov 			const char *kernel_cmdline)
370ae1fae34SPekka Enberg {
3717fb218bdSPekka Enberg 	bool ret;
372ae1fae34SPekka Enberg 	int fd;
373ae1fae34SPekka Enberg 
374ae1fae34SPekka Enberg 	fd = open(kernel_filename, O_RDONLY);
375ae1fae34SPekka Enberg 	if (fd < 0)
376ae1fae34SPekka Enberg 		die("unable to open kernel");
377ae1fae34SPekka Enberg 
3786d1f350dSCyrill Gorcunov 	ret = load_bzimage(kvm, fd, kernel_cmdline);
379009b0758SPekka Enberg 	if (ret)
380009b0758SPekka Enberg 		goto found_kernel;
381ae1fae34SPekka Enberg 
382009b0758SPekka Enberg 	ret = load_flat_binary(kvm, fd);
383009b0758SPekka Enberg 	if (ret)
384009b0758SPekka Enberg 		goto found_kernel;
385009b0758SPekka Enberg 
386009b0758SPekka Enberg 	die("%s is not a valid bzImage or flat binary", kernel_filename);
387009b0758SPekka Enberg 
388009b0758SPekka Enberg found_kernel:
389ae1fae34SPekka Enberg 	return ret;
390ae1fae34SPekka Enberg }
391ae1fae34SPekka Enberg 
39206e41eeaSPekka Enberg static inline uint64_t ip_flat_to_real(struct kvm *self, uint64_t ip)
39306e41eeaSPekka Enberg {
39406e41eeaSPekka Enberg 	uint64_t cs = self->sregs.cs.selector;
39506e41eeaSPekka Enberg 
39606e41eeaSPekka Enberg 	return ip - (cs << 4);
39706e41eeaSPekka Enberg }
39806e41eeaSPekka Enberg 
399f01944c8SPekka Enberg static inline bool is_in_protected_mode(struct kvm *self)
400f01944c8SPekka Enberg {
401f01944c8SPekka Enberg 	return self->sregs.cr0 & 0x01;
402f01944c8SPekka Enberg }
403f01944c8SPekka Enberg 
404f326512aSPekka Enberg static inline uint64_t ip_to_flat(struct kvm *self, uint64_t ip)
40506e41eeaSPekka Enberg {
406f326512aSPekka Enberg 	uint64_t cs;
407f326512aSPekka Enberg 
408f326512aSPekka Enberg 	/*
409f326512aSPekka Enberg 	 * NOTE! We should take code segment base address into account here.
410f326512aSPekka Enberg 	 * Luckily it's usually zero because Linux uses flat memory model.
411f326512aSPekka Enberg 	 */
412f01944c8SPekka Enberg 	if (is_in_protected_mode(self))
413f326512aSPekka Enberg 		return ip;
414f326512aSPekka Enberg 
415f326512aSPekka Enberg 	cs = self->sregs.cs.selector;
41606e41eeaSPekka Enberg 
41706e41eeaSPekka Enberg 	return ip + (cs << 4);
41806e41eeaSPekka Enberg }
41906e41eeaSPekka Enberg 
420dbdb74c2SPekka Enberg static inline uint32_t selector_to_base(uint16_t selector)
421dbdb74c2SPekka Enberg {
422dbdb74c2SPekka Enberg 	/*
423dbdb74c2SPekka Enberg 	 * KVM on Intel requires 'base' to be 'selector * 16' in real mode.
424dbdb74c2SPekka Enberg 	 */
425dbdb74c2SPekka Enberg 	return (uint32_t)selector * 16;
426dbdb74c2SPekka Enberg }
427dbdb74c2SPekka Enberg 
42853d48714SPekka Enberg static struct kvm_msrs *kvm_msrs__new(size_t nmsrs)
42953d48714SPekka Enberg {
43053d48714SPekka Enberg 	struct kvm_msrs *self = calloc(1, sizeof(*self) + (sizeof(struct kvm_msr_entry) * nmsrs));
43153d48714SPekka Enberg 
43253d48714SPekka Enberg 	if (!self)
43353d48714SPekka Enberg 		die("out of memory");
43453d48714SPekka Enberg 
43553d48714SPekka Enberg 	return self;
43653d48714SPekka Enberg }
43753d48714SPekka Enberg 
43853d48714SPekka Enberg #define MSR_IA32_TIME_STAMP_COUNTER	0x10
43953d48714SPekka Enberg 
44053d48714SPekka Enberg #define MSR_IA32_SYSENTER_CS		0x174
44153d48714SPekka Enberg #define MSR_IA32_SYSENTER_ESP		0x175
44253d48714SPekka Enberg #define MSR_IA32_SYSENTER_EIP		0x176
44353d48714SPekka Enberg 
44453d48714SPekka Enberg #define MSR_IA32_STAR			0xc0000081
44553d48714SPekka Enberg #define MSR_IA32_LSTAR			0xc0000082
44653d48714SPekka Enberg #define MSR_IA32_CSTAR			0xc0000083
44753d48714SPekka Enberg #define MSR_IA32_FMASK			0xc0000084
44853d48714SPekka Enberg #define MSR_IA32_KERNEL_GS_BASE		0xc0000102
44953d48714SPekka Enberg 
45053d48714SPekka Enberg #define KVM_MSR_ENTRY(_index, _data)	\
45153d48714SPekka Enberg 	(struct kvm_msr_entry) { .index = _index, .data = _data }
45253d48714SPekka Enberg 
45353d48714SPekka Enberg static void kvm__setup_msrs(struct kvm *self)
45453d48714SPekka Enberg {
45553d48714SPekka Enberg 	unsigned long ndx = 0;
45653d48714SPekka Enberg 
45753d48714SPekka Enberg 	self->msrs = kvm_msrs__new(100);
45853d48714SPekka Enberg 
45953d48714SPekka Enberg 	self->msrs->entries[ndx++] = KVM_MSR_ENTRY(MSR_IA32_SYSENTER_CS,	0x0);
46053d48714SPekka Enberg 	self->msrs->entries[ndx++] = KVM_MSR_ENTRY(MSR_IA32_SYSENTER_ESP,	0x0);
46153d48714SPekka Enberg 	self->msrs->entries[ndx++] = KVM_MSR_ENTRY(MSR_IA32_SYSENTER_EIP,	0x0);
4628b334abcSCyrill Gorcunov #ifdef CONFIG_X86_64
46353d48714SPekka Enberg 	self->msrs->entries[ndx++] = KVM_MSR_ENTRY(MSR_IA32_STAR,		0x0);
46453d48714SPekka Enberg 	self->msrs->entries[ndx++] = KVM_MSR_ENTRY(MSR_IA32_CSTAR,		0x0);
46553d48714SPekka Enberg 	self->msrs->entries[ndx++] = KVM_MSR_ENTRY(MSR_IA32_KERNEL_GS_BASE,	0x0);
46653d48714SPekka Enberg 	self->msrs->entries[ndx++] = KVM_MSR_ENTRY(MSR_IA32_FMASK,		0x0);
46753d48714SPekka Enberg 	self->msrs->entries[ndx++] = KVM_MSR_ENTRY(MSR_IA32_LSTAR,		0x0);
46844069a9dSCyrill Gorcunov #endif
46953d48714SPekka Enberg 	self->msrs->entries[ndx++] = KVM_MSR_ENTRY(MSR_IA32_TIME_STAMP_COUNTER,	0x0);
47053d48714SPekka Enberg 
47153d48714SPekka Enberg 	self->msrs->nmsrs	= ndx;
47253d48714SPekka Enberg 
47353d48714SPekka Enberg 	if (ioctl(self->vcpu_fd, KVM_SET_MSRS, self->msrs) < 0)
47453d48714SPekka Enberg 		die_perror("KVM_SET_MSRS failed");
47553d48714SPekka Enberg }
47653d48714SPekka Enberg 
4773d78d3a5SPekka Enberg static void kvm__setup_fpu(struct kvm *self)
4783d78d3a5SPekka Enberg {
4793d78d3a5SPekka Enberg 	self->fpu = (struct kvm_fpu) {
4803d78d3a5SPekka Enberg 		.fcw		= 0x37f,
4813d78d3a5SPekka Enberg 		.mxcsr		= 0x1f80,
4823d78d3a5SPekka Enberg 	};
4833d78d3a5SPekka Enberg 
4843d78d3a5SPekka Enberg 	if (ioctl(self->vcpu_fd, KVM_SET_FPU, &self->fpu) < 0)
4853d78d3a5SPekka Enberg 		die_perror("KVM_SET_FPU failed");
4863d78d3a5SPekka Enberg }
4873d78d3a5SPekka Enberg 
4883d78d3a5SPekka Enberg static void kvm__setup_regs(struct kvm *self)
4893d78d3a5SPekka Enberg {
4903d78d3a5SPekka Enberg 	self->regs = (struct kvm_regs) {
4913d78d3a5SPekka Enberg 		/* We start the guest in 16-bit real mode  */
4923d78d3a5SPekka Enberg 		.rflags		= 0x0000000000000002ULL,
4933d78d3a5SPekka Enberg 
4943d78d3a5SPekka Enberg 		.rip		= self->boot_ip,
4953d78d3a5SPekka Enberg 		.rsp		= self->boot_sp,
4963d78d3a5SPekka Enberg 		.rbp		= self->boot_sp,
4973d78d3a5SPekka Enberg 	};
4983d78d3a5SPekka Enberg 
4993d78d3a5SPekka Enberg 	if (self->regs.rip > USHRT_MAX)
5003d78d3a5SPekka Enberg 		die("ip 0x%" PRIx64 " is too high for real mode", (uint64_t) self->regs.rip);
5013d78d3a5SPekka Enberg 
5023d78d3a5SPekka Enberg 	if (ioctl(self->vcpu_fd, KVM_SET_REGS, &self->regs) < 0)
5033d78d3a5SPekka Enberg 		die_perror("KVM_SET_REGS failed");
5043d78d3a5SPekka Enberg }
5053d78d3a5SPekka Enberg 
5063d78d3a5SPekka Enberg static void kvm__setup_sregs(struct kvm *self)
507ae1fae34SPekka Enberg {
50853602077SPekka Enberg 
5090ed849e6SAsias He 	if (ioctl(self->vcpu_fd, KVM_GET_SREGS, &self->sregs) < 0)
5100ed849e6SAsias He 		die_perror("KVM_GET_SREGS failed");
5110ed849e6SAsias He 	self->sregs.cs.selector = self->boot_selector;
5120ed849e6SAsias He 	self->sregs.cs.base = selector_to_base(self->boot_selector);
5134e42cf94SAsias He 	self->sregs.ss.selector = self->boot_selector;
5144e42cf94SAsias He 	self->sregs.ss.base = selector_to_base(self->boot_selector);
5154e42cf94SAsias He 	self->sregs.ds.selector = self->boot_selector;
5164e42cf94SAsias He 	self->sregs.ds.base = selector_to_base(self->boot_selector);
5174e42cf94SAsias He 	self->sregs.es.selector = self->boot_selector;
5184e42cf94SAsias He 	self->sregs.es.base = selector_to_base(self->boot_selector);
5194e42cf94SAsias He 	self->sregs.fs.selector = self->boot_selector;
5204e42cf94SAsias He 	self->sregs.fs.base = selector_to_base(self->boot_selector);
5214e42cf94SAsias He 	self->sregs.gs.selector = self->boot_selector;
5224e42cf94SAsias He 	self->sregs.gs.base = selector_to_base(self->boot_selector);
52353602077SPekka Enberg 	if (ioctl(self->vcpu_fd, KVM_SET_SREGS, &self->sregs) < 0)
52453602077SPekka Enberg 		die_perror("KVM_SET_SREGS failed");
5253d78d3a5SPekka Enberg }
52606e41eeaSPekka Enberg 
5273d78d3a5SPekka Enberg void kvm__reset_vcpu(struct kvm *self)
5283d78d3a5SPekka Enberg {
5293d78d3a5SPekka Enberg 	kvm__setup_sregs(self);
530dbdb74c2SPekka Enberg 
5313d78d3a5SPekka Enberg 	kvm__setup_regs(self);
53206e41eeaSPekka Enberg 
5333d78d3a5SPekka Enberg 	kvm__setup_fpu(self);
53453d48714SPekka Enberg 
53553d48714SPekka Enberg 	kvm__setup_msrs(self);
536ae1fae34SPekka Enberg }
537ae1fae34SPekka Enberg 
538ae1fae34SPekka Enberg void kvm__run(struct kvm *self)
539ae1fae34SPekka Enberg {
540ae1fae34SPekka Enberg 	if (ioctl(self->vcpu_fd, KVM_RUN, 0) < 0)
541ae1fae34SPekka Enberg 		die_perror("KVM_RUN failed");
542ae1fae34SPekka Enberg }
543ae1fae34SPekka Enberg 
5448351aaddSPekka Enberg static void print_dtable(const char *name, struct kvm_dtable *dtable)
5458351aaddSPekka Enberg {
5468351aaddSPekka Enberg 	printf(" %s                 %016" PRIx64 "  %08" PRIx16 "\n",
5478351aaddSPekka Enberg 		name, (uint64_t) dtable->base, (uint16_t) dtable->limit);
5488351aaddSPekka Enberg }
5498351aaddSPekka Enberg 
55053602077SPekka Enberg static void print_segment(const char *name, struct kvm_segment *seg)
55153602077SPekka Enberg {
552ce556636SPekka Enberg 	printf(" %s       %04" PRIx16 "      %016" PRIx64 "  %08" PRIx32 "  %02" PRIx8 "    %x %x   %x  %x %x %x %x\n",
55353602077SPekka Enberg 		name, (uint16_t) seg->selector, (uint64_t) seg->base, (uint32_t) seg->limit,
554ce556636SPekka Enberg 		(uint8_t) seg->type, seg->present, seg->dpl, seg->db, seg->s, seg->l, seg->g, seg->avl);
55553602077SPekka Enberg }
55653602077SPekka Enberg 
557ae1fae34SPekka Enberg void kvm__show_registers(struct kvm *self)
5587118d2caSPekka Enberg {
55953602077SPekka Enberg 	unsigned long cr0, cr2, cr3;
56053602077SPekka Enberg 	unsigned long cr4, cr8;
5617118d2caSPekka Enberg 	unsigned long rax, rbx, rcx;
5627118d2caSPekka Enberg 	unsigned long rdx, rsi, rdi;
5637118d2caSPekka Enberg 	unsigned long rbp,  r8,  r9;
5647118d2caSPekka Enberg 	unsigned long r10, r11, r12;
5657118d2caSPekka Enberg 	unsigned long r13, r14, r15;
5667118d2caSPekka Enberg 	unsigned long rip, rsp;
56753602077SPekka Enberg 	struct kvm_sregs sregs;
568a2fe6199SPekka Enberg 	unsigned long rflags;
5697118d2caSPekka Enberg 	struct kvm_regs regs;
570ce5e0ecbSPekka Enberg 	int i;
5717118d2caSPekka Enberg 
5727118d2caSPekka Enberg 	if (ioctl(self->vcpu_fd, KVM_GET_REGS, &regs) < 0)
5737118d2caSPekka Enberg 		die("KVM_GET_REGS failed");
5747118d2caSPekka Enberg 
575a2fe6199SPekka Enberg 	rflags = regs.rflags;
576a2fe6199SPekka Enberg 
5777118d2caSPekka Enberg 	rip = regs.rip; rsp = regs.rsp;
5787118d2caSPekka Enberg 	rax = regs.rax; rbx = regs.rbx; rcx = regs.rcx;
5797118d2caSPekka Enberg 	rdx = regs.rdx; rsi = regs.rsi; rdi = regs.rdi;
5807118d2caSPekka Enberg 	rbp = regs.rbp; r8  = regs.r8;  r9  = regs.r9;
5817118d2caSPekka Enberg 	r10 = regs.r10; r11 = regs.r11; r12 = regs.r12;
5827118d2caSPekka Enberg 	r13 = regs.r13; r14 = regs.r14; r15 = regs.r15;
5837118d2caSPekka Enberg 
5847118d2caSPekka Enberg 	printf("Registers:\n");
5852177ec43SPekka Enberg 	printf(" rip: %016lx   rsp: %016lx flags: %016lx\n", rip, rsp, rflags);
586ea2e4ea0SCyrill Gorcunov 	printf(" rax: %016lx   rbx: %016lx   rcx: %016lx\n", rax, rbx, rcx);
5877118d2caSPekka Enberg 	printf(" rdx: %016lx   rsi: %016lx   rdi: %016lx\n", rdx, rsi, rdi);
5887118d2caSPekka Enberg 	printf(" rbp: %016lx   r8:  %016lx   r9:  %016lx\n", rbp, r8,  r9);
5897118d2caSPekka Enberg 	printf(" r10: %016lx   r11: %016lx   r12: %016lx\n", r10, r11, r12);
5907118d2caSPekka Enberg 	printf(" r13: %016lx   r14: %016lx   r15: %016lx\n", r13, r14, r15);
59153602077SPekka Enberg 
59253602077SPekka Enberg 	if (ioctl(self->vcpu_fd, KVM_GET_SREGS, &sregs) < 0)
59353602077SPekka Enberg 		die("KVM_GET_REGS failed");
59453602077SPekka Enberg 
59553602077SPekka Enberg 	cr0 = sregs.cr0; cr2 = sregs.cr2; cr3 = sregs.cr3;
59653602077SPekka Enberg 	cr4 = sregs.cr4; cr8 = sregs.cr8;
59753602077SPekka Enberg 
59853602077SPekka Enberg 	printf(" cr0: %016lx   cr2: %016lx   cr3: %016lx\n", cr0, cr2, cr3);
59953602077SPekka Enberg 	printf(" cr4: %016lx   cr8: %016lx\n", cr4, cr8);
600ce5e0ecbSPekka Enberg 	printf("Segment registers:\n");
601ce556636SPekka Enberg 	printf(" register  selector  base              limit     type  p dpl db s l g avl\n");
60253602077SPekka Enberg 	print_segment("cs ", &sregs.cs);
60353602077SPekka Enberg 	print_segment("ss ", &sregs.ss);
60453602077SPekka Enberg 	print_segment("ds ", &sregs.ds);
60553602077SPekka Enberg 	print_segment("es ", &sregs.es);
60653602077SPekka Enberg 	print_segment("fs ", &sregs.fs);
60753602077SPekka Enberg 	print_segment("gs ", &sregs.gs);
608ce5e0ecbSPekka Enberg 	print_segment("tr ", &sregs.tr);
609ce5e0ecbSPekka Enberg 	print_segment("ldt", &sregs.ldt);
6108351aaddSPekka Enberg 	print_dtable("gdt", &sregs.gdt);
6118351aaddSPekka Enberg 	print_dtable("idt", &sregs.idt);
6120f9983b2SCyrill Gorcunov 	printf(" [ efer: %016" PRIx64 "  apic base: %016" PRIx64 "  nmi: %s ]\n",
6130f9983b2SCyrill Gorcunov 		(uint64_t) sregs.efer, (uint64_t) sregs.apic_base,
6142049569dSPekka Enberg 		(self->nmi_disabled ? "disabled" : "enabled"));
615ce5e0ecbSPekka Enberg 	printf("Interrupt bitmap:\n");
616ce5e0ecbSPekka Enberg 	printf(" ");
617ce5e0ecbSPekka Enberg 	for (i = 0; i < (KVM_NR_INTERRUPTS + 63) / 64; i++)
6180f9983b2SCyrill Gorcunov 		printf("%016" PRIx64 " ", (uint64_t) sregs.interrupt_bitmap[i]);
619ce5e0ecbSPekka Enberg 	printf("\n");
6207118d2caSPekka Enberg }
6217118d2caSPekka Enberg 
622ae1fae34SPekka Enberg void kvm__show_code(struct kvm *self)
6236f10be05SPekka Enberg {
6246f10be05SPekka Enberg 	unsigned int code_bytes = 64;
6256f10be05SPekka Enberg 	unsigned int code_prologue = code_bytes * 43 / 64;
6266f10be05SPekka Enberg 	unsigned int code_len = code_bytes;
6276f10be05SPekka Enberg 	unsigned char c;
628ae1fae34SPekka Enberg 	unsigned int i;
6296f10be05SPekka Enberg 	uint8_t *ip;
6306f10be05SPekka Enberg 
6312a601aafSPekka Enberg 	if (ioctl(self->vcpu_fd, KVM_GET_REGS, &self->regs) < 0)
6322a601aafSPekka Enberg 		die("KVM_GET_REGS failed");
6332a601aafSPekka Enberg 
6342a601aafSPekka Enberg 	if (ioctl(self->vcpu_fd, KVM_GET_SREGS, &self->sregs) < 0)
6352a601aafSPekka Enberg 		die("KVM_GET_SREGS failed");
6362a601aafSPekka Enberg 
637f326512aSPekka Enberg 	ip = guest_flat_to_host(self, ip_to_flat(self, self->regs.rip) - code_prologue);
6386f10be05SPekka Enberg 
6396f10be05SPekka Enberg 	printf("Code: ");
6406f10be05SPekka Enberg 
6416f10be05SPekka Enberg 	for (i = 0; i < code_len; i++, ip++) {
64248cf3877SPekka Enberg 		if (!host_ptr_in_ram(self, ip))
64348cf3877SPekka Enberg 			break;
64448cf3877SPekka Enberg 
6456e8abc38SPekka Enberg 		c = *ip;
6466e8abc38SPekka Enberg 
647f326512aSPekka Enberg 		if (ip == guest_flat_to_host(self, ip_to_flat(self, self->regs.rip)))
6486f10be05SPekka Enberg 			printf("<%02x> ", c);
6496f10be05SPekka Enberg 		else
6506f10be05SPekka Enberg 			printf("%02x ", c);
6516f10be05SPekka Enberg 	}
6526f10be05SPekka Enberg 
6536f10be05SPekka Enberg 	printf("\n");
6542a7d39a4SPekka Enberg 
6552a7d39a4SPekka Enberg 	printf("Stack:\n");
6562a7d39a4SPekka Enberg 	kvm__dump_mem(self, self->regs.rsp, 32);
6576f10be05SPekka Enberg }
658090f898eSCyrill Gorcunov 
659f01944c8SPekka Enberg void kvm__show_page_tables(struct kvm *self)
660f01944c8SPekka Enberg {
661f01944c8SPekka Enberg 	uint64_t *pte1;
662f01944c8SPekka Enberg 	uint64_t *pte2;
663f01944c8SPekka Enberg 	uint64_t *pte3;
664f01944c8SPekka Enberg 	uint64_t *pte4;
665f01944c8SPekka Enberg 
666f01944c8SPekka Enberg 	if (!is_in_protected_mode(self))
667f01944c8SPekka Enberg 		return;
668f01944c8SPekka Enberg 
669f01944c8SPekka Enberg 	if (ioctl(self->vcpu_fd, KVM_GET_SREGS, &self->sregs) < 0)
670f01944c8SPekka Enberg 		die("KVM_GET_SREGS failed");
671f01944c8SPekka Enberg 
672f01944c8SPekka Enberg 	pte4	= guest_flat_to_host(self, self->sregs.cr3);
67348cf3877SPekka Enberg 	if (!host_ptr_in_ram(self, pte4))
67448cf3877SPekka Enberg 		return;
67548cf3877SPekka Enberg 
676f01944c8SPekka Enberg 	pte3	= guest_flat_to_host(self, (*pte4 & ~0xfff));
67748cf3877SPekka Enberg 	if (!host_ptr_in_ram(self, pte3))
67848cf3877SPekka Enberg 		return;
67948cf3877SPekka Enberg 
680f01944c8SPekka Enberg 	pte2	= guest_flat_to_host(self, (*pte3 & ~0xfff));
68148cf3877SPekka Enberg 	if (!host_ptr_in_ram(self, pte2))
68248cf3877SPekka Enberg 		return;
68348cf3877SPekka Enberg 
684f01944c8SPekka Enberg 	pte1	= guest_flat_to_host(self, (*pte2 & ~0xfff));
68548cf3877SPekka Enberg 	if (!host_ptr_in_ram(self, pte1))
68648cf3877SPekka Enberg 		return;
687f01944c8SPekka Enberg 
688f01944c8SPekka Enberg 	printf("Page Tables:\n");
689f01944c8SPekka Enberg 	if (*pte2 & (1 << 7))
6900f9983b2SCyrill Gorcunov 		printf(" pte4: %016" PRIx64 "   pte3: %016" PRIx64
6910f9983b2SCyrill Gorcunov 			"   pte2: %016" PRIx64 "\n",
6920f9983b2SCyrill Gorcunov 			*pte4, *pte3, *pte2);
693f01944c8SPekka Enberg 	else
6940f9983b2SCyrill Gorcunov 		printf(" pte4: %016" PRIx64 "   pte3: %016" PRIx64 "   pte2: %016"
6950f9983b2SCyrill Gorcunov 			PRIx64 "   pte1: %016" PRIx64 "\n",
6960f9983b2SCyrill Gorcunov 			*pte4, *pte3, *pte2, *pte1);
697f01944c8SPekka Enberg }
698f01944c8SPekka Enberg 
699090f898eSCyrill Gorcunov void kvm__dump_mem(struct kvm *self, unsigned long addr, unsigned long size)
700090f898eSCyrill Gorcunov {
701090f898eSCyrill Gorcunov 	unsigned char *p;
702090f898eSCyrill Gorcunov 	unsigned long n;
703090f898eSCyrill Gorcunov 
704090f898eSCyrill Gorcunov 	size &= ~7; /* mod 8 */
705090f898eSCyrill Gorcunov 	if (!size)
706090f898eSCyrill Gorcunov 		return;
707090f898eSCyrill Gorcunov 
7082a7d39a4SPekka Enberg 	p = guest_flat_to_host(self, addr);
709090f898eSCyrill Gorcunov 
71048cf3877SPekka Enberg 	for (n = 0; n < size; n+=8) {
71148cf3877SPekka Enberg 		if (!host_ptr_in_ram(self, p + n))
71248cf3877SPekka Enberg 			break;
71348cf3877SPekka Enberg 
714090f898eSCyrill Gorcunov 		printf("  0x%08lx: %02x %02x %02x %02x  %02x %02x %02x %02x\n",
715090f898eSCyrill Gorcunov 			addr + n, p[n + 0], p[n + 1], p[n + 2], p[n + 3],
716090f898eSCyrill Gorcunov 				  p[n + 4], p[n + 5], p[n + 6], p[n + 7]);
717090f898eSCyrill Gorcunov 	}
71848cf3877SPekka Enberg }
719