xref: /kvmtool/kvm.c (revision f326512a4b8669814fba9e23ed430fcdfdf30443)
1ae1fae34SPekka Enberg #include "kvm/kvm.h"
2ae1fae34SPekka Enberg 
3eda03319SPekka Enberg #include "kvm/interrupt.h"
4f3150089SPekka Enberg #include "kvm/util.h"
5eda03319SPekka Enberg 
66c7d8514SPekka Enberg #include <linux/kvm.h>
7f5ab5f67SPekka Enberg 
8f5ab5f67SPekka Enberg #include <asm/bootparam.h>
9f5ab5f67SPekka Enberg 
10ae1fae34SPekka Enberg #include <sys/ioctl.h>
111f9cff23SPekka Enberg #include <inttypes.h>
121f9cff23SPekka Enberg #include <sys/mman.h>
132da26a59SPekka Enberg #include <stdbool.h>
146e5e8b8dSPekka Enberg #include <assert.h>
1506e41eeaSPekka Enberg #include <limits.h>
16f5ab5f67SPekka Enberg #include <stdarg.h>
17b8f6afcdSPekka Enberg #include <stdlib.h>
18f5ab5f67SPekka Enberg #include <string.h>
190d1f17ecSPekka Enberg #include <unistd.h>
201f9cff23SPekka Enberg #include <stdio.h>
21b8f6afcdSPekka Enberg #include <fcntl.h>
22b8f6afcdSPekka Enberg 
231f9cff23SPekka Enberg /*
241f9cff23SPekka Enberg  * Compatibility code. Remove this when we move to tools/kvm.
251f9cff23SPekka Enberg  */
261f9cff23SPekka Enberg #ifndef KVM_EXIT_INTERNAL_ERROR
271f9cff23SPekka Enberg # define KVM_EXIT_INTERNAL_ERROR		17
281f9cff23SPekka Enberg #endif
291f9cff23SPekka Enberg 
30ae1fae34SPekka Enberg #define DEFINE_KVM_EXIT_REASON(reason) [reason] = #reason
310d1f17ecSPekka Enberg 
32ae1fae34SPekka Enberg const char *kvm_exit_reasons[] = {
33ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_UNKNOWN),
34ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_EXCEPTION),
35ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_IO),
36ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_HYPERCALL),
37ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_DEBUG),
38ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_HLT),
39ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_MMIO),
40ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_IRQ_WINDOW_OPEN),
41ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_SHUTDOWN),
42ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_FAIL_ENTRY),
43ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_INTR),
44ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_SET_TPR),
45ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_TPR_ACCESS),
46ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_S390_SIEIC),
47ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_S390_RESET),
48ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_DCR),
49ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_NMI),
50ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_INTERNAL_ERROR),
519b1fb1c3SPekka Enberg };
529b1fb1c3SPekka Enberg 
536753ed2fSPekka Enberg static inline uint32_t segment_to_flat(uint16_t selector, uint16_t offset)
546753ed2fSPekka Enberg {
556753ed2fSPekka Enberg 	return ((uint32_t)selector << 4) + (uint32_t) offset;
566753ed2fSPekka Enberg }
576753ed2fSPekka Enberg 
586753ed2fSPekka Enberg static inline void *guest_flat_to_host(struct kvm *self, unsigned long offset)
59ae1fae34SPekka Enberg {
60ae1fae34SPekka Enberg 	return self->ram_start + offset;
61ae1fae34SPekka Enberg }
62ae1fae34SPekka Enberg 
636753ed2fSPekka Enberg static inline void *guest_real_to_host(struct kvm *self, uint16_t selector, uint16_t offset)
646753ed2fSPekka Enberg {
656753ed2fSPekka Enberg 	unsigned long flat = segment_to_flat(selector, offset);
666753ed2fSPekka Enberg 
676753ed2fSPekka Enberg 	return guest_flat_to_host(self, flat);
686753ed2fSPekka Enberg }
696753ed2fSPekka Enberg 
70ae1fae34SPekka Enberg static bool kvm__supports_extension(struct kvm *self, unsigned int extension)
71b8f6afcdSPekka Enberg {
7228fa19c0SPekka Enberg 	int ret;
73b8f6afcdSPekka Enberg 
7473ac60e6SPekka Enberg 	ret = ioctl(self->sys_fd, KVM_CHECK_EXTENSION, extension);
754076b041SPekka Enberg 	if (ret < 0)
764076b041SPekka Enberg 		return false;
774076b041SPekka Enberg 
784076b041SPekka Enberg 	return ret;
794076b041SPekka Enberg }
804076b041SPekka Enberg 
814076b041SPekka Enberg static struct kvm *kvm__new(void)
824076b041SPekka Enberg {
834076b041SPekka Enberg 	struct kvm *self = calloc(1, sizeof *self);
844076b041SPekka Enberg 
854076b041SPekka Enberg 	if (!self)
864076b041SPekka Enberg 		die("out of memory");
874076b041SPekka Enberg 
884076b041SPekka Enberg 	return self;
894076b041SPekka Enberg }
904076b041SPekka Enberg 
91ae1fae34SPekka Enberg struct kvm *kvm__init(void)
924076b041SPekka Enberg {
932b0e3342SPekka Enberg 	struct kvm_userspace_memory_region mem;
944076b041SPekka Enberg 	struct kvm *self;
950d1f17ecSPekka Enberg 	long page_size;
961f9cff23SPekka Enberg 	int mmap_size;
974076b041SPekka Enberg 	int ret;
984076b041SPekka Enberg 
994076b041SPekka Enberg 	self = kvm__new();
1004076b041SPekka Enberg 
10173ac60e6SPekka Enberg 	self->sys_fd = open("/dev/kvm", O_RDWR);
10273ac60e6SPekka Enberg 	if (self->sys_fd < 0)
103f5ab5f67SPekka Enberg 		die_perror("open");
104b8f6afcdSPekka Enberg 
10573ac60e6SPekka Enberg 	ret = ioctl(self->sys_fd, KVM_GET_API_VERSION, 0);
1066c7d8514SPekka Enberg 	if (ret != KVM_API_VERSION)
107f5ab5f67SPekka Enberg 		die_perror("KVM_API_VERSION ioctl");
1086c7d8514SPekka Enberg 
10973ac60e6SPekka Enberg 	self->vm_fd = ioctl(self->sys_fd, KVM_CREATE_VM, 0);
11073ac60e6SPekka Enberg 	if (self->vm_fd < 0)
111f5ab5f67SPekka Enberg 		die_perror("KVM_CREATE_VM ioctl");
11228fa19c0SPekka Enberg 
1134076b041SPekka Enberg 	if (!kvm__supports_extension(self, KVM_CAP_USER_MEMORY))
114f5ab5f67SPekka Enberg 		die("KVM_CAP_USER_MEMORY is not supported");
1152da26a59SPekka Enberg 
1160d1f17ecSPekka Enberg 	self->ram_size		= 64UL * 1024UL * 1024UL;
1170d1f17ecSPekka Enberg 
1180d1f17ecSPekka Enberg 	page_size	= sysconf(_SC_PAGESIZE);
1190d1f17ecSPekka Enberg 	if (posix_memalign(&self->ram_start, page_size, self->ram_size) != 0)
1200d1f17ecSPekka Enberg 		die("out of memory");
1210d1f17ecSPekka Enberg 
1222b0e3342SPekka Enberg 	mem = (struct kvm_userspace_memory_region) {
1232b0e3342SPekka Enberg 		.slot			= 0,
1242b0e3342SPekka Enberg 		.guest_phys_addr	= 0x0UL,
1250d1f17ecSPekka Enberg 		.memory_size		= self->ram_size,
1260d1f17ecSPekka Enberg 		.userspace_addr		= (unsigned long) self->ram_start,
1272b0e3342SPekka Enberg 	};
1282b0e3342SPekka Enberg 
12973ac60e6SPekka Enberg 	ret = ioctl(self->vm_fd, KVM_SET_USER_MEMORY_REGION, &mem, 1);
1302b0e3342SPekka Enberg 	if (ret < 0)
131f5ab5f67SPekka Enberg 		die_perror("KVM_SET_USER_MEMORY_REGION ioctl");
1322b0e3342SPekka Enberg 
133895c2fefSPekka Enberg 	if (!kvm__supports_extension(self, KVM_CAP_SET_TSS_ADDR))
134f5ab5f67SPekka Enberg 		die("KVM_CAP_SET_TSS_ADDR is not supported");
135895c2fefSPekka Enberg 
13673ac60e6SPekka Enberg 	ret = ioctl(self->vm_fd, KVM_SET_TSS_ADDR, 0xfffbd000);
137895c2fefSPekka Enberg 	if (ret < 0)
138f5ab5f67SPekka Enberg 		die_perror("KVM_SET_TSS_ADDR ioctl");
139895c2fefSPekka Enberg 
14073ac60e6SPekka Enberg 	self->vcpu_fd = ioctl(self->vm_fd, KVM_CREATE_VCPU, 0);
1412b0e3342SPekka Enberg 	if (self->vcpu_fd < 0)
142f5ab5f67SPekka Enberg 		die_perror("KVM_CREATE_VCPU ioctl");
1432b0e3342SPekka Enberg 
1441f9cff23SPekka Enberg 	mmap_size = ioctl(self->sys_fd, KVM_GET_VCPU_MMAP_SIZE, 0);
1451f9cff23SPekka Enberg 	if (mmap_size < 0)
146f5ab5f67SPekka Enberg 		die_perror("KVM_GET_VCPU_MMAP_SIZE ioctl");
1471f9cff23SPekka Enberg 
1481f9cff23SPekka Enberg 	self->kvm_run = mmap(NULL, mmap_size, PROT_READ|PROT_WRITE, MAP_SHARED, self->vcpu_fd, 0);
1491f9cff23SPekka Enberg 	if (self->kvm_run == MAP_FAILED)
1501f9cff23SPekka Enberg 		die("unable to mmap vcpu fd");
1511f9cff23SPekka Enberg 
1524076b041SPekka Enberg 	return self;
1534076b041SPekka Enberg }
1544076b041SPekka Enberg 
155ae1fae34SPekka Enberg void kvm__enable_singlestep(struct kvm *self)
156aee6632eSPekka Enberg {
157aee6632eSPekka Enberg 	struct kvm_guest_debug debug = {
158aee6632eSPekka Enberg 		.control	= KVM_GUESTDBG_ENABLE | KVM_GUESTDBG_SINGLESTEP,
159aee6632eSPekka Enberg 	};
160aee6632eSPekka Enberg 
161aee6632eSPekka Enberg 	if (ioctl(self->vcpu_fd, KVM_SET_GUEST_DEBUG, &debug) < 0)
162b625d4b6SCyrill Gorcunov 		warning("KVM_SET_GUEST_DEBUG failed");
163aee6632eSPekka Enberg }
164aee6632eSPekka Enberg 
1655f6772b8SCyrill Gorcunov #define BOOT_LOADER_SELECTOR	0x1000
166b08e9ec4SPekka Enberg #define BOOT_LOADER_IP		0x0000
167dbdb74c2SPekka Enberg #define BOOT_LOADER_SP		0x8000
168009b0758SPekka Enberg 
169edc8a14dSPekka Enberg static int load_flat_binary(struct kvm *self, int fd)
170009b0758SPekka Enberg {
171009b0758SPekka Enberg 	void *p;
172009b0758SPekka Enberg 	int nr;
173009b0758SPekka Enberg 
174009b0758SPekka Enberg 	if (lseek(fd, 0, SEEK_SET) < 0)
175009b0758SPekka Enberg 		die_perror("lseek");
176009b0758SPekka Enberg 
1776753ed2fSPekka Enberg 	p = guest_real_to_host(self, BOOT_LOADER_SELECTOR, BOOT_LOADER_IP);
178009b0758SPekka Enberg 
179009b0758SPekka Enberg 	while ((nr = read(fd, p, 65536)) > 0)
180009b0758SPekka Enberg 		p += nr;
181009b0758SPekka Enberg 
182dbdb74c2SPekka Enberg 	self->boot_selector	= BOOT_LOADER_SELECTOR;
183edc8a14dSPekka Enberg 	self->boot_ip		= BOOT_LOADER_IP;
184dbdb74c2SPekka Enberg 	self->boot_sp		= BOOT_LOADER_SP;
185edc8a14dSPekka Enberg 
1867fb218bdSPekka Enberg 	return true;
187009b0758SPekka Enberg }
188009b0758SPekka Enberg 
1897fb218bdSPekka Enberg /*
1907fb218bdSPekka Enberg  * The protected mode kernel part of a modern bzImage is loaded at 1 MB by
1917fb218bdSPekka Enberg  * default.
1927fb218bdSPekka Enberg  */
1937fb218bdSPekka Enberg #define BZ_KERNEL_START			0x100000UL
194ae1fae34SPekka Enberg 
195ae1fae34SPekka Enberg static const char *BZIMAGE_MAGIC	= "HdrS";
19622489bb0SCyrill Gorcunov static const char fakebios_vector[]	= { 0xcf };
197ae1fae34SPekka Enberg 
19810943d14SPekka Enberg #define BZ_DEFAULT_SETUP_SECTS		4
19910943d14SPekka Enberg 
2006d1f350dSCyrill Gorcunov static bool load_bzimage(struct kvm *self, int fd, const char *kernel_cmdline)
201ae1fae34SPekka Enberg {
202bc75b0aeSCyrill Gorcunov 	struct real_intr_desc intr;
20322489bb0SCyrill Gorcunov 	struct boot_params boot;
2044b62331fSPekka Enberg 	unsigned long setup_sects;
2057fb218bdSPekka Enberg 	ssize_t setup_size;
20622489bb0SCyrill Gorcunov 	void *p;
207ae1fae34SPekka Enberg 	int nr;
208ae1fae34SPekka Enberg 
2095d67eaf6SPekka Enberg 	/*
2105d67eaf6SPekka Enberg 	 * See Documentation/x86/boot.txt for details no bzImage on-disk and
2115d67eaf6SPekka Enberg 	 * memory layout.
2125d67eaf6SPekka Enberg 	 */
2135d67eaf6SPekka Enberg 
214009b0758SPekka Enberg 	if (lseek(fd, 0, SEEK_SET) < 0)
215009b0758SPekka Enberg 		die_perror("lseek");
216009b0758SPekka Enberg 
217ae1fae34SPekka Enberg 	read(fd, &boot, sizeof(boot));
218ae1fae34SPekka Enberg 
219ae1fae34SPekka Enberg         if (memcmp(&boot.hdr.header, BZIMAGE_MAGIC, strlen(BZIMAGE_MAGIC)) != 0)
2207fb218bdSPekka Enberg 		return false;
221ae1fae34SPekka Enberg 
222e93ab78aSPekka Enberg 	if (lseek(fd, 0, SEEK_SET) < 0)
223e93ab78aSPekka Enberg 		die_perror("lseek");
224e93ab78aSPekka Enberg 
2254cf542bbSCyrill Gorcunov 	if (!boot.hdr.setup_sects)
2264cf542bbSCyrill Gorcunov 		boot.hdr.setup_sects = BZ_DEFAULT_SETUP_SECTS;
22710943d14SPekka Enberg 	setup_sects = boot.hdr.setup_sects + 1;
22810943d14SPekka Enberg 
22954d4a626SPekka Enberg 	setup_size = setup_sects << 9;
2306753ed2fSPekka Enberg 	p = guest_real_to_host(self, BOOT_LOADER_SELECTOR, BOOT_LOADER_IP);
231ae1fae34SPekka Enberg 
2327fb218bdSPekka Enberg 	if (read(fd, p, setup_size) != setup_size)
2337fb218bdSPekka Enberg 		die_perror("read");
2347fb218bdSPekka Enberg 
2356753ed2fSPekka Enberg 	p = guest_flat_to_host(self, BZ_KERNEL_START);
236ae1fae34SPekka Enberg 
237ae1fae34SPekka Enberg 	while ((nr = read(fd, p, 65536)) > 0)
238ae1fae34SPekka Enberg 		p += nr;
239ae1fae34SPekka Enberg 
240dbdb74c2SPekka Enberg 	self->boot_selector	= BOOT_LOADER_SELECTOR;
241edc8a14dSPekka Enberg 	/*
242edc8a14dSPekka Enberg 	 * The real-mode setup code starts at offset 0x200 of a bzImage. See
243edc8a14dSPekka Enberg 	 * Documentation/x86/boot.txt for details.
244edc8a14dSPekka Enberg 	 */
245edc8a14dSPekka Enberg 	self->boot_ip		= BOOT_LOADER_IP + 0x200;
246dbdb74c2SPekka Enberg 	self->boot_sp		= BOOT_LOADER_SP;
247edc8a14dSPekka Enberg 
248ea684828SCyrill Gorcunov 	/*
24922489bb0SCyrill Gorcunov 	 * Setup a *fake* real mode vector table, it has only
25022489bb0SCyrill Gorcunov 	 * one real hadler which does just iret
25122489bb0SCyrill Gorcunov 	 *
25222489bb0SCyrill Gorcunov 	 * we need a place for 1 byte so lets put
25322489bb0SCyrill Gorcunov 	 * it where the BIOS lives -- BDA area
254ea684828SCyrill Gorcunov 	 */
25522489bb0SCyrill Gorcunov 	p = guest_flat_to_host(self, BDA_START);
25622489bb0SCyrill Gorcunov 	memcpy(p, fakebios_vector, sizeof(fakebios_vector));
257bc75b0aeSCyrill Gorcunov 	intr = (struct real_intr_desc) {
25822489bb0SCyrill Gorcunov 		.segment	= BDA_START >> 4,
25922489bb0SCyrill Gorcunov 		.offset		= 0,
260ea684828SCyrill Gorcunov 	};
261ea684828SCyrill Gorcunov 	p = guest_flat_to_host(self, 0);
262bc75b0aeSCyrill Gorcunov 	interrupt_table__setup(&self->interrupt_table, &intr);
263bc75b0aeSCyrill Gorcunov 	interrupt_table__copy(&self->interrupt_table, p, REAL_INTR_SIZE);
264ea684828SCyrill Gorcunov 
2657fb218bdSPekka Enberg 	return true;
266ae1fae34SPekka Enberg }
267ae1fae34SPekka Enberg 
2686d1f350dSCyrill Gorcunov bool kvm__load_kernel(struct kvm *kvm, const char *kernel_filename,
2696d1f350dSCyrill Gorcunov 			const char *kernel_cmdline)
270ae1fae34SPekka Enberg {
2717fb218bdSPekka Enberg 	bool ret;
272ae1fae34SPekka Enberg 	int fd;
273ae1fae34SPekka Enberg 
274ae1fae34SPekka Enberg 	fd = open(kernel_filename, O_RDONLY);
275ae1fae34SPekka Enberg 	if (fd < 0)
276ae1fae34SPekka Enberg 		die("unable to open kernel");
277ae1fae34SPekka Enberg 
2786d1f350dSCyrill Gorcunov 	ret = load_bzimage(kvm, fd, kernel_cmdline);
279009b0758SPekka Enberg 	if (ret)
280009b0758SPekka Enberg 		goto found_kernel;
281ae1fae34SPekka Enberg 
282009b0758SPekka Enberg 	ret = load_flat_binary(kvm, fd);
283009b0758SPekka Enberg 	if (ret)
284009b0758SPekka Enberg 		goto found_kernel;
285009b0758SPekka Enberg 
286009b0758SPekka Enberg 	die("%s is not a valid bzImage or flat binary", kernel_filename);
287009b0758SPekka Enberg 
288009b0758SPekka Enberg found_kernel:
289ae1fae34SPekka Enberg 	return ret;
290ae1fae34SPekka Enberg }
291ae1fae34SPekka Enberg 
29206e41eeaSPekka Enberg static inline uint64_t ip_flat_to_real(struct kvm *self, uint64_t ip)
29306e41eeaSPekka Enberg {
29406e41eeaSPekka Enberg 	uint64_t cs = self->sregs.cs.selector;
29506e41eeaSPekka Enberg 
29606e41eeaSPekka Enberg 	return ip - (cs << 4);
29706e41eeaSPekka Enberg }
29806e41eeaSPekka Enberg 
299*f326512aSPekka Enberg static inline uint64_t ip_to_flat(struct kvm *self, uint64_t ip)
30006e41eeaSPekka Enberg {
301*f326512aSPekka Enberg 	uint64_t cs;
302*f326512aSPekka Enberg 
303*f326512aSPekka Enberg 	/*
304*f326512aSPekka Enberg 	 * NOTE! We should take code segment base address into account here.
305*f326512aSPekka Enberg 	 * Luckily it's usually zero because Linux uses flat memory model.
306*f326512aSPekka Enberg 	 */
307*f326512aSPekka Enberg 	if (self->sregs.cr0 & 0x01)
308*f326512aSPekka Enberg 		return ip;
309*f326512aSPekka Enberg 
310*f326512aSPekka Enberg 	cs = self->sregs.cs.selector;
31106e41eeaSPekka Enberg 
31206e41eeaSPekka Enberg 	return ip + (cs << 4);
31306e41eeaSPekka Enberg }
31406e41eeaSPekka Enberg 
315dbdb74c2SPekka Enberg static inline uint32_t selector_to_base(uint16_t selector)
316dbdb74c2SPekka Enberg {
317dbdb74c2SPekka Enberg 	/*
318dbdb74c2SPekka Enberg 	 * KVM on Intel requires 'base' to be 'selector * 16' in real mode.
319dbdb74c2SPekka Enberg 	 */
320dbdb74c2SPekka Enberg 	return (uint32_t)selector * 16;
321dbdb74c2SPekka Enberg }
322dbdb74c2SPekka Enberg 
3237fb218bdSPekka Enberg void kvm__reset_vcpu(struct kvm *self)
324ae1fae34SPekka Enberg {
32553602077SPekka Enberg 	self->sregs = (struct kvm_sregs) {
32653602077SPekka Enberg 		.cr0		= 0x60000010ULL,
32753602077SPekka Enberg 		.cs		= (struct kvm_segment) {
328dbdb74c2SPekka Enberg 			.selector	= self->boot_selector,
329dbdb74c2SPekka Enberg 			.base		= selector_to_base(self->boot_selector),
33053602077SPekka Enberg 			.limit		= 0xffffU,
33153602077SPekka Enberg 			.type		= 0x0bU,
33253602077SPekka Enberg 			.present	= 1,
33353602077SPekka Enberg 			.dpl		= 0x03,
33453602077SPekka Enberg 			.s		= 1,
33553602077SPekka Enberg 		},
33653602077SPekka Enberg 		.ss		= (struct kvm_segment) {
337dbdb74c2SPekka Enberg 			.selector	= self->boot_selector,
338dbdb74c2SPekka Enberg 			.base		= selector_to_base(self->boot_selector),
33953602077SPekka Enberg 			.limit		= 0xffffU,
34053602077SPekka Enberg 			.type		= 0x03U,
34153602077SPekka Enberg 			.present	= 1,
34253602077SPekka Enberg 			.dpl		= 0x03,
34353602077SPekka Enberg 			.s		= 1,
34453602077SPekka Enberg 		},
34553602077SPekka Enberg 		.ds		= (struct kvm_segment) {
346dbdb74c2SPekka Enberg 			.selector	= self->boot_selector,
347dbdb74c2SPekka Enberg 			.base		= selector_to_base(self->boot_selector),
34853602077SPekka Enberg 			.limit		= 0xffffU,
34953602077SPekka Enberg 			.type		= 0x03U,
35053602077SPekka Enberg 			.present	= 1,
35153602077SPekka Enberg 			.dpl		= 0x03,
35253602077SPekka Enberg 			.s		= 1,
35353602077SPekka Enberg 		},
35453602077SPekka Enberg 		.es		= (struct kvm_segment) {
355dbdb74c2SPekka Enberg 			.selector	= self->boot_selector,
356dbdb74c2SPekka Enberg 			.base		= selector_to_base(self->boot_selector),
35753602077SPekka Enberg 			.limit		= 0xffffU,
35853602077SPekka Enberg 			.type		= 0x03U,
35953602077SPekka Enberg 			.present	= 1,
36053602077SPekka Enberg 			.dpl		= 0x03,
36153602077SPekka Enberg 			.s		= 1,
36253602077SPekka Enberg 		},
36353602077SPekka Enberg 		.fs		= (struct kvm_segment) {
364dbdb74c2SPekka Enberg 			.selector	= self->boot_selector,
365dbdb74c2SPekka Enberg 			.base		= selector_to_base(self->boot_selector),
36653602077SPekka Enberg 			.limit		= 0xffffU,
36753602077SPekka Enberg 			.type		= 0x03U,
36853602077SPekka Enberg 			.present	= 1,
36953602077SPekka Enberg 			.dpl		= 0x03,
37053602077SPekka Enberg 			.s		= 1,
37153602077SPekka Enberg 		},
37253602077SPekka Enberg 		.gs		= (struct kvm_segment) {
373dbdb74c2SPekka Enberg 			.selector	= self->boot_selector,
374dbdb74c2SPekka Enberg 			.base		= selector_to_base(self->boot_selector),
37553602077SPekka Enberg 			.limit		= 0xffffU,
37653602077SPekka Enberg 			.type		= 0x03U,
37753602077SPekka Enberg 			.present	= 1,
37853602077SPekka Enberg 			.dpl		= 0x03,
37953602077SPekka Enberg 			.s		= 1,
38053602077SPekka Enberg 		},
38153602077SPekka Enberg 		.tr		= (struct kvm_segment) {
38253602077SPekka Enberg 			.limit		= 0xffffU,
38353602077SPekka Enberg 			.present	= 1,
38453602077SPekka Enberg 			.type		= 0x03U,
38553602077SPekka Enberg 		},
38653602077SPekka Enberg 		.ldt		= (struct kvm_segment) {
38753602077SPekka Enberg 			.limit		= 0xffffU,
38853602077SPekka Enberg 			.present	= 1,
3897085d935SPekka Enberg 			.type		= 0x02U,
39053602077SPekka Enberg 		},
39153602077SPekka Enberg 		.gdt		= (struct kvm_dtable) {
39253602077SPekka Enberg 			.limit		= 0xffffU,
39353602077SPekka Enberg 		},
39453602077SPekka Enberg 		.idt		= (struct kvm_dtable) {
39553602077SPekka Enberg 			.limit		= 0xffffU,
39653602077SPekka Enberg 		},
39753602077SPekka Enberg 	};
39853602077SPekka Enberg 
39953602077SPekka Enberg 	if (ioctl(self->vcpu_fd, KVM_SET_SREGS, &self->sregs) < 0)
40053602077SPekka Enberg 		die_perror("KVM_SET_SREGS failed");
40106e41eeaSPekka Enberg 
40206e41eeaSPekka Enberg 	self->regs = (struct kvm_regs) {
40306e41eeaSPekka Enberg 		/* We start the guest in 16-bit real mode  */
40406e41eeaSPekka Enberg 		.rflags		= 0x0000000000000002ULL,
405dbdb74c2SPekka Enberg 
406dbdb74c2SPekka Enberg 		.rip		= self->boot_ip,
407dbdb74c2SPekka Enberg 		.rsp		= self->boot_sp,
408dbdb74c2SPekka Enberg 		.rbp		= self->boot_sp,
40906e41eeaSPekka Enberg 	};
41006e41eeaSPekka Enberg 
41106e41eeaSPekka Enberg 	if (self->regs.rip > USHRT_MAX)
41206e41eeaSPekka Enberg 		die("ip 0x%" PRIx64 " is too high for real mode", (uint64_t) self->regs.rip);
41306e41eeaSPekka Enberg 
41406e41eeaSPekka Enberg 	if (ioctl(self->vcpu_fd, KVM_SET_REGS, &self->regs) < 0)
41506e41eeaSPekka Enberg 		die_perror("KVM_SET_REGS failed");
41606e41eeaSPekka Enberg 
417ce4d0766SPekka Enberg 	self->fpu = (struct kvm_fpu) {
418ce4d0766SPekka Enberg 		.fcw		= 0x37f,
419ce4d0766SPekka Enberg 		.mxcsr		= 0x1f80,
420ce4d0766SPekka Enberg 	};
421ce4d0766SPekka Enberg 
422ce4d0766SPekka Enberg 	if (ioctl(self->vcpu_fd, KVM_SET_FPU, &self->fpu) < 0)
423ce4d0766SPekka Enberg 		die_perror("KVM_SET_FPU failed");
424ce4d0766SPekka Enberg 
425ae1fae34SPekka Enberg }
426ae1fae34SPekka Enberg 
427ae1fae34SPekka Enberg void kvm__run(struct kvm *self)
428ae1fae34SPekka Enberg {
429ae1fae34SPekka Enberg 	if (ioctl(self->vcpu_fd, KVM_RUN, 0) < 0)
430ae1fae34SPekka Enberg 		die_perror("KVM_RUN failed");
431ae1fae34SPekka Enberg }
432ae1fae34SPekka Enberg 
43353602077SPekka Enberg static void print_segment(const char *name, struct kvm_segment *seg)
43453602077SPekka Enberg {
435ce556636SPekka Enberg 	printf(" %s       %04" PRIx16 "      %016" PRIx64 "  %08" PRIx32 "  %02" PRIx8 "    %x %x   %x  %x %x %x %x\n",
43653602077SPekka Enberg 		name, (uint16_t) seg->selector, (uint64_t) seg->base, (uint32_t) seg->limit,
437ce556636SPekka Enberg 		(uint8_t) seg->type, seg->present, seg->dpl, seg->db, seg->s, seg->l, seg->g, seg->avl);
43853602077SPekka Enberg }
43953602077SPekka Enberg 
440ae1fae34SPekka Enberg void kvm__show_registers(struct kvm *self)
4417118d2caSPekka Enberg {
44253602077SPekka Enberg 	unsigned long cr0, cr2, cr3;
44353602077SPekka Enberg 	unsigned long cr4, cr8;
4447118d2caSPekka Enberg 	unsigned long rax, rbx, rcx;
4457118d2caSPekka Enberg 	unsigned long rdx, rsi, rdi;
4467118d2caSPekka Enberg 	unsigned long rbp,  r8,  r9;
4477118d2caSPekka Enberg 	unsigned long r10, r11, r12;
4487118d2caSPekka Enberg 	unsigned long r13, r14, r15;
4497118d2caSPekka Enberg 	unsigned long rip, rsp;
45053602077SPekka Enberg 	struct kvm_sregs sregs;
451a2fe6199SPekka Enberg 	unsigned long rflags;
4527118d2caSPekka Enberg 	struct kvm_regs regs;
453ce5e0ecbSPekka Enberg 	int i;
4547118d2caSPekka Enberg 
4557118d2caSPekka Enberg 	if (ioctl(self->vcpu_fd, KVM_GET_REGS, &regs) < 0)
4567118d2caSPekka Enberg 		die("KVM_GET_REGS failed");
4577118d2caSPekka Enberg 
458a2fe6199SPekka Enberg 	rflags = regs.rflags;
459a2fe6199SPekka Enberg 
4607118d2caSPekka Enberg 	rip = regs.rip; rsp = regs.rsp;
4617118d2caSPekka Enberg 	rax = regs.rax; rbx = regs.rbx; rcx = regs.rcx;
4627118d2caSPekka Enberg 	rdx = regs.rdx; rsi = regs.rsi; rdi = regs.rdi;
4637118d2caSPekka Enberg 	rbp = regs.rbp; r8  = regs.r8;  r9  = regs.r9;
4647118d2caSPekka Enberg 	r10 = regs.r10; r11 = regs.r11; r12 = regs.r12;
4657118d2caSPekka Enberg 	r13 = regs.r13; r14 = regs.r14; r15 = regs.r15;
4667118d2caSPekka Enberg 
4677118d2caSPekka Enberg 	printf("Registers:\n");
4682177ec43SPekka Enberg 	printf(" rip: %016lx   rsp: %016lx flags: %016lx\n", rip, rsp, rflags);
469ea2e4ea0SCyrill Gorcunov 	printf(" rax: %016lx   rbx: %016lx   rcx: %016lx\n", rax, rbx, rcx);
4707118d2caSPekka Enberg 	printf(" rdx: %016lx   rsi: %016lx   rdi: %016lx\n", rdx, rsi, rdi);
4717118d2caSPekka Enberg 	printf(" rbp: %016lx   r8:  %016lx   r9:  %016lx\n", rbp, r8,  r9);
4727118d2caSPekka Enberg 	printf(" r10: %016lx   r11: %016lx   r12: %016lx\n", r10, r11, r12);
4737118d2caSPekka Enberg 	printf(" r13: %016lx   r14: %016lx   r15: %016lx\n", r13, r14, r15);
47453602077SPekka Enberg 
47553602077SPekka Enberg 	if (ioctl(self->vcpu_fd, KVM_GET_SREGS, &sregs) < 0)
47653602077SPekka Enberg 		die("KVM_GET_REGS failed");
47753602077SPekka Enberg 
47853602077SPekka Enberg 	cr0 = sregs.cr0; cr2 = sregs.cr2; cr3 = sregs.cr3;
47953602077SPekka Enberg 	cr4 = sregs.cr4; cr8 = sregs.cr8;
48053602077SPekka Enberg 
48153602077SPekka Enberg 	printf(" cr0: %016lx   cr2: %016lx   cr3: %016lx\n", cr0, cr2, cr3);
48253602077SPekka Enberg 	printf(" cr4: %016lx   cr8: %016lx\n", cr4, cr8);
483ce5e0ecbSPekka Enberg 	printf("Segment registers:\n");
484ce556636SPekka Enberg 	printf(" register  selector  base              limit     type  p dpl db s l g avl\n");
48553602077SPekka Enberg 	print_segment("cs ", &sregs.cs);
48653602077SPekka Enberg 	print_segment("ss ", &sregs.ss);
48753602077SPekka Enberg 	print_segment("ds ", &sregs.ds);
48853602077SPekka Enberg 	print_segment("es ", &sregs.es);
48953602077SPekka Enberg 	print_segment("fs ", &sregs.fs);
49053602077SPekka Enberg 	print_segment("gs ", &sregs.gs);
491ce5e0ecbSPekka Enberg 	print_segment("tr ", &sregs.tr);
492ce5e0ecbSPekka Enberg 	print_segment("ldt", &sregs.ldt);
4932049569dSPekka Enberg 	printf(" [ efer: %016lx  apic base: %016lx  nmi: %s ]\n", (uint64_t) sregs.efer, (uint64_t) sregs.apic_base,
4942049569dSPekka Enberg 		(self->nmi_disabled ? "disabled" : "enabled"));
495ce5e0ecbSPekka Enberg 	printf("Interrupt bitmap:\n");
496ce5e0ecbSPekka Enberg 	printf(" ");
497ce5e0ecbSPekka Enberg 	for (i = 0; i < (KVM_NR_INTERRUPTS + 63) / 64; i++)
498ce5e0ecbSPekka Enberg 		printf("%016lx ", (uint64_t) sregs.interrupt_bitmap[i]);
499ce5e0ecbSPekka Enberg 	printf("\n");
5007118d2caSPekka Enberg }
5017118d2caSPekka Enberg 
502ae1fae34SPekka Enberg void kvm__show_code(struct kvm *self)
5036f10be05SPekka Enberg {
5046f10be05SPekka Enberg 	unsigned int code_bytes = 64;
5056f10be05SPekka Enberg 	unsigned int code_prologue = code_bytes * 43 / 64;
5066f10be05SPekka Enberg 	unsigned int code_len = code_bytes;
5076f10be05SPekka Enberg 	unsigned char c;
508ae1fae34SPekka Enberg 	unsigned int i;
5096f10be05SPekka Enberg 	uint8_t *ip;
5106f10be05SPekka Enberg 
5112a601aafSPekka Enberg 	if (ioctl(self->vcpu_fd, KVM_GET_REGS, &self->regs) < 0)
5122a601aafSPekka Enberg 		die("KVM_GET_REGS failed");
5132a601aafSPekka Enberg 
5142a601aafSPekka Enberg 	if (ioctl(self->vcpu_fd, KVM_GET_SREGS, &self->sregs) < 0)
5152a601aafSPekka Enberg 		die("KVM_GET_SREGS failed");
5162a601aafSPekka Enberg 
517*f326512aSPekka Enberg 	ip = guest_flat_to_host(self, ip_to_flat(self, self->regs.rip) - code_prologue);
5186f10be05SPekka Enberg 
5196f10be05SPekka Enberg 	printf("Code: ");
5206f10be05SPekka Enberg 
5216f10be05SPekka Enberg 	for (i = 0; i < code_len; i++, ip++) {
5226e8abc38SPekka Enberg 		c = *ip;
5236e8abc38SPekka Enberg 
524*f326512aSPekka Enberg 		if (ip == guest_flat_to_host(self, ip_to_flat(self, self->regs.rip)))
5256f10be05SPekka Enberg 			printf("<%02x> ", c);
5266f10be05SPekka Enberg 		else
5276f10be05SPekka Enberg 			printf("%02x ", c);
5286f10be05SPekka Enberg 	}
5296f10be05SPekka Enberg 
5306f10be05SPekka Enberg 	printf("\n");
5316f10be05SPekka Enberg }
532