xref: /kvmtool/kvm.c (revision ae1fae34a8e9b97d1e999fb0b82813d282376e11)
1*ae1fae34SPekka Enberg #include "kvm/kvm.h"
2*ae1fae34SPekka Enberg 
36c7d8514SPekka Enberg #include <linux/kvm.h>
4f5ab5f67SPekka Enberg 
5f5ab5f67SPekka Enberg #include <asm/bootparam.h>
6f5ab5f67SPekka Enberg 
7*ae1fae34SPekka Enberg #include <sys/ioctl.h>
81f9cff23SPekka Enberg #include <inttypes.h>
91f9cff23SPekka Enberg #include <sys/mman.h>
102da26a59SPekka Enberg #include <stdbool.h>
11f5ab5f67SPekka Enberg #include <stdarg.h>
12b8f6afcdSPekka Enberg #include <stdlib.h>
13f5ab5f67SPekka Enberg #include <string.h>
140d1f17ecSPekka Enberg #include <unistd.h>
151f9cff23SPekka Enberg #include <stdio.h>
16b8f6afcdSPekka Enberg #include <fcntl.h>
17b8f6afcdSPekka Enberg 
18ad054a21SCyrill Gorcunov #include "util.h"
19ad054a21SCyrill Gorcunov 
201f9cff23SPekka Enberg /*
211f9cff23SPekka Enberg  * Compatibility code. Remove this when we move to tools/kvm.
221f9cff23SPekka Enberg  */
231f9cff23SPekka Enberg #ifndef KVM_EXIT_INTERNAL_ERROR
241f9cff23SPekka Enberg # define KVM_EXIT_INTERNAL_ERROR		17
251f9cff23SPekka Enberg #endif
261f9cff23SPekka Enberg 
27*ae1fae34SPekka Enberg #define DEFINE_KVM_EXIT_REASON(reason) [reason] = #reason
280d1f17ecSPekka Enberg 
29*ae1fae34SPekka Enberg const char *kvm_exit_reasons[] = {
30*ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_UNKNOWN),
31*ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_EXCEPTION),
32*ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_IO),
33*ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_HYPERCALL),
34*ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_DEBUG),
35*ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_HLT),
36*ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_MMIO),
37*ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_IRQ_WINDOW_OPEN),
38*ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_SHUTDOWN),
39*ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_FAIL_ENTRY),
40*ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_INTR),
41*ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_SET_TPR),
42*ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_TPR_ACCESS),
43*ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_S390_SIEIC),
44*ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_S390_RESET),
45*ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_DCR),
46*ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_NMI),
47*ae1fae34SPekka Enberg 	DEFINE_KVM_EXIT_REASON(KVM_EXIT_INTERNAL_ERROR),
489b1fb1c3SPekka Enberg };
499b1fb1c3SPekka Enberg 
50*ae1fae34SPekka Enberg static inline void *guest_addr_to_host(struct kvm *self, unsigned long offset)
51*ae1fae34SPekka Enberg {
52*ae1fae34SPekka Enberg 	return self->ram_start + offset;
53*ae1fae34SPekka Enberg }
54*ae1fae34SPekka Enberg 
55*ae1fae34SPekka Enberg static bool kvm__supports_extension(struct kvm *self, unsigned int extension)
56b8f6afcdSPekka Enberg {
5728fa19c0SPekka Enberg 	int ret;
58b8f6afcdSPekka Enberg 
5973ac60e6SPekka Enberg 	ret = ioctl(self->sys_fd, KVM_CHECK_EXTENSION, extension);
604076b041SPekka Enberg 	if (ret < 0)
614076b041SPekka Enberg 		return false;
624076b041SPekka Enberg 
634076b041SPekka Enberg 	return ret;
644076b041SPekka Enberg }
654076b041SPekka Enberg 
664076b041SPekka Enberg static struct kvm *kvm__new(void)
674076b041SPekka Enberg {
684076b041SPekka Enberg 	struct kvm *self = calloc(1, sizeof *self);
694076b041SPekka Enberg 
704076b041SPekka Enberg 	if (!self)
714076b041SPekka Enberg 		die("out of memory");
724076b041SPekka Enberg 
734076b041SPekka Enberg 	return self;
744076b041SPekka Enberg }
754076b041SPekka Enberg 
76*ae1fae34SPekka Enberg struct kvm *kvm__init(void)
774076b041SPekka Enberg {
782b0e3342SPekka Enberg 	struct kvm_userspace_memory_region mem;
794076b041SPekka Enberg 	struct kvm *self;
800d1f17ecSPekka Enberg 	long page_size;
811f9cff23SPekka Enberg 	int mmap_size;
824076b041SPekka Enberg 	int ret;
834076b041SPekka Enberg 
844076b041SPekka Enberg 	self = kvm__new();
854076b041SPekka Enberg 
8673ac60e6SPekka Enberg 	self->sys_fd = open("/dev/kvm", O_RDWR);
8773ac60e6SPekka Enberg 	if (self->sys_fd < 0)
88f5ab5f67SPekka Enberg 		die_perror("open");
89b8f6afcdSPekka Enberg 
9073ac60e6SPekka Enberg 	ret = ioctl(self->sys_fd, KVM_GET_API_VERSION, 0);
916c7d8514SPekka Enberg 	if (ret != KVM_API_VERSION)
92f5ab5f67SPekka Enberg 		die_perror("KVM_API_VERSION ioctl");
936c7d8514SPekka Enberg 
9473ac60e6SPekka Enberg 	self->vm_fd = ioctl(self->sys_fd, KVM_CREATE_VM, 0);
9573ac60e6SPekka Enberg 	if (self->vm_fd < 0)
96f5ab5f67SPekka Enberg 		die_perror("KVM_CREATE_VM ioctl");
9728fa19c0SPekka Enberg 
984076b041SPekka Enberg 	if (!kvm__supports_extension(self, KVM_CAP_USER_MEMORY))
99f5ab5f67SPekka Enberg 		die("KVM_CAP_USER_MEMORY is not supported");
1002da26a59SPekka Enberg 
1010d1f17ecSPekka Enberg 	self->ram_size		= 64UL * 1024UL * 1024UL;
1020d1f17ecSPekka Enberg 
1030d1f17ecSPekka Enberg 	page_size	= sysconf(_SC_PAGESIZE);
1040d1f17ecSPekka Enberg 	if (posix_memalign(&self->ram_start, page_size, self->ram_size) != 0)
1050d1f17ecSPekka Enberg 		die("out of memory");
1060d1f17ecSPekka Enberg 
1072b0e3342SPekka Enberg 	mem = (struct kvm_userspace_memory_region) {
1082b0e3342SPekka Enberg 		.slot			= 0,
1092b0e3342SPekka Enberg 		.guest_phys_addr	= 0x0UL,
1100d1f17ecSPekka Enberg 		.memory_size		= self->ram_size,
1110d1f17ecSPekka Enberg 		.userspace_addr		= (unsigned long) self->ram_start,
1122b0e3342SPekka Enberg 	};
1132b0e3342SPekka Enberg 
11473ac60e6SPekka Enberg 	ret = ioctl(self->vm_fd, KVM_SET_USER_MEMORY_REGION, &mem, 1);
1152b0e3342SPekka Enberg 	if (ret < 0)
116f5ab5f67SPekka Enberg 		die_perror("KVM_SET_USER_MEMORY_REGION ioctl");
1172b0e3342SPekka Enberg 
118895c2fefSPekka Enberg 	if (!kvm__supports_extension(self, KVM_CAP_SET_TSS_ADDR))
119f5ab5f67SPekka Enberg 		die("KVM_CAP_SET_TSS_ADDR is not supported");
120895c2fefSPekka Enberg 
12173ac60e6SPekka Enberg 	ret = ioctl(self->vm_fd, KVM_SET_TSS_ADDR, 0xfffbd000);
122895c2fefSPekka Enberg 	if (ret < 0)
123f5ab5f67SPekka Enberg 		die_perror("KVM_SET_TSS_ADDR ioctl");
124895c2fefSPekka Enberg 
12573ac60e6SPekka Enberg 	self->vcpu_fd = ioctl(self->vm_fd, KVM_CREATE_VCPU, 0);
1262b0e3342SPekka Enberg 	if (self->vcpu_fd < 0)
127f5ab5f67SPekka Enberg 		die_perror("KVM_CREATE_VCPU ioctl");
1282b0e3342SPekka Enberg 
1291f9cff23SPekka Enberg 	mmap_size = ioctl(self->sys_fd, KVM_GET_VCPU_MMAP_SIZE, 0);
1301f9cff23SPekka Enberg 	if (mmap_size < 0)
131f5ab5f67SPekka Enberg 		die_perror("KVM_GET_VCPU_MMAP_SIZE ioctl");
1321f9cff23SPekka Enberg 
1331f9cff23SPekka Enberg 	self->kvm_run = mmap(NULL, mmap_size, PROT_READ|PROT_WRITE, MAP_SHARED, self->vcpu_fd, 0);
1341f9cff23SPekka Enberg 	if (self->kvm_run == MAP_FAILED)
1351f9cff23SPekka Enberg 		die("unable to mmap vcpu fd");
1361f9cff23SPekka Enberg 
1374076b041SPekka Enberg 	return self;
1384076b041SPekka Enberg }
1394076b041SPekka Enberg 
140*ae1fae34SPekka Enberg void kvm__enable_singlestep(struct kvm *self)
141aee6632eSPekka Enberg {
142aee6632eSPekka Enberg 	struct kvm_guest_debug debug = {
143aee6632eSPekka Enberg 		.control	= KVM_GUESTDBG_ENABLE | KVM_GUESTDBG_SINGLESTEP,
144aee6632eSPekka Enberg 	};
145aee6632eSPekka Enberg 
146aee6632eSPekka Enberg 	if (ioctl(self->vcpu_fd, KVM_SET_GUEST_DEBUG, &debug) < 0)
147b625d4b6SCyrill Gorcunov 		warning("KVM_SET_GUEST_DEBUG failed");
148aee6632eSPekka Enberg }
149aee6632eSPekka Enberg 
150*ae1fae34SPekka Enberg /* bzImages are loaded at 1 MB by default.  */
151*ae1fae34SPekka Enberg #define KERNEL_START_ADDR	(1024ULL * 1024ULL)
152*ae1fae34SPekka Enberg 
153*ae1fae34SPekka Enberg static const char *BZIMAGE_MAGIC	= "HdrS";
154*ae1fae34SPekka Enberg 
155*ae1fae34SPekka Enberg static uint32_t load_bzimage(struct kvm *kvm, int fd)
156*ae1fae34SPekka Enberg {
157*ae1fae34SPekka Enberg 	struct boot_params boot;
158*ae1fae34SPekka Enberg 	void *p;
159*ae1fae34SPekka Enberg 	int nr;
160*ae1fae34SPekka Enberg 
161*ae1fae34SPekka Enberg 	read(fd, &boot, sizeof(boot));
162*ae1fae34SPekka Enberg 
163*ae1fae34SPekka Enberg         if (memcmp(&boot.hdr.header, BZIMAGE_MAGIC, strlen(BZIMAGE_MAGIC)) != 0)
164*ae1fae34SPekka Enberg 		return 0;
165*ae1fae34SPekka Enberg 
166*ae1fae34SPekka Enberg 	lseek(fd, (boot.hdr.setup_sects+1) * 512, SEEK_SET);
167*ae1fae34SPekka Enberg 
168*ae1fae34SPekka Enberg 	p = guest_addr_to_host(kvm, KERNEL_START_ADDR);
169*ae1fae34SPekka Enberg 
170*ae1fae34SPekka Enberg 	while ((nr = read(fd, p, 65536)) > 0)
171*ae1fae34SPekka Enberg 		p += nr;
172*ae1fae34SPekka Enberg 
173*ae1fae34SPekka Enberg 	return boot.hdr.code32_start;
174*ae1fae34SPekka Enberg }
175*ae1fae34SPekka Enberg 
176*ae1fae34SPekka Enberg uint32_t kvm__load_kernel(struct kvm *kvm, const char *kernel_filename)
177*ae1fae34SPekka Enberg {
178*ae1fae34SPekka Enberg 	uint32_t ret;
179*ae1fae34SPekka Enberg 	int fd;
180*ae1fae34SPekka Enberg 
181*ae1fae34SPekka Enberg 	fd = open(kernel_filename, O_RDONLY);
182*ae1fae34SPekka Enberg 	if (fd < 0)
183*ae1fae34SPekka Enberg 		die("unable to open kernel");
184*ae1fae34SPekka Enberg 
185*ae1fae34SPekka Enberg 	ret = load_bzimage(kvm, fd);
186*ae1fae34SPekka Enberg 	if (!ret)
187*ae1fae34SPekka Enberg 		die("%s is not a valid bzImage", kernel_filename);
188*ae1fae34SPekka Enberg 
189*ae1fae34SPekka Enberg 	return ret;
190*ae1fae34SPekka Enberg }
191*ae1fae34SPekka Enberg 
192*ae1fae34SPekka Enberg void kvm__reset_vcpu(struct kvm *self, uint64_t rip)
193*ae1fae34SPekka Enberg {
194*ae1fae34SPekka Enberg 	self->regs.rip		= rip;
195*ae1fae34SPekka Enberg 	self->regs.rflags	= 0x0000000000000002ULL;
196*ae1fae34SPekka Enberg 
197*ae1fae34SPekka Enberg 	if (ioctl(self->vcpu_fd, KVM_SET_REGS, &self->regs) < 0)
198*ae1fae34SPekka Enberg 		die_perror("KVM_SET_REGS failed");
199*ae1fae34SPekka Enberg }
200*ae1fae34SPekka Enberg 
201*ae1fae34SPekka Enberg void kvm__run(struct kvm *self)
202*ae1fae34SPekka Enberg {
203*ae1fae34SPekka Enberg 	if (ioctl(self->vcpu_fd, KVM_RUN, 0) < 0)
204*ae1fae34SPekka Enberg 		die_perror("KVM_RUN failed");
205*ae1fae34SPekka Enberg }
206*ae1fae34SPekka Enberg 
207*ae1fae34SPekka Enberg static void kvm__emulate_io_out(struct kvm *self, uint16_t port, void *data, int size, uint32_t count)
208*ae1fae34SPekka Enberg {
209*ae1fae34SPekka Enberg 	fprintf(stderr, "%s port=%x, size=%d, count=%" PRIu32 "\n", __func__, port, size, count);
210*ae1fae34SPekka Enberg }
211*ae1fae34SPekka Enberg 
212*ae1fae34SPekka Enberg static void kvm__emulate_io_in(struct kvm *self, uint16_t port, void *data, int size, uint32_t count)
213*ae1fae34SPekka Enberg {
214*ae1fae34SPekka Enberg 	fprintf(stderr, "%s port=%x, size=%d, count=%" PRIu32 "\n", __func__, port, size, count);
215*ae1fae34SPekka Enberg }
216*ae1fae34SPekka Enberg 
217*ae1fae34SPekka Enberg void kvm__emulate_io(struct kvm *self, uint16_t port, void *data, int direction, int size, uint32_t count)
218*ae1fae34SPekka Enberg {
219*ae1fae34SPekka Enberg 	if (direction == KVM_EXIT_IO_IN)
220*ae1fae34SPekka Enberg 		kvm__emulate_io_in(self, port, data, size, count);
221*ae1fae34SPekka Enberg 	else
222*ae1fae34SPekka Enberg 		kvm__emulate_io_out(self, port, data, size, count);
223*ae1fae34SPekka Enberg }
224*ae1fae34SPekka Enberg 
225*ae1fae34SPekka Enberg void kvm__show_registers(struct kvm *self)
2267118d2caSPekka Enberg {
2277118d2caSPekka Enberg 	unsigned long rax, rbx, rcx;
2287118d2caSPekka Enberg 	unsigned long rdx, rsi, rdi;
2297118d2caSPekka Enberg 	unsigned long rbp,  r8,  r9;
2307118d2caSPekka Enberg 	unsigned long r10, r11, r12;
2317118d2caSPekka Enberg 	unsigned long r13, r14, r15;
2327118d2caSPekka Enberg 	unsigned long rip, rsp;
233a2fe6199SPekka Enberg 	unsigned long rflags;
2347118d2caSPekka Enberg 	struct kvm_regs regs;
2357118d2caSPekka Enberg 
2367118d2caSPekka Enberg 	if (ioctl(self->vcpu_fd, KVM_GET_REGS, &regs) < 0)
2377118d2caSPekka Enberg 		die("KVM_GET_REGS failed");
2387118d2caSPekka Enberg 
239a2fe6199SPekka Enberg 	rflags = regs.rflags;
240a2fe6199SPekka Enberg 
2417118d2caSPekka Enberg 	rip = regs.rip; rsp = regs.rsp;
2427118d2caSPekka Enberg 	rax = regs.rax; rbx = regs.rbx; rcx = regs.rcx;
2437118d2caSPekka Enberg 	rdx = regs.rdx; rsi = regs.rsi; rdi = regs.rdi;
2447118d2caSPekka Enberg 	rbp = regs.rbp; r8  = regs.r8;  r9  = regs.r9;
2457118d2caSPekka Enberg 	r10 = regs.r10; r11 = regs.r11; r12 = regs.r12;
2467118d2caSPekka Enberg 	r13 = regs.r13; r14 = regs.r14; r15 = regs.r15;
2477118d2caSPekka Enberg 
2487118d2caSPekka Enberg 	printf("Registers:\n");
2492177ec43SPekka Enberg 	printf(" rip: %016lx   rsp: %016lx flags: %016lx\n", rip, rsp, rflags);
2507118d2caSPekka Enberg 	printf(" rax: %016lx   ebx: %016lx   ecx: %016lx\n", rax, rbx, rcx);
2517118d2caSPekka Enberg 	printf(" rdx: %016lx   rsi: %016lx   rdi: %016lx\n", rdx, rsi, rdi);
2527118d2caSPekka Enberg 	printf(" rbp: %016lx   r8:  %016lx   r9:  %016lx\n", rbp, r8,  r9);
2537118d2caSPekka Enberg 	printf(" r10: %016lx   r11: %016lx   r12: %016lx\n", r10, r11, r12);
2547118d2caSPekka Enberg 	printf(" r13: %016lx   r14: %016lx   r15: %016lx\n", r13, r14, r15);
2557118d2caSPekka Enberg }
2567118d2caSPekka Enberg 
257*ae1fae34SPekka Enberg void kvm__show_code(struct kvm *self)
2586f10be05SPekka Enberg {
2596f10be05SPekka Enberg 	unsigned int code_bytes = 64;
2606f10be05SPekka Enberg 	unsigned int code_prologue = code_bytes * 43 / 64;
2616f10be05SPekka Enberg 	unsigned int code_len = code_bytes;
2626f10be05SPekka Enberg 	unsigned char c;
263*ae1fae34SPekka Enberg 	unsigned int i;
2646f10be05SPekka Enberg 	uint8_t *ip;
2656f10be05SPekka Enberg 
2666f10be05SPekka Enberg 	ip = guest_addr_to_host(self, self->regs.rip - code_prologue);
2676f10be05SPekka Enberg 
2686f10be05SPekka Enberg 	printf("Code: ");
2696f10be05SPekka Enberg 
2706f10be05SPekka Enberg 	for (i = 0; i < code_len; i++, ip++) {
2716e8abc38SPekka Enberg 		c = *ip;
2726e8abc38SPekka Enberg 
2736f10be05SPekka Enberg 		if (ip == guest_addr_to_host(self, self->regs.rip))
2746f10be05SPekka Enberg 			printf("<%02x> ", c);
2756f10be05SPekka Enberg 		else
2766f10be05SPekka Enberg 			printf("%02x ", c);
2776f10be05SPekka Enberg 	}
2786f10be05SPekka Enberg 
2796f10be05SPekka Enberg 	printf("\n");
2806f10be05SPekka Enberg }
281