1*ae1fae34SPekka Enberg #include "kvm/kvm.h" 2*ae1fae34SPekka Enberg 36c7d8514SPekka Enberg #include <linux/kvm.h> 4f5ab5f67SPekka Enberg 5f5ab5f67SPekka Enberg #include <asm/bootparam.h> 6f5ab5f67SPekka Enberg 7*ae1fae34SPekka Enberg #include <sys/ioctl.h> 81f9cff23SPekka Enberg #include <inttypes.h> 91f9cff23SPekka Enberg #include <sys/mman.h> 102da26a59SPekka Enberg #include <stdbool.h> 11f5ab5f67SPekka Enberg #include <stdarg.h> 12b8f6afcdSPekka Enberg #include <stdlib.h> 13f5ab5f67SPekka Enberg #include <string.h> 140d1f17ecSPekka Enberg #include <unistd.h> 151f9cff23SPekka Enberg #include <stdio.h> 16b8f6afcdSPekka Enberg #include <fcntl.h> 17b8f6afcdSPekka Enberg 18ad054a21SCyrill Gorcunov #include "util.h" 19ad054a21SCyrill Gorcunov 201f9cff23SPekka Enberg /* 211f9cff23SPekka Enberg * Compatibility code. Remove this when we move to tools/kvm. 221f9cff23SPekka Enberg */ 231f9cff23SPekka Enberg #ifndef KVM_EXIT_INTERNAL_ERROR 241f9cff23SPekka Enberg # define KVM_EXIT_INTERNAL_ERROR 17 251f9cff23SPekka Enberg #endif 261f9cff23SPekka Enberg 27*ae1fae34SPekka Enberg #define DEFINE_KVM_EXIT_REASON(reason) [reason] = #reason 280d1f17ecSPekka Enberg 29*ae1fae34SPekka Enberg const char *kvm_exit_reasons[] = { 30*ae1fae34SPekka Enberg DEFINE_KVM_EXIT_REASON(KVM_EXIT_UNKNOWN), 31*ae1fae34SPekka Enberg DEFINE_KVM_EXIT_REASON(KVM_EXIT_EXCEPTION), 32*ae1fae34SPekka Enberg DEFINE_KVM_EXIT_REASON(KVM_EXIT_IO), 33*ae1fae34SPekka Enberg DEFINE_KVM_EXIT_REASON(KVM_EXIT_HYPERCALL), 34*ae1fae34SPekka Enberg DEFINE_KVM_EXIT_REASON(KVM_EXIT_DEBUG), 35*ae1fae34SPekka Enberg DEFINE_KVM_EXIT_REASON(KVM_EXIT_HLT), 36*ae1fae34SPekka Enberg DEFINE_KVM_EXIT_REASON(KVM_EXIT_MMIO), 37*ae1fae34SPekka Enberg DEFINE_KVM_EXIT_REASON(KVM_EXIT_IRQ_WINDOW_OPEN), 38*ae1fae34SPekka Enberg DEFINE_KVM_EXIT_REASON(KVM_EXIT_SHUTDOWN), 39*ae1fae34SPekka Enberg DEFINE_KVM_EXIT_REASON(KVM_EXIT_FAIL_ENTRY), 40*ae1fae34SPekka Enberg DEFINE_KVM_EXIT_REASON(KVM_EXIT_INTR), 41*ae1fae34SPekka Enberg DEFINE_KVM_EXIT_REASON(KVM_EXIT_SET_TPR), 42*ae1fae34SPekka Enberg DEFINE_KVM_EXIT_REASON(KVM_EXIT_TPR_ACCESS), 43*ae1fae34SPekka Enberg DEFINE_KVM_EXIT_REASON(KVM_EXIT_S390_SIEIC), 44*ae1fae34SPekka Enberg DEFINE_KVM_EXIT_REASON(KVM_EXIT_S390_RESET), 45*ae1fae34SPekka Enberg DEFINE_KVM_EXIT_REASON(KVM_EXIT_DCR), 46*ae1fae34SPekka Enberg DEFINE_KVM_EXIT_REASON(KVM_EXIT_NMI), 47*ae1fae34SPekka Enberg DEFINE_KVM_EXIT_REASON(KVM_EXIT_INTERNAL_ERROR), 489b1fb1c3SPekka Enberg }; 499b1fb1c3SPekka Enberg 50*ae1fae34SPekka Enberg static inline void *guest_addr_to_host(struct kvm *self, unsigned long offset) 51*ae1fae34SPekka Enberg { 52*ae1fae34SPekka Enberg return self->ram_start + offset; 53*ae1fae34SPekka Enberg } 54*ae1fae34SPekka Enberg 55*ae1fae34SPekka Enberg static bool kvm__supports_extension(struct kvm *self, unsigned int extension) 56b8f6afcdSPekka Enberg { 5728fa19c0SPekka Enberg int ret; 58b8f6afcdSPekka Enberg 5973ac60e6SPekka Enberg ret = ioctl(self->sys_fd, KVM_CHECK_EXTENSION, extension); 604076b041SPekka Enberg if (ret < 0) 614076b041SPekka Enberg return false; 624076b041SPekka Enberg 634076b041SPekka Enberg return ret; 644076b041SPekka Enberg } 654076b041SPekka Enberg 664076b041SPekka Enberg static struct kvm *kvm__new(void) 674076b041SPekka Enberg { 684076b041SPekka Enberg struct kvm *self = calloc(1, sizeof *self); 694076b041SPekka Enberg 704076b041SPekka Enberg if (!self) 714076b041SPekka Enberg die("out of memory"); 724076b041SPekka Enberg 734076b041SPekka Enberg return self; 744076b041SPekka Enberg } 754076b041SPekka Enberg 76*ae1fae34SPekka Enberg struct kvm *kvm__init(void) 774076b041SPekka Enberg { 782b0e3342SPekka Enberg struct kvm_userspace_memory_region mem; 794076b041SPekka Enberg struct kvm *self; 800d1f17ecSPekka Enberg long page_size; 811f9cff23SPekka Enberg int mmap_size; 824076b041SPekka Enberg int ret; 834076b041SPekka Enberg 844076b041SPekka Enberg self = kvm__new(); 854076b041SPekka Enberg 8673ac60e6SPekka Enberg self->sys_fd = open("/dev/kvm", O_RDWR); 8773ac60e6SPekka Enberg if (self->sys_fd < 0) 88f5ab5f67SPekka Enberg die_perror("open"); 89b8f6afcdSPekka Enberg 9073ac60e6SPekka Enberg ret = ioctl(self->sys_fd, KVM_GET_API_VERSION, 0); 916c7d8514SPekka Enberg if (ret != KVM_API_VERSION) 92f5ab5f67SPekka Enberg die_perror("KVM_API_VERSION ioctl"); 936c7d8514SPekka Enberg 9473ac60e6SPekka Enberg self->vm_fd = ioctl(self->sys_fd, KVM_CREATE_VM, 0); 9573ac60e6SPekka Enberg if (self->vm_fd < 0) 96f5ab5f67SPekka Enberg die_perror("KVM_CREATE_VM ioctl"); 9728fa19c0SPekka Enberg 984076b041SPekka Enberg if (!kvm__supports_extension(self, KVM_CAP_USER_MEMORY)) 99f5ab5f67SPekka Enberg die("KVM_CAP_USER_MEMORY is not supported"); 1002da26a59SPekka Enberg 1010d1f17ecSPekka Enberg self->ram_size = 64UL * 1024UL * 1024UL; 1020d1f17ecSPekka Enberg 1030d1f17ecSPekka Enberg page_size = sysconf(_SC_PAGESIZE); 1040d1f17ecSPekka Enberg if (posix_memalign(&self->ram_start, page_size, self->ram_size) != 0) 1050d1f17ecSPekka Enberg die("out of memory"); 1060d1f17ecSPekka Enberg 1072b0e3342SPekka Enberg mem = (struct kvm_userspace_memory_region) { 1082b0e3342SPekka Enberg .slot = 0, 1092b0e3342SPekka Enberg .guest_phys_addr = 0x0UL, 1100d1f17ecSPekka Enberg .memory_size = self->ram_size, 1110d1f17ecSPekka Enberg .userspace_addr = (unsigned long) self->ram_start, 1122b0e3342SPekka Enberg }; 1132b0e3342SPekka Enberg 11473ac60e6SPekka Enberg ret = ioctl(self->vm_fd, KVM_SET_USER_MEMORY_REGION, &mem, 1); 1152b0e3342SPekka Enberg if (ret < 0) 116f5ab5f67SPekka Enberg die_perror("KVM_SET_USER_MEMORY_REGION ioctl"); 1172b0e3342SPekka Enberg 118895c2fefSPekka Enberg if (!kvm__supports_extension(self, KVM_CAP_SET_TSS_ADDR)) 119f5ab5f67SPekka Enberg die("KVM_CAP_SET_TSS_ADDR is not supported"); 120895c2fefSPekka Enberg 12173ac60e6SPekka Enberg ret = ioctl(self->vm_fd, KVM_SET_TSS_ADDR, 0xfffbd000); 122895c2fefSPekka Enberg if (ret < 0) 123f5ab5f67SPekka Enberg die_perror("KVM_SET_TSS_ADDR ioctl"); 124895c2fefSPekka Enberg 12573ac60e6SPekka Enberg self->vcpu_fd = ioctl(self->vm_fd, KVM_CREATE_VCPU, 0); 1262b0e3342SPekka Enberg if (self->vcpu_fd < 0) 127f5ab5f67SPekka Enberg die_perror("KVM_CREATE_VCPU ioctl"); 1282b0e3342SPekka Enberg 1291f9cff23SPekka Enberg mmap_size = ioctl(self->sys_fd, KVM_GET_VCPU_MMAP_SIZE, 0); 1301f9cff23SPekka Enberg if (mmap_size < 0) 131f5ab5f67SPekka Enberg die_perror("KVM_GET_VCPU_MMAP_SIZE ioctl"); 1321f9cff23SPekka Enberg 1331f9cff23SPekka Enberg self->kvm_run = mmap(NULL, mmap_size, PROT_READ|PROT_WRITE, MAP_SHARED, self->vcpu_fd, 0); 1341f9cff23SPekka Enberg if (self->kvm_run == MAP_FAILED) 1351f9cff23SPekka Enberg die("unable to mmap vcpu fd"); 1361f9cff23SPekka Enberg 1374076b041SPekka Enberg return self; 1384076b041SPekka Enberg } 1394076b041SPekka Enberg 140*ae1fae34SPekka Enberg void kvm__enable_singlestep(struct kvm *self) 141aee6632eSPekka Enberg { 142aee6632eSPekka Enberg struct kvm_guest_debug debug = { 143aee6632eSPekka Enberg .control = KVM_GUESTDBG_ENABLE | KVM_GUESTDBG_SINGLESTEP, 144aee6632eSPekka Enberg }; 145aee6632eSPekka Enberg 146aee6632eSPekka Enberg if (ioctl(self->vcpu_fd, KVM_SET_GUEST_DEBUG, &debug) < 0) 147b625d4b6SCyrill Gorcunov warning("KVM_SET_GUEST_DEBUG failed"); 148aee6632eSPekka Enberg } 149aee6632eSPekka Enberg 150*ae1fae34SPekka Enberg /* bzImages are loaded at 1 MB by default. */ 151*ae1fae34SPekka Enberg #define KERNEL_START_ADDR (1024ULL * 1024ULL) 152*ae1fae34SPekka Enberg 153*ae1fae34SPekka Enberg static const char *BZIMAGE_MAGIC = "HdrS"; 154*ae1fae34SPekka Enberg 155*ae1fae34SPekka Enberg static uint32_t load_bzimage(struct kvm *kvm, int fd) 156*ae1fae34SPekka Enberg { 157*ae1fae34SPekka Enberg struct boot_params boot; 158*ae1fae34SPekka Enberg void *p; 159*ae1fae34SPekka Enberg int nr; 160*ae1fae34SPekka Enberg 161*ae1fae34SPekka Enberg read(fd, &boot, sizeof(boot)); 162*ae1fae34SPekka Enberg 163*ae1fae34SPekka Enberg if (memcmp(&boot.hdr.header, BZIMAGE_MAGIC, strlen(BZIMAGE_MAGIC)) != 0) 164*ae1fae34SPekka Enberg return 0; 165*ae1fae34SPekka Enberg 166*ae1fae34SPekka Enberg lseek(fd, (boot.hdr.setup_sects+1) * 512, SEEK_SET); 167*ae1fae34SPekka Enberg 168*ae1fae34SPekka Enberg p = guest_addr_to_host(kvm, KERNEL_START_ADDR); 169*ae1fae34SPekka Enberg 170*ae1fae34SPekka Enberg while ((nr = read(fd, p, 65536)) > 0) 171*ae1fae34SPekka Enberg p += nr; 172*ae1fae34SPekka Enberg 173*ae1fae34SPekka Enberg return boot.hdr.code32_start; 174*ae1fae34SPekka Enberg } 175*ae1fae34SPekka Enberg 176*ae1fae34SPekka Enberg uint32_t kvm__load_kernel(struct kvm *kvm, const char *kernel_filename) 177*ae1fae34SPekka Enberg { 178*ae1fae34SPekka Enberg uint32_t ret; 179*ae1fae34SPekka Enberg int fd; 180*ae1fae34SPekka Enberg 181*ae1fae34SPekka Enberg fd = open(kernel_filename, O_RDONLY); 182*ae1fae34SPekka Enberg if (fd < 0) 183*ae1fae34SPekka Enberg die("unable to open kernel"); 184*ae1fae34SPekka Enberg 185*ae1fae34SPekka Enberg ret = load_bzimage(kvm, fd); 186*ae1fae34SPekka Enberg if (!ret) 187*ae1fae34SPekka Enberg die("%s is not a valid bzImage", kernel_filename); 188*ae1fae34SPekka Enberg 189*ae1fae34SPekka Enberg return ret; 190*ae1fae34SPekka Enberg } 191*ae1fae34SPekka Enberg 192*ae1fae34SPekka Enberg void kvm__reset_vcpu(struct kvm *self, uint64_t rip) 193*ae1fae34SPekka Enberg { 194*ae1fae34SPekka Enberg self->regs.rip = rip; 195*ae1fae34SPekka Enberg self->regs.rflags = 0x0000000000000002ULL; 196*ae1fae34SPekka Enberg 197*ae1fae34SPekka Enberg if (ioctl(self->vcpu_fd, KVM_SET_REGS, &self->regs) < 0) 198*ae1fae34SPekka Enberg die_perror("KVM_SET_REGS failed"); 199*ae1fae34SPekka Enberg } 200*ae1fae34SPekka Enberg 201*ae1fae34SPekka Enberg void kvm__run(struct kvm *self) 202*ae1fae34SPekka Enberg { 203*ae1fae34SPekka Enberg if (ioctl(self->vcpu_fd, KVM_RUN, 0) < 0) 204*ae1fae34SPekka Enberg die_perror("KVM_RUN failed"); 205*ae1fae34SPekka Enberg } 206*ae1fae34SPekka Enberg 207*ae1fae34SPekka Enberg static void kvm__emulate_io_out(struct kvm *self, uint16_t port, void *data, int size, uint32_t count) 208*ae1fae34SPekka Enberg { 209*ae1fae34SPekka Enberg fprintf(stderr, "%s port=%x, size=%d, count=%" PRIu32 "\n", __func__, port, size, count); 210*ae1fae34SPekka Enberg } 211*ae1fae34SPekka Enberg 212*ae1fae34SPekka Enberg static void kvm__emulate_io_in(struct kvm *self, uint16_t port, void *data, int size, uint32_t count) 213*ae1fae34SPekka Enberg { 214*ae1fae34SPekka Enberg fprintf(stderr, "%s port=%x, size=%d, count=%" PRIu32 "\n", __func__, port, size, count); 215*ae1fae34SPekka Enberg } 216*ae1fae34SPekka Enberg 217*ae1fae34SPekka Enberg void kvm__emulate_io(struct kvm *self, uint16_t port, void *data, int direction, int size, uint32_t count) 218*ae1fae34SPekka Enberg { 219*ae1fae34SPekka Enberg if (direction == KVM_EXIT_IO_IN) 220*ae1fae34SPekka Enberg kvm__emulate_io_in(self, port, data, size, count); 221*ae1fae34SPekka Enberg else 222*ae1fae34SPekka Enberg kvm__emulate_io_out(self, port, data, size, count); 223*ae1fae34SPekka Enberg } 224*ae1fae34SPekka Enberg 225*ae1fae34SPekka Enberg void kvm__show_registers(struct kvm *self) 2267118d2caSPekka Enberg { 2277118d2caSPekka Enberg unsigned long rax, rbx, rcx; 2287118d2caSPekka Enberg unsigned long rdx, rsi, rdi; 2297118d2caSPekka Enberg unsigned long rbp, r8, r9; 2307118d2caSPekka Enberg unsigned long r10, r11, r12; 2317118d2caSPekka Enberg unsigned long r13, r14, r15; 2327118d2caSPekka Enberg unsigned long rip, rsp; 233a2fe6199SPekka Enberg unsigned long rflags; 2347118d2caSPekka Enberg struct kvm_regs regs; 2357118d2caSPekka Enberg 2367118d2caSPekka Enberg if (ioctl(self->vcpu_fd, KVM_GET_REGS, ®s) < 0) 2377118d2caSPekka Enberg die("KVM_GET_REGS failed"); 2387118d2caSPekka Enberg 239a2fe6199SPekka Enberg rflags = regs.rflags; 240a2fe6199SPekka Enberg 2417118d2caSPekka Enberg rip = regs.rip; rsp = regs.rsp; 2427118d2caSPekka Enberg rax = regs.rax; rbx = regs.rbx; rcx = regs.rcx; 2437118d2caSPekka Enberg rdx = regs.rdx; rsi = regs.rsi; rdi = regs.rdi; 2447118d2caSPekka Enberg rbp = regs.rbp; r8 = regs.r8; r9 = regs.r9; 2457118d2caSPekka Enberg r10 = regs.r10; r11 = regs.r11; r12 = regs.r12; 2467118d2caSPekka Enberg r13 = regs.r13; r14 = regs.r14; r15 = regs.r15; 2477118d2caSPekka Enberg 2487118d2caSPekka Enberg printf("Registers:\n"); 2492177ec43SPekka Enberg printf(" rip: %016lx rsp: %016lx flags: %016lx\n", rip, rsp, rflags); 2507118d2caSPekka Enberg printf(" rax: %016lx ebx: %016lx ecx: %016lx\n", rax, rbx, rcx); 2517118d2caSPekka Enberg printf(" rdx: %016lx rsi: %016lx rdi: %016lx\n", rdx, rsi, rdi); 2527118d2caSPekka Enberg printf(" rbp: %016lx r8: %016lx r9: %016lx\n", rbp, r8, r9); 2537118d2caSPekka Enberg printf(" r10: %016lx r11: %016lx r12: %016lx\n", r10, r11, r12); 2547118d2caSPekka Enberg printf(" r13: %016lx r14: %016lx r15: %016lx\n", r13, r14, r15); 2557118d2caSPekka Enberg } 2567118d2caSPekka Enberg 257*ae1fae34SPekka Enberg void kvm__show_code(struct kvm *self) 2586f10be05SPekka Enberg { 2596f10be05SPekka Enberg unsigned int code_bytes = 64; 2606f10be05SPekka Enberg unsigned int code_prologue = code_bytes * 43 / 64; 2616f10be05SPekka Enberg unsigned int code_len = code_bytes; 2626f10be05SPekka Enberg unsigned char c; 263*ae1fae34SPekka Enberg unsigned int i; 2646f10be05SPekka Enberg uint8_t *ip; 2656f10be05SPekka Enberg 2666f10be05SPekka Enberg ip = guest_addr_to_host(self, self->regs.rip - code_prologue); 2676f10be05SPekka Enberg 2686f10be05SPekka Enberg printf("Code: "); 2696f10be05SPekka Enberg 2706f10be05SPekka Enberg for (i = 0; i < code_len; i++, ip++) { 2716e8abc38SPekka Enberg c = *ip; 2726e8abc38SPekka Enberg 2736f10be05SPekka Enberg if (ip == guest_addr_to_host(self, self->regs.rip)) 2746f10be05SPekka Enberg printf("<%02x> ", c); 2756f10be05SPekka Enberg else 2766f10be05SPekka Enberg printf("%02x ", c); 2776f10be05SPekka Enberg } 2786f10be05SPekka Enberg 2796f10be05SPekka Enberg printf("\n"); 2806f10be05SPekka Enberg } 281