1ae1fae34SPekka Enberg #include "kvm/kvm.h" 2ae1fae34SPekka Enberg 3b3594ec7SCyrill Gorcunov #include "kvm/boot-protocol.h" 472811558SPekka Enberg #include "kvm/cpufeature.h" 572811558SPekka Enberg #include "kvm/read-write.h" 672811558SPekka Enberg #include "kvm/interrupt.h" 70c7c14a7SCyrill Gorcunov #include "kvm/mptable.h" 872811558SPekka Enberg #include "kvm/util.h" 9eda03319SPekka Enberg 106c7d8514SPekka Enberg #include <linux/kvm.h> 11f5ab5f67SPekka Enberg 12f5ab5f67SPekka Enberg #include <asm/bootparam.h> 13f5ab5f67SPekka Enberg 14ae1fae34SPekka Enberg #include <sys/ioctl.h> 151f9cff23SPekka Enberg #include <sys/mman.h> 16ce79f1caSPekka Enberg #include <sys/stat.h> 172da26a59SPekka Enberg #include <stdbool.h> 186e5e8b8dSPekka Enberg #include <assert.h> 1906e41eeaSPekka Enberg #include <limits.h> 20ce79f1caSPekka Enberg #include <signal.h> 21f5ab5f67SPekka Enberg #include <stdarg.h> 22b8f6afcdSPekka Enberg #include <stdlib.h> 23f5ab5f67SPekka Enberg #include <string.h> 240d1f17ecSPekka Enberg #include <unistd.h> 251f9cff23SPekka Enberg #include <stdio.h> 26b8f6afcdSPekka Enberg #include <fcntl.h> 27ce79f1caSPekka Enberg #include <time.h> 28b8f6afcdSPekka Enberg 29ae1fae34SPekka Enberg #define DEFINE_KVM_EXIT_REASON(reason) [reason] = #reason 300d1f17ecSPekka Enberg 31ae1fae34SPekka Enberg const char *kvm_exit_reasons[] = { 32ae1fae34SPekka Enberg DEFINE_KVM_EXIT_REASON(KVM_EXIT_UNKNOWN), 33ae1fae34SPekka Enberg DEFINE_KVM_EXIT_REASON(KVM_EXIT_EXCEPTION), 34ae1fae34SPekka Enberg DEFINE_KVM_EXIT_REASON(KVM_EXIT_IO), 35ae1fae34SPekka Enberg DEFINE_KVM_EXIT_REASON(KVM_EXIT_HYPERCALL), 36ae1fae34SPekka Enberg DEFINE_KVM_EXIT_REASON(KVM_EXIT_DEBUG), 37ae1fae34SPekka Enberg DEFINE_KVM_EXIT_REASON(KVM_EXIT_HLT), 38ae1fae34SPekka Enberg DEFINE_KVM_EXIT_REASON(KVM_EXIT_MMIO), 39ae1fae34SPekka Enberg DEFINE_KVM_EXIT_REASON(KVM_EXIT_IRQ_WINDOW_OPEN), 40ae1fae34SPekka Enberg DEFINE_KVM_EXIT_REASON(KVM_EXIT_SHUTDOWN), 41ae1fae34SPekka Enberg DEFINE_KVM_EXIT_REASON(KVM_EXIT_FAIL_ENTRY), 42ae1fae34SPekka Enberg DEFINE_KVM_EXIT_REASON(KVM_EXIT_INTR), 43ae1fae34SPekka Enberg DEFINE_KVM_EXIT_REASON(KVM_EXIT_SET_TPR), 44ae1fae34SPekka Enberg DEFINE_KVM_EXIT_REASON(KVM_EXIT_TPR_ACCESS), 45ae1fae34SPekka Enberg DEFINE_KVM_EXIT_REASON(KVM_EXIT_S390_SIEIC), 46ae1fae34SPekka Enberg DEFINE_KVM_EXIT_REASON(KVM_EXIT_S390_RESET), 47ae1fae34SPekka Enberg DEFINE_KVM_EXIT_REASON(KVM_EXIT_DCR), 48ae1fae34SPekka Enberg DEFINE_KVM_EXIT_REASON(KVM_EXIT_NMI), 49ae1fae34SPekka Enberg DEFINE_KVM_EXIT_REASON(KVM_EXIT_INTERNAL_ERROR), 509b1fb1c3SPekka Enberg }; 519b1fb1c3SPekka Enberg 5255e19624SCyrill Gorcunov #define DEFINE_KVM_EXT(ext) \ 5355e19624SCyrill Gorcunov .name = #ext, \ 5455e19624SCyrill Gorcunov .code = ext 5555e19624SCyrill Gorcunov 5655e19624SCyrill Gorcunov struct { 5755e19624SCyrill Gorcunov const char *name; 5855e19624SCyrill Gorcunov int code; 5955e19624SCyrill Gorcunov } kvm_req_ext[] = { 6055e19624SCyrill Gorcunov { DEFINE_KVM_EXT(KVM_CAP_COALESCED_MMIO) }, 6155e19624SCyrill Gorcunov { DEFINE_KVM_EXT(KVM_CAP_SET_TSS_ADDR) }, 6255e19624SCyrill Gorcunov { DEFINE_KVM_EXT(KVM_CAP_PIT2) }, 6355e19624SCyrill Gorcunov { DEFINE_KVM_EXT(KVM_CAP_USER_MEMORY) }, 6455e19624SCyrill Gorcunov { DEFINE_KVM_EXT(KVM_CAP_IRQ_ROUTING) }, 6555e19624SCyrill Gorcunov { DEFINE_KVM_EXT(KVM_CAP_IRQCHIP) }, 667c0ec28fSCyrill Gorcunov { DEFINE_KVM_EXT(KVM_CAP_HLT) }, 6755e19624SCyrill Gorcunov { DEFINE_KVM_EXT(KVM_CAP_IRQ_INJECT_STATUS) }, 68d38ad31aSCyrill Gorcunov { DEFINE_KVM_EXT(KVM_CAP_EXT_CPUID) }, 6955e19624SCyrill Gorcunov }; 7055e19624SCyrill Gorcunov 7143835ac9SSasha Levin static bool kvm__supports_extension(struct kvm *kvm, unsigned int extension) 72b8f6afcdSPekka Enberg { 7328fa19c0SPekka Enberg int ret; 74b8f6afcdSPekka Enberg 7543835ac9SSasha Levin ret = ioctl(kvm->sys_fd, KVM_CHECK_EXTENSION, extension); 764076b041SPekka Enberg if (ret < 0) 774076b041SPekka Enberg return false; 784076b041SPekka Enberg 794076b041SPekka Enberg return ret; 804076b041SPekka Enberg } 814076b041SPekka Enberg 8243835ac9SSasha Levin static int kvm__check_extensions(struct kvm *kvm) 8355e19624SCyrill Gorcunov { 8455e19624SCyrill Gorcunov unsigned int i; 8555e19624SCyrill Gorcunov 8655e19624SCyrill Gorcunov for (i = 0; i < ARRAY_SIZE(kvm_req_ext); i++) { 8743835ac9SSasha Levin if (!kvm__supports_extension(kvm, kvm_req_ext[i].code)) { 884542f276SCyrill Gorcunov pr_error("Unsuppored KVM extension detected: %s", 8955e19624SCyrill Gorcunov kvm_req_ext[i].name); 9055e19624SCyrill Gorcunov return (int)-i; 9155e19624SCyrill Gorcunov } 9255e19624SCyrill Gorcunov } 9355e19624SCyrill Gorcunov 9455e19624SCyrill Gorcunov return 0; 9555e19624SCyrill Gorcunov } 9655e19624SCyrill Gorcunov 974076b041SPekka Enberg static struct kvm *kvm__new(void) 984076b041SPekka Enberg { 9943835ac9SSasha Levin struct kvm *kvm = calloc(1, sizeof *kvm); 1004076b041SPekka Enberg 10143835ac9SSasha Levin if (!kvm) 1024076b041SPekka Enberg die("out of memory"); 1034076b041SPekka Enberg 10443835ac9SSasha Levin return kvm; 1054076b041SPekka Enberg } 1064076b041SPekka Enberg 10743835ac9SSasha Levin void kvm__delete(struct kvm *kvm) 1089ef4c68eSPekka Enberg { 10943835ac9SSasha Levin kvm__stop_timer(kvm); 110fbfe68b7SSasha Levin 11143835ac9SSasha Levin munmap(kvm->ram_start, kvm->ram_size); 11243835ac9SSasha Levin free(kvm); 1139ef4c68eSPekka Enberg } 1149ef4c68eSPekka Enberg 115c78b8713SAsias He static bool kvm__cpu_supports_vm(void) 116c78b8713SAsias He { 117c78b8713SAsias He struct cpuid_regs regs; 1183fdf659dSSasha Levin u32 eax_base; 119831fbf23SPekka Enberg int feature; 120c78b8713SAsias He 121c78b8713SAsias He regs = (struct cpuid_regs) { 122831fbf23SPekka Enberg .eax = 0x00, 123c78b8713SAsias He }; 124c78b8713SAsias He host_cpuid(®s); 125c78b8713SAsias He 126ae87afbfSCyrill Gorcunov switch (regs.ebx) { 127ae87afbfSCyrill Gorcunov case CPUID_VENDOR_INTEL_1: 128831fbf23SPekka Enberg eax_base = 0x00; 129831fbf23SPekka Enberg feature = KVM__X86_FEATURE_VMX; 130ae87afbfSCyrill Gorcunov break; 13134649df9SPekka Enberg 132ae87afbfSCyrill Gorcunov case CPUID_VENDOR_AMD_1: 133831fbf23SPekka Enberg eax_base = 0x80000000; 134831fbf23SPekka Enberg feature = KVM__X86_FEATURE_SVM; 135ae87afbfSCyrill Gorcunov break; 13634649df9SPekka Enberg 13734649df9SPekka Enberg default: 13834649df9SPekka Enberg return false; 139ae87afbfSCyrill Gorcunov } 140ae87afbfSCyrill Gorcunov 141831fbf23SPekka Enberg regs = (struct cpuid_regs) { 142831fbf23SPekka Enberg .eax = eax_base, 143831fbf23SPekka Enberg }; 144831fbf23SPekka Enberg host_cpuid(®s); 145831fbf23SPekka Enberg 146831fbf23SPekka Enberg if (regs.eax < eax_base + 0x01) 147831fbf23SPekka Enberg return false; 148831fbf23SPekka Enberg 149831fbf23SPekka Enberg regs = (struct cpuid_regs) { 150831fbf23SPekka Enberg .eax = eax_base + 0x01 151831fbf23SPekka Enberg }; 152831fbf23SPekka Enberg host_cpuid(®s); 153831fbf23SPekka Enberg 154831fbf23SPekka Enberg return regs.ecx & (1 << feature); 155c78b8713SAsias He } 156c78b8713SAsias He 157874467f8SSasha Levin static void kvm_register_mem_slot(struct kvm *kvm, u32 slot, u64 guest_phys, u64 size, void *userspace_addr) 1584076b041SPekka Enberg { 1592b0e3342SPekka Enberg struct kvm_userspace_memory_region mem; 160839051d9SSasha Levin int ret; 161839051d9SSasha Levin 162839051d9SSasha Levin mem = (struct kvm_userspace_memory_region) { 163874467f8SSasha Levin .slot = slot, 164874467f8SSasha Levin .guest_phys_addr = guest_phys, 165874467f8SSasha Levin .memory_size = size, 166c4acb611SIngo Molnar .userspace_addr = (unsigned long)userspace_addr, 167839051d9SSasha Levin }; 168839051d9SSasha Levin 169874467f8SSasha Levin ret = ioctl(kvm->vm_fd, KVM_SET_USER_MEMORY_REGION, &mem); 170839051d9SSasha Levin if (ret < 0) 171839051d9SSasha Levin die_perror("KVM_SET_USER_MEMORY_REGION ioctl"); 172839051d9SSasha Levin } 173839051d9SSasha Levin 174874467f8SSasha Levin /* 175874467f8SSasha Levin * Allocating RAM size bigger than 4GB requires us to leave a gap 176874467f8SSasha Levin * in the RAM which is used for PCI MMIO, hotplug, and unconfigured 177874467f8SSasha Levin * devices (see documentation of e820_setup_gap() for details). 178874467f8SSasha Levin * 179874467f8SSasha Levin * If we're required to initialize RAM bigger than 4GB, we will create 180874467f8SSasha Levin * a gap between 0xe0000000 and 0x100000000 in the guest virtual mem space. 181874467f8SSasha Levin */ 182874467f8SSasha Levin 18343835ac9SSasha Levin void kvm__init_ram(struct kvm *kvm) 184874467f8SSasha Levin { 185874467f8SSasha Levin u64 phys_start, phys_size; 186874467f8SSasha Levin void *host_mem; 187874467f8SSasha Levin 18843835ac9SSasha Levin if (kvm->ram_size < KVM_32BIT_GAP_START) { 189874467f8SSasha Levin /* Use a single block of RAM for 32bit RAM */ 190874467f8SSasha Levin 191874467f8SSasha Levin phys_start = 0; 19243835ac9SSasha Levin phys_size = kvm->ram_size; 19343835ac9SSasha Levin host_mem = kvm->ram_start; 194874467f8SSasha Levin 195*f234697eSSasha Levin kvm_register_mem_slot(kvm, 0, phys_start, phys_size, host_mem); 196874467f8SSasha Levin } else { 197874467f8SSasha Levin /* First RAM range from zero to the PCI gap: */ 198874467f8SSasha Levin 199874467f8SSasha Levin phys_start = 0; 200874467f8SSasha Levin phys_size = KVM_32BIT_GAP_START; 20143835ac9SSasha Levin host_mem = kvm->ram_start; 202874467f8SSasha Levin 20343835ac9SSasha Levin kvm_register_mem_slot(kvm, 0, phys_start, phys_size, host_mem); 204874467f8SSasha Levin 205874467f8SSasha Levin /* Second RAM range from 4GB to the end of RAM: */ 206874467f8SSasha Levin 207874467f8SSasha Levin phys_start = 0x100000000ULL; 20843835ac9SSasha Levin phys_size = kvm->ram_size - phys_size; 20943835ac9SSasha Levin host_mem = kvm->ram_start + phys_start; 210874467f8SSasha Levin 21143835ac9SSasha Levin kvm_register_mem_slot(kvm, 1, phys_start, phys_size, host_mem); 212874467f8SSasha Levin } 213874467f8SSasha Levin } 214874467f8SSasha Levin 21543835ac9SSasha Levin int kvm__max_cpus(struct kvm *kvm) 216384922b3SPekka Enberg { 217384922b3SPekka Enberg int ret; 218384922b3SPekka Enberg 21943835ac9SSasha Levin ret = ioctl(kvm->sys_fd, KVM_CHECK_EXTENSION, KVM_CAP_NR_VCPUS); 220384922b3SPekka Enberg if (ret < 0) 221384922b3SPekka Enberg die_perror("KVM_CAP_NR_VCPUS"); 222384922b3SPekka Enberg 223384922b3SPekka Enberg return ret; 224384922b3SPekka Enberg } 225384922b3SPekka Enberg 226839051d9SSasha Levin struct kvm *kvm__init(const char *kvm_dev, unsigned long ram_size) 227839051d9SSasha Levin { 2289687927dSAsias He struct kvm_pit_config pit_config = { .flags = 0, }; 22943835ac9SSasha Levin struct kvm *kvm; 2304076b041SPekka Enberg int ret; 2314076b041SPekka Enberg 232c78b8713SAsias He if (!kvm__cpu_supports_vm()) 233c78b8713SAsias He die("Your CPU does not support hardware virtualization"); 234c78b8713SAsias He 23543835ac9SSasha Levin kvm = kvm__new(); 2364076b041SPekka Enberg 23743835ac9SSasha Levin kvm->sys_fd = open(kvm_dev, O_RDWR); 23843835ac9SSasha Levin if (kvm->sys_fd < 0) { 2396d7c36ceSPekka Enberg if (errno == ENOENT) 240e907b83fSPekka Enberg die("'%s' not found. Please make sure your kernel has CONFIG_KVM enabled and that the KVM modules are loaded.", kvm_dev); 241f8334800SIngo Molnar if (errno == ENODEV) 242f8334800SIngo Molnar die("'%s' KVM driver not available.\n # (If the KVM module is loaded then 'dmesg' may offer further clues about the failure.)", kvm_dev); 2436d7c36ceSPekka Enberg 244f8334800SIngo Molnar fprintf(stderr, " Fatal, could not open %s: ", kvm_dev); 245f8334800SIngo Molnar perror(NULL); 246f8334800SIngo Molnar exit(1); 2476d7c36ceSPekka Enberg } 248b8f6afcdSPekka Enberg 24943835ac9SSasha Levin ret = ioctl(kvm->sys_fd, KVM_GET_API_VERSION, 0); 2506c7d8514SPekka Enberg if (ret != KVM_API_VERSION) 251f5ab5f67SPekka Enberg die_perror("KVM_API_VERSION ioctl"); 2526c7d8514SPekka Enberg 25343835ac9SSasha Levin kvm->vm_fd = ioctl(kvm->sys_fd, KVM_CREATE_VM, 0); 25443835ac9SSasha Levin if (kvm->vm_fd < 0) 255f5ab5f67SPekka Enberg die_perror("KVM_CREATE_VM ioctl"); 25628fa19c0SPekka Enberg 25743835ac9SSasha Levin if (kvm__check_extensions(kvm)) 25855e19624SCyrill Gorcunov die("A required KVM extention is not supported by OS"); 2599687927dSAsias He 26043835ac9SSasha Levin ret = ioctl(kvm->vm_fd, KVM_SET_TSS_ADDR, 0xfffbd000); 2619687927dSAsias He if (ret < 0) 2629687927dSAsias He die_perror("KVM_SET_TSS_ADDR ioctl"); 2639687927dSAsias He 26443835ac9SSasha Levin ret = ioctl(kvm->vm_fd, KVM_CREATE_PIT2, &pit_config); 2659687927dSAsias He if (ret < 0) 2669687927dSAsias He die_perror("KVM_CREATE_PIT2 ioctl"); 2679687927dSAsias He 26843835ac9SSasha Levin kvm->ram_size = ram_size; 2690d1f17ecSPekka Enberg 27043835ac9SSasha Levin if (kvm->ram_size < KVM_32BIT_GAP_START) { 27137c34ca8SSasha Levin kvm->ram_start = mmap(NULL, ram_size, PROT_RW, MAP_ANON_NORESERVE, -1, 0); 272874467f8SSasha Levin } else { 27337c34ca8SSasha Levin kvm->ram_start = mmap(NULL, ram_size + KVM_32BIT_GAP_SIZE, PROT_RW, MAP_ANON_NORESERVE, -1, 0); 27443835ac9SSasha Levin if (kvm->ram_start != MAP_FAILED) { 275874467f8SSasha Levin /* 276874467f8SSasha Levin * We mprotect the gap (see kvm__init_ram() for details) PROT_NONE so that 277874467f8SSasha Levin * if we accidently write to it, we will know. 278874467f8SSasha Levin */ 27943835ac9SSasha Levin mprotect(kvm->ram_start + KVM_32BIT_GAP_START, KVM_32BIT_GAP_SIZE, PROT_NONE); 280874467f8SSasha Levin } 281874467f8SSasha Levin } 28243835ac9SSasha Levin if (kvm->ram_start == MAP_FAILED) 2830d1f17ecSPekka Enberg die("out of memory"); 2840d1f17ecSPekka Enberg 28543835ac9SSasha Levin ret = ioctl(kvm->vm_fd, KVM_CREATE_IRQCHIP); 286895c2fefSPekka Enberg if (ret < 0) 2879687927dSAsias He die_perror("KVM_CREATE_IRQCHIP ioctl"); 2889687927dSAsias He 28943835ac9SSasha Levin return kvm; 2904076b041SPekka Enberg } 2914076b041SPekka Enberg 2925f6772b8SCyrill Gorcunov #define BOOT_LOADER_SELECTOR 0x1000 293b08e9ec4SPekka Enberg #define BOOT_LOADER_IP 0x0000 294dbdb74c2SPekka Enberg #define BOOT_LOADER_SP 0x8000 2952dd4a4edSCyrill Gorcunov #define BOOT_CMDLINE_OFFSET 0x20000 2962dd4a4edSCyrill Gorcunov 2979a4ecdc5SPekka Enberg #define BOOT_PROTOCOL_REQUIRED 0x206 298a43f6460SCyrill Gorcunov #define LOAD_HIGH 0x01 299009b0758SPekka Enberg 30043835ac9SSasha Levin static int load_flat_binary(struct kvm *kvm, int fd) 301009b0758SPekka Enberg { 302009b0758SPekka Enberg void *p; 303009b0758SPekka Enberg int nr; 304009b0758SPekka Enberg 305009b0758SPekka Enberg if (lseek(fd, 0, SEEK_SET) < 0) 306009b0758SPekka Enberg die_perror("lseek"); 307009b0758SPekka Enberg 30843835ac9SSasha Levin p = guest_real_to_host(kvm, BOOT_LOADER_SELECTOR, BOOT_LOADER_IP); 309009b0758SPekka Enberg 310009b0758SPekka Enberg while ((nr = read(fd, p, 65536)) > 0) 311009b0758SPekka Enberg p += nr; 312009b0758SPekka Enberg 31343835ac9SSasha Levin kvm->boot_selector = BOOT_LOADER_SELECTOR; 31443835ac9SSasha Levin kvm->boot_ip = BOOT_LOADER_IP; 31543835ac9SSasha Levin kvm->boot_sp = BOOT_LOADER_SP; 316edc8a14dSPekka Enberg 3177fb218bdSPekka Enberg return true; 318009b0758SPekka Enberg } 319009b0758SPekka Enberg 320ae1fae34SPekka Enberg static const char *BZIMAGE_MAGIC = "HdrS"; 321ae1fae34SPekka Enberg 32243835ac9SSasha Levin static bool load_bzimage(struct kvm *kvm, int fd_kernel, 32353861c74SJohn Floren int fd_initrd, const char *kernel_cmdline, u16 vidmode) 324ae1fae34SPekka Enberg { 325b9271160SPekka Enberg struct boot_params *kern_boot; 3264b62331fSPekka Enberg unsigned long setup_sects; 327b9271160SPekka Enberg struct boot_params boot; 3282dd4a4edSCyrill Gorcunov size_t cmdline_size; 3297fb218bdSPekka Enberg ssize_t setup_size; 33022489bb0SCyrill Gorcunov void *p; 331ae1fae34SPekka Enberg int nr; 332ae1fae34SPekka Enberg 3335d67eaf6SPekka Enberg /* 3345d67eaf6SPekka Enberg * See Documentation/x86/boot.txt for details no bzImage on-disk and 3355d67eaf6SPekka Enberg * memory layout. 3365d67eaf6SPekka Enberg */ 3375d67eaf6SPekka Enberg 3382065a6f7SCyrill Gorcunov if (lseek(fd_kernel, 0, SEEK_SET) < 0) 339009b0758SPekka Enberg die_perror("lseek"); 340009b0758SPekka Enberg 3410b62d2bbSPekka Enberg if (read(fd_kernel, &boot, sizeof(boot)) != sizeof(boot)) 3422346d461SPekka Enberg return false; 343ae1fae34SPekka Enberg 3440b62d2bbSPekka Enberg if (memcmp(&boot.hdr.header, BZIMAGE_MAGIC, strlen(BZIMAGE_MAGIC))) 3457fb218bdSPekka Enberg return false; 346ae1fae34SPekka Enberg 3470ea58e5bSPekka Enberg if (boot.hdr.version < BOOT_PROTOCOL_REQUIRED) 3480b62d2bbSPekka Enberg die("Too old kernel"); 349ad681038SCyrill Gorcunov 3502065a6f7SCyrill Gorcunov if (lseek(fd_kernel, 0, SEEK_SET) < 0) 351e93ab78aSPekka Enberg die_perror("lseek"); 352e93ab78aSPekka Enberg 3534cf542bbSCyrill Gorcunov if (!boot.hdr.setup_sects) 3544cf542bbSCyrill Gorcunov boot.hdr.setup_sects = BZ_DEFAULT_SETUP_SECTS; 35510943d14SPekka Enberg setup_sects = boot.hdr.setup_sects + 1; 35610943d14SPekka Enberg 35754d4a626SPekka Enberg setup_size = setup_sects << 9; 35843835ac9SSasha Levin p = guest_real_to_host(kvm, BOOT_LOADER_SELECTOR, BOOT_LOADER_IP); 359ae1fae34SPekka Enberg 3602065a6f7SCyrill Gorcunov /* copy setup.bin to mem*/ 3612065a6f7SCyrill Gorcunov if (read(fd_kernel, p, setup_size) != setup_size) 3627fb218bdSPekka Enberg die_perror("read"); 3637fb218bdSPekka Enberg 3642065a6f7SCyrill Gorcunov /* copy vmlinux.bin to BZ_KERNEL_START*/ 36543835ac9SSasha Levin p = guest_flat_to_host(kvm, BZ_KERNEL_START); 366ae1fae34SPekka Enberg 3672065a6f7SCyrill Gorcunov while ((nr = read(fd_kernel, p, 65536)) > 0) 368ae1fae34SPekka Enberg p += nr; 369ae1fae34SPekka Enberg 37043835ac9SSasha Levin p = guest_flat_to_host(kvm, BOOT_CMDLINE_OFFSET); 371debcfac0SCyrill Gorcunov if (kernel_cmdline) { 372debcfac0SCyrill Gorcunov cmdline_size = strlen(kernel_cmdline) + 1; 373debcfac0SCyrill Gorcunov if (cmdline_size > boot.hdr.cmdline_size) 374debcfac0SCyrill Gorcunov cmdline_size = boot.hdr.cmdline_size; 375ad681038SCyrill Gorcunov 3762dd4a4edSCyrill Gorcunov memset(p, 0, boot.hdr.cmdline_size); 3772dd4a4edSCyrill Gorcunov memcpy(p, kernel_cmdline, cmdline_size - 1); 378debcfac0SCyrill Gorcunov } 379debcfac0SCyrill Gorcunov 38043835ac9SSasha Levin kern_boot = guest_real_to_host(kvm, BOOT_LOADER_SELECTOR, 0x00); 381a43f6460SCyrill Gorcunov 382b9271160SPekka Enberg kern_boot->hdr.cmd_line_ptr = BOOT_CMDLINE_OFFSET; 383b9271160SPekka Enberg kern_boot->hdr.type_of_loader = 0xff; 384b9271160SPekka Enberg kern_boot->hdr.heap_end_ptr = 0xfe00; 385b9271160SPekka Enberg kern_boot->hdr.loadflags |= CAN_USE_HEAP; 38653861c74SJohn Floren kern_boot->hdr.vid_mode = vidmode; 387a43f6460SCyrill Gorcunov 3882065a6f7SCyrill Gorcunov /* 3892065a6f7SCyrill Gorcunov * Read initrd image into guest memory 3902065a6f7SCyrill Gorcunov */ 3912065a6f7SCyrill Gorcunov if (fd_initrd >= 0) { 3922065a6f7SCyrill Gorcunov struct stat initrd_stat; 3932065a6f7SCyrill Gorcunov unsigned long addr; 3942065a6f7SCyrill Gorcunov 3952065a6f7SCyrill Gorcunov if (fstat(fd_initrd, &initrd_stat)) 3962065a6f7SCyrill Gorcunov die_perror("fstat"); 3972065a6f7SCyrill Gorcunov 3982065a6f7SCyrill Gorcunov addr = boot.hdr.initrd_addr_max & ~0xfffff; 3992065a6f7SCyrill Gorcunov for (;;) { 4002065a6f7SCyrill Gorcunov if (addr < BZ_KERNEL_START) 4012065a6f7SCyrill Gorcunov die("Not enough memory for initrd"); 40243835ac9SSasha Levin else if (addr < (kvm->ram_size - initrd_stat.st_size)) 4032065a6f7SCyrill Gorcunov break; 4042065a6f7SCyrill Gorcunov addr -= 0x100000; 4052065a6f7SCyrill Gorcunov } 4062065a6f7SCyrill Gorcunov 40743835ac9SSasha Levin p = guest_flat_to_host(kvm, addr); 4082065a6f7SCyrill Gorcunov nr = read(fd_initrd, p, initrd_stat.st_size); 4092065a6f7SCyrill Gorcunov if (nr != initrd_stat.st_size) 4102065a6f7SCyrill Gorcunov die("Failed to read initrd"); 4112065a6f7SCyrill Gorcunov 4122065a6f7SCyrill Gorcunov kern_boot->hdr.ramdisk_image = addr; 4132065a6f7SCyrill Gorcunov kern_boot->hdr.ramdisk_size = initrd_stat.st_size; 4142065a6f7SCyrill Gorcunov } 4152065a6f7SCyrill Gorcunov 41643835ac9SSasha Levin kvm->boot_selector = BOOT_LOADER_SELECTOR; 417edc8a14dSPekka Enberg /* 418edc8a14dSPekka Enberg * The real-mode setup code starts at offset 0x200 of a bzImage. See 419edc8a14dSPekka Enberg * Documentation/x86/boot.txt for details. 420edc8a14dSPekka Enberg */ 42143835ac9SSasha Levin kvm->boot_ip = BOOT_LOADER_IP + 0x200; 42243835ac9SSasha Levin kvm->boot_sp = BOOT_LOADER_SP; 423edc8a14dSPekka Enberg 4247fb218bdSPekka Enberg return true; 425ae1fae34SPekka Enberg } 426ae1fae34SPekka Enberg 42772811558SPekka Enberg /* RFC 1952 */ 42872811558SPekka Enberg #define GZIP_ID1 0x1f 42972811558SPekka Enberg #define GZIP_ID2 0x8b 43072811558SPekka Enberg 43172811558SPekka Enberg static bool initrd_check(int fd) 43272811558SPekka Enberg { 43372811558SPekka Enberg unsigned char id[2]; 43472811558SPekka Enberg 43572811558SPekka Enberg if (read_in_full(fd, id, ARRAY_SIZE(id)) < 0) 43672811558SPekka Enberg return false; 43772811558SPekka Enberg 43872811558SPekka Enberg if (lseek(fd, 0, SEEK_SET) < 0) 43972811558SPekka Enberg die_perror("lseek"); 44072811558SPekka Enberg 44172811558SPekka Enberg return id[0] == GZIP_ID1 && id[1] == GZIP_ID2; 44272811558SPekka Enberg } 44372811558SPekka Enberg 4446d1f350dSCyrill Gorcunov bool kvm__load_kernel(struct kvm *kvm, const char *kernel_filename, 44553861c74SJohn Floren const char *initrd_filename, const char *kernel_cmdline, u16 vidmode) 446ae1fae34SPekka Enberg { 4477fb218bdSPekka Enberg bool ret; 4482065a6f7SCyrill Gorcunov int fd_kernel = -1, fd_initrd = -1; 449ae1fae34SPekka Enberg 4502065a6f7SCyrill Gorcunov fd_kernel = open(kernel_filename, O_RDONLY); 4512065a6f7SCyrill Gorcunov if (fd_kernel < 0) 4520b62d2bbSPekka Enberg die("Unable to open kernel %s", kernel_filename); 453ae1fae34SPekka Enberg 4542065a6f7SCyrill Gorcunov if (initrd_filename) { 4552065a6f7SCyrill Gorcunov fd_initrd = open(initrd_filename, O_RDONLY); 4562065a6f7SCyrill Gorcunov if (fd_initrd < 0) 4570b62d2bbSPekka Enberg die("Unable to open initrd %s", initrd_filename); 45872811558SPekka Enberg 45972811558SPekka Enberg if (!initrd_check(fd_initrd)) 46072811558SPekka Enberg die("%s is not an initrd", initrd_filename); 4612065a6f7SCyrill Gorcunov } 4622065a6f7SCyrill Gorcunov 46353861c74SJohn Floren ret = load_bzimage(kvm, fd_kernel, fd_initrd, kernel_cmdline, vidmode); 46428972750SCyrill Gorcunov 46528972750SCyrill Gorcunov if (initrd_filename) 46628972750SCyrill Gorcunov close(fd_initrd); 46728972750SCyrill Gorcunov 468009b0758SPekka Enberg if (ret) 469009b0758SPekka Enberg goto found_kernel; 470ae1fae34SPekka Enberg 4714542f276SCyrill Gorcunov pr_warning("%s is not a bzImage. Trying to load it as a flat binary...", kernel_filename); 4720b62d2bbSPekka Enberg 4732065a6f7SCyrill Gorcunov ret = load_flat_binary(kvm, fd_kernel); 474009b0758SPekka Enberg if (ret) 475009b0758SPekka Enberg goto found_kernel; 476009b0758SPekka Enberg 4775a6ac675SSasha Levin close(fd_kernel); 4785a6ac675SSasha Levin 479009b0758SPekka Enberg die("%s is not a valid bzImage or flat binary", kernel_filename); 480009b0758SPekka Enberg 481009b0758SPekka Enberg found_kernel: 4825a6ac675SSasha Levin close(fd_kernel); 4835a6ac675SSasha Levin 484ae1fae34SPekka Enberg return ret; 485ae1fae34SPekka Enberg } 486ae1fae34SPekka Enberg 487b3594ec7SCyrill Gorcunov /** 488b3594ec7SCyrill Gorcunov * kvm__setup_bios - inject BIOS into guest system memory 48943835ac9SSasha Levin * @kvm - guest system descriptor 490b3594ec7SCyrill Gorcunov * 491b3594ec7SCyrill Gorcunov * This function is a main routine where we poke guest memory 492b3594ec7SCyrill Gorcunov * and install BIOS there. 493b3594ec7SCyrill Gorcunov */ 49443835ac9SSasha Levin void kvm__setup_bios(struct kvm *kvm) 4952f3976eeSPekka Enberg { 496b3594ec7SCyrill Gorcunov /* standart minimal configuration */ 49743835ac9SSasha Levin setup_bios(kvm); 4982f3976eeSPekka Enberg 499b3594ec7SCyrill Gorcunov /* FIXME: SMP, ACPI and friends here */ 5000c7c14a7SCyrill Gorcunov 5010c7c14a7SCyrill Gorcunov /* MP table */ 50243835ac9SSasha Levin mptable_setup(kvm, kvm->nrcpus); 5032f3976eeSPekka Enberg } 5042f3976eeSPekka Enberg 505ce79f1caSPekka Enberg #define TIMER_INTERVAL_NS 1000000 /* 1 msec */ 506ce79f1caSPekka Enberg 507ce79f1caSPekka Enberg /* 508ce79f1caSPekka Enberg * This function sets up a timer that's used to inject interrupts from the 509ce79f1caSPekka Enberg * userspace hypervisor into the guest at periodical intervals. Please note 510ce79f1caSPekka Enberg * that clock interrupt, for example, is not handled here. 511ce79f1caSPekka Enberg */ 51243835ac9SSasha Levin void kvm__start_timer(struct kvm *kvm) 513ce79f1caSPekka Enberg { 514ce79f1caSPekka Enberg struct itimerspec its; 515ce79f1caSPekka Enberg struct sigevent sev; 516ce79f1caSPekka Enberg 517ce79f1caSPekka Enberg memset(&sev, 0, sizeof(struct sigevent)); 518ce79f1caSPekka Enberg sev.sigev_value.sival_int = 0; 519ce79f1caSPekka Enberg sev.sigev_notify = SIGEV_SIGNAL; 520ce79f1caSPekka Enberg sev.sigev_signo = SIGALRM; 521ce79f1caSPekka Enberg 52243835ac9SSasha Levin if (timer_create(CLOCK_REALTIME, &sev, &kvm->timerid) < 0) 523ce79f1caSPekka Enberg die("timer_create()"); 524ce79f1caSPekka Enberg 525ce79f1caSPekka Enberg its.it_value.tv_sec = TIMER_INTERVAL_NS / 1000000000; 526ce79f1caSPekka Enberg its.it_value.tv_nsec = TIMER_INTERVAL_NS % 1000000000; 527ce79f1caSPekka Enberg its.it_interval.tv_sec = its.it_value.tv_sec; 528ce79f1caSPekka Enberg its.it_interval.tv_nsec = its.it_value.tv_nsec; 529ce79f1caSPekka Enberg 53043835ac9SSasha Levin if (timer_settime(kvm->timerid, 0, &its, NULL) < 0) 531ce79f1caSPekka Enberg die("timer_settime()"); 532ce79f1caSPekka Enberg } 533ce79f1caSPekka Enberg 53443835ac9SSasha Levin void kvm__stop_timer(struct kvm *kvm) 535fbfe68b7SSasha Levin { 53643835ac9SSasha Levin if (kvm->timerid) 53743835ac9SSasha Levin if (timer_delete(kvm->timerid) < 0) 538fbfe68b7SSasha Levin die("timer_delete()"); 539fbfe68b7SSasha Levin 54043835ac9SSasha Levin kvm->timerid = 0; 541fbfe68b7SSasha Levin } 542fbfe68b7SSasha Levin 54343835ac9SSasha Levin void kvm__irq_line(struct kvm *kvm, int irq, int level) 5448b1ff07eSPekka Enberg { 5458b1ff07eSPekka Enberg struct kvm_irq_level irq_level; 5468b1ff07eSPekka Enberg 5478b1ff07eSPekka Enberg irq_level = (struct kvm_irq_level) { 5488b1ff07eSPekka Enberg { 5498b1ff07eSPekka Enberg .irq = irq, 5508b1ff07eSPekka Enberg }, 5518b1ff07eSPekka Enberg .level = level, 5528b1ff07eSPekka Enberg }; 5538b1ff07eSPekka Enberg 55443835ac9SSasha Levin if (ioctl(kvm->vm_fd, KVM_IRQ_LINE, &irq_level) < 0) 5558b1ff07eSPekka Enberg die_perror("KVM_IRQ_LINE failed"); 5568b1ff07eSPekka Enberg } 5578b1ff07eSPekka Enberg 55843835ac9SSasha Levin void kvm__dump_mem(struct kvm *kvm, unsigned long addr, unsigned long size) 559090f898eSCyrill Gorcunov { 560090f898eSCyrill Gorcunov unsigned char *p; 561090f898eSCyrill Gorcunov unsigned long n; 562090f898eSCyrill Gorcunov 563090f898eSCyrill Gorcunov size &= ~7; /* mod 8 */ 564090f898eSCyrill Gorcunov if (!size) 565090f898eSCyrill Gorcunov return; 566090f898eSCyrill Gorcunov 56743835ac9SSasha Levin p = guest_flat_to_host(kvm, addr); 568090f898eSCyrill Gorcunov 56948cf3877SPekka Enberg for (n = 0; n < size; n += 8) { 57043835ac9SSasha Levin if (!host_ptr_in_ram(kvm, p + n)) 57148cf3877SPekka Enberg break; 57248cf3877SPekka Enberg 573090f898eSCyrill Gorcunov printf(" 0x%08lx: %02x %02x %02x %02x %02x %02x %02x %02x\n", 574090f898eSCyrill Gorcunov addr + n, p[n + 0], p[n + 1], p[n + 2], p[n + 3], 575090f898eSCyrill Gorcunov p[n + 4], p[n + 5], p[n + 6], p[n + 7]); 576090f898eSCyrill Gorcunov } 57748cf3877SPekka Enberg } 578