17ada359dSArthur Chunqi Li /* 27ada359dSArthur Chunqi Li * x86/vmx.c : Framework for testing nested virtualization 37ada359dSArthur Chunqi Li * This is a framework to test nested VMX for KVM, which 47ada359dSArthur Chunqi Li * started as a project of GSoC 2013. All test cases should 57ada359dSArthur Chunqi Li * be located in x86/vmx_tests.c and framework related 67ada359dSArthur Chunqi Li * functions should be in this file. 77ada359dSArthur Chunqi Li * 87ada359dSArthur Chunqi Li * How to write test cases? 97ada359dSArthur Chunqi Li * Add callbacks of test suite in variant "vmx_tests". You can 107ada359dSArthur Chunqi Li * write: 117ada359dSArthur Chunqi Li * 1. init function used for initializing test suite 127ada359dSArthur Chunqi Li * 2. main function for codes running in L2 guest, 137ada359dSArthur Chunqi Li * 3. exit_handler to handle vmexit of L2 to L1 147ada359dSArthur Chunqi Li * 4. syscall handler to handle L2 syscall vmexit 157ada359dSArthur Chunqi Li * 5. vmenter fail handler to handle direct failure of vmenter 167ada359dSArthur Chunqi Li * 6. guest_regs is loaded when vmenter and saved when 177ada359dSArthur Chunqi Li * vmexit, you can read and set it in exit_handler 187ada359dSArthur Chunqi Li * If no special function is needed for a test suite, use 197ada359dSArthur Chunqi Li * coressponding basic_* functions as callback. More handlers 207ada359dSArthur Chunqi Li * can be added to "vmx_tests", see details of "struct vmx_test" 217ada359dSArthur Chunqi Li * and function test_run(). 227ada359dSArthur Chunqi Li * 237ada359dSArthur Chunqi Li * Currently, vmx test framework only set up one VCPU and one 247ada359dSArthur Chunqi Li * concurrent guest test environment with same paging for L2 and 257ada359dSArthur Chunqi Li * L1. For usage of EPT, only 1:1 mapped paging is used from VFN 267ada359dSArthur Chunqi Li * to PFN. 277ada359dSArthur Chunqi Li * 287ada359dSArthur Chunqi Li * Author : Arthur Chunqi Li <yzt356@gmail.com> 297ada359dSArthur Chunqi Li */ 307ada359dSArthur Chunqi Li 319d7eaa29SArthur Chunqi Li #include "libcflat.h" 329d7eaa29SArthur Chunqi Li #include "processor.h" 339d7eaa29SArthur Chunqi Li #include "vm.h" 349d7eaa29SArthur Chunqi Li #include "desc.h" 359d7eaa29SArthur Chunqi Li #include "vmx.h" 369d7eaa29SArthur Chunqi Li #include "msr.h" 379d7eaa29SArthur Chunqi Li #include "smp.h" 389d7eaa29SArthur Chunqi Li 39ce21d809SBandan Das u64 *vmxon_region; 409d7eaa29SArthur Chunqi Li struct vmcs *vmcs_root; 419d7eaa29SArthur Chunqi Li u32 vpid_cnt; 429d7eaa29SArthur Chunqi Li void *guest_stack, *guest_syscall_stack; 439d7eaa29SArthur Chunqi Li u32 ctrl_pin, ctrl_enter, ctrl_exit, ctrl_cpu[2]; 449d7eaa29SArthur Chunqi Li struct regs regs; 459d7eaa29SArthur Chunqi Li struct vmx_test *current; 463ee34093SArthur Chunqi Li u64 hypercall_field; 479d7eaa29SArthur Chunqi Li bool launched; 489d7eaa29SArthur Chunqi Li 493ee34093SArthur Chunqi Li union vmx_basic basic; 505f18e779SJan Kiszka union vmx_ctrl_msr ctrl_pin_rev; 515f18e779SJan Kiszka union vmx_ctrl_msr ctrl_cpu_rev[2]; 525f18e779SJan Kiszka union vmx_ctrl_msr ctrl_exit_rev; 535f18e779SJan Kiszka union vmx_ctrl_msr ctrl_enter_rev; 543ee34093SArthur Chunqi Li union vmx_ept_vpid ept_vpid; 553ee34093SArthur Chunqi Li 56337166aaSJan Kiszka extern struct descriptor_table_ptr gdt64_desc; 57337166aaSJan Kiszka extern struct descriptor_table_ptr idt_descr; 58337166aaSJan Kiszka extern struct descriptor_table_ptr tss_descr; 599d7eaa29SArthur Chunqi Li extern void *vmx_return; 609d7eaa29SArthur Chunqi Li extern void *entry_sysenter; 619d7eaa29SArthur Chunqi Li extern void *guest_entry; 629d7eaa29SArthur Chunqi Li 63ffb1a9e0SJan Kiszka static volatile u32 stage; 64ffb1a9e0SJan Kiszka 65ffb1a9e0SJan Kiszka void vmx_set_test_stage(u32 s) 66ffb1a9e0SJan Kiszka { 67ffb1a9e0SJan Kiszka barrier(); 68ffb1a9e0SJan Kiszka stage = s; 69ffb1a9e0SJan Kiszka barrier(); 70ffb1a9e0SJan Kiszka } 71ffb1a9e0SJan Kiszka 72ffb1a9e0SJan Kiszka u32 vmx_get_test_stage(void) 73ffb1a9e0SJan Kiszka { 74ffb1a9e0SJan Kiszka u32 s; 75ffb1a9e0SJan Kiszka 76ffb1a9e0SJan Kiszka barrier(); 77ffb1a9e0SJan Kiszka s = stage; 78ffb1a9e0SJan Kiszka barrier(); 79ffb1a9e0SJan Kiszka return s; 80ffb1a9e0SJan Kiszka } 81ffb1a9e0SJan Kiszka 82ffb1a9e0SJan Kiszka void vmx_inc_test_stage(void) 83ffb1a9e0SJan Kiszka { 84ffb1a9e0SJan Kiszka barrier(); 85ffb1a9e0SJan Kiszka stage++; 86ffb1a9e0SJan Kiszka barrier(); 87ffb1a9e0SJan Kiszka } 88ffb1a9e0SJan Kiszka 899d7eaa29SArthur Chunqi Li static int make_vmcs_current(struct vmcs *vmcs) 909d7eaa29SArthur Chunqi Li { 919d7eaa29SArthur Chunqi Li bool ret; 92a739f560SBandan Das u64 rflags = read_rflags() | X86_EFLAGS_CF | X86_EFLAGS_ZF; 939d7eaa29SArthur Chunqi Li 94a739f560SBandan Das asm volatile ("push %1; popf; vmptrld %2; setbe %0" 95a739f560SBandan Das : "=q" (ret) : "q" (rflags), "m" (vmcs) : "cc"); 969d7eaa29SArthur Chunqi Li return ret; 979d7eaa29SArthur Chunqi Li } 989d7eaa29SArthur Chunqi Li 999d7eaa29SArthur Chunqi Li /* entry_sysenter */ 1009d7eaa29SArthur Chunqi Li asm( 1019d7eaa29SArthur Chunqi Li ".align 4, 0x90\n\t" 1029d7eaa29SArthur Chunqi Li ".globl entry_sysenter\n\t" 1039d7eaa29SArthur Chunqi Li "entry_sysenter:\n\t" 1049d7eaa29SArthur Chunqi Li SAVE_GPR 1059d7eaa29SArthur Chunqi Li " and $0xf, %rax\n\t" 1069d7eaa29SArthur Chunqi Li " mov %rax, %rdi\n\t" 1079d7eaa29SArthur Chunqi Li " call syscall_handler\n\t" 1089d7eaa29SArthur Chunqi Li LOAD_GPR 1099d7eaa29SArthur Chunqi Li " vmresume\n\t" 1109d7eaa29SArthur Chunqi Li ); 1119d7eaa29SArthur Chunqi Li 1129d7eaa29SArthur Chunqi Li static void __attribute__((__used__)) syscall_handler(u64 syscall_no) 1139d7eaa29SArthur Chunqi Li { 114d5315e3dSJan Kiszka if (current->syscall_handler) 1159d7eaa29SArthur Chunqi Li current->syscall_handler(syscall_no); 1169d7eaa29SArthur Chunqi Li } 1179d7eaa29SArthur Chunqi Li 1189d7eaa29SArthur Chunqi Li static inline int vmx_on() 1199d7eaa29SArthur Chunqi Li { 1209d7eaa29SArthur Chunqi Li bool ret; 121a739f560SBandan Das u64 rflags = read_rflags() | X86_EFLAGS_CF | X86_EFLAGS_ZF; 122a739f560SBandan Das asm volatile ("push %1; popf; vmxon %2; setbe %0\n\t" 123a739f560SBandan Das : "=q" (ret) : "q" (rflags), "m" (vmxon_region) : "cc"); 1249d7eaa29SArthur Chunqi Li return ret; 1259d7eaa29SArthur Chunqi Li } 1269d7eaa29SArthur Chunqi Li 1279d7eaa29SArthur Chunqi Li static inline int vmx_off() 1289d7eaa29SArthur Chunqi Li { 1299d7eaa29SArthur Chunqi Li bool ret; 130a739f560SBandan Das u64 rflags = read_rflags() | X86_EFLAGS_CF | X86_EFLAGS_ZF; 131a739f560SBandan Das 132a739f560SBandan Das asm volatile("push %1; popf; vmxoff; setbe %0\n\t" 133a739f560SBandan Das : "=q"(ret) : "q" (rflags) : "cc"); 1349d7eaa29SArthur Chunqi Li return ret; 1359d7eaa29SArthur Chunqi Li } 1369d7eaa29SArthur Chunqi Li 1373ee34093SArthur Chunqi Li void print_vmexit_info() 1389d7eaa29SArthur Chunqi Li { 1399d7eaa29SArthur Chunqi Li u64 guest_rip, guest_rsp; 1409d7eaa29SArthur Chunqi Li ulong reason = vmcs_read(EXI_REASON) & 0xff; 1419d7eaa29SArthur Chunqi Li ulong exit_qual = vmcs_read(EXI_QUALIFICATION); 1429d7eaa29SArthur Chunqi Li guest_rip = vmcs_read(GUEST_RIP); 1439d7eaa29SArthur Chunqi Li guest_rsp = vmcs_read(GUEST_RSP); 1449d7eaa29SArthur Chunqi Li printf("VMEXIT info:\n"); 145b006d7ebSAndrew Jones printf("\tvmexit reason = %ld\n", reason); 146b006d7ebSAndrew Jones printf("\texit qualification = 0x%lx\n", exit_qual); 147b006d7ebSAndrew Jones printf("\tBit 31 of reason = %lx\n", (vmcs_read(EXI_REASON) >> 31) & 1); 148b006d7ebSAndrew Jones printf("\tguest_rip = 0x%lx\n", guest_rip); 149b006d7ebSAndrew Jones printf("\tRAX=0x%lx RBX=0x%lx RCX=0x%lx RDX=0x%lx\n", 1509d7eaa29SArthur Chunqi Li regs.rax, regs.rbx, regs.rcx, regs.rdx); 151b006d7ebSAndrew Jones printf("\tRSP=0x%lx RBP=0x%lx RSI=0x%lx RDI=0x%lx\n", 1529d7eaa29SArthur Chunqi Li guest_rsp, regs.rbp, regs.rsi, regs.rdi); 153b006d7ebSAndrew Jones printf("\tR8 =0x%lx R9 =0x%lx R10=0x%lx R11=0x%lx\n", 1549d7eaa29SArthur Chunqi Li regs.r8, regs.r9, regs.r10, regs.r11); 155b006d7ebSAndrew Jones printf("\tR12=0x%lx R13=0x%lx R14=0x%lx R15=0x%lx\n", 1569d7eaa29SArthur Chunqi Li regs.r12, regs.r13, regs.r14, regs.r15); 1579d7eaa29SArthur Chunqi Li } 1589d7eaa29SArthur Chunqi Li 1593b50efe3SPeter Feiner void 1603b50efe3SPeter Feiner print_vmentry_failure_info(struct vmentry_failure *failure) { 1613b50efe3SPeter Feiner if (failure->early) { 1623b50efe3SPeter Feiner printf("Early %s failure: ", failure->instr); 1633b50efe3SPeter Feiner switch (failure->flags & VMX_ENTRY_FLAGS) { 164ce154ba8SPaolo Bonzini case X86_EFLAGS_CF: 1653b50efe3SPeter Feiner printf("current-VMCS pointer is not valid.\n"); 1663b50efe3SPeter Feiner break; 167ce154ba8SPaolo Bonzini case X86_EFLAGS_ZF: 1683b50efe3SPeter Feiner printf("error number is %ld. See Intel 30.4.\n", 1693b50efe3SPeter Feiner vmcs_read(VMX_INST_ERROR)); 1703b50efe3SPeter Feiner break; 1713b50efe3SPeter Feiner default: 1723b50efe3SPeter Feiner printf("unexpected flags %lx!\n", failure->flags); 1733b50efe3SPeter Feiner } 1743b50efe3SPeter Feiner } else { 1753b50efe3SPeter Feiner u64 reason = vmcs_read(EXI_REASON); 1763b50efe3SPeter Feiner u64 qual = vmcs_read(EXI_QUALIFICATION); 1773b50efe3SPeter Feiner 1783b50efe3SPeter Feiner printf("Non-early %s failure (reason=0x%lx, qual=0x%lx): ", 1793b50efe3SPeter Feiner failure->instr, reason, qual); 1803b50efe3SPeter Feiner 1813b50efe3SPeter Feiner switch (reason & 0xff) { 1823b50efe3SPeter Feiner case VMX_FAIL_STATE: 1833b50efe3SPeter Feiner printf("invalid guest state\n"); 1843b50efe3SPeter Feiner break; 1853b50efe3SPeter Feiner case VMX_FAIL_MSR: 1863b50efe3SPeter Feiner printf("MSR loading\n"); 1873b50efe3SPeter Feiner break; 1883b50efe3SPeter Feiner case VMX_FAIL_MCHECK: 1893b50efe3SPeter Feiner printf("machine-check event\n"); 1903b50efe3SPeter Feiner break; 1913b50efe3SPeter Feiner default: 1923b50efe3SPeter Feiner printf("unexpected basic exit reason %ld\n", 1933b50efe3SPeter Feiner reason & 0xff); 1943b50efe3SPeter Feiner } 1953b50efe3SPeter Feiner 1963b50efe3SPeter Feiner if (!(reason & VMX_ENTRY_FAILURE)) 1973b50efe3SPeter Feiner printf("\tVMX_ENTRY_FAILURE BIT NOT SET!\n"); 1983b50efe3SPeter Feiner 1993b50efe3SPeter Feiner if (reason & 0x7fff0000) 2003b50efe3SPeter Feiner printf("\tRESERVED BITS SET!\n"); 2013b50efe3SPeter Feiner } 2023b50efe3SPeter Feiner } 2033b50efe3SPeter Feiner 2043b50efe3SPeter Feiner 2059d7eaa29SArthur Chunqi Li static void test_vmclear(void) 2069d7eaa29SArthur Chunqi Li { 207daeec979SBandan Das struct vmcs *tmp_root; 208e2cf1c9dSEduardo Habkost int width = cpuid_maxphyaddr(); 209daeec979SBandan Das 210daeec979SBandan Das /* 211daeec979SBandan Das * Note- The tests below do not necessarily have a 212daeec979SBandan Das * valid VMCS, but that's ok since the invalid vmcs 213daeec979SBandan Das * is only used for a specific test and is discarded 214daeec979SBandan Das * without touching its contents 215daeec979SBandan Das */ 216daeec979SBandan Das 217daeec979SBandan Das /* Unaligned page access */ 218daeec979SBandan Das tmp_root = (struct vmcs *)((intptr_t)vmcs_root + 1); 219daeec979SBandan Das report("test vmclear with unaligned vmcs", 220daeec979SBandan Das vmcs_clear(tmp_root) == 1); 221daeec979SBandan Das 222daeec979SBandan Das /* gpa bits beyond physical address width are set*/ 223daeec979SBandan Das tmp_root = (struct vmcs *)((intptr_t)vmcs_root | 224daeec979SBandan Das ((u64)1 << (width+1))); 225daeec979SBandan Das report("test vmclear with vmcs address bits set beyond physical address width", 226daeec979SBandan Das vmcs_clear(tmp_root) == 1); 227daeec979SBandan Das 228daeec979SBandan Das /* Pass VMXON region */ 229daeec979SBandan Das tmp_root = (struct vmcs *)vmxon_region; 230daeec979SBandan Das report("test vmclear with vmxon region", 231daeec979SBandan Das vmcs_clear(tmp_root) == 1); 232daeec979SBandan Das 233daeec979SBandan Das /* Valid VMCS */ 234daeec979SBandan Das report("test vmclear with valid vmcs region", vmcs_clear(vmcs_root) == 0); 235daeec979SBandan Das 2369d7eaa29SArthur Chunqi Li } 2379d7eaa29SArthur Chunqi Li 2389d7eaa29SArthur Chunqi Li static void test_vmxoff(void) 2399d7eaa29SArthur Chunqi Li { 2409d7eaa29SArthur Chunqi Li int ret; 2419d7eaa29SArthur Chunqi Li 2429d7eaa29SArthur Chunqi Li ret = vmx_off(); 2439d7eaa29SArthur Chunqi Li report("test vmxoff", !ret); 2449d7eaa29SArthur Chunqi Li } 2459d7eaa29SArthur Chunqi Li 2469d7eaa29SArthur Chunqi Li static void __attribute__((__used__)) guest_main(void) 2479d7eaa29SArthur Chunqi Li { 2489d7eaa29SArthur Chunqi Li current->guest_main(); 2499d7eaa29SArthur Chunqi Li } 2509d7eaa29SArthur Chunqi Li 2519d7eaa29SArthur Chunqi Li /* guest_entry */ 2529d7eaa29SArthur Chunqi Li asm( 2539d7eaa29SArthur Chunqi Li ".align 4, 0x90\n\t" 2549d7eaa29SArthur Chunqi Li ".globl entry_guest\n\t" 2559d7eaa29SArthur Chunqi Li "guest_entry:\n\t" 2569d7eaa29SArthur Chunqi Li " call guest_main\n\t" 2579d7eaa29SArthur Chunqi Li " mov $1, %edi\n\t" 2589d7eaa29SArthur Chunqi Li " call hypercall\n\t" 2599d7eaa29SArthur Chunqi Li ); 2609d7eaa29SArthur Chunqi Li 2616884af61SArthur Chunqi Li /* EPT paging structure related functions */ 26269c531c8SPeter Feiner /* split_large_ept_entry: Split a 2M/1G large page into 512 smaller PTEs. 26369c531c8SPeter Feiner @ptep : large page table entry to split 26469c531c8SPeter Feiner @level : level of ptep (2 or 3) 26569c531c8SPeter Feiner */ 26669c531c8SPeter Feiner static void split_large_ept_entry(unsigned long *ptep, int level) 26769c531c8SPeter Feiner { 26869c531c8SPeter Feiner unsigned long *new_pt; 26969c531c8SPeter Feiner unsigned long gpa; 27069c531c8SPeter Feiner unsigned long pte; 27169c531c8SPeter Feiner unsigned long prototype; 27269c531c8SPeter Feiner int i; 27369c531c8SPeter Feiner 27469c531c8SPeter Feiner pte = *ptep; 27569c531c8SPeter Feiner assert(pte & EPT_PRESENT); 27669c531c8SPeter Feiner assert(pte & EPT_LARGE_PAGE); 27769c531c8SPeter Feiner assert(level == 2 || level == 3); 27869c531c8SPeter Feiner 27969c531c8SPeter Feiner new_pt = alloc_page(); 28069c531c8SPeter Feiner assert(new_pt); 28169c531c8SPeter Feiner memset(new_pt, 0, PAGE_SIZE); 28269c531c8SPeter Feiner 28369c531c8SPeter Feiner prototype = pte & ~EPT_ADDR_MASK; 28469c531c8SPeter Feiner if (level == 2) 28569c531c8SPeter Feiner prototype &= ~EPT_LARGE_PAGE; 28669c531c8SPeter Feiner 28769c531c8SPeter Feiner gpa = pte & EPT_ADDR_MASK; 28869c531c8SPeter Feiner for (i = 0; i < EPT_PGDIR_ENTRIES; i++) { 28969c531c8SPeter Feiner new_pt[i] = prototype | gpa; 29069c531c8SPeter Feiner gpa += 1ul << EPT_LEVEL_SHIFT(level - 1); 29169c531c8SPeter Feiner } 29269c531c8SPeter Feiner 29369c531c8SPeter Feiner pte &= ~EPT_LARGE_PAGE; 29469c531c8SPeter Feiner pte &= ~EPT_ADDR_MASK; 29569c531c8SPeter Feiner pte |= virt_to_phys(new_pt); 29669c531c8SPeter Feiner 29769c531c8SPeter Feiner *ptep = pte; 29869c531c8SPeter Feiner } 29969c531c8SPeter Feiner 3006884af61SArthur Chunqi Li /* install_ept_entry : Install a page to a given level in EPT 3016884af61SArthur Chunqi Li @pml4 : addr of pml4 table 3026884af61SArthur Chunqi Li @pte_level : level of PTE to set 3036884af61SArthur Chunqi Li @guest_addr : physical address of guest 3046884af61SArthur Chunqi Li @pte : pte value to set 3056884af61SArthur Chunqi Li @pt_page : address of page table, NULL for a new page 3066884af61SArthur Chunqi Li */ 3076884af61SArthur Chunqi Li void install_ept_entry(unsigned long *pml4, 3086884af61SArthur Chunqi Li int pte_level, 3096884af61SArthur Chunqi Li unsigned long guest_addr, 3106884af61SArthur Chunqi Li unsigned long pte, 3116884af61SArthur Chunqi Li unsigned long *pt_page) 3126884af61SArthur Chunqi Li { 3136884af61SArthur Chunqi Li int level; 3146884af61SArthur Chunqi Li unsigned long *pt = pml4; 3156884af61SArthur Chunqi Li unsigned offset; 3166884af61SArthur Chunqi Li 3176884af61SArthur Chunqi Li for (level = EPT_PAGE_LEVEL; level > pte_level; --level) { 318a969e087SPeter Feiner offset = (guest_addr >> EPT_LEVEL_SHIFT(level)) 3196884af61SArthur Chunqi Li & EPT_PGDIR_MASK; 3206884af61SArthur Chunqi Li if (!(pt[offset] & (EPT_PRESENT))) { 3216884af61SArthur Chunqi Li unsigned long *new_pt = pt_page; 3226884af61SArthur Chunqi Li if (!new_pt) 3236884af61SArthur Chunqi Li new_pt = alloc_page(); 3246884af61SArthur Chunqi Li else 3256884af61SArthur Chunqi Li pt_page = 0; 3266884af61SArthur Chunqi Li memset(new_pt, 0, PAGE_SIZE); 3276884af61SArthur Chunqi Li pt[offset] = virt_to_phys(new_pt) 3286884af61SArthur Chunqi Li | EPT_RA | EPT_WA | EPT_EA; 32969c531c8SPeter Feiner } else if (pt[offset] & EPT_LARGE_PAGE) 33069c531c8SPeter Feiner split_large_ept_entry(&pt[offset], level); 33100b5c590SPeter Feiner pt = phys_to_virt(pt[offset] & EPT_ADDR_MASK); 3326884af61SArthur Chunqi Li } 333a969e087SPeter Feiner offset = (guest_addr >> EPT_LEVEL_SHIFT(level)) & EPT_PGDIR_MASK; 3346884af61SArthur Chunqi Li pt[offset] = pte; 3356884af61SArthur Chunqi Li } 3366884af61SArthur Chunqi Li 3376884af61SArthur Chunqi Li /* Map a page, @perm is the permission of the page */ 3386884af61SArthur Chunqi Li void install_ept(unsigned long *pml4, 3396884af61SArthur Chunqi Li unsigned long phys, 3406884af61SArthur Chunqi Li unsigned long guest_addr, 3416884af61SArthur Chunqi Li u64 perm) 3426884af61SArthur Chunqi Li { 3436884af61SArthur Chunqi Li install_ept_entry(pml4, 1, guest_addr, (phys & PAGE_MASK) | perm, 0); 3446884af61SArthur Chunqi Li } 3456884af61SArthur Chunqi Li 3466884af61SArthur Chunqi Li /* Map a 1G-size page */ 3476884af61SArthur Chunqi Li void install_1g_ept(unsigned long *pml4, 3486884af61SArthur Chunqi Li unsigned long phys, 3496884af61SArthur Chunqi Li unsigned long guest_addr, 3506884af61SArthur Chunqi Li u64 perm) 3516884af61SArthur Chunqi Li { 3526884af61SArthur Chunqi Li install_ept_entry(pml4, 3, guest_addr, 3536884af61SArthur Chunqi Li (phys & PAGE_MASK) | perm | EPT_LARGE_PAGE, 0); 3546884af61SArthur Chunqi Li } 3556884af61SArthur Chunqi Li 3566884af61SArthur Chunqi Li /* Map a 2M-size page */ 3576884af61SArthur Chunqi Li void install_2m_ept(unsigned long *pml4, 3586884af61SArthur Chunqi Li unsigned long phys, 3596884af61SArthur Chunqi Li unsigned long guest_addr, 3606884af61SArthur Chunqi Li u64 perm) 3616884af61SArthur Chunqi Li { 3626884af61SArthur Chunqi Li install_ept_entry(pml4, 2, guest_addr, 3636884af61SArthur Chunqi Li (phys & PAGE_MASK) | perm | EPT_LARGE_PAGE, 0); 3646884af61SArthur Chunqi Li } 3656884af61SArthur Chunqi Li 3666884af61SArthur Chunqi Li /* setup_ept_range : Setup a range of 1:1 mapped page to EPT paging structure. 3676884af61SArthur Chunqi Li @start : start address of guest page 3686884af61SArthur Chunqi Li @len : length of address to be mapped 3696884af61SArthur Chunqi Li @map_1g : whether 1G page map is used 3706884af61SArthur Chunqi Li @map_2m : whether 2M page map is used 3716884af61SArthur Chunqi Li @perm : permission for every page 3726884af61SArthur Chunqi Li */ 373b947e241SJan Kiszka void setup_ept_range(unsigned long *pml4, unsigned long start, 3746884af61SArthur Chunqi Li unsigned long len, int map_1g, int map_2m, u64 perm) 3756884af61SArthur Chunqi Li { 3766884af61SArthur Chunqi Li u64 phys = start; 3776884af61SArthur Chunqi Li u64 max = (u64)len + (u64)start; 3786884af61SArthur Chunqi Li 3796884af61SArthur Chunqi Li if (map_1g) { 3806884af61SArthur Chunqi Li while (phys + PAGE_SIZE_1G <= max) { 3816884af61SArthur Chunqi Li install_1g_ept(pml4, phys, phys, perm); 3826884af61SArthur Chunqi Li phys += PAGE_SIZE_1G; 3836884af61SArthur Chunqi Li } 3846884af61SArthur Chunqi Li } 3856884af61SArthur Chunqi Li if (map_2m) { 3866884af61SArthur Chunqi Li while (phys + PAGE_SIZE_2M <= max) { 3876884af61SArthur Chunqi Li install_2m_ept(pml4, phys, phys, perm); 3886884af61SArthur Chunqi Li phys += PAGE_SIZE_2M; 3896884af61SArthur Chunqi Li } 3906884af61SArthur Chunqi Li } 3916884af61SArthur Chunqi Li while (phys + PAGE_SIZE <= max) { 3926884af61SArthur Chunqi Li install_ept(pml4, phys, phys, perm); 3936884af61SArthur Chunqi Li phys += PAGE_SIZE; 3946884af61SArthur Chunqi Li } 3956884af61SArthur Chunqi Li } 3966884af61SArthur Chunqi Li 3976884af61SArthur Chunqi Li /* get_ept_pte : Get the PTE of a given level in EPT, 3986884af61SArthur Chunqi Li @level == 1 means get the latest level*/ 3996884af61SArthur Chunqi Li unsigned long get_ept_pte(unsigned long *pml4, 4006884af61SArthur Chunqi Li unsigned long guest_addr, int level) 4016884af61SArthur Chunqi Li { 4026884af61SArthur Chunqi Li int l; 4036884af61SArthur Chunqi Li unsigned long *pt = pml4, pte; 4046884af61SArthur Chunqi Li unsigned offset; 4056884af61SArthur Chunqi Li 4062ca6f1f3SPaolo Bonzini if (level < 1 || level > 3) 4072ca6f1f3SPaolo Bonzini return -1; 4082ca6f1f3SPaolo Bonzini for (l = EPT_PAGE_LEVEL; ; --l) { 409a969e087SPeter Feiner offset = (guest_addr >> EPT_LEVEL_SHIFT(l)) & EPT_PGDIR_MASK; 4106884af61SArthur Chunqi Li pte = pt[offset]; 4116884af61SArthur Chunqi Li if (!(pte & (EPT_PRESENT))) 4126884af61SArthur Chunqi Li return 0; 4136884af61SArthur Chunqi Li if (l == level) 4142ca6f1f3SPaolo Bonzini break; 4156884af61SArthur Chunqi Li if (l < 4 && (pte & EPT_LARGE_PAGE)) 4166884af61SArthur Chunqi Li return pte; 41700b5c590SPeter Feiner pt = (unsigned long *)(pte & EPT_ADDR_MASK); 4186884af61SArthur Chunqi Li } 419a969e087SPeter Feiner offset = (guest_addr >> EPT_LEVEL_SHIFT(l)) & EPT_PGDIR_MASK; 4206884af61SArthur Chunqi Li pte = pt[offset]; 4216884af61SArthur Chunqi Li return pte; 4226884af61SArthur Chunqi Li } 4236884af61SArthur Chunqi Li 424521820dbSPaolo Bonzini static void clear_ept_ad_pte(unsigned long *pml4, unsigned long guest_addr) 425521820dbSPaolo Bonzini { 426521820dbSPaolo Bonzini int l; 427521820dbSPaolo Bonzini unsigned long *pt = pml4; 428521820dbSPaolo Bonzini u64 pte; 429521820dbSPaolo Bonzini unsigned offset; 430521820dbSPaolo Bonzini 431521820dbSPaolo Bonzini for (l = EPT_PAGE_LEVEL; ; --l) { 432521820dbSPaolo Bonzini offset = (guest_addr >> EPT_LEVEL_SHIFT(l)) & EPT_PGDIR_MASK; 433521820dbSPaolo Bonzini pt[offset] &= ~(EPT_ACCESS_FLAG|EPT_DIRTY_FLAG); 434521820dbSPaolo Bonzini pte = pt[offset]; 435521820dbSPaolo Bonzini if (l == 1 || (l < 4 && (pte & EPT_LARGE_PAGE))) 436521820dbSPaolo Bonzini break; 437521820dbSPaolo Bonzini pt = (unsigned long *)(pte & EPT_ADDR_MASK); 438521820dbSPaolo Bonzini } 439521820dbSPaolo Bonzini } 440521820dbSPaolo Bonzini 441521820dbSPaolo Bonzini /* clear_ept_ad : Clear EPT A/D bits for the page table walk and the 442521820dbSPaolo Bonzini final GPA of a guest address. */ 443521820dbSPaolo Bonzini void clear_ept_ad(unsigned long *pml4, u64 guest_cr3, 444521820dbSPaolo Bonzini unsigned long guest_addr) 445521820dbSPaolo Bonzini { 446521820dbSPaolo Bonzini int l; 447521820dbSPaolo Bonzini unsigned long *pt = (unsigned long *)guest_cr3, gpa; 448521820dbSPaolo Bonzini u64 pte, offset_in_page; 449521820dbSPaolo Bonzini unsigned offset; 450521820dbSPaolo Bonzini 451521820dbSPaolo Bonzini for (l = EPT_PAGE_LEVEL; ; --l) { 452521820dbSPaolo Bonzini offset = (guest_addr >> EPT_LEVEL_SHIFT(l)) & EPT_PGDIR_MASK; 453521820dbSPaolo Bonzini 454521820dbSPaolo Bonzini clear_ept_ad_pte(pml4, (u64) &pt[offset]); 455521820dbSPaolo Bonzini pte = pt[offset]; 456521820dbSPaolo Bonzini if (l == 1 || (l < 4 && (pte & PT_PAGE_SIZE_MASK))) 457521820dbSPaolo Bonzini break; 458521820dbSPaolo Bonzini if (!(pte & PT_PRESENT_MASK)) 459521820dbSPaolo Bonzini return; 460521820dbSPaolo Bonzini pt = (unsigned long *)(pte & PT_ADDR_MASK); 461521820dbSPaolo Bonzini } 462521820dbSPaolo Bonzini 463521820dbSPaolo Bonzini offset = (guest_addr >> EPT_LEVEL_SHIFT(l)) & EPT_PGDIR_MASK; 464521820dbSPaolo Bonzini offset_in_page = guest_addr & ((1 << EPT_LEVEL_SHIFT(l)) - 1); 465521820dbSPaolo Bonzini gpa = (pt[offset] & PT_ADDR_MASK) | (guest_addr & offset_in_page); 466521820dbSPaolo Bonzini clear_ept_ad_pte(pml4, gpa); 467521820dbSPaolo Bonzini } 468521820dbSPaolo Bonzini 469521820dbSPaolo Bonzini /* check_ept_ad : Check the content of EPT A/D bits for the page table 470521820dbSPaolo Bonzini walk and the final GPA of a guest address. */ 471521820dbSPaolo Bonzini void check_ept_ad(unsigned long *pml4, u64 guest_cr3, 472521820dbSPaolo Bonzini unsigned long guest_addr, int expected_gpa_ad, 473521820dbSPaolo Bonzini int expected_pt_ad) 474521820dbSPaolo Bonzini { 475521820dbSPaolo Bonzini int l; 476521820dbSPaolo Bonzini unsigned long *pt = (unsigned long *)guest_cr3, gpa; 477521820dbSPaolo Bonzini u64 ept_pte, pte, offset_in_page; 478521820dbSPaolo Bonzini unsigned offset; 479521820dbSPaolo Bonzini bool bad_pt_ad = false; 480521820dbSPaolo Bonzini 481521820dbSPaolo Bonzini for (l = EPT_PAGE_LEVEL; ; --l) { 482521820dbSPaolo Bonzini offset = (guest_addr >> EPT_LEVEL_SHIFT(l)) & EPT_PGDIR_MASK; 483521820dbSPaolo Bonzini 484521820dbSPaolo Bonzini ept_pte = get_ept_pte(pml4, (u64) &pt[offset], 1); 485521820dbSPaolo Bonzini if (ept_pte == 0) 486521820dbSPaolo Bonzini return; 487521820dbSPaolo Bonzini 488521820dbSPaolo Bonzini if (!bad_pt_ad) { 489521820dbSPaolo Bonzini bad_pt_ad |= (ept_pte & (EPT_ACCESS_FLAG|EPT_DIRTY_FLAG)) != expected_pt_ad; 490521820dbSPaolo Bonzini if (bad_pt_ad) 491521820dbSPaolo Bonzini report("EPT - guest level %d page table A=%d/D=%d", 492521820dbSPaolo Bonzini false, l, 493521820dbSPaolo Bonzini !!(expected_pt_ad & EPT_ACCESS_FLAG), 494521820dbSPaolo Bonzini !!(expected_pt_ad & EPT_DIRTY_FLAG)); 495521820dbSPaolo Bonzini } 496521820dbSPaolo Bonzini 497521820dbSPaolo Bonzini pte = pt[offset]; 498521820dbSPaolo Bonzini if (l == 1 || (l < 4 && (pte & PT_PAGE_SIZE_MASK))) 499521820dbSPaolo Bonzini break; 500521820dbSPaolo Bonzini if (!(pte & PT_PRESENT_MASK)) 501521820dbSPaolo Bonzini return; 502521820dbSPaolo Bonzini pt = (unsigned long *)(pte & PT_ADDR_MASK); 503521820dbSPaolo Bonzini } 504521820dbSPaolo Bonzini 505521820dbSPaolo Bonzini if (!bad_pt_ad) 506521820dbSPaolo Bonzini report("EPT - guest page table structures A=%d/D=%d", 507521820dbSPaolo Bonzini true, 508521820dbSPaolo Bonzini !!(expected_pt_ad & EPT_ACCESS_FLAG), 509521820dbSPaolo Bonzini !!(expected_pt_ad & EPT_DIRTY_FLAG)); 510521820dbSPaolo Bonzini 511521820dbSPaolo Bonzini offset = (guest_addr >> EPT_LEVEL_SHIFT(l)) & EPT_PGDIR_MASK; 512521820dbSPaolo Bonzini offset_in_page = guest_addr & ((1 << EPT_LEVEL_SHIFT(l)) - 1); 513521820dbSPaolo Bonzini gpa = (pt[offset] & PT_ADDR_MASK) | (guest_addr & offset_in_page); 514521820dbSPaolo Bonzini 515521820dbSPaolo Bonzini ept_pte = get_ept_pte(pml4, gpa, 1); 516521820dbSPaolo Bonzini report("EPT - guest physical address A=%d/D=%d", 517521820dbSPaolo Bonzini (ept_pte & (EPT_ACCESS_FLAG|EPT_DIRTY_FLAG)) == expected_gpa_ad, 518521820dbSPaolo Bonzini !!(expected_gpa_ad & EPT_ACCESS_FLAG), 519521820dbSPaolo Bonzini !!(expected_gpa_ad & EPT_DIRTY_FLAG)); 520521820dbSPaolo Bonzini } 521521820dbSPaolo Bonzini 522521820dbSPaolo Bonzini 5232f888fccSBandan Das void ept_sync(int type, u64 eptp) 5242f888fccSBandan Das { 5252f888fccSBandan Das switch (type) { 5262f888fccSBandan Das case INVEPT_SINGLE: 5272f888fccSBandan Das if (ept_vpid.val & EPT_CAP_INVEPT_SINGLE) { 5282f888fccSBandan Das invept(INVEPT_SINGLE, eptp); 5292f888fccSBandan Das break; 5302f888fccSBandan Das } 5312f888fccSBandan Das /* else fall through */ 5322f888fccSBandan Das case INVEPT_GLOBAL: 5332f888fccSBandan Das if (ept_vpid.val & EPT_CAP_INVEPT_ALL) { 5342f888fccSBandan Das invept(INVEPT_GLOBAL, eptp); 5352f888fccSBandan Das break; 5362f888fccSBandan Das } 5372f888fccSBandan Das /* else fall through */ 5382f888fccSBandan Das default: 5392f888fccSBandan Das printf("WARNING: invept is not supported!\n"); 5402f888fccSBandan Das } 5412f888fccSBandan Das } 5422f888fccSBandan Das 5436884af61SArthur Chunqi Li int set_ept_pte(unsigned long *pml4, unsigned long guest_addr, 5446884af61SArthur Chunqi Li int level, u64 pte_val) 5456884af61SArthur Chunqi Li { 5466884af61SArthur Chunqi Li int l; 5476884af61SArthur Chunqi Li unsigned long *pt = pml4; 5486884af61SArthur Chunqi Li unsigned offset; 5496884af61SArthur Chunqi Li 5506884af61SArthur Chunqi Li if (level < 1 || level > 3) 5516884af61SArthur Chunqi Li return -1; 5522ca6f1f3SPaolo Bonzini for (l = EPT_PAGE_LEVEL; ; --l) { 553a969e087SPeter Feiner offset = (guest_addr >> EPT_LEVEL_SHIFT(l)) & EPT_PGDIR_MASK; 5542ca6f1f3SPaolo Bonzini if (l == level) 5552ca6f1f3SPaolo Bonzini break; 5566884af61SArthur Chunqi Li if (!(pt[offset] & (EPT_PRESENT))) 5576884af61SArthur Chunqi Li return -1; 55800b5c590SPeter Feiner pt = (unsigned long *)(pt[offset] & EPT_ADDR_MASK); 5596884af61SArthur Chunqi Li } 560a969e087SPeter Feiner offset = (guest_addr >> EPT_LEVEL_SHIFT(l)) & EPT_PGDIR_MASK; 5616884af61SArthur Chunqi Li pt[offset] = pte_val; 5626884af61SArthur Chunqi Li return 0; 5636884af61SArthur Chunqi Li } 5646884af61SArthur Chunqi Li 565b093c6ceSWanpeng Li void vpid_sync(int type, u16 vpid) 566b093c6ceSWanpeng Li { 567b093c6ceSWanpeng Li switch(type) { 568b093c6ceSWanpeng Li case INVVPID_SINGLE: 569b093c6ceSWanpeng Li if (ept_vpid.val & VPID_CAP_INVVPID_SINGLE) { 570b093c6ceSWanpeng Li invvpid(INVVPID_SINGLE, vpid, 0); 571b093c6ceSWanpeng Li break; 572b093c6ceSWanpeng Li } 573b093c6ceSWanpeng Li case INVVPID_ALL: 574b093c6ceSWanpeng Li if (ept_vpid.val & VPID_CAP_INVVPID_ALL) { 575b093c6ceSWanpeng Li invvpid(INVVPID_ALL, vpid, 0); 576b093c6ceSWanpeng Li break; 577b093c6ceSWanpeng Li } 578b093c6ceSWanpeng Li default: 579b093c6ceSWanpeng Li printf("WARNING: invvpid is not supported\n"); 580b093c6ceSWanpeng Li } 581b093c6ceSWanpeng Li } 5826884af61SArthur Chunqi Li 5839d7eaa29SArthur Chunqi Li static void init_vmcs_ctrl(void) 5849d7eaa29SArthur Chunqi Li { 5859d7eaa29SArthur Chunqi Li /* 26.2 CHECKS ON VMX CONTROLS AND HOST-STATE AREA */ 5869d7eaa29SArthur Chunqi Li /* 26.2.1.1 */ 5879d7eaa29SArthur Chunqi Li vmcs_write(PIN_CONTROLS, ctrl_pin); 5889d7eaa29SArthur Chunqi Li /* Disable VMEXIT of IO instruction */ 5899d7eaa29SArthur Chunqi Li vmcs_write(CPU_EXEC_CTRL0, ctrl_cpu[0]); 5909d7eaa29SArthur Chunqi Li if (ctrl_cpu_rev[0].set & CPU_SECONDARY) { 5916884af61SArthur Chunqi Li ctrl_cpu[1] = (ctrl_cpu[1] | ctrl_cpu_rev[1].set) & 5926884af61SArthur Chunqi Li ctrl_cpu_rev[1].clr; 5939d7eaa29SArthur Chunqi Li vmcs_write(CPU_EXEC_CTRL1, ctrl_cpu[1]); 5949d7eaa29SArthur Chunqi Li } 5959d7eaa29SArthur Chunqi Li vmcs_write(CR3_TARGET_COUNT, 0); 5969d7eaa29SArthur Chunqi Li vmcs_write(VPID, ++vpid_cnt); 5979d7eaa29SArthur Chunqi Li } 5989d7eaa29SArthur Chunqi Li 5999d7eaa29SArthur Chunqi Li static void init_vmcs_host(void) 6009d7eaa29SArthur Chunqi Li { 6019d7eaa29SArthur Chunqi Li /* 26.2 CHECKS ON VMX CONTROLS AND HOST-STATE AREA */ 6029d7eaa29SArthur Chunqi Li /* 26.2.1.2 */ 6039d7eaa29SArthur Chunqi Li vmcs_write(HOST_EFER, rdmsr(MSR_EFER)); 6049d7eaa29SArthur Chunqi Li 6059d7eaa29SArthur Chunqi Li /* 26.2.1.3 */ 6069d7eaa29SArthur Chunqi Li vmcs_write(ENT_CONTROLS, ctrl_enter); 6079d7eaa29SArthur Chunqi Li vmcs_write(EXI_CONTROLS, ctrl_exit); 6089d7eaa29SArthur Chunqi Li 6099d7eaa29SArthur Chunqi Li /* 26.2.2 */ 6109d7eaa29SArthur Chunqi Li vmcs_write(HOST_CR0, read_cr0()); 6119d7eaa29SArthur Chunqi Li vmcs_write(HOST_CR3, read_cr3()); 6129d7eaa29SArthur Chunqi Li vmcs_write(HOST_CR4, read_cr4()); 6139d7eaa29SArthur Chunqi Li vmcs_write(HOST_SYSENTER_EIP, (u64)(&entry_sysenter)); 61469d8fe0eSPaolo Bonzini vmcs_write(HOST_SYSENTER_CS, KERNEL_CS); 6159d7eaa29SArthur Chunqi Li 6169d7eaa29SArthur Chunqi Li /* 26.2.3 */ 61769d8fe0eSPaolo Bonzini vmcs_write(HOST_SEL_CS, KERNEL_CS); 61869d8fe0eSPaolo Bonzini vmcs_write(HOST_SEL_SS, KERNEL_DS); 61969d8fe0eSPaolo Bonzini vmcs_write(HOST_SEL_DS, KERNEL_DS); 62069d8fe0eSPaolo Bonzini vmcs_write(HOST_SEL_ES, KERNEL_DS); 62169d8fe0eSPaolo Bonzini vmcs_write(HOST_SEL_FS, KERNEL_DS); 62269d8fe0eSPaolo Bonzini vmcs_write(HOST_SEL_GS, KERNEL_DS); 62369d8fe0eSPaolo Bonzini vmcs_write(HOST_SEL_TR, TSS_MAIN); 624337166aaSJan Kiszka vmcs_write(HOST_BASE_TR, tss_descr.base); 625337166aaSJan Kiszka vmcs_write(HOST_BASE_GDTR, gdt64_desc.base); 626337166aaSJan Kiszka vmcs_write(HOST_BASE_IDTR, idt_descr.base); 6279d7eaa29SArthur Chunqi Li vmcs_write(HOST_BASE_FS, 0); 6289d7eaa29SArthur Chunqi Li vmcs_write(HOST_BASE_GS, 0); 6299d7eaa29SArthur Chunqi Li 6309d7eaa29SArthur Chunqi Li /* Set other vmcs area */ 6319d7eaa29SArthur Chunqi Li vmcs_write(PF_ERROR_MASK, 0); 6329d7eaa29SArthur Chunqi Li vmcs_write(PF_ERROR_MATCH, 0); 6339d7eaa29SArthur Chunqi Li vmcs_write(VMCS_LINK_PTR, ~0ul); 6349d7eaa29SArthur Chunqi Li vmcs_write(VMCS_LINK_PTR_HI, ~0ul); 6359d7eaa29SArthur Chunqi Li vmcs_write(HOST_RIP, (u64)(&vmx_return)); 6369d7eaa29SArthur Chunqi Li } 6379d7eaa29SArthur Chunqi Li 6389d7eaa29SArthur Chunqi Li static void init_vmcs_guest(void) 6399d7eaa29SArthur Chunqi Li { 6409d7eaa29SArthur Chunqi Li /* 26.3 CHECKING AND LOADING GUEST STATE */ 6419d7eaa29SArthur Chunqi Li ulong guest_cr0, guest_cr4, guest_cr3; 6429d7eaa29SArthur Chunqi Li /* 26.3.1.1 */ 6439d7eaa29SArthur Chunqi Li guest_cr0 = read_cr0(); 6449d7eaa29SArthur Chunqi Li guest_cr4 = read_cr4(); 6459d7eaa29SArthur Chunqi Li guest_cr3 = read_cr3(); 6469d7eaa29SArthur Chunqi Li if (ctrl_enter & ENT_GUEST_64) { 6479d7eaa29SArthur Chunqi Li guest_cr0 |= X86_CR0_PG; 6489d7eaa29SArthur Chunqi Li guest_cr4 |= X86_CR4_PAE; 6499d7eaa29SArthur Chunqi Li } 6509d7eaa29SArthur Chunqi Li if ((ctrl_enter & ENT_GUEST_64) == 0) 6519d7eaa29SArthur Chunqi Li guest_cr4 &= (~X86_CR4_PCIDE); 6529d7eaa29SArthur Chunqi Li if (guest_cr0 & X86_CR0_PG) 6539d7eaa29SArthur Chunqi Li guest_cr0 |= X86_CR0_PE; 6549d7eaa29SArthur Chunqi Li vmcs_write(GUEST_CR0, guest_cr0); 6559d7eaa29SArthur Chunqi Li vmcs_write(GUEST_CR3, guest_cr3); 6569d7eaa29SArthur Chunqi Li vmcs_write(GUEST_CR4, guest_cr4); 65769d8fe0eSPaolo Bonzini vmcs_write(GUEST_SYSENTER_CS, KERNEL_CS); 6589d7eaa29SArthur Chunqi Li vmcs_write(GUEST_SYSENTER_ESP, 6599d7eaa29SArthur Chunqi Li (u64)(guest_syscall_stack + PAGE_SIZE - 1)); 6609d7eaa29SArthur Chunqi Li vmcs_write(GUEST_SYSENTER_EIP, (u64)(&entry_sysenter)); 6619d7eaa29SArthur Chunqi Li vmcs_write(GUEST_DR7, 0); 6629d7eaa29SArthur Chunqi Li vmcs_write(GUEST_EFER, rdmsr(MSR_EFER)); 6639d7eaa29SArthur Chunqi Li 6649d7eaa29SArthur Chunqi Li /* 26.3.1.2 */ 66569d8fe0eSPaolo Bonzini vmcs_write(GUEST_SEL_CS, KERNEL_CS); 66669d8fe0eSPaolo Bonzini vmcs_write(GUEST_SEL_SS, KERNEL_DS); 66769d8fe0eSPaolo Bonzini vmcs_write(GUEST_SEL_DS, KERNEL_DS); 66869d8fe0eSPaolo Bonzini vmcs_write(GUEST_SEL_ES, KERNEL_DS); 66969d8fe0eSPaolo Bonzini vmcs_write(GUEST_SEL_FS, KERNEL_DS); 67069d8fe0eSPaolo Bonzini vmcs_write(GUEST_SEL_GS, KERNEL_DS); 67169d8fe0eSPaolo Bonzini vmcs_write(GUEST_SEL_TR, TSS_MAIN); 6729d7eaa29SArthur Chunqi Li vmcs_write(GUEST_SEL_LDTR, 0); 6739d7eaa29SArthur Chunqi Li 6749d7eaa29SArthur Chunqi Li vmcs_write(GUEST_BASE_CS, 0); 6759d7eaa29SArthur Chunqi Li vmcs_write(GUEST_BASE_ES, 0); 6769d7eaa29SArthur Chunqi Li vmcs_write(GUEST_BASE_SS, 0); 6779d7eaa29SArthur Chunqi Li vmcs_write(GUEST_BASE_DS, 0); 6789d7eaa29SArthur Chunqi Li vmcs_write(GUEST_BASE_FS, 0); 6799d7eaa29SArthur Chunqi Li vmcs_write(GUEST_BASE_GS, 0); 680337166aaSJan Kiszka vmcs_write(GUEST_BASE_TR, tss_descr.base); 6819d7eaa29SArthur Chunqi Li vmcs_write(GUEST_BASE_LDTR, 0); 6829d7eaa29SArthur Chunqi Li 6839d7eaa29SArthur Chunqi Li vmcs_write(GUEST_LIMIT_CS, 0xFFFFFFFF); 6849d7eaa29SArthur Chunqi Li vmcs_write(GUEST_LIMIT_DS, 0xFFFFFFFF); 6859d7eaa29SArthur Chunqi Li vmcs_write(GUEST_LIMIT_ES, 0xFFFFFFFF); 6869d7eaa29SArthur Chunqi Li vmcs_write(GUEST_LIMIT_SS, 0xFFFFFFFF); 6879d7eaa29SArthur Chunqi Li vmcs_write(GUEST_LIMIT_FS, 0xFFFFFFFF); 6889d7eaa29SArthur Chunqi Li vmcs_write(GUEST_LIMIT_GS, 0xFFFFFFFF); 6899d7eaa29SArthur Chunqi Li vmcs_write(GUEST_LIMIT_LDTR, 0xffff); 690337166aaSJan Kiszka vmcs_write(GUEST_LIMIT_TR, tss_descr.limit); 6919d7eaa29SArthur Chunqi Li 6929d7eaa29SArthur Chunqi Li vmcs_write(GUEST_AR_CS, 0xa09b); 6939d7eaa29SArthur Chunqi Li vmcs_write(GUEST_AR_DS, 0xc093); 6949d7eaa29SArthur Chunqi Li vmcs_write(GUEST_AR_ES, 0xc093); 6959d7eaa29SArthur Chunqi Li vmcs_write(GUEST_AR_FS, 0xc093); 6969d7eaa29SArthur Chunqi Li vmcs_write(GUEST_AR_GS, 0xc093); 6979d7eaa29SArthur Chunqi Li vmcs_write(GUEST_AR_SS, 0xc093); 6989d7eaa29SArthur Chunqi Li vmcs_write(GUEST_AR_LDTR, 0x82); 6999d7eaa29SArthur Chunqi Li vmcs_write(GUEST_AR_TR, 0x8b); 7009d7eaa29SArthur Chunqi Li 7019d7eaa29SArthur Chunqi Li /* 26.3.1.3 */ 702337166aaSJan Kiszka vmcs_write(GUEST_BASE_GDTR, gdt64_desc.base); 703337166aaSJan Kiszka vmcs_write(GUEST_BASE_IDTR, idt_descr.base); 704337166aaSJan Kiszka vmcs_write(GUEST_LIMIT_GDTR, gdt64_desc.limit); 705337166aaSJan Kiszka vmcs_write(GUEST_LIMIT_IDTR, idt_descr.limit); 7069d7eaa29SArthur Chunqi Li 7079d7eaa29SArthur Chunqi Li /* 26.3.1.4 */ 7089d7eaa29SArthur Chunqi Li vmcs_write(GUEST_RIP, (u64)(&guest_entry)); 7099d7eaa29SArthur Chunqi Li vmcs_write(GUEST_RSP, (u64)(guest_stack + PAGE_SIZE - 1)); 7109d7eaa29SArthur Chunqi Li vmcs_write(GUEST_RFLAGS, 0x2); 7119d7eaa29SArthur Chunqi Li 7129d7eaa29SArthur Chunqi Li /* 26.3.1.5 */ 71317ba0dd0SJan Kiszka vmcs_write(GUEST_ACTV_STATE, ACTV_ACTIVE); 7149d7eaa29SArthur Chunqi Li vmcs_write(GUEST_INTR_STATE, 0); 7159d7eaa29SArthur Chunqi Li } 7169d7eaa29SArthur Chunqi Li 7179d7eaa29SArthur Chunqi Li static int init_vmcs(struct vmcs **vmcs) 7189d7eaa29SArthur Chunqi Li { 7199d7eaa29SArthur Chunqi Li *vmcs = alloc_page(); 7209d7eaa29SArthur Chunqi Li memset(*vmcs, 0, PAGE_SIZE); 7219d7eaa29SArthur Chunqi Li (*vmcs)->revision_id = basic.revision; 7229d7eaa29SArthur Chunqi Li /* vmclear first to init vmcs */ 7239d7eaa29SArthur Chunqi Li if (vmcs_clear(*vmcs)) { 7249d7eaa29SArthur Chunqi Li printf("%s : vmcs_clear error\n", __func__); 7259d7eaa29SArthur Chunqi Li return 1; 7269d7eaa29SArthur Chunqi Li } 7279d7eaa29SArthur Chunqi Li 7289d7eaa29SArthur Chunqi Li if (make_vmcs_current(*vmcs)) { 7299d7eaa29SArthur Chunqi Li printf("%s : make_vmcs_current error\n", __func__); 7309d7eaa29SArthur Chunqi Li return 1; 7319d7eaa29SArthur Chunqi Li } 7329d7eaa29SArthur Chunqi Li 7339d7eaa29SArthur Chunqi Li /* All settings to pin/exit/enter/cpu 7349d7eaa29SArthur Chunqi Li control fields should be placed here */ 7359d7eaa29SArthur Chunqi Li ctrl_pin |= PIN_EXTINT | PIN_NMI | PIN_VIRT_NMI; 7369d7eaa29SArthur Chunqi Li ctrl_exit = EXI_LOAD_EFER | EXI_HOST_64; 7379d7eaa29SArthur Chunqi Li ctrl_enter = (ENT_LOAD_EFER | ENT_GUEST_64); 7389d7eaa29SArthur Chunqi Li /* DIsable IO instruction VMEXIT now */ 7399d7eaa29SArthur Chunqi Li ctrl_cpu[0] &= (~(CPU_IO | CPU_IO_BITMAP)); 7409d7eaa29SArthur Chunqi Li ctrl_cpu[1] = 0; 7419d7eaa29SArthur Chunqi Li 7429d7eaa29SArthur Chunqi Li ctrl_pin = (ctrl_pin | ctrl_pin_rev.set) & ctrl_pin_rev.clr; 7439d7eaa29SArthur Chunqi Li ctrl_enter = (ctrl_enter | ctrl_enter_rev.set) & ctrl_enter_rev.clr; 7449d7eaa29SArthur Chunqi Li ctrl_exit = (ctrl_exit | ctrl_exit_rev.set) & ctrl_exit_rev.clr; 7459d7eaa29SArthur Chunqi Li ctrl_cpu[0] = (ctrl_cpu[0] | ctrl_cpu_rev[0].set) & ctrl_cpu_rev[0].clr; 7469d7eaa29SArthur Chunqi Li 7479d7eaa29SArthur Chunqi Li init_vmcs_ctrl(); 7489d7eaa29SArthur Chunqi Li init_vmcs_host(); 7499d7eaa29SArthur Chunqi Li init_vmcs_guest(); 7509d7eaa29SArthur Chunqi Li return 0; 7519d7eaa29SArthur Chunqi Li } 7529d7eaa29SArthur Chunqi Li 7539d7eaa29SArthur Chunqi Li static void init_vmx(void) 7549d7eaa29SArthur Chunqi Li { 7553ee34093SArthur Chunqi Li ulong fix_cr0_set, fix_cr0_clr; 7563ee34093SArthur Chunqi Li ulong fix_cr4_set, fix_cr4_clr; 7573ee34093SArthur Chunqi Li 7589d7eaa29SArthur Chunqi Li vmxon_region = alloc_page(); 7599d7eaa29SArthur Chunqi Li memset(vmxon_region, 0, PAGE_SIZE); 7609d7eaa29SArthur Chunqi Li 7619d7eaa29SArthur Chunqi Li fix_cr0_set = rdmsr(MSR_IA32_VMX_CR0_FIXED0); 7629d7eaa29SArthur Chunqi Li fix_cr0_clr = rdmsr(MSR_IA32_VMX_CR0_FIXED1); 7639d7eaa29SArthur Chunqi Li fix_cr4_set = rdmsr(MSR_IA32_VMX_CR4_FIXED0); 7649d7eaa29SArthur Chunqi Li fix_cr4_clr = rdmsr(MSR_IA32_VMX_CR4_FIXED1); 7659d7eaa29SArthur Chunqi Li basic.val = rdmsr(MSR_IA32_VMX_BASIC); 7669d7eaa29SArthur Chunqi Li ctrl_pin_rev.val = rdmsr(basic.ctrl ? MSR_IA32_VMX_TRUE_PIN 7679d7eaa29SArthur Chunqi Li : MSR_IA32_VMX_PINBASED_CTLS); 7689d7eaa29SArthur Chunqi Li ctrl_exit_rev.val = rdmsr(basic.ctrl ? MSR_IA32_VMX_TRUE_EXIT 7699d7eaa29SArthur Chunqi Li : MSR_IA32_VMX_EXIT_CTLS); 7709d7eaa29SArthur Chunqi Li ctrl_enter_rev.val = rdmsr(basic.ctrl ? MSR_IA32_VMX_TRUE_ENTRY 7719d7eaa29SArthur Chunqi Li : MSR_IA32_VMX_ENTRY_CTLS); 7729d7eaa29SArthur Chunqi Li ctrl_cpu_rev[0].val = rdmsr(basic.ctrl ? MSR_IA32_VMX_TRUE_PROC 7739d7eaa29SArthur Chunqi Li : MSR_IA32_VMX_PROCBASED_CTLS); 7746884af61SArthur Chunqi Li if ((ctrl_cpu_rev[0].clr & CPU_SECONDARY) != 0) 7759d7eaa29SArthur Chunqi Li ctrl_cpu_rev[1].val = rdmsr(MSR_IA32_VMX_PROCBASED_CTLS2); 7766884af61SArthur Chunqi Li else 7776884af61SArthur Chunqi Li ctrl_cpu_rev[1].val = 0; 7786884af61SArthur Chunqi Li if ((ctrl_cpu_rev[1].clr & (CPU_EPT | CPU_VPID)) != 0) 7799d7eaa29SArthur Chunqi Li ept_vpid.val = rdmsr(MSR_IA32_VMX_EPT_VPID_CAP); 7806884af61SArthur Chunqi Li else 7816884af61SArthur Chunqi Li ept_vpid.val = 0; 7829d7eaa29SArthur Chunqi Li 7839d7eaa29SArthur Chunqi Li write_cr0((read_cr0() & fix_cr0_clr) | fix_cr0_set); 7849d7eaa29SArthur Chunqi Li write_cr4((read_cr4() & fix_cr4_clr) | fix_cr4_set | X86_CR4_VMXE); 7859d7eaa29SArthur Chunqi Li 7869d7eaa29SArthur Chunqi Li *vmxon_region = basic.revision; 7879d7eaa29SArthur Chunqi Li 7889d7eaa29SArthur Chunqi Li guest_stack = alloc_page(); 7899d7eaa29SArthur Chunqi Li memset(guest_stack, 0, PAGE_SIZE); 7909d7eaa29SArthur Chunqi Li guest_syscall_stack = alloc_page(); 7919d7eaa29SArthur Chunqi Li memset(guest_syscall_stack, 0, PAGE_SIZE); 7929d7eaa29SArthur Chunqi Li } 7939d7eaa29SArthur Chunqi Li 794e3f363c4SJan Kiszka static void do_vmxon_off(void *data) 7959d7eaa29SArthur Chunqi Li { 7963b127446SJan Kiszka vmx_on(); 7973b127446SJan Kiszka vmx_off(); 79803f37ef2SPaolo Bonzini } 7993b127446SJan Kiszka 800e3f363c4SJan Kiszka static void do_write_feature_control(void *data) 8013b127446SJan Kiszka { 8023b127446SJan Kiszka wrmsr(MSR_IA32_FEATURE_CONTROL, 0); 80303f37ef2SPaolo Bonzini } 8043b127446SJan Kiszka 8053b127446SJan Kiszka static int test_vmx_feature_control(void) 8063b127446SJan Kiszka { 8073b127446SJan Kiszka u64 ia32_feature_control; 8083b127446SJan Kiszka bool vmx_enabled; 8093b127446SJan Kiszka 8103b127446SJan Kiszka ia32_feature_control = rdmsr(MSR_IA32_FEATURE_CONTROL); 8113b127446SJan Kiszka vmx_enabled = ((ia32_feature_control & 0x5) == 0x5); 8123b127446SJan Kiszka if ((ia32_feature_control & 0x5) == 0x5) { 8133b127446SJan Kiszka printf("VMX enabled and locked by BIOS\n"); 8143b127446SJan Kiszka return 0; 8153b127446SJan Kiszka } else if (ia32_feature_control & 0x1) { 8163b127446SJan Kiszka printf("ERROR: VMX locked out by BIOS!?\n"); 8173b127446SJan Kiszka return 1; 8183b127446SJan Kiszka } 8193b127446SJan Kiszka 8203b127446SJan Kiszka wrmsr(MSR_IA32_FEATURE_CONTROL, 0); 8213b127446SJan Kiszka report("test vmxon with FEATURE_CONTROL cleared", 822e3f363c4SJan Kiszka test_for_exception(GP_VECTOR, &do_vmxon_off, NULL)); 8233b127446SJan Kiszka 8243b127446SJan Kiszka wrmsr(MSR_IA32_FEATURE_CONTROL, 0x4); 8253b127446SJan Kiszka report("test vmxon without FEATURE_CONTROL lock", 826e3f363c4SJan Kiszka test_for_exception(GP_VECTOR, &do_vmxon_off, NULL)); 8273b127446SJan Kiszka 8283b127446SJan Kiszka wrmsr(MSR_IA32_FEATURE_CONTROL, 0x5); 8293b127446SJan Kiszka vmx_enabled = ((rdmsr(MSR_IA32_FEATURE_CONTROL) & 0x5) == 0x5); 8303b127446SJan Kiszka report("test enable VMX in FEATURE_CONTROL", vmx_enabled); 8313b127446SJan Kiszka 8323b127446SJan Kiszka report("test FEATURE_CONTROL lock bit", 833e3f363c4SJan Kiszka test_for_exception(GP_VECTOR, &do_write_feature_control, NULL)); 8343b127446SJan Kiszka 8353b127446SJan Kiszka return !vmx_enabled; 8369d7eaa29SArthur Chunqi Li } 8379d7eaa29SArthur Chunqi Li 8389d7eaa29SArthur Chunqi Li static int test_vmxon(void) 8399d7eaa29SArthur Chunqi Li { 840ce21d809SBandan Das int ret, ret1; 841ce21d809SBandan Das u64 *tmp_region = vmxon_region; 842e2cf1c9dSEduardo Habkost int width = cpuid_maxphyaddr(); 8439d7eaa29SArthur Chunqi Li 844ce21d809SBandan Das /* Unaligned page access */ 845ce21d809SBandan Das vmxon_region = (u64 *)((intptr_t)vmxon_region + 1); 846ce21d809SBandan Das ret1 = vmx_on(); 847ce21d809SBandan Das report("test vmxon with unaligned vmxon region", ret1); 848ce21d809SBandan Das if (!ret1) { 849ce21d809SBandan Das ret = 1; 850ce21d809SBandan Das goto out; 851ce21d809SBandan Das } 852ce21d809SBandan Das 853ce21d809SBandan Das /* gpa bits beyond physical address width are set*/ 854ce21d809SBandan Das vmxon_region = (u64 *)((intptr_t)tmp_region | ((u64)1 << (width+1))); 855ce21d809SBandan Das ret1 = vmx_on(); 856ce21d809SBandan Das report("test vmxon with bits set beyond physical address width", ret1); 857ce21d809SBandan Das if (!ret1) { 858ce21d809SBandan Das ret = 1; 859ce21d809SBandan Das goto out; 860ce21d809SBandan Das } 861ce21d809SBandan Das 862ce21d809SBandan Das /* invalid revision indentifier */ 863ce21d809SBandan Das vmxon_region = tmp_region; 864ce21d809SBandan Das *vmxon_region = 0xba9da9; 865ce21d809SBandan Das ret1 = vmx_on(); 866ce21d809SBandan Das report("test vmxon with invalid revision identifier", ret1); 867ce21d809SBandan Das if (!ret1) { 868ce21d809SBandan Das ret = 1; 869ce21d809SBandan Das goto out; 870ce21d809SBandan Das } 871ce21d809SBandan Das 872ce21d809SBandan Das /* and finally a valid region */ 873ce21d809SBandan Das *vmxon_region = basic.revision; 8749d7eaa29SArthur Chunqi Li ret = vmx_on(); 875ce21d809SBandan Das report("test vmxon with valid vmxon region", !ret); 876ce21d809SBandan Das 877ce21d809SBandan Das out: 8789d7eaa29SArthur Chunqi Li return ret; 8799d7eaa29SArthur Chunqi Li } 8809d7eaa29SArthur Chunqi Li 8819d7eaa29SArthur Chunqi Li static void test_vmptrld(void) 8829d7eaa29SArthur Chunqi Li { 883daeec979SBandan Das struct vmcs *vmcs, *tmp_root; 884e2cf1c9dSEduardo Habkost int width = cpuid_maxphyaddr(); 8859d7eaa29SArthur Chunqi Li 8869d7eaa29SArthur Chunqi Li vmcs = alloc_page(); 8879d7eaa29SArthur Chunqi Li vmcs->revision_id = basic.revision; 888daeec979SBandan Das 889daeec979SBandan Das /* Unaligned page access */ 890daeec979SBandan Das tmp_root = (struct vmcs *)((intptr_t)vmcs + 1); 891daeec979SBandan Das report("test vmptrld with unaligned vmcs", 8929c305952SPaolo Bonzini make_vmcs_current(tmp_root) == 1); 893daeec979SBandan Das 894daeec979SBandan Das /* gpa bits beyond physical address width are set*/ 895daeec979SBandan Das tmp_root = (struct vmcs *)((intptr_t)vmcs | 896daeec979SBandan Das ((u64)1 << (width+1))); 897daeec979SBandan Das report("test vmptrld with vmcs address bits set beyond physical address width", 8989c305952SPaolo Bonzini make_vmcs_current(tmp_root) == 1); 899daeec979SBandan Das 900daeec979SBandan Das /* Pass VMXON region */ 901daeec979SBandan Das tmp_root = (struct vmcs *)vmxon_region; 902daeec979SBandan Das report("test vmptrld with vmxon region", 9039c305952SPaolo Bonzini make_vmcs_current(tmp_root) == 1); 904daeec979SBandan Das 905daeec979SBandan Das report("test vmptrld with valid vmcs region", make_vmcs_current(vmcs) == 0); 9069d7eaa29SArthur Chunqi Li } 9079d7eaa29SArthur Chunqi Li 9089d7eaa29SArthur Chunqi Li static void test_vmptrst(void) 9099d7eaa29SArthur Chunqi Li { 9109d7eaa29SArthur Chunqi Li int ret; 9119d7eaa29SArthur Chunqi Li struct vmcs *vmcs1, *vmcs2; 9129d7eaa29SArthur Chunqi Li 9139d7eaa29SArthur Chunqi Li vmcs1 = alloc_page(); 9149d7eaa29SArthur Chunqi Li memset(vmcs1, 0, PAGE_SIZE); 9159d7eaa29SArthur Chunqi Li init_vmcs(&vmcs1); 9169d7eaa29SArthur Chunqi Li ret = vmcs_save(&vmcs2); 9179d7eaa29SArthur Chunqi Li report("test vmptrst", (!ret) && (vmcs1 == vmcs2)); 9189d7eaa29SArthur Chunqi Li } 9199d7eaa29SArthur Chunqi Li 92069c8d31cSJan Kiszka struct vmx_ctl_msr { 92169c8d31cSJan Kiszka const char *name; 92269c8d31cSJan Kiszka u32 index, true_index; 92369c8d31cSJan Kiszka u32 default1; 92469c8d31cSJan Kiszka } vmx_ctl_msr[] = { 92569c8d31cSJan Kiszka { "MSR_IA32_VMX_PINBASED_CTLS", MSR_IA32_VMX_PINBASED_CTLS, 92669c8d31cSJan Kiszka MSR_IA32_VMX_TRUE_PIN, 0x16 }, 92769c8d31cSJan Kiszka { "MSR_IA32_VMX_PROCBASED_CTLS", MSR_IA32_VMX_PROCBASED_CTLS, 92869c8d31cSJan Kiszka MSR_IA32_VMX_TRUE_PROC, 0x401e172 }, 92969c8d31cSJan Kiszka { "MSR_IA32_VMX_PROCBASED_CTLS2", MSR_IA32_VMX_PROCBASED_CTLS2, 93069c8d31cSJan Kiszka MSR_IA32_VMX_PROCBASED_CTLS2, 0 }, 93169c8d31cSJan Kiszka { "MSR_IA32_VMX_EXIT_CTLS", MSR_IA32_VMX_EXIT_CTLS, 93269c8d31cSJan Kiszka MSR_IA32_VMX_TRUE_EXIT, 0x36dff }, 93369c8d31cSJan Kiszka { "MSR_IA32_VMX_ENTRY_CTLS", MSR_IA32_VMX_ENTRY_CTLS, 93469c8d31cSJan Kiszka MSR_IA32_VMX_TRUE_ENTRY, 0x11ff }, 93569c8d31cSJan Kiszka }; 93669c8d31cSJan Kiszka 93769c8d31cSJan Kiszka static void test_vmx_caps(void) 93869c8d31cSJan Kiszka { 93969c8d31cSJan Kiszka u64 val, default1, fixed0, fixed1; 94069c8d31cSJan Kiszka union vmx_ctrl_msr ctrl, true_ctrl; 94169c8d31cSJan Kiszka unsigned int n; 94269c8d31cSJan Kiszka bool ok; 94369c8d31cSJan Kiszka 94469c8d31cSJan Kiszka printf("\nTest suite: VMX capability reporting\n"); 94569c8d31cSJan Kiszka 94669c8d31cSJan Kiszka report("MSR_IA32_VMX_BASIC", 94769c8d31cSJan Kiszka (basic.revision & (1ul << 31)) == 0 && 94869c8d31cSJan Kiszka basic.size > 0 && basic.size <= 4096 && 94969c8d31cSJan Kiszka (basic.type == 0 || basic.type == 6) && 95069c8d31cSJan Kiszka basic.reserved1 == 0 && basic.reserved2 == 0); 95169c8d31cSJan Kiszka 95269c8d31cSJan Kiszka val = rdmsr(MSR_IA32_VMX_MISC); 95369c8d31cSJan Kiszka report("MSR_IA32_VMX_MISC", 95469c8d31cSJan Kiszka (!(ctrl_cpu_rev[1].clr & CPU_URG) || val & (1ul << 5)) && 95569c8d31cSJan Kiszka ((val >> 16) & 0x1ff) <= 256 && 95669c8d31cSJan Kiszka (val & 0xc0007e00) == 0); 95769c8d31cSJan Kiszka 95869c8d31cSJan Kiszka for (n = 0; n < ARRAY_SIZE(vmx_ctl_msr); n++) { 95969c8d31cSJan Kiszka ctrl.val = rdmsr(vmx_ctl_msr[n].index); 96069c8d31cSJan Kiszka default1 = vmx_ctl_msr[n].default1; 96169c8d31cSJan Kiszka ok = (ctrl.set & default1) == default1; 96269c8d31cSJan Kiszka ok = ok && (ctrl.set & ~ctrl.clr) == 0; 96369c8d31cSJan Kiszka if (ok && basic.ctrl) { 96469c8d31cSJan Kiszka true_ctrl.val = rdmsr(vmx_ctl_msr[n].true_index); 96569c8d31cSJan Kiszka ok = ctrl.clr == true_ctrl.clr; 96669c8d31cSJan Kiszka ok = ok && ctrl.set == (true_ctrl.set | default1); 96769c8d31cSJan Kiszka } 96869c8d31cSJan Kiszka report(vmx_ctl_msr[n].name, ok); 96969c8d31cSJan Kiszka } 97069c8d31cSJan Kiszka 97169c8d31cSJan Kiszka fixed0 = rdmsr(MSR_IA32_VMX_CR0_FIXED0); 97269c8d31cSJan Kiszka fixed1 = rdmsr(MSR_IA32_VMX_CR0_FIXED1); 97369c8d31cSJan Kiszka report("MSR_IA32_VMX_IA32_VMX_CR0_FIXED0/1", 97469c8d31cSJan Kiszka ((fixed0 ^ fixed1) & ~fixed1) == 0); 97569c8d31cSJan Kiszka 97669c8d31cSJan Kiszka fixed0 = rdmsr(MSR_IA32_VMX_CR4_FIXED0); 97769c8d31cSJan Kiszka fixed1 = rdmsr(MSR_IA32_VMX_CR4_FIXED1); 97869c8d31cSJan Kiszka report("MSR_IA32_VMX_IA32_VMX_CR4_FIXED0/1", 97969c8d31cSJan Kiszka ((fixed0 ^ fixed1) & ~fixed1) == 0); 98069c8d31cSJan Kiszka 98169c8d31cSJan Kiszka val = rdmsr(MSR_IA32_VMX_VMCS_ENUM); 98269c8d31cSJan Kiszka report("MSR_IA32_VMX_VMCS_ENUM", 98369c8d31cSJan Kiszka (val & 0x3e) >= 0x2a && 98469c8d31cSJan Kiszka (val & 0xfffffffffffffc01Ull) == 0); 98569c8d31cSJan Kiszka 98669c8d31cSJan Kiszka val = rdmsr(MSR_IA32_VMX_EPT_VPID_CAP); 98769c8d31cSJan Kiszka report("MSR_IA32_VMX_EPT_VPID_CAP", 988625f52abSPaolo Bonzini (val & 0xfffff07ef98cbebeUll) == 0); 98969c8d31cSJan Kiszka } 99069c8d31cSJan Kiszka 9919d7eaa29SArthur Chunqi Li /* This function can only be called in guest */ 9929d7eaa29SArthur Chunqi Li static void __attribute__((__used__)) hypercall(u32 hypercall_no) 9939d7eaa29SArthur Chunqi Li { 9949d7eaa29SArthur Chunqi Li u64 val = 0; 9959d7eaa29SArthur Chunqi Li val = (hypercall_no & HYPERCALL_MASK) | HYPERCALL_BIT; 9969d7eaa29SArthur Chunqi Li hypercall_field = val; 9979d7eaa29SArthur Chunqi Li asm volatile("vmcall\n\t"); 9989d7eaa29SArthur Chunqi Li } 9999d7eaa29SArthur Chunqi Li 10009d7eaa29SArthur Chunqi Li static bool is_hypercall() 10019d7eaa29SArthur Chunqi Li { 10029d7eaa29SArthur Chunqi Li ulong reason, hyper_bit; 10039d7eaa29SArthur Chunqi Li 10049d7eaa29SArthur Chunqi Li reason = vmcs_read(EXI_REASON) & 0xff; 10059d7eaa29SArthur Chunqi Li hyper_bit = hypercall_field & HYPERCALL_BIT; 10069d7eaa29SArthur Chunqi Li if (reason == VMX_VMCALL && hyper_bit) 10079d7eaa29SArthur Chunqi Li return true; 10089d7eaa29SArthur Chunqi Li return false; 10099d7eaa29SArthur Chunqi Li } 10109d7eaa29SArthur Chunqi Li 10119d7eaa29SArthur Chunqi Li static int handle_hypercall() 10129d7eaa29SArthur Chunqi Li { 10139d7eaa29SArthur Chunqi Li ulong hypercall_no; 10149d7eaa29SArthur Chunqi Li 10159d7eaa29SArthur Chunqi Li hypercall_no = hypercall_field & HYPERCALL_MASK; 10169d7eaa29SArthur Chunqi Li hypercall_field = 0; 10179d7eaa29SArthur Chunqi Li switch (hypercall_no) { 10189d7eaa29SArthur Chunqi Li case HYPERCALL_VMEXIT: 10199d7eaa29SArthur Chunqi Li return VMX_TEST_VMEXIT; 10209d7eaa29SArthur Chunqi Li default: 1021b006d7ebSAndrew Jones printf("ERROR : Invalid hypercall number : %ld\n", hypercall_no); 10229d7eaa29SArthur Chunqi Li } 10239d7eaa29SArthur Chunqi Li return VMX_TEST_EXIT; 10249d7eaa29SArthur Chunqi Li } 10259d7eaa29SArthur Chunqi Li 10269d7eaa29SArthur Chunqi Li static int exit_handler() 10279d7eaa29SArthur Chunqi Li { 10289d7eaa29SArthur Chunqi Li int ret; 10299d7eaa29SArthur Chunqi Li 10309d7eaa29SArthur Chunqi Li current->exits++; 10311d9284d0SArthur Chunqi Li regs.rflags = vmcs_read(GUEST_RFLAGS); 10329d7eaa29SArthur Chunqi Li if (is_hypercall()) 10339d7eaa29SArthur Chunqi Li ret = handle_hypercall(); 10349d7eaa29SArthur Chunqi Li else 10359d7eaa29SArthur Chunqi Li ret = current->exit_handler(); 10361d9284d0SArthur Chunqi Li vmcs_write(GUEST_RFLAGS, regs.rflags); 10373b50efe3SPeter Feiner 10389d7eaa29SArthur Chunqi Li return ret; 10399d7eaa29SArthur Chunqi Li } 10403b50efe3SPeter Feiner 10413b50efe3SPeter Feiner /* 10423b50efe3SPeter Feiner * Called if vmlaunch or vmresume fails. 10433b50efe3SPeter Feiner * @early - failure due to "VMX controls and host-state area" (26.2) 10443b50efe3SPeter Feiner * @vmlaunch - was this a vmlaunch or vmresume 10453b50efe3SPeter Feiner * @rflags - host rflags 10463b50efe3SPeter Feiner */ 10473b50efe3SPeter Feiner static int 10483b50efe3SPeter Feiner entry_failure_handler(struct vmentry_failure *failure) 10493b50efe3SPeter Feiner { 10503b50efe3SPeter Feiner if (current->entry_failure_handler) 10513b50efe3SPeter Feiner return current->entry_failure_handler(failure); 10523b50efe3SPeter Feiner else 10533b50efe3SPeter Feiner return VMX_TEST_EXIT; 10549d7eaa29SArthur Chunqi Li } 10559d7eaa29SArthur Chunqi Li 10569d7eaa29SArthur Chunqi Li static int vmx_run() 10579d7eaa29SArthur Chunqi Li { 1058897d8365SPeter Feiner unsigned long host_rflags; 10599d7eaa29SArthur Chunqi Li 10609d7eaa29SArthur Chunqi Li while (1) { 10613b50efe3SPeter Feiner u32 ret; 10623b50efe3SPeter Feiner u32 fail = 0; 10633b50efe3SPeter Feiner bool entered; 10643b50efe3SPeter Feiner struct vmentry_failure failure; 10654e809db5SPeter Feiner 10669d7eaa29SArthur Chunqi Li asm volatile ( 1067897d8365SPeter Feiner "mov %[HOST_RSP], %%rdi\n\t" 1068897d8365SPeter Feiner "vmwrite %%rsp, %%rdi\n\t" 10699d7eaa29SArthur Chunqi Li LOAD_GPR_C 107044417388SPaolo Bonzini "cmpb $0, %[launched]\n\t" 10719d7eaa29SArthur Chunqi Li "jne 1f\n\t" 10729d7eaa29SArthur Chunqi Li "vmlaunch\n\t" 10739d7eaa29SArthur Chunqi Li "jmp 2f\n\t" 10749d7eaa29SArthur Chunqi Li "1: " 10759d7eaa29SArthur Chunqi Li "vmresume\n\t" 10769d7eaa29SArthur Chunqi Li "2: " 1077f37cf4e2SPeter Feiner SAVE_GPR_C 1078897d8365SPeter Feiner "pushf\n\t" 1079897d8365SPeter Feiner "pop %%rdi\n\t" 1080897d8365SPeter Feiner "mov %%rdi, %[host_rflags]\n\t" 1081897d8365SPeter Feiner "movl $1, %[fail]\n\t" 1082f37cf4e2SPeter Feiner "jmp 3f\n\t" 10839d7eaa29SArthur Chunqi Li "vmx_return:\n\t" 10849d7eaa29SArthur Chunqi Li SAVE_GPR_C 1085f37cf4e2SPeter Feiner "3: \n\t" 1086897d8365SPeter Feiner : [fail]"+m"(fail), [host_rflags]"=m"(host_rflags) 1087897d8365SPeter Feiner : [launched]"m"(launched), [HOST_RSP]"i"(HOST_RSP) 1088897d8365SPeter Feiner : "rdi", "memory", "cc" 10899d7eaa29SArthur Chunqi Li 10909d7eaa29SArthur Chunqi Li ); 10913b50efe3SPeter Feiner 10923b50efe3SPeter Feiner entered = !fail && !(vmcs_read(EXI_REASON) & VMX_ENTRY_FAILURE); 10933b50efe3SPeter Feiner 10943b50efe3SPeter Feiner if (entered) { 10953b50efe3SPeter Feiner /* 10963b50efe3SPeter Feiner * VMCS isn't in "launched" state if there's been any 10973b50efe3SPeter Feiner * entry failure (early or otherwise). 10983b50efe3SPeter Feiner */ 10999d7eaa29SArthur Chunqi Li launched = 1; 11009d7eaa29SArthur Chunqi Li ret = exit_handler(); 11013b50efe3SPeter Feiner } else { 11023b50efe3SPeter Feiner failure.flags = host_rflags; 11033b50efe3SPeter Feiner failure.vmlaunch = !launched; 11043b50efe3SPeter Feiner failure.instr = launched ? "vmresume" : "vmlaunch"; 11053b50efe3SPeter Feiner failure.early = fail; 11063b50efe3SPeter Feiner ret = entry_failure_handler(&failure); 11079d7eaa29SArthur Chunqi Li } 11083b50efe3SPeter Feiner 11099d7eaa29SArthur Chunqi Li switch (ret) { 11103b50efe3SPeter Feiner case VMX_TEST_RESUME: 11113b50efe3SPeter Feiner continue; 11129d7eaa29SArthur Chunqi Li case VMX_TEST_VMEXIT: 11139d7eaa29SArthur Chunqi Li return 0; 11143b50efe3SPeter Feiner case VMX_TEST_EXIT: 11159d7eaa29SArthur Chunqi Li break; 11169d7eaa29SArthur Chunqi Li default: 11173b50efe3SPeter Feiner printf("ERROR : Invalid %s_handler return val %d.\n", 11183b50efe3SPeter Feiner entered ? "exit" : "entry_failure", 11193b50efe3SPeter Feiner ret); 11209d7eaa29SArthur Chunqi Li break; 11219d7eaa29SArthur Chunqi Li } 11223b50efe3SPeter Feiner 11233b50efe3SPeter Feiner if (entered) 11243b50efe3SPeter Feiner print_vmexit_info(); 11253b50efe3SPeter Feiner else 11263b50efe3SPeter Feiner print_vmentry_failure_info(&failure); 11273b50efe3SPeter Feiner abort(); 11283b50efe3SPeter Feiner } 11299d7eaa29SArthur Chunqi Li } 11309d7eaa29SArthur Chunqi Li 11319d7eaa29SArthur Chunqi Li static int test_run(struct vmx_test *test) 11329d7eaa29SArthur Chunqi Li { 11339d7eaa29SArthur Chunqi Li if (test->name == NULL) 11349d7eaa29SArthur Chunqi Li test->name = "(no name)"; 11359d7eaa29SArthur Chunqi Li if (vmx_on()) { 11369d7eaa29SArthur Chunqi Li printf("%s : vmxon failed.\n", __func__); 11379d7eaa29SArthur Chunqi Li return 1; 11389d7eaa29SArthur Chunqi Li } 11399d7eaa29SArthur Chunqi Li init_vmcs(&(test->vmcs)); 11409d7eaa29SArthur Chunqi Li /* Directly call test->init is ok here, init_vmcs has done 11419d7eaa29SArthur Chunqi Li vmcs init, vmclear and vmptrld*/ 1142c592c151SJan Kiszka if (test->init && test->init(test->vmcs) != VMX_TEST_START) 1143a0e30e71SPaolo Bonzini goto out; 11449d7eaa29SArthur Chunqi Li test->exits = 0; 11459d7eaa29SArthur Chunqi Li current = test; 11469d7eaa29SArthur Chunqi Li regs = test->guest_regs; 11479d7eaa29SArthur Chunqi Li vmcs_write(GUEST_RFLAGS, regs.rflags | 0x2); 11489d7eaa29SArthur Chunqi Li launched = 0; 11499d7eaa29SArthur Chunqi Li printf("\nTest suite: %s\n", test->name); 11509d7eaa29SArthur Chunqi Li vmx_run(); 1151a0e30e71SPaolo Bonzini out: 11529d7eaa29SArthur Chunqi Li if (vmx_off()) { 11539d7eaa29SArthur Chunqi Li printf("%s : vmxoff failed.\n", __func__); 11549d7eaa29SArthur Chunqi Li return 1; 11559d7eaa29SArthur Chunqi Li } 11569d7eaa29SArthur Chunqi Li return 0; 11579d7eaa29SArthur Chunqi Li } 11589d7eaa29SArthur Chunqi Li 11593ee34093SArthur Chunqi Li extern struct vmx_test vmx_tests[]; 11609d7eaa29SArthur Chunqi Li 1161*8029cac7SPeter Feiner /* Match name with wanted allowing underscores in place of spaces. */ 1162*8029cac7SPeter Feiner static bool test_name_wanted(const char *name, const char *wanted) 1163*8029cac7SPeter Feiner { 1164*8029cac7SPeter Feiner const char *n; 1165*8029cac7SPeter Feiner const char *w; 1166*8029cac7SPeter Feiner 1167*8029cac7SPeter Feiner for (n = name, w = wanted; *n != '\0' && *w != '\0'; n++, w++) { 1168*8029cac7SPeter Feiner if (*n != *w && !(*n == ' ' && *w == '_')) 1169*8029cac7SPeter Feiner return false; 1170*8029cac7SPeter Feiner } 1171*8029cac7SPeter Feiner return *n == '\0' && *w == '\0'; 1172*8029cac7SPeter Feiner } 1173*8029cac7SPeter Feiner 1174*8029cac7SPeter Feiner static bool test_wanted(struct vmx_test *test, char *wanted[], int nwanted) 1175*8029cac7SPeter Feiner { 1176*8029cac7SPeter Feiner int i; 1177*8029cac7SPeter Feiner 1178*8029cac7SPeter Feiner if (!nwanted) 1179*8029cac7SPeter Feiner return true; 1180*8029cac7SPeter Feiner 1181*8029cac7SPeter Feiner for (i = 0; i < nwanted; ++i) { 1182*8029cac7SPeter Feiner if (test_name_wanted(test->name, wanted[i])) 1183*8029cac7SPeter Feiner return true; 1184*8029cac7SPeter Feiner } 1185*8029cac7SPeter Feiner return false; 1186*8029cac7SPeter Feiner } 1187*8029cac7SPeter Feiner 1188*8029cac7SPeter Feiner int main(int argc, char *argv[]) 11899d7eaa29SArthur Chunqi Li { 11903ee34093SArthur Chunqi Li int i = 0; 1191*8029cac7SPeter Feiner int matched = 0; 11929d7eaa29SArthur Chunqi Li 11939d7eaa29SArthur Chunqi Li setup_vm(); 11949d7eaa29SArthur Chunqi Li setup_idt(); 11953ee34093SArthur Chunqi Li hypercall_field = 0; 11969d7eaa29SArthur Chunqi Li 11973b127446SJan Kiszka if (!(cpuid(1).c & (1 << 5))) { 11983b127446SJan Kiszka printf("WARNING: vmx not supported, add '-cpu host'\n"); 11999d7eaa29SArthur Chunqi Li goto exit; 12009d7eaa29SArthur Chunqi Li } 12019d7eaa29SArthur Chunqi Li init_vmx(); 12023b127446SJan Kiszka if (test_vmx_feature_control() != 0) 12033b127446SJan Kiszka goto exit; 12049d7eaa29SArthur Chunqi Li /* Set basic test ctxt the same as "null" */ 12059d7eaa29SArthur Chunqi Li current = &vmx_tests[0]; 12069d7eaa29SArthur Chunqi Li if (test_vmxon() != 0) 12079d7eaa29SArthur Chunqi Li goto exit; 12089d7eaa29SArthur Chunqi Li test_vmptrld(); 12099d7eaa29SArthur Chunqi Li test_vmclear(); 12109d7eaa29SArthur Chunqi Li test_vmptrst(); 12119d7eaa29SArthur Chunqi Li init_vmcs(&vmcs_root); 12129d7eaa29SArthur Chunqi Li if (vmx_run()) { 12139d7eaa29SArthur Chunqi Li report("test vmlaunch", 0); 12149d7eaa29SArthur Chunqi Li goto exit; 12159d7eaa29SArthur Chunqi Li } 12169d7eaa29SArthur Chunqi Li test_vmxoff(); 121769c8d31cSJan Kiszka test_vmx_caps(); 12189d7eaa29SArthur Chunqi Li 1219*8029cac7SPeter Feiner while (vmx_tests[++i].name != NULL) { 1220*8029cac7SPeter Feiner if (!test_wanted(&vmx_tests[i], argv + 1, argc - 1)) 1221*8029cac7SPeter Feiner continue; 1222*8029cac7SPeter Feiner matched++; 12239d7eaa29SArthur Chunqi Li if (test_run(&vmx_tests[i])) 12249d7eaa29SArthur Chunqi Li goto exit; 1225*8029cac7SPeter Feiner } 1226*8029cac7SPeter Feiner 1227*8029cac7SPeter Feiner if (!matched) 1228*8029cac7SPeter Feiner report("command line didn't match any tests!", matched); 12299d7eaa29SArthur Chunqi Li 12309d7eaa29SArthur Chunqi Li exit: 1231f3cdd159SJan Kiszka return report_summary(); 12329d7eaa29SArthur Chunqi Li } 1233