1002d1830SGleb Natapov #include "fwcfg.h" 27d36db35SAvi Kivity #include "vm.h" 37d36db35SAvi Kivity #include "libcflat.h" 47d36db35SAvi Kivity 57d36db35SAvi Kivity #define PAGE_SIZE 4096ul 67d36db35SAvi Kivity #ifdef __x86_64__ 77d36db35SAvi Kivity #define LARGE_PAGE_SIZE (512 * PAGE_SIZE) 87d36db35SAvi Kivity #else 97d36db35SAvi Kivity #define LARGE_PAGE_SIZE (1024 * PAGE_SIZE) 107d36db35SAvi Kivity #endif 117d36db35SAvi Kivity 127d36db35SAvi Kivity static void *free = 0; 137d36db35SAvi Kivity static void *vfree_top = 0; 147d36db35SAvi Kivity 157d36db35SAvi Kivity static void free_memory(void *mem, unsigned long size) 167d36db35SAvi Kivity { 177d36db35SAvi Kivity while (size >= PAGE_SIZE) { 187d36db35SAvi Kivity *(void **)mem = free; 197d36db35SAvi Kivity free = mem; 207d36db35SAvi Kivity mem += PAGE_SIZE; 217d36db35SAvi Kivity size -= PAGE_SIZE; 227d36db35SAvi Kivity } 237d36db35SAvi Kivity } 247d36db35SAvi Kivity 257d36db35SAvi Kivity void *alloc_page() 267d36db35SAvi Kivity { 277d36db35SAvi Kivity void *p; 287d36db35SAvi Kivity 297d36db35SAvi Kivity if (!free) 307d36db35SAvi Kivity return 0; 317d36db35SAvi Kivity 327d36db35SAvi Kivity p = free; 337d36db35SAvi Kivity free = *(void **)free; 347d36db35SAvi Kivity 357d36db35SAvi Kivity return p; 367d36db35SAvi Kivity } 377d36db35SAvi Kivity 387d36db35SAvi Kivity void free_page(void *page) 397d36db35SAvi Kivity { 407d36db35SAvi Kivity *(void **)page = free; 417d36db35SAvi Kivity free = page; 427d36db35SAvi Kivity } 437d36db35SAvi Kivity 447d36db35SAvi Kivity extern char edata; 457d36db35SAvi Kivity static unsigned long end_of_memory; 467d36db35SAvi Kivity 477d36db35SAvi Kivity #ifdef __x86_64__ 487d36db35SAvi Kivity #define PAGE_LEVEL 4 497d36db35SAvi Kivity #define PGDIR_WIDTH 9 507d36db35SAvi Kivity #define PGDIR_MASK 511 517d36db35SAvi Kivity #else 527d36db35SAvi Kivity #define PAGE_LEVEL 2 537d36db35SAvi Kivity #define PGDIR_WIDTH 10 547d36db35SAvi Kivity #define PGDIR_MASK 1023 557d36db35SAvi Kivity #endif 567d36db35SAvi Kivity 577d36db35SAvi Kivity void install_pte(unsigned long *cr3, 587d36db35SAvi Kivity int pte_level, 597d36db35SAvi Kivity void *virt, 607d36db35SAvi Kivity unsigned long pte, 617d36db35SAvi Kivity unsigned long *pt_page) 627d36db35SAvi Kivity { 637d36db35SAvi Kivity int level; 647d36db35SAvi Kivity unsigned long *pt = cr3; 657d36db35SAvi Kivity unsigned offset; 667d36db35SAvi Kivity 677d36db35SAvi Kivity for (level = PAGE_LEVEL; level > pte_level; --level) { 687d36db35SAvi Kivity offset = ((unsigned long)virt >> ((level-1) * PGDIR_WIDTH + 12)) & PGDIR_MASK; 697d36db35SAvi Kivity if (!(pt[offset] & PTE_PRESENT)) { 707d36db35SAvi Kivity unsigned long *new_pt = pt_page; 717d36db35SAvi Kivity if (!new_pt) 727d36db35SAvi Kivity new_pt = alloc_page(); 737d36db35SAvi Kivity else 747d36db35SAvi Kivity pt_page = 0; 757d36db35SAvi Kivity memset(new_pt, 0, PAGE_SIZE); 76*333af1b4SPaolo Bonzini pt[offset] = virt_to_phys(new_pt) | PTE_PRESENT | PTE_WRITE | PTE_USER; 777d36db35SAvi Kivity } 787d36db35SAvi Kivity pt = phys_to_virt(pt[offset] & 0xffffffffff000ull); 797d36db35SAvi Kivity } 807d36db35SAvi Kivity offset = ((unsigned long)virt >> ((level-1) * PGDIR_WIDTH + 12)) & PGDIR_MASK; 817d36db35SAvi Kivity pt[offset] = pte; 827d36db35SAvi Kivity } 837d36db35SAvi Kivity 847d36db35SAvi Kivity static unsigned long get_pte(unsigned long *cr3, void *virt) 857d36db35SAvi Kivity { 867d36db35SAvi Kivity int level; 877d36db35SAvi Kivity unsigned long *pt = cr3, pte; 887d36db35SAvi Kivity unsigned offset; 897d36db35SAvi Kivity 907d36db35SAvi Kivity for (level = PAGE_LEVEL; level > 1; --level) { 917d36db35SAvi Kivity offset = ((unsigned long)virt >> (((level-1) * PGDIR_WIDTH) + 12)) & PGDIR_MASK; 927d36db35SAvi Kivity pte = pt[offset]; 937d36db35SAvi Kivity if (!(pte & PTE_PRESENT)) 947d36db35SAvi Kivity return 0; 957d36db35SAvi Kivity if (level == 2 && (pte & PTE_PSE)) 967d36db35SAvi Kivity return pte; 977d36db35SAvi Kivity pt = phys_to_virt(pte & 0xffffffffff000ull); 987d36db35SAvi Kivity } 997d36db35SAvi Kivity offset = ((unsigned long)virt >> (((level-1) * PGDIR_WIDTH) + 12)) & PGDIR_MASK; 1007d36db35SAvi Kivity pte = pt[offset]; 1017d36db35SAvi Kivity return pte; 1027d36db35SAvi Kivity } 1037d36db35SAvi Kivity 1047d36db35SAvi Kivity void install_large_page(unsigned long *cr3, 1057d36db35SAvi Kivity unsigned long phys, 1067d36db35SAvi Kivity void *virt) 1077d36db35SAvi Kivity { 108b01c8823SKevin Wolf install_pte(cr3, 2, virt, phys | PTE_PRESENT | PTE_WRITE | PTE_USER | PTE_PSE, 0); 1097d36db35SAvi Kivity } 1107d36db35SAvi Kivity 1117d36db35SAvi Kivity void install_page(unsigned long *cr3, 1127d36db35SAvi Kivity unsigned long phys, 1137d36db35SAvi Kivity void *virt) 1147d36db35SAvi Kivity { 115b01c8823SKevin Wolf install_pte(cr3, 1, virt, phys | PTE_PRESENT | PTE_WRITE | PTE_USER, 0); 1167d36db35SAvi Kivity } 1177d36db35SAvi Kivity 1187d36db35SAvi Kivity 11963254428SGleb Natapov static void setup_mmu_range(unsigned long *cr3, unsigned long start, 12063254428SGleb Natapov unsigned long len) 12163254428SGleb Natapov { 12263254428SGleb Natapov u64 max = (u64)len + (u64)start; 12363254428SGleb Natapov u64 phys = start; 12463254428SGleb Natapov 12563254428SGleb Natapov while (phys + LARGE_PAGE_SIZE <= max) { 12663254428SGleb Natapov install_large_page(cr3, phys, (void *)(ulong)phys); 12763254428SGleb Natapov phys += LARGE_PAGE_SIZE; 12863254428SGleb Natapov } 12963254428SGleb Natapov while (phys + PAGE_SIZE <= max) { 13063254428SGleb Natapov install_page(cr3, phys, (void *)(ulong)phys); 13163254428SGleb Natapov phys += PAGE_SIZE; 13263254428SGleb Natapov } 13363254428SGleb Natapov } 13463254428SGleb Natapov 1357d36db35SAvi Kivity static void setup_mmu(unsigned long len) 1367d36db35SAvi Kivity { 1377d36db35SAvi Kivity unsigned long *cr3 = alloc_page(); 1387d36db35SAvi Kivity 1397d36db35SAvi Kivity memset(cr3, 0, PAGE_SIZE); 14063254428SGleb Natapov 14163254428SGleb Natapov #ifdef __x86_64__ 14263254428SGleb Natapov if (len < (1ul << 32)) 14363254428SGleb Natapov len = (1ul << 32); /* map mmio 1:1 */ 14463254428SGleb Natapov 14563254428SGleb Natapov setup_mmu_range(cr3, 0, len); 14663254428SGleb Natapov #else 14763254428SGleb Natapov if (len > (1ul << 31)) 14863254428SGleb Natapov len = (1ul << 31); 14963254428SGleb Natapov 15063254428SGleb Natapov /* 0 - 2G memory, 2G-3G valloc area, 3G-4G mmio */ 15163254428SGleb Natapov setup_mmu_range(cr3, 0, len); 15263254428SGleb Natapov setup_mmu_range(cr3, 3ul << 30, (1ul << 30)); 15363254428SGleb Natapov vfree_top = (void*)(3ul << 30); 15463254428SGleb Natapov #endif 15563254428SGleb Natapov 1567d36db35SAvi Kivity write_cr3(virt_to_phys(cr3)); 1577d36db35SAvi Kivity #ifndef __x86_64__ 1587d36db35SAvi Kivity write_cr4(X86_CR4_PSE); 1597d36db35SAvi Kivity #endif 16097011120SGleb Natapov write_cr0(X86_CR0_PG |X86_CR0_PE | X86_CR0_WP); 1617d36db35SAvi Kivity 1627d36db35SAvi Kivity printf("paging enabled\n"); 1637d36db35SAvi Kivity printf("cr0 = %x\n", read_cr0()); 1647d36db35SAvi Kivity printf("cr3 = %x\n", read_cr3()); 1657d36db35SAvi Kivity printf("cr4 = %x\n", read_cr4()); 1667d36db35SAvi Kivity } 1677d36db35SAvi Kivity 1687d36db35SAvi Kivity void setup_vm() 1697d36db35SAvi Kivity { 170002d1830SGleb Natapov end_of_memory = fwcfg_get_u64(FW_CFG_RAM_SIZE); 1717d36db35SAvi Kivity free_memory(&edata, end_of_memory - (unsigned long)&edata); 1727d36db35SAvi Kivity setup_mmu(end_of_memory); 1737d36db35SAvi Kivity } 1747d36db35SAvi Kivity 1757d36db35SAvi Kivity void *vmalloc(unsigned long size) 1767d36db35SAvi Kivity { 1777d36db35SAvi Kivity void *mem, *p; 1787d36db35SAvi Kivity unsigned pages; 1797d36db35SAvi Kivity 1807d36db35SAvi Kivity size += sizeof(unsigned long); 1817d36db35SAvi Kivity 1827d36db35SAvi Kivity size = (size + PAGE_SIZE - 1) & ~(PAGE_SIZE - 1); 1837d36db35SAvi Kivity vfree_top -= size; 1847d36db35SAvi Kivity mem = p = vfree_top; 1857d36db35SAvi Kivity pages = size / PAGE_SIZE; 1867d36db35SAvi Kivity while (pages--) { 1877d36db35SAvi Kivity install_page(phys_to_virt(read_cr3()), virt_to_phys(alloc_page()), p); 1887d36db35SAvi Kivity p += PAGE_SIZE; 1897d36db35SAvi Kivity } 1907d36db35SAvi Kivity *(unsigned long *)mem = size; 1917d36db35SAvi Kivity mem += sizeof(unsigned long); 1927d36db35SAvi Kivity return mem; 1937d36db35SAvi Kivity } 1947d36db35SAvi Kivity 195334cd2bfSGleb Natapov uint64_t virt_to_phys_cr3(void *mem) 196334cd2bfSGleb Natapov { 197334cd2bfSGleb Natapov return (get_pte(phys_to_virt(read_cr3()), mem) & PTE_ADDR) + ((ulong)mem & (PAGE_SIZE - 1)); 198334cd2bfSGleb Natapov } 199334cd2bfSGleb Natapov 2007d36db35SAvi Kivity void vfree(void *mem) 2017d36db35SAvi Kivity { 2027d36db35SAvi Kivity unsigned long size = ((unsigned long *)mem)[-1]; 2037d36db35SAvi Kivity 2047d36db35SAvi Kivity while (size) { 2057d36db35SAvi Kivity free_page(phys_to_virt(get_pte(phys_to_virt(read_cr3()), mem) & PTE_ADDR)); 2067d36db35SAvi Kivity mem += PAGE_SIZE; 2077d36db35SAvi Kivity size -= PAGE_SIZE; 2087d36db35SAvi Kivity } 2097d36db35SAvi Kivity } 2107d36db35SAvi Kivity 2117d36db35SAvi Kivity void *vmap(unsigned long long phys, unsigned long size) 2127d36db35SAvi Kivity { 2137d36db35SAvi Kivity void *mem, *p; 2147d36db35SAvi Kivity unsigned pages; 2157d36db35SAvi Kivity 2167d36db35SAvi Kivity size = (size + PAGE_SIZE - 1) & ~(PAGE_SIZE - 1); 2177d36db35SAvi Kivity vfree_top -= size; 2187d36db35SAvi Kivity phys &= ~(unsigned long long)(PAGE_SIZE - 1); 2197d36db35SAvi Kivity 2207d36db35SAvi Kivity mem = p = vfree_top; 2217d36db35SAvi Kivity pages = size / PAGE_SIZE; 2227d36db35SAvi Kivity while (pages--) { 2237d36db35SAvi Kivity install_page(phys_to_virt(read_cr3()), phys, p); 2247d36db35SAvi Kivity phys += PAGE_SIZE; 2257d36db35SAvi Kivity p += PAGE_SIZE; 2267d36db35SAvi Kivity } 2277d36db35SAvi Kivity return mem; 2287d36db35SAvi Kivity } 229a4b87a16SGleb Natapov 230524ae896SAvi Kivity void *alloc_vpages(ulong nr) 231524ae896SAvi Kivity { 232524ae896SAvi Kivity vfree_top -= PAGE_SIZE * nr; 233524ae896SAvi Kivity return vfree_top; 234524ae896SAvi Kivity } 235524ae896SAvi Kivity 236a4b87a16SGleb Natapov void *alloc_vpage(void) 237a4b87a16SGleb Natapov { 238524ae896SAvi Kivity return alloc_vpages(1); 239a4b87a16SGleb Natapov } 240