17d36db35SAvi Kivity #include "vm.h" 27d36db35SAvi Kivity #include "libcflat.h" 37d36db35SAvi Kivity 47d36db35SAvi Kivity #define PAGE_SIZE 4096ul 57d36db35SAvi Kivity #ifdef __x86_64__ 67d36db35SAvi Kivity #define LARGE_PAGE_SIZE (512 * PAGE_SIZE) 77d36db35SAvi Kivity #else 87d36db35SAvi Kivity #define LARGE_PAGE_SIZE (1024 * PAGE_SIZE) 97d36db35SAvi Kivity #endif 107d36db35SAvi Kivity 117d36db35SAvi Kivity #define X86_CR0_PE 0x00000001 127d36db35SAvi Kivity #define X86_CR0_PG 0x80000000 137d36db35SAvi Kivity #define X86_CR4_PSE 0x00000010 147d36db35SAvi Kivity static void *free = 0; 157d36db35SAvi Kivity static void *vfree_top = 0; 167d36db35SAvi Kivity 177d36db35SAvi Kivity static void free_memory(void *mem, unsigned long size) 187d36db35SAvi Kivity { 197d36db35SAvi Kivity while (size >= PAGE_SIZE) { 207d36db35SAvi Kivity *(void **)mem = free; 217d36db35SAvi Kivity free = mem; 227d36db35SAvi Kivity mem += PAGE_SIZE; 237d36db35SAvi Kivity size -= PAGE_SIZE; 247d36db35SAvi Kivity } 257d36db35SAvi Kivity } 267d36db35SAvi Kivity 277d36db35SAvi Kivity void *alloc_page() 287d36db35SAvi Kivity { 297d36db35SAvi Kivity void *p; 307d36db35SAvi Kivity 317d36db35SAvi Kivity if (!free) 327d36db35SAvi Kivity return 0; 337d36db35SAvi Kivity 347d36db35SAvi Kivity p = free; 357d36db35SAvi Kivity free = *(void **)free; 367d36db35SAvi Kivity 377d36db35SAvi Kivity return p; 387d36db35SAvi Kivity } 397d36db35SAvi Kivity 407d36db35SAvi Kivity void free_page(void *page) 417d36db35SAvi Kivity { 427d36db35SAvi Kivity *(void **)page = free; 437d36db35SAvi Kivity free = page; 447d36db35SAvi Kivity } 457d36db35SAvi Kivity 467d36db35SAvi Kivity extern char edata; 477d36db35SAvi Kivity static unsigned long end_of_memory; 487d36db35SAvi Kivity 497d36db35SAvi Kivity #ifdef __x86_64__ 507d36db35SAvi Kivity #define PAGE_LEVEL 4 517d36db35SAvi Kivity #define PGDIR_WIDTH 9 527d36db35SAvi Kivity #define PGDIR_MASK 511 537d36db35SAvi Kivity #else 547d36db35SAvi Kivity #define PAGE_LEVEL 2 557d36db35SAvi Kivity #define PGDIR_WIDTH 10 567d36db35SAvi Kivity #define PGDIR_MASK 1023 577d36db35SAvi Kivity #endif 587d36db35SAvi Kivity 597d36db35SAvi Kivity void install_pte(unsigned long *cr3, 607d36db35SAvi Kivity int pte_level, 617d36db35SAvi Kivity void *virt, 627d36db35SAvi Kivity unsigned long pte, 637d36db35SAvi Kivity unsigned long *pt_page) 647d36db35SAvi Kivity { 657d36db35SAvi Kivity int level; 667d36db35SAvi Kivity unsigned long *pt = cr3; 677d36db35SAvi Kivity unsigned offset; 687d36db35SAvi Kivity 697d36db35SAvi Kivity for (level = PAGE_LEVEL; level > pte_level; --level) { 707d36db35SAvi Kivity offset = ((unsigned long)virt >> ((level-1) * PGDIR_WIDTH + 12)) & PGDIR_MASK; 717d36db35SAvi Kivity if (!(pt[offset] & PTE_PRESENT)) { 727d36db35SAvi Kivity unsigned long *new_pt = pt_page; 737d36db35SAvi Kivity if (!new_pt) 747d36db35SAvi Kivity new_pt = alloc_page(); 757d36db35SAvi Kivity else 767d36db35SAvi Kivity pt_page = 0; 777d36db35SAvi Kivity memset(new_pt, 0, PAGE_SIZE); 787d36db35SAvi Kivity pt[offset] = virt_to_phys(new_pt) | PTE_PRESENT | PTE_WRITE; 797d36db35SAvi Kivity } 807d36db35SAvi Kivity pt = phys_to_virt(pt[offset] & 0xffffffffff000ull); 817d36db35SAvi Kivity } 827d36db35SAvi Kivity offset = ((unsigned long)virt >> ((level-1) * PGDIR_WIDTH + 12)) & PGDIR_MASK; 837d36db35SAvi Kivity pt[offset] = pte; 847d36db35SAvi Kivity } 857d36db35SAvi Kivity 867d36db35SAvi Kivity static unsigned long get_pte(unsigned long *cr3, void *virt) 877d36db35SAvi Kivity { 887d36db35SAvi Kivity int level; 897d36db35SAvi Kivity unsigned long *pt = cr3, pte; 907d36db35SAvi Kivity unsigned offset; 917d36db35SAvi Kivity 927d36db35SAvi Kivity for (level = PAGE_LEVEL; level > 1; --level) { 937d36db35SAvi Kivity offset = ((unsigned long)virt >> (((level-1) * PGDIR_WIDTH) + 12)) & PGDIR_MASK; 947d36db35SAvi Kivity pte = pt[offset]; 957d36db35SAvi Kivity if (!(pte & PTE_PRESENT)) 967d36db35SAvi Kivity return 0; 977d36db35SAvi Kivity if (level == 2 && (pte & PTE_PSE)) 987d36db35SAvi Kivity return pte; 997d36db35SAvi Kivity pt = phys_to_virt(pte & 0xffffffffff000ull); 1007d36db35SAvi Kivity } 1017d36db35SAvi Kivity offset = ((unsigned long)virt >> (((level-1) * PGDIR_WIDTH) + 12)) & PGDIR_MASK; 1027d36db35SAvi Kivity pte = pt[offset]; 1037d36db35SAvi Kivity return pte; 1047d36db35SAvi Kivity } 1057d36db35SAvi Kivity 1067d36db35SAvi Kivity void install_large_page(unsigned long *cr3, 1077d36db35SAvi Kivity unsigned long phys, 1087d36db35SAvi Kivity void *virt) 1097d36db35SAvi Kivity { 1107d36db35SAvi Kivity install_pte(cr3, 2, virt, phys | PTE_PRESENT | PTE_WRITE | PTE_PSE, 0); 1117d36db35SAvi Kivity } 1127d36db35SAvi Kivity 1137d36db35SAvi Kivity void install_page(unsigned long *cr3, 1147d36db35SAvi Kivity unsigned long phys, 1157d36db35SAvi Kivity void *virt) 1167d36db35SAvi Kivity { 1177d36db35SAvi Kivity install_pte(cr3, 1, virt, phys | PTE_PRESENT | PTE_WRITE, 0); 1187d36db35SAvi Kivity } 1197d36db35SAvi Kivity 1207d36db35SAvi Kivity 1217d36db35SAvi Kivity static inline void load_gdt(unsigned long *table, int nent) 1227d36db35SAvi Kivity { 1237d36db35SAvi Kivity struct descriptor_table_ptr descr; 1247d36db35SAvi Kivity 1257d36db35SAvi Kivity descr.limit = nent * 8 - 1; 1267d36db35SAvi Kivity descr.base = (ulong)table; 1277d36db35SAvi Kivity lgdt(&descr); 1287d36db35SAvi Kivity } 1297d36db35SAvi Kivity 1307d36db35SAvi Kivity #define SEG_CS_32 8 1317d36db35SAvi Kivity #define SEG_CS_64 16 1327d36db35SAvi Kivity 1337d36db35SAvi Kivity struct ljmp { 1347d36db35SAvi Kivity void *ofs; 1357d36db35SAvi Kivity unsigned short seg; 1367d36db35SAvi Kivity }; 1377d36db35SAvi Kivity 138*63254428SGleb Natapov static void setup_mmu_range(unsigned long *cr3, unsigned long start, 139*63254428SGleb Natapov unsigned long len) 140*63254428SGleb Natapov { 141*63254428SGleb Natapov u64 max = (u64)len + (u64)start; 142*63254428SGleb Natapov u64 phys = start; 143*63254428SGleb Natapov 144*63254428SGleb Natapov while (phys + LARGE_PAGE_SIZE <= max) { 145*63254428SGleb Natapov install_large_page(cr3, phys, (void *)(ulong)phys); 146*63254428SGleb Natapov phys += LARGE_PAGE_SIZE; 147*63254428SGleb Natapov } 148*63254428SGleb Natapov while (phys + PAGE_SIZE <= max) { 149*63254428SGleb Natapov install_page(cr3, phys, (void *)(ulong)phys); 150*63254428SGleb Natapov phys += PAGE_SIZE; 151*63254428SGleb Natapov } 152*63254428SGleb Natapov } 153*63254428SGleb Natapov 1547d36db35SAvi Kivity static void setup_mmu(unsigned long len) 1557d36db35SAvi Kivity { 1567d36db35SAvi Kivity unsigned long *cr3 = alloc_page(); 1577d36db35SAvi Kivity 1587d36db35SAvi Kivity memset(cr3, 0, PAGE_SIZE); 159*63254428SGleb Natapov 160*63254428SGleb Natapov #ifdef __x86_64__ 161*63254428SGleb Natapov if (len < (1ul << 32)) 162*63254428SGleb Natapov len = (1ul << 32); /* map mmio 1:1 */ 163*63254428SGleb Natapov 164*63254428SGleb Natapov setup_mmu_range(cr3, 0, len); 165*63254428SGleb Natapov #else 166*63254428SGleb Natapov if (len > (1ul << 31)) 167*63254428SGleb Natapov len = (1ul << 31); 168*63254428SGleb Natapov 169*63254428SGleb Natapov /* 0 - 2G memory, 2G-3G valloc area, 3G-4G mmio */ 170*63254428SGleb Natapov setup_mmu_range(cr3, 0, len); 171*63254428SGleb Natapov setup_mmu_range(cr3, 3ul << 30, (1ul << 30)); 172*63254428SGleb Natapov vfree_top = (void*)(3ul << 30); 173*63254428SGleb Natapov #endif 174*63254428SGleb Natapov 1757d36db35SAvi Kivity write_cr3(virt_to_phys(cr3)); 1767d36db35SAvi Kivity #ifndef __x86_64__ 1777d36db35SAvi Kivity write_cr4(X86_CR4_PSE); 1787d36db35SAvi Kivity #endif 1797d36db35SAvi Kivity write_cr0(X86_CR0_PG |X86_CR0_PE); 1807d36db35SAvi Kivity 1817d36db35SAvi Kivity printf("paging enabled\n"); 1827d36db35SAvi Kivity printf("cr0 = %x\n", read_cr0()); 1837d36db35SAvi Kivity printf("cr3 = %x\n", read_cr3()); 1847d36db35SAvi Kivity printf("cr4 = %x\n", read_cr4()); 1857d36db35SAvi Kivity } 1867d36db35SAvi Kivity 1877d36db35SAvi Kivity static unsigned int inl(unsigned short port) 1887d36db35SAvi Kivity { 1897d36db35SAvi Kivity unsigned int val; 1907d36db35SAvi Kivity asm volatile("inl %w1, %0" : "=a"(val) : "Nd"(port)); 1917d36db35SAvi Kivity return val; 1927d36db35SAvi Kivity } 1937d36db35SAvi Kivity 1947d36db35SAvi Kivity void setup_vm() 1957d36db35SAvi Kivity { 1967d36db35SAvi Kivity end_of_memory = inl(0xd1); 1977d36db35SAvi Kivity free_memory(&edata, end_of_memory - (unsigned long)&edata); 1987d36db35SAvi Kivity setup_mmu(end_of_memory); 1997d36db35SAvi Kivity } 2007d36db35SAvi Kivity 2017d36db35SAvi Kivity void *vmalloc(unsigned long size) 2027d36db35SAvi Kivity { 2037d36db35SAvi Kivity void *mem, *p; 2047d36db35SAvi Kivity unsigned pages; 2057d36db35SAvi Kivity 2067d36db35SAvi Kivity size += sizeof(unsigned long); 2077d36db35SAvi Kivity 2087d36db35SAvi Kivity size = (size + PAGE_SIZE - 1) & ~(PAGE_SIZE - 1); 2097d36db35SAvi Kivity vfree_top -= size; 2107d36db35SAvi Kivity mem = p = vfree_top; 2117d36db35SAvi Kivity pages = size / PAGE_SIZE; 2127d36db35SAvi Kivity while (pages--) { 2137d36db35SAvi Kivity install_page(phys_to_virt(read_cr3()), virt_to_phys(alloc_page()), p); 2147d36db35SAvi Kivity p += PAGE_SIZE; 2157d36db35SAvi Kivity } 2167d36db35SAvi Kivity *(unsigned long *)mem = size; 2177d36db35SAvi Kivity mem += sizeof(unsigned long); 2187d36db35SAvi Kivity return mem; 2197d36db35SAvi Kivity } 2207d36db35SAvi Kivity 2217d36db35SAvi Kivity void vfree(void *mem) 2227d36db35SAvi Kivity { 2237d36db35SAvi Kivity unsigned long size = ((unsigned long *)mem)[-1]; 2247d36db35SAvi Kivity 2257d36db35SAvi Kivity while (size) { 2267d36db35SAvi Kivity free_page(phys_to_virt(get_pte(phys_to_virt(read_cr3()), mem) & PTE_ADDR)); 2277d36db35SAvi Kivity mem += PAGE_SIZE; 2287d36db35SAvi Kivity size -= PAGE_SIZE; 2297d36db35SAvi Kivity } 2307d36db35SAvi Kivity } 2317d36db35SAvi Kivity 2327d36db35SAvi Kivity void *vmap(unsigned long long phys, unsigned long size) 2337d36db35SAvi Kivity { 2347d36db35SAvi Kivity void *mem, *p; 2357d36db35SAvi Kivity unsigned pages; 2367d36db35SAvi Kivity 2377d36db35SAvi Kivity size = (size + PAGE_SIZE - 1) & ~(PAGE_SIZE - 1); 2387d36db35SAvi Kivity vfree_top -= size; 2397d36db35SAvi Kivity phys &= ~(unsigned long long)(PAGE_SIZE - 1); 2407d36db35SAvi Kivity 2417d36db35SAvi Kivity mem = p = vfree_top; 2427d36db35SAvi Kivity pages = size / PAGE_SIZE; 2437d36db35SAvi Kivity while (pages--) { 2447d36db35SAvi Kivity install_page(phys_to_virt(read_cr3()), phys, p); 2457d36db35SAvi Kivity phys += PAGE_SIZE; 2467d36db35SAvi Kivity p += PAGE_SIZE; 2477d36db35SAvi Kivity } 2487d36db35SAvi Kivity return mem; 2497d36db35SAvi Kivity } 250