17d36db35SAvi Kivity #include "vm.h" 27d36db35SAvi Kivity #include "libcflat.h" 37d36db35SAvi Kivity 47d36db35SAvi Kivity #define PAGE_SIZE 4096ul 57d36db35SAvi Kivity #ifdef __x86_64__ 67d36db35SAvi Kivity #define LARGE_PAGE_SIZE (512 * PAGE_SIZE) 77d36db35SAvi Kivity #else 87d36db35SAvi Kivity #define LARGE_PAGE_SIZE (1024 * PAGE_SIZE) 97d36db35SAvi Kivity #endif 107d36db35SAvi Kivity 117d36db35SAvi Kivity #define X86_CR0_PE 0x00000001 1297011120SGleb Natapov #define X86_CR0_WP 0x00010000 137d36db35SAvi Kivity #define X86_CR0_PG 0x80000000 147d36db35SAvi Kivity #define X86_CR4_PSE 0x00000010 157d36db35SAvi Kivity static void *free = 0; 167d36db35SAvi Kivity static void *vfree_top = 0; 177d36db35SAvi Kivity 187d36db35SAvi Kivity static void free_memory(void *mem, unsigned long size) 197d36db35SAvi Kivity { 207d36db35SAvi Kivity while (size >= PAGE_SIZE) { 217d36db35SAvi Kivity *(void **)mem = free; 227d36db35SAvi Kivity free = mem; 237d36db35SAvi Kivity mem += PAGE_SIZE; 247d36db35SAvi Kivity size -= PAGE_SIZE; 257d36db35SAvi Kivity } 267d36db35SAvi Kivity } 277d36db35SAvi Kivity 287d36db35SAvi Kivity void *alloc_page() 297d36db35SAvi Kivity { 307d36db35SAvi Kivity void *p; 317d36db35SAvi Kivity 327d36db35SAvi Kivity if (!free) 337d36db35SAvi Kivity return 0; 347d36db35SAvi Kivity 357d36db35SAvi Kivity p = free; 367d36db35SAvi Kivity free = *(void **)free; 377d36db35SAvi Kivity 387d36db35SAvi Kivity return p; 397d36db35SAvi Kivity } 407d36db35SAvi Kivity 417d36db35SAvi Kivity void free_page(void *page) 427d36db35SAvi Kivity { 437d36db35SAvi Kivity *(void **)page = free; 447d36db35SAvi Kivity free = page; 457d36db35SAvi Kivity } 467d36db35SAvi Kivity 477d36db35SAvi Kivity extern char edata; 487d36db35SAvi Kivity static unsigned long end_of_memory; 497d36db35SAvi Kivity 507d36db35SAvi Kivity #ifdef __x86_64__ 517d36db35SAvi Kivity #define PAGE_LEVEL 4 527d36db35SAvi Kivity #define PGDIR_WIDTH 9 537d36db35SAvi Kivity #define PGDIR_MASK 511 547d36db35SAvi Kivity #else 557d36db35SAvi Kivity #define PAGE_LEVEL 2 567d36db35SAvi Kivity #define PGDIR_WIDTH 10 577d36db35SAvi Kivity #define PGDIR_MASK 1023 587d36db35SAvi Kivity #endif 597d36db35SAvi Kivity 607d36db35SAvi Kivity void install_pte(unsigned long *cr3, 617d36db35SAvi Kivity int pte_level, 627d36db35SAvi Kivity void *virt, 637d36db35SAvi Kivity unsigned long pte, 647d36db35SAvi Kivity unsigned long *pt_page) 657d36db35SAvi Kivity { 667d36db35SAvi Kivity int level; 677d36db35SAvi Kivity unsigned long *pt = cr3; 687d36db35SAvi Kivity unsigned offset; 697d36db35SAvi Kivity 707d36db35SAvi Kivity for (level = PAGE_LEVEL; level > pte_level; --level) { 717d36db35SAvi Kivity offset = ((unsigned long)virt >> ((level-1) * PGDIR_WIDTH + 12)) & PGDIR_MASK; 727d36db35SAvi Kivity if (!(pt[offset] & PTE_PRESENT)) { 737d36db35SAvi Kivity unsigned long *new_pt = pt_page; 747d36db35SAvi Kivity if (!new_pt) 757d36db35SAvi Kivity new_pt = alloc_page(); 767d36db35SAvi Kivity else 777d36db35SAvi Kivity pt_page = 0; 787d36db35SAvi Kivity memset(new_pt, 0, PAGE_SIZE); 797d36db35SAvi Kivity pt[offset] = virt_to_phys(new_pt) | PTE_PRESENT | PTE_WRITE; 807d36db35SAvi Kivity } 817d36db35SAvi Kivity pt = phys_to_virt(pt[offset] & 0xffffffffff000ull); 827d36db35SAvi Kivity } 837d36db35SAvi Kivity offset = ((unsigned long)virt >> ((level-1) * PGDIR_WIDTH + 12)) & PGDIR_MASK; 847d36db35SAvi Kivity pt[offset] = pte; 857d36db35SAvi Kivity } 867d36db35SAvi Kivity 877d36db35SAvi Kivity static unsigned long get_pte(unsigned long *cr3, void *virt) 887d36db35SAvi Kivity { 897d36db35SAvi Kivity int level; 907d36db35SAvi Kivity unsigned long *pt = cr3, pte; 917d36db35SAvi Kivity unsigned offset; 927d36db35SAvi Kivity 937d36db35SAvi Kivity for (level = PAGE_LEVEL; level > 1; --level) { 947d36db35SAvi Kivity offset = ((unsigned long)virt >> (((level-1) * PGDIR_WIDTH) + 12)) & PGDIR_MASK; 957d36db35SAvi Kivity pte = pt[offset]; 967d36db35SAvi Kivity if (!(pte & PTE_PRESENT)) 977d36db35SAvi Kivity return 0; 987d36db35SAvi Kivity if (level == 2 && (pte & PTE_PSE)) 997d36db35SAvi Kivity return pte; 1007d36db35SAvi Kivity pt = phys_to_virt(pte & 0xffffffffff000ull); 1017d36db35SAvi Kivity } 1027d36db35SAvi Kivity offset = ((unsigned long)virt >> (((level-1) * PGDIR_WIDTH) + 12)) & PGDIR_MASK; 1037d36db35SAvi Kivity pte = pt[offset]; 1047d36db35SAvi Kivity return pte; 1057d36db35SAvi Kivity } 1067d36db35SAvi Kivity 1077d36db35SAvi Kivity void install_large_page(unsigned long *cr3, 1087d36db35SAvi Kivity unsigned long phys, 1097d36db35SAvi Kivity void *virt) 1107d36db35SAvi Kivity { 1117d36db35SAvi Kivity install_pte(cr3, 2, virt, phys | PTE_PRESENT | PTE_WRITE | PTE_PSE, 0); 1127d36db35SAvi Kivity } 1137d36db35SAvi Kivity 1147d36db35SAvi Kivity void install_page(unsigned long *cr3, 1157d36db35SAvi Kivity unsigned long phys, 1167d36db35SAvi Kivity void *virt) 1177d36db35SAvi Kivity { 1187d36db35SAvi Kivity install_pte(cr3, 1, virt, phys | PTE_PRESENT | PTE_WRITE, 0); 1197d36db35SAvi Kivity } 1207d36db35SAvi Kivity 1217d36db35SAvi Kivity 1227d36db35SAvi Kivity static inline void load_gdt(unsigned long *table, int nent) 1237d36db35SAvi Kivity { 1247d36db35SAvi Kivity struct descriptor_table_ptr descr; 1257d36db35SAvi Kivity 1267d36db35SAvi Kivity descr.limit = nent * 8 - 1; 1277d36db35SAvi Kivity descr.base = (ulong)table; 1287d36db35SAvi Kivity lgdt(&descr); 1297d36db35SAvi Kivity } 1307d36db35SAvi Kivity 1317d36db35SAvi Kivity #define SEG_CS_32 8 1327d36db35SAvi Kivity #define SEG_CS_64 16 1337d36db35SAvi Kivity 1347d36db35SAvi Kivity struct ljmp { 1357d36db35SAvi Kivity void *ofs; 1367d36db35SAvi Kivity unsigned short seg; 1377d36db35SAvi Kivity }; 1387d36db35SAvi Kivity 13963254428SGleb Natapov static void setup_mmu_range(unsigned long *cr3, unsigned long start, 14063254428SGleb Natapov unsigned long len) 14163254428SGleb Natapov { 14263254428SGleb Natapov u64 max = (u64)len + (u64)start; 14363254428SGleb Natapov u64 phys = start; 14463254428SGleb Natapov 14563254428SGleb Natapov while (phys + LARGE_PAGE_SIZE <= max) { 14663254428SGleb Natapov install_large_page(cr3, phys, (void *)(ulong)phys); 14763254428SGleb Natapov phys += LARGE_PAGE_SIZE; 14863254428SGleb Natapov } 14963254428SGleb Natapov while (phys + PAGE_SIZE <= max) { 15063254428SGleb Natapov install_page(cr3, phys, (void *)(ulong)phys); 15163254428SGleb Natapov phys += PAGE_SIZE; 15263254428SGleb Natapov } 15363254428SGleb Natapov } 15463254428SGleb Natapov 1557d36db35SAvi Kivity static void setup_mmu(unsigned long len) 1567d36db35SAvi Kivity { 1577d36db35SAvi Kivity unsigned long *cr3 = alloc_page(); 1587d36db35SAvi Kivity 1597d36db35SAvi Kivity memset(cr3, 0, PAGE_SIZE); 16063254428SGleb Natapov 16163254428SGleb Natapov #ifdef __x86_64__ 16263254428SGleb Natapov if (len < (1ul << 32)) 16363254428SGleb Natapov len = (1ul << 32); /* map mmio 1:1 */ 16463254428SGleb Natapov 16563254428SGleb Natapov setup_mmu_range(cr3, 0, len); 16663254428SGleb Natapov #else 16763254428SGleb Natapov if (len > (1ul << 31)) 16863254428SGleb Natapov len = (1ul << 31); 16963254428SGleb Natapov 17063254428SGleb Natapov /* 0 - 2G memory, 2G-3G valloc area, 3G-4G mmio */ 17163254428SGleb Natapov setup_mmu_range(cr3, 0, len); 17263254428SGleb Natapov setup_mmu_range(cr3, 3ul << 30, (1ul << 30)); 17363254428SGleb Natapov vfree_top = (void*)(3ul << 30); 17463254428SGleb Natapov #endif 17563254428SGleb Natapov 1767d36db35SAvi Kivity write_cr3(virt_to_phys(cr3)); 1777d36db35SAvi Kivity #ifndef __x86_64__ 1787d36db35SAvi Kivity write_cr4(X86_CR4_PSE); 1797d36db35SAvi Kivity #endif 18097011120SGleb Natapov write_cr0(X86_CR0_PG |X86_CR0_PE | X86_CR0_WP); 1817d36db35SAvi Kivity 1827d36db35SAvi Kivity printf("paging enabled\n"); 1837d36db35SAvi Kivity printf("cr0 = %x\n", read_cr0()); 1847d36db35SAvi Kivity printf("cr3 = %x\n", read_cr3()); 1857d36db35SAvi Kivity printf("cr4 = %x\n", read_cr4()); 1867d36db35SAvi Kivity } 1877d36db35SAvi Kivity 1887d36db35SAvi Kivity static unsigned int inl(unsigned short port) 1897d36db35SAvi Kivity { 1907d36db35SAvi Kivity unsigned int val; 1917d36db35SAvi Kivity asm volatile("inl %w1, %0" : "=a"(val) : "Nd"(port)); 1927d36db35SAvi Kivity return val; 1937d36db35SAvi Kivity } 1947d36db35SAvi Kivity 1957d36db35SAvi Kivity void setup_vm() 1967d36db35SAvi Kivity { 1977d36db35SAvi Kivity end_of_memory = inl(0xd1); 1987d36db35SAvi Kivity free_memory(&edata, end_of_memory - (unsigned long)&edata); 1997d36db35SAvi Kivity setup_mmu(end_of_memory); 2007d36db35SAvi Kivity } 2017d36db35SAvi Kivity 2027d36db35SAvi Kivity void *vmalloc(unsigned long size) 2037d36db35SAvi Kivity { 2047d36db35SAvi Kivity void *mem, *p; 2057d36db35SAvi Kivity unsigned pages; 2067d36db35SAvi Kivity 2077d36db35SAvi Kivity size += sizeof(unsigned long); 2087d36db35SAvi Kivity 2097d36db35SAvi Kivity size = (size + PAGE_SIZE - 1) & ~(PAGE_SIZE - 1); 2107d36db35SAvi Kivity vfree_top -= size; 2117d36db35SAvi Kivity mem = p = vfree_top; 2127d36db35SAvi Kivity pages = size / PAGE_SIZE; 2137d36db35SAvi Kivity while (pages--) { 2147d36db35SAvi Kivity install_page(phys_to_virt(read_cr3()), virt_to_phys(alloc_page()), p); 2157d36db35SAvi Kivity p += PAGE_SIZE; 2167d36db35SAvi Kivity } 2177d36db35SAvi Kivity *(unsigned long *)mem = size; 2187d36db35SAvi Kivity mem += sizeof(unsigned long); 2197d36db35SAvi Kivity return mem; 2207d36db35SAvi Kivity } 2217d36db35SAvi Kivity 2227d36db35SAvi Kivity void vfree(void *mem) 2237d36db35SAvi Kivity { 2247d36db35SAvi Kivity unsigned long size = ((unsigned long *)mem)[-1]; 2257d36db35SAvi Kivity 2267d36db35SAvi Kivity while (size) { 2277d36db35SAvi Kivity free_page(phys_to_virt(get_pte(phys_to_virt(read_cr3()), mem) & PTE_ADDR)); 2287d36db35SAvi Kivity mem += PAGE_SIZE; 2297d36db35SAvi Kivity size -= PAGE_SIZE; 2307d36db35SAvi Kivity } 2317d36db35SAvi Kivity } 2327d36db35SAvi Kivity 2337d36db35SAvi Kivity void *vmap(unsigned long long phys, unsigned long size) 2347d36db35SAvi Kivity { 2357d36db35SAvi Kivity void *mem, *p; 2367d36db35SAvi Kivity unsigned pages; 2377d36db35SAvi Kivity 2387d36db35SAvi Kivity size = (size + PAGE_SIZE - 1) & ~(PAGE_SIZE - 1); 2397d36db35SAvi Kivity vfree_top -= size; 2407d36db35SAvi Kivity phys &= ~(unsigned long long)(PAGE_SIZE - 1); 2417d36db35SAvi Kivity 2427d36db35SAvi Kivity mem = p = vfree_top; 2437d36db35SAvi Kivity pages = size / PAGE_SIZE; 2447d36db35SAvi Kivity while (pages--) { 2457d36db35SAvi Kivity install_page(phys_to_virt(read_cr3()), phys, p); 2467d36db35SAvi Kivity phys += PAGE_SIZE; 2477d36db35SAvi Kivity p += PAGE_SIZE; 2487d36db35SAvi Kivity } 2497d36db35SAvi Kivity return mem; 2507d36db35SAvi Kivity } 251*a4b87a16SGleb Natapov 252*a4b87a16SGleb Natapov void *alloc_vpage(void) 253*a4b87a16SGleb Natapov { 254*a4b87a16SGleb Natapov vfree_top -= PAGE_SIZE; 255*a4b87a16SGleb Natapov return vfree_top; 256*a4b87a16SGleb Natapov } 257