xref: /kvm-unit-tests/lib/x86/vm.c (revision 632544282a5f59037f3d6f7edc86139b1e5ce098)
17d36db35SAvi Kivity #include "vm.h"
27d36db35SAvi Kivity #include "libcflat.h"
37d36db35SAvi Kivity 
47d36db35SAvi Kivity #define PAGE_SIZE 4096ul
57d36db35SAvi Kivity #ifdef __x86_64__
67d36db35SAvi Kivity #define LARGE_PAGE_SIZE (512 * PAGE_SIZE)
77d36db35SAvi Kivity #else
87d36db35SAvi Kivity #define LARGE_PAGE_SIZE (1024 * PAGE_SIZE)
97d36db35SAvi Kivity #endif
107d36db35SAvi Kivity 
117d36db35SAvi Kivity #define X86_CR0_PE      0x00000001
127d36db35SAvi Kivity #define X86_CR0_PG      0x80000000
137d36db35SAvi Kivity #define X86_CR4_PSE     0x00000010
147d36db35SAvi Kivity static void *free = 0;
157d36db35SAvi Kivity static void *vfree_top = 0;
167d36db35SAvi Kivity 
177d36db35SAvi Kivity static void free_memory(void *mem, unsigned long size)
187d36db35SAvi Kivity {
197d36db35SAvi Kivity     while (size >= PAGE_SIZE) {
207d36db35SAvi Kivity 	*(void **)mem = free;
217d36db35SAvi Kivity 	free = mem;
227d36db35SAvi Kivity 	mem += PAGE_SIZE;
237d36db35SAvi Kivity 	size -= PAGE_SIZE;
247d36db35SAvi Kivity     }
257d36db35SAvi Kivity }
267d36db35SAvi Kivity 
277d36db35SAvi Kivity void *alloc_page()
287d36db35SAvi Kivity {
297d36db35SAvi Kivity     void *p;
307d36db35SAvi Kivity 
317d36db35SAvi Kivity     if (!free)
327d36db35SAvi Kivity 	return 0;
337d36db35SAvi Kivity 
347d36db35SAvi Kivity     p = free;
357d36db35SAvi Kivity     free = *(void **)free;
367d36db35SAvi Kivity 
377d36db35SAvi Kivity     return p;
387d36db35SAvi Kivity }
397d36db35SAvi Kivity 
407d36db35SAvi Kivity void free_page(void *page)
417d36db35SAvi Kivity {
427d36db35SAvi Kivity     *(void **)page = free;
437d36db35SAvi Kivity     free = page;
447d36db35SAvi Kivity }
457d36db35SAvi Kivity 
467d36db35SAvi Kivity extern char edata;
477d36db35SAvi Kivity static unsigned long end_of_memory;
487d36db35SAvi Kivity 
497d36db35SAvi Kivity #ifdef __x86_64__
507d36db35SAvi Kivity #define	PAGE_LEVEL	4
517d36db35SAvi Kivity #define	PGDIR_WIDTH	9
527d36db35SAvi Kivity #define	PGDIR_MASK	511
537d36db35SAvi Kivity #else
547d36db35SAvi Kivity #define	PAGE_LEVEL	2
557d36db35SAvi Kivity #define	PGDIR_WIDTH	10
567d36db35SAvi Kivity #define	PGDIR_MASK	1023
577d36db35SAvi Kivity #endif
587d36db35SAvi Kivity 
597d36db35SAvi Kivity void install_pte(unsigned long *cr3,
607d36db35SAvi Kivity 		 int pte_level,
617d36db35SAvi Kivity 		 void *virt,
627d36db35SAvi Kivity 		 unsigned long pte,
637d36db35SAvi Kivity 		 unsigned long *pt_page)
647d36db35SAvi Kivity {
657d36db35SAvi Kivity     int level;
667d36db35SAvi Kivity     unsigned long *pt = cr3;
677d36db35SAvi Kivity     unsigned offset;
687d36db35SAvi Kivity 
697d36db35SAvi Kivity     for (level = PAGE_LEVEL; level > pte_level; --level) {
707d36db35SAvi Kivity 	offset = ((unsigned long)virt >> ((level-1) * PGDIR_WIDTH + 12)) & PGDIR_MASK;
717d36db35SAvi Kivity 	if (!(pt[offset] & PTE_PRESENT)) {
727d36db35SAvi Kivity 	    unsigned long *new_pt = pt_page;
737d36db35SAvi Kivity             if (!new_pt)
747d36db35SAvi Kivity                 new_pt = alloc_page();
757d36db35SAvi Kivity             else
767d36db35SAvi Kivity                 pt_page = 0;
777d36db35SAvi Kivity 	    memset(new_pt, 0, PAGE_SIZE);
787d36db35SAvi Kivity 	    pt[offset] = virt_to_phys(new_pt) | PTE_PRESENT | PTE_WRITE;
797d36db35SAvi Kivity 	}
807d36db35SAvi Kivity 	pt = phys_to_virt(pt[offset] & 0xffffffffff000ull);
817d36db35SAvi Kivity     }
827d36db35SAvi Kivity     offset = ((unsigned long)virt >> ((level-1) * PGDIR_WIDTH + 12)) & PGDIR_MASK;
837d36db35SAvi Kivity     pt[offset] = pte;
847d36db35SAvi Kivity }
857d36db35SAvi Kivity 
867d36db35SAvi Kivity static unsigned long get_pte(unsigned long *cr3, void *virt)
877d36db35SAvi Kivity {
887d36db35SAvi Kivity     int level;
897d36db35SAvi Kivity     unsigned long *pt = cr3, pte;
907d36db35SAvi Kivity     unsigned offset;
917d36db35SAvi Kivity 
927d36db35SAvi Kivity     for (level = PAGE_LEVEL; level > 1; --level) {
937d36db35SAvi Kivity 	offset = ((unsigned long)virt >> (((level-1) * PGDIR_WIDTH) + 12)) & PGDIR_MASK;
947d36db35SAvi Kivity 	pte = pt[offset];
957d36db35SAvi Kivity 	if (!(pte & PTE_PRESENT))
967d36db35SAvi Kivity 	    return 0;
977d36db35SAvi Kivity 	if (level == 2 && (pte & PTE_PSE))
987d36db35SAvi Kivity 	    return pte;
997d36db35SAvi Kivity 	pt = phys_to_virt(pte & 0xffffffffff000ull);
1007d36db35SAvi Kivity     }
1017d36db35SAvi Kivity     offset = ((unsigned long)virt >> (((level-1) * PGDIR_WIDTH) + 12)) & PGDIR_MASK;
1027d36db35SAvi Kivity     pte = pt[offset];
1037d36db35SAvi Kivity     return pte;
1047d36db35SAvi Kivity }
1057d36db35SAvi Kivity 
1067d36db35SAvi Kivity void install_large_page(unsigned long *cr3,
1077d36db35SAvi Kivity                               unsigned long phys,
1087d36db35SAvi Kivity                               void *virt)
1097d36db35SAvi Kivity {
1107d36db35SAvi Kivity     install_pte(cr3, 2, virt, phys | PTE_PRESENT | PTE_WRITE | PTE_PSE, 0);
1117d36db35SAvi Kivity }
1127d36db35SAvi Kivity 
1137d36db35SAvi Kivity void install_page(unsigned long *cr3,
1147d36db35SAvi Kivity                   unsigned long phys,
1157d36db35SAvi Kivity                   void *virt)
1167d36db35SAvi Kivity {
1177d36db35SAvi Kivity     install_pte(cr3, 1, virt, phys | PTE_PRESENT | PTE_WRITE, 0);
1187d36db35SAvi Kivity }
1197d36db35SAvi Kivity 
1207d36db35SAvi Kivity 
1217d36db35SAvi Kivity static inline void load_gdt(unsigned long *table, int nent)
1227d36db35SAvi Kivity {
1237d36db35SAvi Kivity     struct descriptor_table_ptr descr;
1247d36db35SAvi Kivity 
1257d36db35SAvi Kivity     descr.limit = nent * 8 - 1;
1267d36db35SAvi Kivity     descr.base = (ulong)table;
1277d36db35SAvi Kivity     lgdt(&descr);
1287d36db35SAvi Kivity }
1297d36db35SAvi Kivity 
1307d36db35SAvi Kivity #define SEG_CS_32 8
1317d36db35SAvi Kivity #define SEG_CS_64 16
1327d36db35SAvi Kivity 
1337d36db35SAvi Kivity struct ljmp {
1347d36db35SAvi Kivity     void *ofs;
1357d36db35SAvi Kivity     unsigned short seg;
1367d36db35SAvi Kivity };
1377d36db35SAvi Kivity 
138*63254428SGleb Natapov static void setup_mmu_range(unsigned long *cr3, unsigned long start,
139*63254428SGleb Natapov 			    unsigned long len)
140*63254428SGleb Natapov {
141*63254428SGleb Natapov 	u64 max = (u64)len + (u64)start;
142*63254428SGleb Natapov 	u64 phys = start;
143*63254428SGleb Natapov 
144*63254428SGleb Natapov 	while (phys + LARGE_PAGE_SIZE <= max) {
145*63254428SGleb Natapov 		install_large_page(cr3, phys, (void *)(ulong)phys);
146*63254428SGleb Natapov 		phys += LARGE_PAGE_SIZE;
147*63254428SGleb Natapov 	}
148*63254428SGleb Natapov 	while (phys + PAGE_SIZE <= max) {
149*63254428SGleb Natapov 		install_page(cr3, phys, (void *)(ulong)phys);
150*63254428SGleb Natapov 		phys += PAGE_SIZE;
151*63254428SGleb Natapov 	}
152*63254428SGleb Natapov }
153*63254428SGleb Natapov 
1547d36db35SAvi Kivity static void setup_mmu(unsigned long len)
1557d36db35SAvi Kivity {
1567d36db35SAvi Kivity     unsigned long *cr3 = alloc_page();
1577d36db35SAvi Kivity 
1587d36db35SAvi Kivity     memset(cr3, 0, PAGE_SIZE);
159*63254428SGleb Natapov 
160*63254428SGleb Natapov #ifdef __x86_64__
161*63254428SGleb Natapov     if (len < (1ul << 32))
162*63254428SGleb Natapov         len = (1ul << 32);  /* map mmio 1:1 */
163*63254428SGleb Natapov 
164*63254428SGleb Natapov     setup_mmu_range(cr3, 0, len);
165*63254428SGleb Natapov #else
166*63254428SGleb Natapov     if (len > (1ul << 31))
167*63254428SGleb Natapov 	    len = (1ul << 31);
168*63254428SGleb Natapov 
169*63254428SGleb Natapov     /* 0 - 2G memory, 2G-3G valloc area, 3G-4G mmio */
170*63254428SGleb Natapov     setup_mmu_range(cr3, 0, len);
171*63254428SGleb Natapov     setup_mmu_range(cr3, 3ul << 30, (1ul << 30));
172*63254428SGleb Natapov     vfree_top = (void*)(3ul << 30);
173*63254428SGleb Natapov #endif
174*63254428SGleb Natapov 
1757d36db35SAvi Kivity     write_cr3(virt_to_phys(cr3));
1767d36db35SAvi Kivity #ifndef __x86_64__
1777d36db35SAvi Kivity     write_cr4(X86_CR4_PSE);
1787d36db35SAvi Kivity #endif
1797d36db35SAvi Kivity     write_cr0(X86_CR0_PG |X86_CR0_PE);
1807d36db35SAvi Kivity 
1817d36db35SAvi Kivity     printf("paging enabled\n");
1827d36db35SAvi Kivity     printf("cr0 = %x\n", read_cr0());
1837d36db35SAvi Kivity     printf("cr3 = %x\n", read_cr3());
1847d36db35SAvi Kivity     printf("cr4 = %x\n", read_cr4());
1857d36db35SAvi Kivity }
1867d36db35SAvi Kivity 
1877d36db35SAvi Kivity static unsigned int inl(unsigned short port)
1887d36db35SAvi Kivity {
1897d36db35SAvi Kivity     unsigned int val;
1907d36db35SAvi Kivity     asm volatile("inl %w1, %0" : "=a"(val) : "Nd"(port));
1917d36db35SAvi Kivity     return val;
1927d36db35SAvi Kivity }
1937d36db35SAvi Kivity 
1947d36db35SAvi Kivity void setup_vm()
1957d36db35SAvi Kivity {
1967d36db35SAvi Kivity     end_of_memory = inl(0xd1);
1977d36db35SAvi Kivity     free_memory(&edata, end_of_memory - (unsigned long)&edata);
1987d36db35SAvi Kivity     setup_mmu(end_of_memory);
1997d36db35SAvi Kivity }
2007d36db35SAvi Kivity 
2017d36db35SAvi Kivity void *vmalloc(unsigned long size)
2027d36db35SAvi Kivity {
2037d36db35SAvi Kivity     void *mem, *p;
2047d36db35SAvi Kivity     unsigned pages;
2057d36db35SAvi Kivity 
2067d36db35SAvi Kivity     size += sizeof(unsigned long);
2077d36db35SAvi Kivity 
2087d36db35SAvi Kivity     size = (size + PAGE_SIZE - 1) & ~(PAGE_SIZE - 1);
2097d36db35SAvi Kivity     vfree_top -= size;
2107d36db35SAvi Kivity     mem = p = vfree_top;
2117d36db35SAvi Kivity     pages = size / PAGE_SIZE;
2127d36db35SAvi Kivity     while (pages--) {
2137d36db35SAvi Kivity 	install_page(phys_to_virt(read_cr3()), virt_to_phys(alloc_page()), p);
2147d36db35SAvi Kivity 	p += PAGE_SIZE;
2157d36db35SAvi Kivity     }
2167d36db35SAvi Kivity     *(unsigned long *)mem = size;
2177d36db35SAvi Kivity     mem += sizeof(unsigned long);
2187d36db35SAvi Kivity     return mem;
2197d36db35SAvi Kivity }
2207d36db35SAvi Kivity 
2217d36db35SAvi Kivity void vfree(void *mem)
2227d36db35SAvi Kivity {
2237d36db35SAvi Kivity     unsigned long size = ((unsigned long *)mem)[-1];
2247d36db35SAvi Kivity 
2257d36db35SAvi Kivity     while (size) {
2267d36db35SAvi Kivity 	free_page(phys_to_virt(get_pte(phys_to_virt(read_cr3()), mem) & PTE_ADDR));
2277d36db35SAvi Kivity 	mem += PAGE_SIZE;
2287d36db35SAvi Kivity 	size -= PAGE_SIZE;
2297d36db35SAvi Kivity     }
2307d36db35SAvi Kivity }
2317d36db35SAvi Kivity 
2327d36db35SAvi Kivity void *vmap(unsigned long long phys, unsigned long size)
2337d36db35SAvi Kivity {
2347d36db35SAvi Kivity     void *mem, *p;
2357d36db35SAvi Kivity     unsigned pages;
2367d36db35SAvi Kivity 
2377d36db35SAvi Kivity     size = (size + PAGE_SIZE - 1) & ~(PAGE_SIZE - 1);
2387d36db35SAvi Kivity     vfree_top -= size;
2397d36db35SAvi Kivity     phys &= ~(unsigned long long)(PAGE_SIZE - 1);
2407d36db35SAvi Kivity 
2417d36db35SAvi Kivity     mem = p = vfree_top;
2427d36db35SAvi Kivity     pages = size / PAGE_SIZE;
2437d36db35SAvi Kivity     while (pages--) {
2447d36db35SAvi Kivity 	install_page(phys_to_virt(read_cr3()), phys, p);
2457d36db35SAvi Kivity 	phys += PAGE_SIZE;
2467d36db35SAvi Kivity 	p += PAGE_SIZE;
2477d36db35SAvi Kivity     }
2487d36db35SAvi Kivity     return mem;
2497d36db35SAvi Kivity }
250