13fa2d384SViktor Prutyanov /* 23fa2d384SViktor Prutyanov * Copyright (c) 2018 Virtuozzo International GmbH 33fa2d384SViktor Prutyanov * 43fa2d384SViktor Prutyanov * This work is licensed under the terms of the GNU GPL, version 2 or later. 53fa2d384SViktor Prutyanov * 63fa2d384SViktor Prutyanov */ 73fa2d384SViktor Prutyanov 83fa2d384SViktor Prutyanov #include "qemu/osdep.h" 93fa2d384SViktor Prutyanov #include "addrspace.h" 103fa2d384SViktor Prutyanov 113fa2d384SViktor Prutyanov static struct pa_block *pa_space_find_block(struct pa_space *ps, uint64_t pa) 123fa2d384SViktor Prutyanov { 133fa2d384SViktor Prutyanov size_t i; 1405adc48eSViktor Prutyanov 153fa2d384SViktor Prutyanov for (i = 0; i < ps->block_nr; i++) { 163fa2d384SViktor Prutyanov if (ps->block[i].paddr <= pa && 17*d5c27a53SViktor Prutyanov pa < ps->block[i].paddr + ps->block[i].size) { 183fa2d384SViktor Prutyanov return ps->block + i; 193fa2d384SViktor Prutyanov } 203fa2d384SViktor Prutyanov } 213fa2d384SViktor Prutyanov 223fa2d384SViktor Prutyanov return NULL; 233fa2d384SViktor Prutyanov } 243fa2d384SViktor Prutyanov 253fa2d384SViktor Prutyanov static uint8_t *pa_space_resolve(struct pa_space *ps, uint64_t pa) 263fa2d384SViktor Prutyanov { 273fa2d384SViktor Prutyanov struct pa_block *block = pa_space_find_block(ps, pa); 283fa2d384SViktor Prutyanov 293fa2d384SViktor Prutyanov if (!block) { 303fa2d384SViktor Prutyanov return NULL; 313fa2d384SViktor Prutyanov } 323fa2d384SViktor Prutyanov 333fa2d384SViktor Prutyanov return block->addr + (pa - block->paddr); 343fa2d384SViktor Prutyanov } 353fa2d384SViktor Prutyanov 36*d5c27a53SViktor Prutyanov static void pa_block_align(struct pa_block *b) 37*d5c27a53SViktor Prutyanov { 38*d5c27a53SViktor Prutyanov uint64_t low_align = ((b->paddr - 1) | ELF2DMP_PAGE_MASK) + 1 - b->paddr; 39*d5c27a53SViktor Prutyanov uint64_t high_align = (b->paddr + b->size) & ELF2DMP_PAGE_MASK; 40*d5c27a53SViktor Prutyanov 41*d5c27a53SViktor Prutyanov if (low_align == 0 && high_align == 0) { 42*d5c27a53SViktor Prutyanov return; 43*d5c27a53SViktor Prutyanov } 44*d5c27a53SViktor Prutyanov 45*d5c27a53SViktor Prutyanov if (low_align + high_align < b->size) { 46*d5c27a53SViktor Prutyanov printf("Block 0x%"PRIx64"+:0x%"PRIx64" will be aligned to " 47*d5c27a53SViktor Prutyanov "0x%"PRIx64"+:0x%"PRIx64"\n", b->paddr, b->size, 48*d5c27a53SViktor Prutyanov b->paddr + low_align, b->size - low_align - high_align); 49*d5c27a53SViktor Prutyanov b->size -= low_align + high_align; 50*d5c27a53SViktor Prutyanov } else { 51*d5c27a53SViktor Prutyanov printf("Block 0x%"PRIx64"+:0x%"PRIx64" is too small to align\n", 52*d5c27a53SViktor Prutyanov b->paddr, b->size); 53*d5c27a53SViktor Prutyanov b->size = 0; 54*d5c27a53SViktor Prutyanov } 55*d5c27a53SViktor Prutyanov 56*d5c27a53SViktor Prutyanov b->addr += low_align; 57*d5c27a53SViktor Prutyanov b->paddr += low_align; 58*d5c27a53SViktor Prutyanov } 59*d5c27a53SViktor Prutyanov 603fa2d384SViktor Prutyanov int pa_space_create(struct pa_space *ps, QEMU_Elf *qemu_elf) 613fa2d384SViktor Prutyanov { 623fa2d384SViktor Prutyanov Elf64_Half phdr_nr = elf_getphdrnum(qemu_elf->map); 633fa2d384SViktor Prutyanov Elf64_Phdr *phdr = elf64_getphdr(qemu_elf->map); 643fa2d384SViktor Prutyanov size_t block_i = 0; 653fa2d384SViktor Prutyanov size_t i; 663fa2d384SViktor Prutyanov 673fa2d384SViktor Prutyanov ps->block_nr = 0; 683fa2d384SViktor Prutyanov 693fa2d384SViktor Prutyanov for (i = 0; i < phdr_nr; i++) { 703fa2d384SViktor Prutyanov if (phdr[i].p_type == PT_LOAD) { 713fa2d384SViktor Prutyanov ps->block_nr++; 723fa2d384SViktor Prutyanov } 733fa2d384SViktor Prutyanov } 743fa2d384SViktor Prutyanov 753fa2d384SViktor Prutyanov ps->block = malloc(sizeof(*ps->block) * ps->block_nr); 763fa2d384SViktor Prutyanov if (!ps->block) { 773fa2d384SViktor Prutyanov return 1; 783fa2d384SViktor Prutyanov } 793fa2d384SViktor Prutyanov 803fa2d384SViktor Prutyanov for (i = 0; i < phdr_nr; i++) { 813fa2d384SViktor Prutyanov if (phdr[i].p_type == PT_LOAD) { 823fa2d384SViktor Prutyanov ps->block[block_i] = (struct pa_block) { 833fa2d384SViktor Prutyanov .addr = (uint8_t *)qemu_elf->map + phdr[i].p_offset, 843fa2d384SViktor Prutyanov .paddr = phdr[i].p_paddr, 853fa2d384SViktor Prutyanov .size = phdr[i].p_filesz, 863fa2d384SViktor Prutyanov }; 87*d5c27a53SViktor Prutyanov pa_block_align(&ps->block[block_i]); 88*d5c27a53SViktor Prutyanov block_i = ps->block[block_i].size ? (block_i + 1) : block_i; 893fa2d384SViktor Prutyanov } 903fa2d384SViktor Prutyanov } 913fa2d384SViktor Prutyanov 92*d5c27a53SViktor Prutyanov ps->block_nr = block_i; 93*d5c27a53SViktor Prutyanov 943fa2d384SViktor Prutyanov return 0; 953fa2d384SViktor Prutyanov } 963fa2d384SViktor Prutyanov 973fa2d384SViktor Prutyanov void pa_space_destroy(struct pa_space *ps) 983fa2d384SViktor Prutyanov { 993fa2d384SViktor Prutyanov ps->block_nr = 0; 1003fa2d384SViktor Prutyanov free(ps->block); 1013fa2d384SViktor Prutyanov } 1023fa2d384SViktor Prutyanov 1033fa2d384SViktor Prutyanov void va_space_set_dtb(struct va_space *vs, uint64_t dtb) 1043fa2d384SViktor Prutyanov { 1053fa2d384SViktor Prutyanov vs->dtb = dtb & 0x00ffffffffff000; 1063fa2d384SViktor Prutyanov } 1073fa2d384SViktor Prutyanov 1083fa2d384SViktor Prutyanov void va_space_create(struct va_space *vs, struct pa_space *ps, uint64_t dtb) 1093fa2d384SViktor Prutyanov { 1103fa2d384SViktor Prutyanov vs->ps = ps; 1113fa2d384SViktor Prutyanov va_space_set_dtb(vs, dtb); 1123fa2d384SViktor Prutyanov } 1133fa2d384SViktor Prutyanov 1143fa2d384SViktor Prutyanov static uint64_t get_pml4e(struct va_space *vs, uint64_t va) 1153fa2d384SViktor Prutyanov { 1163fa2d384SViktor Prutyanov uint64_t pa = (vs->dtb & 0xffffffffff000) | ((va & 0xff8000000000) >> 36); 1173fa2d384SViktor Prutyanov 1183fa2d384SViktor Prutyanov return *(uint64_t *)pa_space_resolve(vs->ps, pa); 1193fa2d384SViktor Prutyanov } 1203fa2d384SViktor Prutyanov 1213fa2d384SViktor Prutyanov static uint64_t get_pdpi(struct va_space *vs, uint64_t va, uint64_t pml4e) 1223fa2d384SViktor Prutyanov { 1233fa2d384SViktor Prutyanov uint64_t pdpte_paddr = (pml4e & 0xffffffffff000) | 1243fa2d384SViktor Prutyanov ((va & 0x7FC0000000) >> 27); 1253fa2d384SViktor Prutyanov 1263fa2d384SViktor Prutyanov return *(uint64_t *)pa_space_resolve(vs->ps, pdpte_paddr); 1273fa2d384SViktor Prutyanov } 1283fa2d384SViktor Prutyanov 1293fa2d384SViktor Prutyanov static uint64_t pde_index(uint64_t va) 1303fa2d384SViktor Prutyanov { 1313fa2d384SViktor Prutyanov return (va >> 21) & 0x1FF; 1323fa2d384SViktor Prutyanov } 1333fa2d384SViktor Prutyanov 1343fa2d384SViktor Prutyanov static uint64_t pdba_base(uint64_t pdpe) 1353fa2d384SViktor Prutyanov { 1363fa2d384SViktor Prutyanov return pdpe & 0xFFFFFFFFFF000; 1373fa2d384SViktor Prutyanov } 1383fa2d384SViktor Prutyanov 1393fa2d384SViktor Prutyanov static uint64_t get_pgd(struct va_space *vs, uint64_t va, uint64_t pdpe) 1403fa2d384SViktor Prutyanov { 1413fa2d384SViktor Prutyanov uint64_t pgd_entry = pdba_base(pdpe) + pde_index(va) * 8; 1423fa2d384SViktor Prutyanov 1433fa2d384SViktor Prutyanov return *(uint64_t *)pa_space_resolve(vs->ps, pgd_entry); 1443fa2d384SViktor Prutyanov } 1453fa2d384SViktor Prutyanov 1463fa2d384SViktor Prutyanov static uint64_t pte_index(uint64_t va) 1473fa2d384SViktor Prutyanov { 1483fa2d384SViktor Prutyanov return (va >> 12) & 0x1FF; 1493fa2d384SViktor Prutyanov } 1503fa2d384SViktor Prutyanov 1513fa2d384SViktor Prutyanov static uint64_t ptba_base(uint64_t pde) 1523fa2d384SViktor Prutyanov { 1533fa2d384SViktor Prutyanov return pde & 0xFFFFFFFFFF000; 1543fa2d384SViktor Prutyanov } 1553fa2d384SViktor Prutyanov 1563fa2d384SViktor Prutyanov static uint64_t get_pte(struct va_space *vs, uint64_t va, uint64_t pgd) 1573fa2d384SViktor Prutyanov { 1583fa2d384SViktor Prutyanov uint64_t pgd_val = ptba_base(pgd) + pte_index(va) * 8; 1593fa2d384SViktor Prutyanov 1603fa2d384SViktor Prutyanov return *(uint64_t *)pa_space_resolve(vs->ps, pgd_val); 1613fa2d384SViktor Prutyanov } 1623fa2d384SViktor Prutyanov 1633fa2d384SViktor Prutyanov static uint64_t get_paddr(uint64_t va, uint64_t pte) 1643fa2d384SViktor Prutyanov { 1653fa2d384SViktor Prutyanov return (pte & 0xFFFFFFFFFF000) | (va & 0xFFF); 1663fa2d384SViktor Prutyanov } 1673fa2d384SViktor Prutyanov 1683fa2d384SViktor Prutyanov static bool is_present(uint64_t entry) 1693fa2d384SViktor Prutyanov { 1703fa2d384SViktor Prutyanov return entry & 0x1; 1713fa2d384SViktor Prutyanov } 1723fa2d384SViktor Prutyanov 1733fa2d384SViktor Prutyanov static bool page_size_flag(uint64_t entry) 1743fa2d384SViktor Prutyanov { 1753fa2d384SViktor Prutyanov return entry & (1 << 7); 1763fa2d384SViktor Prutyanov } 1773fa2d384SViktor Prutyanov 1783fa2d384SViktor Prutyanov static uint64_t get_1GB_paddr(uint64_t va, uint64_t pdpte) 1793fa2d384SViktor Prutyanov { 1803fa2d384SViktor Prutyanov return (pdpte & 0xfffffc0000000) | (va & 0x3fffffff); 1813fa2d384SViktor Prutyanov } 1823fa2d384SViktor Prutyanov 1833fa2d384SViktor Prutyanov static uint64_t get_2MB_paddr(uint64_t va, uint64_t pgd_entry) 1843fa2d384SViktor Prutyanov { 1853fa2d384SViktor Prutyanov return (pgd_entry & 0xfffffffe00000) | (va & 0x00000001fffff); 1863fa2d384SViktor Prutyanov } 1873fa2d384SViktor Prutyanov 1883fa2d384SViktor Prutyanov static uint64_t va_space_va2pa(struct va_space *vs, uint64_t va) 1893fa2d384SViktor Prutyanov { 1903fa2d384SViktor Prutyanov uint64_t pml4e, pdpe, pgd, pte; 1913fa2d384SViktor Prutyanov 1923fa2d384SViktor Prutyanov pml4e = get_pml4e(vs, va); 1933fa2d384SViktor Prutyanov if (!is_present(pml4e)) { 1943fa2d384SViktor Prutyanov return INVALID_PA; 1953fa2d384SViktor Prutyanov } 1963fa2d384SViktor Prutyanov 1973fa2d384SViktor Prutyanov pdpe = get_pdpi(vs, va, pml4e); 1983fa2d384SViktor Prutyanov if (!is_present(pdpe)) { 1993fa2d384SViktor Prutyanov return INVALID_PA; 2003fa2d384SViktor Prutyanov } 2013fa2d384SViktor Prutyanov 2023fa2d384SViktor Prutyanov if (page_size_flag(pdpe)) { 2033fa2d384SViktor Prutyanov return get_1GB_paddr(va, pdpe); 2043fa2d384SViktor Prutyanov } 2053fa2d384SViktor Prutyanov 2063fa2d384SViktor Prutyanov pgd = get_pgd(vs, va, pdpe); 2073fa2d384SViktor Prutyanov if (!is_present(pgd)) { 2083fa2d384SViktor Prutyanov return INVALID_PA; 2093fa2d384SViktor Prutyanov } 2103fa2d384SViktor Prutyanov 2113fa2d384SViktor Prutyanov if (page_size_flag(pgd)) { 2123fa2d384SViktor Prutyanov return get_2MB_paddr(va, pgd); 2133fa2d384SViktor Prutyanov } 2143fa2d384SViktor Prutyanov 2153fa2d384SViktor Prutyanov pte = get_pte(vs, va, pgd); 2163fa2d384SViktor Prutyanov if (!is_present(pte)) { 2173fa2d384SViktor Prutyanov return INVALID_PA; 2183fa2d384SViktor Prutyanov } 2193fa2d384SViktor Prutyanov 2203fa2d384SViktor Prutyanov return get_paddr(va, pte); 2213fa2d384SViktor Prutyanov } 2223fa2d384SViktor Prutyanov 2233fa2d384SViktor Prutyanov void *va_space_resolve(struct va_space *vs, uint64_t va) 2243fa2d384SViktor Prutyanov { 2253fa2d384SViktor Prutyanov uint64_t pa = va_space_va2pa(vs, va); 2263fa2d384SViktor Prutyanov 2273fa2d384SViktor Prutyanov if (pa == INVALID_PA) { 2283fa2d384SViktor Prutyanov return NULL; 2293fa2d384SViktor Prutyanov } 2303fa2d384SViktor Prutyanov 2313fa2d384SViktor Prutyanov return pa_space_resolve(vs->ps, pa); 2323fa2d384SViktor Prutyanov } 2333fa2d384SViktor Prutyanov 2343fa2d384SViktor Prutyanov int va_space_rw(struct va_space *vs, uint64_t addr, 2353fa2d384SViktor Prutyanov void *buf, size_t size, int is_write) 2363fa2d384SViktor Prutyanov { 2373fa2d384SViktor Prutyanov while (size) { 2382d0fc797SJiaxun Yang uint64_t page = addr & ELF2DMP_PFN_MASK; 2392d0fc797SJiaxun Yang size_t s = (page + ELF2DMP_PAGE_SIZE) - addr; 2403fa2d384SViktor Prutyanov void *ptr; 2413fa2d384SViktor Prutyanov 2423fa2d384SViktor Prutyanov s = (s > size) ? size : s; 2433fa2d384SViktor Prutyanov 2443fa2d384SViktor Prutyanov ptr = va_space_resolve(vs, addr); 2453fa2d384SViktor Prutyanov if (!ptr) { 2463fa2d384SViktor Prutyanov return 1; 2473fa2d384SViktor Prutyanov } 2483fa2d384SViktor Prutyanov 2493fa2d384SViktor Prutyanov if (is_write) { 2503fa2d384SViktor Prutyanov memcpy(ptr, buf, s); 2513fa2d384SViktor Prutyanov } else { 2523fa2d384SViktor Prutyanov memcpy(buf, ptr, s); 2533fa2d384SViktor Prutyanov } 2543fa2d384SViktor Prutyanov 2553fa2d384SViktor Prutyanov size -= s; 2563fa2d384SViktor Prutyanov buf = (uint8_t *)buf + s; 2573fa2d384SViktor Prutyanov addr += s; 2583fa2d384SViktor Prutyanov } 2593fa2d384SViktor Prutyanov 2603fa2d384SViktor Prutyanov return 0; 2613fa2d384SViktor Prutyanov } 262