11802d0beSThomas Gleixner // SPDX-License-Identifier: GPL-2.0-only
2084bd298SSteve Capper /*
3084bd298SSteve Capper * arch/arm64/mm/hugetlbpage.c
4084bd298SSteve Capper *
5084bd298SSteve Capper * Copyright (C) 2013 Linaro Ltd.
6084bd298SSteve Capper *
7084bd298SSteve Capper * Based on arch/x86/mm/hugetlbpage.c.
8084bd298SSteve Capper */
9084bd298SSteve Capper
10084bd298SSteve Capper #include <linux/init.h>
11084bd298SSteve Capper #include <linux/fs.h>
12084bd298SSteve Capper #include <linux/mm.h>
13084bd298SSteve Capper #include <linux/hugetlb.h>
14084bd298SSteve Capper #include <linux/pagemap.h>
15084bd298SSteve Capper #include <linux/err.h>
16084bd298SSteve Capper #include <linux/sysctl.h>
17084bd298SSteve Capper #include <asm/mman.h>
18084bd298SSteve Capper #include <asm/tlb.h>
19084bd298SSteve Capper #include <asm/tlbflush.h>
20084bd298SSteve Capper
21abb7962aSAnshuman Khandual /*
22abb7962aSAnshuman Khandual * HugeTLB Support Matrix
23abb7962aSAnshuman Khandual *
24abb7962aSAnshuman Khandual * ---------------------------------------------------
25abb7962aSAnshuman Khandual * | Page Size | CONT PTE | PMD | CONT PMD | PUD |
26abb7962aSAnshuman Khandual * ---------------------------------------------------
27abb7962aSAnshuman Khandual * | 4K | 64K | 2M | 32M | 1G |
28abb7962aSAnshuman Khandual * | 16K | 2M | 32M | 1G | |
29abb7962aSAnshuman Khandual * | 64K | 2M | 512M | 16G | |
30abb7962aSAnshuman Khandual * ---------------------------------------------------
31abb7962aSAnshuman Khandual */
32abb7962aSAnshuman Khandual
33abb7962aSAnshuman Khandual /*
34abb7962aSAnshuman Khandual * Reserve CMA areas for the largest supported gigantic
35abb7962aSAnshuman Khandual * huge page when requested. Any other smaller gigantic
36abb7962aSAnshuman Khandual * huge pages could still be served from those areas.
37abb7962aSAnshuman Khandual */
38abb7962aSAnshuman Khandual #ifdef CONFIG_CMA
arm64_hugetlb_cma_reserve(void)39abb7962aSAnshuman Khandual void __init arm64_hugetlb_cma_reserve(void)
40abb7962aSAnshuman Khandual {
41abb7962aSAnshuman Khandual int order;
42abb7962aSAnshuman Khandual
43f8b46c4bSAnshuman Khandual if (pud_sect_supported())
44abb7962aSAnshuman Khandual order = PUD_SHIFT - PAGE_SHIFT;
45f8b46c4bSAnshuman Khandual else
462e5809a4SMike Kravetz order = CONT_PMD_SHIFT - PAGE_SHIFT;
47e6359798SWill Deacon
48abb7962aSAnshuman Khandual hugetlb_cma_reserve(order);
49abb7962aSAnshuman Khandual }
50abb7962aSAnshuman Khandual #endif /* CONFIG_CMA */
51abb7962aSAnshuman Khandual
__hugetlb_valid_size(unsigned long size)52a8a733b2SAnshuman Khandual static bool __hugetlb_valid_size(unsigned long size)
53a8a733b2SAnshuman Khandual {
54a8a733b2SAnshuman Khandual switch (size) {
55a8a733b2SAnshuman Khandual #ifndef __PAGETABLE_PMD_FOLDED
56a8a733b2SAnshuman Khandual case PUD_SIZE:
57a8a733b2SAnshuman Khandual return pud_sect_supported();
58a8a733b2SAnshuman Khandual #endif
59a8a733b2SAnshuman Khandual case CONT_PMD_SIZE:
60a8a733b2SAnshuman Khandual case PMD_SIZE:
61a8a733b2SAnshuman Khandual case CONT_PTE_SIZE:
62a8a733b2SAnshuman Khandual return true;
63a8a733b2SAnshuman Khandual }
64a8a733b2SAnshuman Khandual
65a8a733b2SAnshuman Khandual return false;
66a8a733b2SAnshuman Khandual }
67a8a733b2SAnshuman Khandual
685480280dSAnshuman Khandual #ifdef CONFIG_ARCH_ENABLE_HUGEPAGE_MIGRATION
arch_hugetlb_migration_supported(struct hstate * h)695480280dSAnshuman Khandual bool arch_hugetlb_migration_supported(struct hstate *h)
705480280dSAnshuman Khandual {
715480280dSAnshuman Khandual size_t pagesize = huge_page_size(h);
725480280dSAnshuman Khandual
73a8a733b2SAnshuman Khandual if (!__hugetlb_valid_size(pagesize)) {
745480280dSAnshuman Khandual pr_warn("%s: unrecognized huge page size 0x%lx\n",
755480280dSAnshuman Khandual __func__, pagesize);
765480280dSAnshuman Khandual return false;
775480280dSAnshuman Khandual }
78a8a733b2SAnshuman Khandual return true;
79a8a733b2SAnshuman Khandual }
805480280dSAnshuman Khandual #endif
815480280dSAnshuman Khandual
find_num_contig(struct mm_struct * mm,unsigned long addr,pte_t * ptep,size_t * pgsize)8266b3923aSDavid Woods static int find_num_contig(struct mm_struct *mm, unsigned long addr,
83bb9dd3dfSSteve Capper pte_t *ptep, size_t *pgsize)
8466b3923aSDavid Woods {
8520a004e7SWill Deacon pgd_t *pgdp = pgd_offset(mm, addr);
86e9f63768SMike Rapoport p4d_t *p4dp;
8720a004e7SWill Deacon pud_t *pudp;
8820a004e7SWill Deacon pmd_t *pmdp;
8966b3923aSDavid Woods
9066b3923aSDavid Woods *pgsize = PAGE_SIZE;
91e9f63768SMike Rapoport p4dp = p4d_offset(pgdp, addr);
92e9f63768SMike Rapoport pudp = pud_offset(p4dp, addr);
9320a004e7SWill Deacon pmdp = pmd_offset(pudp, addr);
9420a004e7SWill Deacon if ((pte_t *)pmdp == ptep) {
9566b3923aSDavid Woods *pgsize = PMD_SIZE;
9666b3923aSDavid Woods return CONT_PMDS;
9766b3923aSDavid Woods }
9866b3923aSDavid Woods return CONT_PTES;
9966b3923aSDavid Woods }
10066b3923aSDavid Woods
num_contig_ptes(unsigned long size,size_t * pgsize)101c3e4ed5cSPunit Agrawal static inline int num_contig_ptes(unsigned long size, size_t *pgsize)
102c3e4ed5cSPunit Agrawal {
10349c87f76SRyan Roberts int contig_ptes = 1;
104c3e4ed5cSPunit Agrawal
105c3e4ed5cSPunit Agrawal *pgsize = size;
106c3e4ed5cSPunit Agrawal
107c3e4ed5cSPunit Agrawal switch (size) {
108c3e4ed5cSPunit Agrawal case CONT_PMD_SIZE:
109c3e4ed5cSPunit Agrawal *pgsize = PMD_SIZE;
110c3e4ed5cSPunit Agrawal contig_ptes = CONT_PMDS;
111c3e4ed5cSPunit Agrawal break;
112c3e4ed5cSPunit Agrawal case CONT_PTE_SIZE:
113c3e4ed5cSPunit Agrawal *pgsize = PAGE_SIZE;
114c3e4ed5cSPunit Agrawal contig_ptes = CONT_PTES;
115c3e4ed5cSPunit Agrawal break;
11649c87f76SRyan Roberts default:
11749c87f76SRyan Roberts WARN_ON(!__hugetlb_valid_size(size));
118c3e4ed5cSPunit Agrawal }
119c3e4ed5cSPunit Agrawal
120c3e4ed5cSPunit Agrawal return contig_ptes;
121c3e4ed5cSPunit Agrawal }
122c3e4ed5cSPunit Agrawal
huge_ptep_get(struct mm_struct * mm,unsigned long addr,pte_t * ptep)123e6c0c032SChristophe Leroy pte_t huge_ptep_get(struct mm_struct *mm, unsigned long addr, pte_t *ptep)
124bc5dfb4fSBaolin Wang {
125bc5dfb4fSBaolin Wang int ncontig, i;
126bc5dfb4fSBaolin Wang size_t pgsize;
1275a00bfd6SRyan Roberts pte_t orig_pte = __ptep_get(ptep);
128bc5dfb4fSBaolin Wang
129bc5dfb4fSBaolin Wang if (!pte_present(orig_pte) || !pte_cont(orig_pte))
130bc5dfb4fSBaolin Wang return orig_pte;
131bc5dfb4fSBaolin Wang
13229cb8051SRyan Roberts ncontig = find_num_contig(mm, addr, ptep, &pgsize);
133bc5dfb4fSBaolin Wang for (i = 0; i < ncontig; i++, ptep++) {
1345a00bfd6SRyan Roberts pte_t pte = __ptep_get(ptep);
135bc5dfb4fSBaolin Wang
136bc5dfb4fSBaolin Wang if (pte_dirty(pte))
137bc5dfb4fSBaolin Wang orig_pte = pte_mkdirty(orig_pte);
138bc5dfb4fSBaolin Wang
139bc5dfb4fSBaolin Wang if (pte_young(pte))
140bc5dfb4fSBaolin Wang orig_pte = pte_mkyoung(orig_pte);
141bc5dfb4fSBaolin Wang }
142bc5dfb4fSBaolin Wang return orig_pte;
143bc5dfb4fSBaolin Wang }
144bc5dfb4fSBaolin Wang
145d8bdcff2SSteve Capper /*
146d8bdcff2SSteve Capper * Changing some bits of contiguous entries requires us to follow a
147d8bdcff2SSteve Capper * Break-Before-Make approach, breaking the whole contiguous set
148d8bdcff2SSteve Capper * before we can change any entries. See ARM DDI 0487A.k_iss10775,
149d8bdcff2SSteve Capper * "Misprogramming of the Contiguous bit", page D4-1762.
150d8bdcff2SSteve Capper *
151d8bdcff2SSteve Capper * This helper performs the break step.
152d8bdcff2SSteve Capper */
get_clear_contig(struct mm_struct * mm,unsigned long addr,pte_t * ptep,unsigned long pgsize,unsigned long ncontig)153fb396bb4SAnshuman Khandual static pte_t get_clear_contig(struct mm_struct *mm,
154d8bdcff2SSteve Capper unsigned long addr,
155d8bdcff2SSteve Capper pte_t *ptep,
156d8bdcff2SSteve Capper unsigned long pgsize,
157d8bdcff2SSteve Capper unsigned long ncontig)
158d8bdcff2SSteve Capper {
15949c87f76SRyan Roberts pte_t pte, tmp_pte;
16049c87f76SRyan Roberts bool present;
161d8bdcff2SSteve Capper
162a899b7d0SRyan Roberts pte = __ptep_get_and_clear_anysz(mm, ptep, pgsize);
16349c87f76SRyan Roberts present = pte_present(pte);
16449c87f76SRyan Roberts while (--ncontig) {
16549c87f76SRyan Roberts ptep++;
166a899b7d0SRyan Roberts tmp_pte = __ptep_get_and_clear_anysz(mm, ptep, pgsize);
16749c87f76SRyan Roberts if (present) {
16849c87f76SRyan Roberts if (pte_dirty(tmp_pte))
16949c87f76SRyan Roberts pte = pte_mkdirty(pte);
17049c87f76SRyan Roberts if (pte_young(tmp_pte))
17149c87f76SRyan Roberts pte = pte_mkyoung(pte);
172d8bdcff2SSteve Capper }
17349c87f76SRyan Roberts }
17449c87f76SRyan Roberts return pte;
175d8bdcff2SSteve Capper }
176d8bdcff2SSteve Capper
get_clear_contig_flush(struct mm_struct * mm,unsigned long addr,pte_t * ptep,unsigned long pgsize,unsigned long ncontig)17741098230SWill Deacon static pte_t get_clear_contig_flush(struct mm_struct *mm,
17841098230SWill Deacon unsigned long addr,
17941098230SWill Deacon pte_t *ptep,
18041098230SWill Deacon unsigned long pgsize,
18141098230SWill Deacon unsigned long ncontig)
18241098230SWill Deacon {
18341098230SWill Deacon pte_t orig_pte = get_clear_contig(mm, addr, ptep, pgsize, ncontig);
18441098230SWill Deacon struct vm_area_struct vma = TLB_FLUSH_VMA(mm, 0);
1855b3f8917SRyan Roberts unsigned long end = addr + (pgsize * ncontig);
18641098230SWill Deacon
1875b3f8917SRyan Roberts __flush_hugetlb_tlb_range(&vma, addr, end, pgsize, true);
18841098230SWill Deacon return orig_pte;
18941098230SWill Deacon }
19041098230SWill Deacon
191d8bdcff2SSteve Capper /*
192d8bdcff2SSteve Capper * Changing some bits of contiguous entries requires us to follow a
193d8bdcff2SSteve Capper * Break-Before-Make approach, breaking the whole contiguous set
194d8bdcff2SSteve Capper * before we can change any entries. See ARM DDI 0487A.k_iss10775,
195d8bdcff2SSteve Capper * "Misprogramming of the Contiguous bit", page D4-1762.
196d8bdcff2SSteve Capper *
197d8bdcff2SSteve Capper * This helper performs the break step for use cases where the
198d8bdcff2SSteve Capper * original pte is not needed.
199d8bdcff2SSteve Capper */
clear_flush(struct mm_struct * mm,unsigned long addr,pte_t * ptep,unsigned long pgsize,unsigned long ncontig)200d8bdcff2SSteve Capper static void clear_flush(struct mm_struct *mm,
201d8bdcff2SSteve Capper unsigned long addr,
202d8bdcff2SSteve Capper pte_t *ptep,
203d8bdcff2SSteve Capper unsigned long pgsize,
204d8bdcff2SSteve Capper unsigned long ncontig)
205d8bdcff2SSteve Capper {
2068b11ec1bSLinus Torvalds struct vm_area_struct vma = TLB_FLUSH_VMA(mm, 0);
207d8bdcff2SSteve Capper unsigned long i, saddr = addr;
208d8bdcff2SSteve Capper
209d8bdcff2SSteve Capper for (i = 0; i < ncontig; i++, addr += pgsize, ptep++)
210a899b7d0SRyan Roberts __ptep_get_and_clear_anysz(mm, ptep, pgsize);
211d8bdcff2SSteve Capper
212*06fc959fSRyan Roberts if (mm == &init_mm)
213*06fc959fSRyan Roberts flush_tlb_kernel_range(saddr, addr);
214*06fc959fSRyan Roberts else
2155b3f8917SRyan Roberts __flush_hugetlb_tlb_range(&vma, saddr, addr, pgsize, true);
216d8bdcff2SSteve Capper }
217d8bdcff2SSteve Capper
set_huge_pte_at(struct mm_struct * mm,unsigned long addr,pte_t * ptep,pte_t pte,unsigned long sz)21866b3923aSDavid Woods void set_huge_pte_at(struct mm_struct *mm, unsigned long addr,
219935d4f0cSRyan Roberts pte_t *ptep, pte_t pte, unsigned long sz)
22066b3923aSDavid Woods {
22166b3923aSDavid Woods size_t pgsize;
22266b3923aSDavid Woods int i;
223bb9dd3dfSSteve Capper int ncontig;
22466b3923aSDavid Woods
2256f1bace9SRyan Roberts ncontig = num_contig_ptes(sz, &pgsize);
2266f1bace9SRyan Roberts
22718f39629SQi Zheng if (!pte_present(pte)) {
2286f1bace9SRyan Roberts for (i = 0; i < ncontig; i++, ptep++)
229a899b7d0SRyan Roberts __set_ptes_anysz(mm, ptep, pte, 1, pgsize);
23018f39629SQi Zheng return;
23118f39629SQi Zheng }
232d3ea7952SSteve Capper
2335b3f8917SRyan Roberts /* Only need to "break" if transitioning valid -> valid. */
234a899b7d0SRyan Roberts if (pte_cont(pte) && pte_valid(__ptep_get(ptep)))
235d8bdcff2SSteve Capper clear_flush(mm, addr, ptep, pgsize, ncontig);
236d8bdcff2SSteve Capper
237a899b7d0SRyan Roberts __set_ptes_anysz(mm, ptep, pte, ncontig, pgsize);
23866b3923aSDavid Woods }
23966b3923aSDavid Woods
huge_pte_alloc(struct mm_struct * mm,struct vm_area_struct * vma,unsigned long addr,unsigned long sz)240aec44e0fSPeter Xu pte_t *huge_pte_alloc(struct mm_struct *mm, struct vm_area_struct *vma,
24166b3923aSDavid Woods unsigned long addr, unsigned long sz)
24266b3923aSDavid Woods {
24320a004e7SWill Deacon pgd_t *pgdp;
244e9f63768SMike Rapoport p4d_t *p4dp;
24520a004e7SWill Deacon pud_t *pudp;
24620a004e7SWill Deacon pmd_t *pmdp;
24720a004e7SWill Deacon pte_t *ptep = NULL;
24866b3923aSDavid Woods
24920a004e7SWill Deacon pgdp = pgd_offset(mm, addr);
250015a12a4SAnshuman Khandual p4dp = p4d_alloc(mm, pgdp, addr);
251015a12a4SAnshuman Khandual if (!p4dp)
252015a12a4SAnshuman Khandual return NULL;
253015a12a4SAnshuman Khandual
254e9f63768SMike Rapoport pudp = pud_alloc(mm, p4dp, addr);
25520a004e7SWill Deacon if (!pudp)
25666b3923aSDavid Woods return NULL;
25766b3923aSDavid Woods
25866b3923aSDavid Woods if (sz == PUD_SIZE) {
25920a004e7SWill Deacon ptep = (pte_t *)pudp;
260441a6278SAnshuman Khandual } else if (sz == (CONT_PTE_SIZE)) {
26120a004e7SWill Deacon pmdp = pmd_alloc(mm, pudp, addr);
262027d0c71SMark Rutland if (!pmdp)
263027d0c71SMark Rutland return NULL;
26466b3923aSDavid Woods
26566b3923aSDavid Woods WARN_ON(addr & (sz - 1));
266cafcb9caSHugh Dickins ptep = pte_alloc_huge(mm, pmdp, addr);
26766b3923aSDavid Woods } else if (sz == PMD_SIZE) {
268c1991e07SPeter Xu if (want_pmd_share(vma, addr) && pud_none(READ_ONCE(*pudp)))
269aec44e0fSPeter Xu ptep = huge_pmd_share(mm, vma, addr, pudp);
27066b3923aSDavid Woods else
27120a004e7SWill Deacon ptep = (pte_t *)pmd_alloc(mm, pudp, addr);
272441a6278SAnshuman Khandual } else if (sz == (CONT_PMD_SIZE)) {
27320a004e7SWill Deacon pmdp = pmd_alloc(mm, pudp, addr);
27466b3923aSDavid Woods WARN_ON(addr & (sz - 1));
27520a004e7SWill Deacon return (pte_t *)pmdp;
27666b3923aSDavid Woods }
27766b3923aSDavid Woods
27820a004e7SWill Deacon return ptep;
27966b3923aSDavid Woods }
28066b3923aSDavid Woods
huge_pte_offset(struct mm_struct * mm,unsigned long addr,unsigned long sz)2817868a208SPunit Agrawal pte_t *huge_pte_offset(struct mm_struct *mm,
2827868a208SPunit Agrawal unsigned long addr, unsigned long sz)
28366b3923aSDavid Woods {
28420a004e7SWill Deacon pgd_t *pgdp;
285e9f63768SMike Rapoport p4d_t *p4dp;
28620a004e7SWill Deacon pud_t *pudp, pud;
28720a004e7SWill Deacon pmd_t *pmdp, pmd;
28866b3923aSDavid Woods
28920a004e7SWill Deacon pgdp = pgd_offset(mm, addr);
29020a004e7SWill Deacon if (!pgd_present(READ_ONCE(*pgdp)))
29166b3923aSDavid Woods return NULL;
292f02ab08aSPunit Agrawal
293e9f63768SMike Rapoport p4dp = p4d_offset(pgdp, addr);
294e9f63768SMike Rapoport if (!p4d_present(READ_ONCE(*p4dp)))
295e9f63768SMike Rapoport return NULL;
296e9f63768SMike Rapoport
297e9f63768SMike Rapoport pudp = pud_offset(p4dp, addr);
29820a004e7SWill Deacon pud = READ_ONCE(*pudp);
29920a004e7SWill Deacon if (sz != PUD_SIZE && pud_none(pud))
30066b3923aSDavid Woods return NULL;
30130f3ac00SPunit Agrawal /* hugepage or swap? */
3021965e933SPeter Xu if (pud_leaf(pud) || !pud_present(pud))
30320a004e7SWill Deacon return (pte_t *)pudp;
304f02ab08aSPunit Agrawal /* table; check the next level */
30566b3923aSDavid Woods
30630f3ac00SPunit Agrawal if (sz == CONT_PMD_SIZE)
30730f3ac00SPunit Agrawal addr &= CONT_PMD_MASK;
30830f3ac00SPunit Agrawal
30920a004e7SWill Deacon pmdp = pmd_offset(pudp, addr);
31020a004e7SWill Deacon pmd = READ_ONCE(*pmdp);
31130f3ac00SPunit Agrawal if (!(sz == PMD_SIZE || sz == CONT_PMD_SIZE) &&
31220a004e7SWill Deacon pmd_none(pmd))
313f02ab08aSPunit Agrawal return NULL;
3141965e933SPeter Xu if (pmd_leaf(pmd) || !pmd_present(pmd))
31520a004e7SWill Deacon return (pte_t *)pmdp;
316f02ab08aSPunit Agrawal
31720a004e7SWill Deacon if (sz == CONT_PTE_SIZE)
318cafcb9caSHugh Dickins return pte_offset_huge(pmdp, (addr & CONT_PTE_MASK));
31930f3ac00SPunit Agrawal
32066b3923aSDavid Woods return NULL;
32166b3923aSDavid Woods }
32266b3923aSDavid Woods
hugetlb_mask_last_page(struct hstate * h)3231bcdb769SBaolin Wang unsigned long hugetlb_mask_last_page(struct hstate *h)
3241bcdb769SBaolin Wang {
3251bcdb769SBaolin Wang unsigned long hp_size = huge_page_size(h);
3261bcdb769SBaolin Wang
3271bcdb769SBaolin Wang switch (hp_size) {
3281bcdb769SBaolin Wang #ifndef __PAGETABLE_PMD_FOLDED
3291bcdb769SBaolin Wang case PUD_SIZE:
33034e8e63aSAnshuman Khandual if (pud_sect_supported())
3311bcdb769SBaolin Wang return PGDIR_SIZE - PUD_SIZE;
33234e8e63aSAnshuman Khandual break;
3331bcdb769SBaolin Wang #endif
3341bcdb769SBaolin Wang case CONT_PMD_SIZE:
3351bcdb769SBaolin Wang return PUD_SIZE - CONT_PMD_SIZE;
3361bcdb769SBaolin Wang case PMD_SIZE:
3371bcdb769SBaolin Wang return PUD_SIZE - PMD_SIZE;
3381bcdb769SBaolin Wang case CONT_PTE_SIZE:
3391bcdb769SBaolin Wang return PMD_SIZE - CONT_PTE_SIZE;
3401bcdb769SBaolin Wang default:
3411bcdb769SBaolin Wang break;
3421bcdb769SBaolin Wang }
3431bcdb769SBaolin Wang
3441bcdb769SBaolin Wang return 0UL;
3451bcdb769SBaolin Wang }
3461bcdb769SBaolin Wang
arch_make_huge_pte(pte_t entry,unsigned int shift,vm_flags_t flags)34779c1c594SChristophe Leroy pte_t arch_make_huge_pte(pte_t entry, unsigned int shift, vm_flags_t flags)
34866b3923aSDavid Woods {
34979c1c594SChristophe Leroy size_t pagesize = 1UL << shift;
35066b3923aSDavid Woods
351f8192813SAnshuman Khandual switch (pagesize) {
352f8192813SAnshuman Khandual #ifndef __PAGETABLE_PMD_FOLDED
353f8192813SAnshuman Khandual case PUD_SIZE:
35434e8e63aSAnshuman Khandual if (pud_sect_supported())
35534e8e63aSAnshuman Khandual return pud_pte(pud_mkhuge(pte_pud(entry)));
356f8192813SAnshuman Khandual break;
357f8192813SAnshuman Khandual #endif
358f8192813SAnshuman Khandual case CONT_PMD_SIZE:
35934e8e63aSAnshuman Khandual return pmd_pte(pmd_mkhuge(pmd_mkcont(pte_pmd(entry))));
360f8192813SAnshuman Khandual case PMD_SIZE:
36134e8e63aSAnshuman Khandual return pmd_pte(pmd_mkhuge(pte_pmd(entry)));
362f8192813SAnshuman Khandual case CONT_PTE_SIZE:
36334e8e63aSAnshuman Khandual return pte_mkcont(entry);
364f8192813SAnshuman Khandual default:
365f8192813SAnshuman Khandual break;
36666b3923aSDavid Woods }
36734e8e63aSAnshuman Khandual pr_warn("%s: unrecognized huge page size 0x%lx\n",
36834e8e63aSAnshuman Khandual __func__, pagesize);
36966b3923aSDavid Woods return entry;
37066b3923aSDavid Woods }
37166b3923aSDavid Woods
huge_pte_clear(struct mm_struct * mm,unsigned long addr,pte_t * ptep,unsigned long sz)372c3e4ed5cSPunit Agrawal void huge_pte_clear(struct mm_struct *mm, unsigned long addr,
373c3e4ed5cSPunit Agrawal pte_t *ptep, unsigned long sz)
374c3e4ed5cSPunit Agrawal {
375c3e4ed5cSPunit Agrawal int i, ncontig;
376c3e4ed5cSPunit Agrawal size_t pgsize;
377c3e4ed5cSPunit Agrawal
378c3e4ed5cSPunit Agrawal ncontig = num_contig_ptes(sz, &pgsize);
379c3e4ed5cSPunit Agrawal
380c3e4ed5cSPunit Agrawal for (i = 0; i < ncontig; i++, addr += pgsize, ptep++)
3815a00bfd6SRyan Roberts __pte_clear(mm, addr, ptep);
382c3e4ed5cSPunit Agrawal }
383c3e4ed5cSPunit Agrawal
huge_ptep_get_and_clear(struct mm_struct * mm,unsigned long addr,pte_t * ptep,unsigned long sz)38402410ac7SRyan Roberts pte_t huge_ptep_get_and_clear(struct mm_struct *mm, unsigned long addr,
38502410ac7SRyan Roberts pte_t *ptep, unsigned long sz)
38666b3923aSDavid Woods {
387d8bdcff2SSteve Capper int ncontig;
38866b3923aSDavid Woods size_t pgsize;
38929a7287dSSteve Capper
39049c87f76SRyan Roberts ncontig = num_contig_ptes(sz, &pgsize);
391fb396bb4SAnshuman Khandual return get_clear_contig(mm, addr, ptep, pgsize, ncontig);
39266b3923aSDavid Woods }
39366b3923aSDavid Woods
394031e6e6bSSteve Capper /*
395031e6e6bSSteve Capper * huge_ptep_set_access_flags will update access flags (dirty, accesssed)
396031e6e6bSSteve Capper * and write permission.
397031e6e6bSSteve Capper *
398031e6e6bSSteve Capper * For a contiguous huge pte range we need to check whether or not write
399031e6e6bSSteve Capper * permission has to change only on the first pte in the set. Then for
400031e6e6bSSteve Capper * all the contiguous ptes we need to check whether or not there is a
401031e6e6bSSteve Capper * discrepancy between dirty or young.
402031e6e6bSSteve Capper */
__cont_access_flags_changed(pte_t * ptep,pte_t pte,int ncontig)403031e6e6bSSteve Capper static int __cont_access_flags_changed(pte_t *ptep, pte_t pte, int ncontig)
404031e6e6bSSteve Capper {
405031e6e6bSSteve Capper int i;
406031e6e6bSSteve Capper
4075a00bfd6SRyan Roberts if (pte_write(pte) != pte_write(__ptep_get(ptep)))
408031e6e6bSSteve Capper return 1;
409031e6e6bSSteve Capper
410031e6e6bSSteve Capper for (i = 0; i < ncontig; i++) {
4115a00bfd6SRyan Roberts pte_t orig_pte = __ptep_get(ptep + i);
412031e6e6bSSteve Capper
413031e6e6bSSteve Capper if (pte_dirty(pte) != pte_dirty(orig_pte))
414031e6e6bSSteve Capper return 1;
415031e6e6bSSteve Capper
416031e6e6bSSteve Capper if (pte_young(pte) != pte_young(orig_pte))
417031e6e6bSSteve Capper return 1;
418031e6e6bSSteve Capper }
419031e6e6bSSteve Capper
420031e6e6bSSteve Capper return 0;
421031e6e6bSSteve Capper }
422031e6e6bSSteve Capper
huge_ptep_set_access_flags(struct vm_area_struct * vma,unsigned long addr,pte_t * ptep,pte_t pte,int dirty)42366b3923aSDavid Woods int huge_ptep_set_access_flags(struct vm_area_struct *vma,
42466b3923aSDavid Woods unsigned long addr, pte_t *ptep,
42566b3923aSDavid Woods pte_t pte, int dirty)
42666b3923aSDavid Woods {
427a899b7d0SRyan Roberts int ncontig;
42866b3923aSDavid Woods size_t pgsize = 0;
42941098230SWill Deacon struct mm_struct *mm = vma->vm_mm;
430d8bdcff2SSteve Capper pte_t orig_pte;
43166b3923aSDavid Woods
43229cb8051SRyan Roberts VM_WARN_ON(!pte_present(pte));
43329cb8051SRyan Roberts
43429a7287dSSteve Capper if (!pte_cont(pte))
4355a00bfd6SRyan Roberts return __ptep_set_access_flags(vma, addr, ptep, pte, dirty);
43629a7287dSSteve Capper
43729cb8051SRyan Roberts ncontig = num_contig_ptes(huge_page_size(hstate_vma(vma)), &pgsize);
43829a7287dSSteve Capper
439031e6e6bSSteve Capper if (!__cont_access_flags_changed(ptep, pte, ncontig))
440031e6e6bSSteve Capper return 0;
441031e6e6bSSteve Capper
44241098230SWill Deacon orig_pte = get_clear_contig_flush(mm, addr, ptep, pgsize, ncontig);
44329cb8051SRyan Roberts VM_WARN_ON(!pte_present(orig_pte));
444d8bdcff2SSteve Capper
445469ed9d8SSteve Capper /* Make sure we don't lose the dirty or young state */
446d8bdcff2SSteve Capper if (pte_dirty(orig_pte))
447d8bdcff2SSteve Capper pte = pte_mkdirty(pte);
448d8bdcff2SSteve Capper
449469ed9d8SSteve Capper if (pte_young(orig_pte))
450469ed9d8SSteve Capper pte = pte_mkyoung(pte);
451469ed9d8SSteve Capper
452a899b7d0SRyan Roberts __set_ptes_anysz(mm, ptep, pte, ncontig, pgsize);
453031e6e6bSSteve Capper return 1;
45466b3923aSDavid Woods }
45566b3923aSDavid Woods
huge_ptep_set_wrprotect(struct mm_struct * mm,unsigned long addr,pte_t * ptep)45666b3923aSDavid Woods void huge_ptep_set_wrprotect(struct mm_struct *mm,
45766b3923aSDavid Woods unsigned long addr, pte_t *ptep)
45866b3923aSDavid Woods {
459a899b7d0SRyan Roberts int ncontig;
46029a7287dSSteve Capper size_t pgsize;
461d8bdcff2SSteve Capper pte_t pte;
46229a7287dSSteve Capper
46329cb8051SRyan Roberts pte = __ptep_get(ptep);
46429cb8051SRyan Roberts VM_WARN_ON(!pte_present(pte));
46529cb8051SRyan Roberts
46629cb8051SRyan Roberts if (!pte_cont(pte)) {
4675a00bfd6SRyan Roberts __ptep_set_wrprotect(mm, addr, ptep);
46829a7287dSSteve Capper return;
46929a7287dSSteve Capper }
47066b3923aSDavid Woods
471f0b38d65SSteve Capper ncontig = find_num_contig(mm, addr, ptep, &pgsize);
472d8bdcff2SSteve Capper
47341098230SWill Deacon pte = get_clear_contig_flush(mm, addr, ptep, pgsize, ncontig);
474d8bdcff2SSteve Capper pte = pte_wrprotect(pte);
475d8bdcff2SSteve Capper
476a899b7d0SRyan Roberts __set_ptes_anysz(mm, ptep, pte, ncontig, pgsize);
47766b3923aSDavid Woods }
47866b3923aSDavid Woods
huge_ptep_clear_flush(struct vm_area_struct * vma,unsigned long addr,pte_t * ptep)479ae075629SBaolin Wang pte_t huge_ptep_clear_flush(struct vm_area_struct *vma,
48066b3923aSDavid Woods unsigned long addr, pte_t *ptep)
48166b3923aSDavid Woods {
48241098230SWill Deacon struct mm_struct *mm = vma->vm_mm;
48329a7287dSSteve Capper size_t pgsize;
484d8bdcff2SSteve Capper int ncontig;
48529a7287dSSteve Capper
48629cb8051SRyan Roberts ncontig = num_contig_ptes(huge_page_size(hstate_vma(vma)), &pgsize);
48741098230SWill Deacon return get_clear_contig_flush(mm, addr, ptep, pgsize, ncontig);
48866b3923aSDavid Woods }
48966b3923aSDavid Woods
hugetlbpage_init(void)490a21b0b78SAllen Pais static int __init hugetlbpage_init(void)
491a21b0b78SAllen Pais {
4921e5823c8SAnshuman Khandual /*
4931e5823c8SAnshuman Khandual * HugeTLB pages are supported on maximum four page table
4941e5823c8SAnshuman Khandual * levels (PUD, CONT PMD, PMD, CONT PTE) for a given base
4951e5823c8SAnshuman Khandual * page size, corresponding to hugetlb_add_hstate() calls
4961e5823c8SAnshuman Khandual * here.
4971e5823c8SAnshuman Khandual *
4981e5823c8SAnshuman Khandual * HUGE_MAX_HSTATE should at least match maximum supported
4991e5823c8SAnshuman Khandual * HugeTLB page sizes on the platform. Any new addition to
5001e5823c8SAnshuman Khandual * supported HugeTLB page sizes will also require changing
5011e5823c8SAnshuman Khandual * HUGE_MAX_HSTATE as well.
5021e5823c8SAnshuman Khandual */
5031e5823c8SAnshuman Khandual BUILD_BUG_ON(HUGE_MAX_HSTATE < 4);
504f8b46c4bSAnshuman Khandual if (pud_sect_supported())
50538237830SMike Kravetz hugetlb_add_hstate(PUD_SHIFT - PAGE_SHIFT);
506f8b46c4bSAnshuman Khandual
507a1634a54SGavin Shan hugetlb_add_hstate(CONT_PMD_SHIFT - PAGE_SHIFT);
50838237830SMike Kravetz hugetlb_add_hstate(PMD_SHIFT - PAGE_SHIFT);
509a1634a54SGavin Shan hugetlb_add_hstate(CONT_PTE_SHIFT - PAGE_SHIFT);
510a21b0b78SAllen Pais
511a21b0b78SAllen Pais return 0;
512a21b0b78SAllen Pais }
513a21b0b78SAllen Pais arch_initcall(hugetlbpage_init);
514a21b0b78SAllen Pais
arch_hugetlb_valid_size(unsigned long size)515ae94da89SMike Kravetz bool __init arch_hugetlb_valid_size(unsigned long size)
516084bd298SSteve Capper {
517a8a733b2SAnshuman Khandual return __hugetlb_valid_size(size);
518ae94da89SMike Kravetz }
5195db568e7SAnshuman Khandual
huge_ptep_modify_prot_start(struct vm_area_struct * vma,unsigned long addr,pte_t * ptep)5205db568e7SAnshuman Khandual pte_t huge_ptep_modify_prot_start(struct vm_area_struct *vma, unsigned long addr, pte_t *ptep)
5215db568e7SAnshuman Khandual {
52202410ac7SRyan Roberts unsigned long psize = huge_page_size(hstate_vma(vma));
52302410ac7SRyan Roberts
524412cb380SMark Rutland if (alternative_has_cap_unlikely(ARM64_WORKAROUND_2645198)) {
5255db568e7SAnshuman Khandual /*
5265db568e7SAnshuman Khandual * Break-before-make (BBM) is required for all user space mappings
5275db568e7SAnshuman Khandual * when the permission changes from executable to non-executable
5285db568e7SAnshuman Khandual * in cases where cpu is affected with errata #2645198.
5295db568e7SAnshuman Khandual */
5305a00bfd6SRyan Roberts if (pte_user_exec(__ptep_get(ptep)))
5315db568e7SAnshuman Khandual return huge_ptep_clear_flush(vma, addr, ptep);
5325db568e7SAnshuman Khandual }
53302410ac7SRyan Roberts return huge_ptep_get_and_clear(vma->vm_mm, addr, ptep, psize);
5345db568e7SAnshuman Khandual }
5355db568e7SAnshuman Khandual
huge_ptep_modify_prot_commit(struct vm_area_struct * vma,unsigned long addr,pte_t * ptep,pte_t old_pte,pte_t pte)5365db568e7SAnshuman Khandual void huge_ptep_modify_prot_commit(struct vm_area_struct *vma, unsigned long addr, pte_t *ptep,
5375db568e7SAnshuman Khandual pte_t old_pte, pte_t pte)
5385db568e7SAnshuman Khandual {
539935d4f0cSRyan Roberts unsigned long psize = huge_page_size(hstate_vma(vma));
540935d4f0cSRyan Roberts
541935d4f0cSRyan Roberts set_huge_pte_at(vma->vm_mm, addr, ptep, pte, psize);
5425db568e7SAnshuman Khandual }
543