Greg Kroah-Hartman | b244131 | 2017-11-01 15:07:57 +0100 | [diff] [blame] | 1 | // SPDX-License-Identifier: GPL-2.0 |
Andrea Arcangeli | e2cda32 | 2011-01-13 15:46:40 -0800 | [diff] [blame] | 2 | /* |
| 3 | * mm/pgtable-generic.c |
| 4 | * |
Mike Rapoport | ca5999f | 2020-06-08 21:32:38 -0700 | [diff] [blame] | 5 | * Generic pgtable methods declared in linux/pgtable.h |
Andrea Arcangeli | e2cda32 | 2011-01-13 15:46:40 -0800 | [diff] [blame] | 6 | * |
| 7 | * Copyright (C) 2010 Linus Torvalds |
| 8 | */ |
| 9 | |
Andrew Morton | f95ba94 | 2011-01-25 15:07:11 -0800 | [diff] [blame] | 10 | #include <linux/pagemap.h> |
Peter Zijlstra | a31acd3 | 2018-08-26 12:56:48 +0200 | [diff] [blame] | 11 | #include <linux/hugetlb.h> |
Mike Rapoport | ca5999f | 2020-06-08 21:32:38 -0700 | [diff] [blame] | 12 | #include <linux/pgtable.h> |
Arnd Bergmann | 36090de | 2022-01-14 14:06:10 -0800 | [diff] [blame] | 13 | #include <linux/mm_inline.h> |
Andrea Arcangeli | e2cda32 | 2011-01-13 15:46:40 -0800 | [diff] [blame] | 14 | #include <asm/tlb.h> |
Andrea Arcangeli | e2cda32 | 2011-01-13 15:46:40 -0800 | [diff] [blame] | 15 | |
Joonsoo Kim | bc4b444 | 2013-09-11 14:21:28 -0700 | [diff] [blame] | 16 | /* |
| 17 | * If a p?d_bad entry is found while walking page tables, report |
| 18 | * the error, before resetting entry to p?d_none. Usually (but |
| 19 | * very seldom) called out from the p?d_none_or_clear_bad macros. |
| 20 | */ |
| 21 | |
| 22 | void pgd_clear_bad(pgd_t *pgd) |
| 23 | { |
| 24 | pgd_ERROR(*pgd); |
| 25 | pgd_clear(pgd); |
| 26 | } |
| 27 | |
Vineet Gupta | f2400ab | 2019-11-30 17:51:20 -0800 | [diff] [blame] | 28 | #ifndef __PAGETABLE_P4D_FOLDED |
Kirill A. Shutemov | c2febaf | 2017-03-09 17:24:07 +0300 | [diff] [blame] | 29 | void p4d_clear_bad(p4d_t *p4d) |
| 30 | { |
| 31 | p4d_ERROR(*p4d); |
| 32 | p4d_clear(p4d); |
| 33 | } |
Vineet Gupta | f2400ab | 2019-11-30 17:51:20 -0800 | [diff] [blame] | 34 | #endif |
Kirill A. Shutemov | c2febaf | 2017-03-09 17:24:07 +0300 | [diff] [blame] | 35 | |
Vineet Gupta | f2400ab | 2019-11-30 17:51:20 -0800 | [diff] [blame] | 36 | #ifndef __PAGETABLE_PUD_FOLDED |
Joonsoo Kim | bc4b444 | 2013-09-11 14:21:28 -0700 | [diff] [blame] | 37 | void pud_clear_bad(pud_t *pud) |
| 38 | { |
| 39 | pud_ERROR(*pud); |
| 40 | pud_clear(pud); |
| 41 | } |
Vineet Gupta | f2400ab | 2019-11-30 17:51:20 -0800 | [diff] [blame] | 42 | #endif |
Joonsoo Kim | bc4b444 | 2013-09-11 14:21:28 -0700 | [diff] [blame] | 43 | |
Vineet Gupta | f2400ab | 2019-11-30 17:51:20 -0800 | [diff] [blame] | 44 | /* |
| 45 | * Note that the pmd variant below can't be stub'ed out just as for p4d/pud |
| 46 | * above. pmd folding is special and typically pmd_* macros refer to upper |
| 47 | * level even when folded |
| 48 | */ |
Joonsoo Kim | bc4b444 | 2013-09-11 14:21:28 -0700 | [diff] [blame] | 49 | void pmd_clear_bad(pmd_t *pmd) |
| 50 | { |
| 51 | pmd_ERROR(*pmd); |
| 52 | pmd_clear(pmd); |
| 53 | } |
| 54 | |
Andrea Arcangeli | e2cda32 | 2011-01-13 15:46:40 -0800 | [diff] [blame] | 55 | #ifndef __HAVE_ARCH_PTEP_SET_ACCESS_FLAGS |
| 56 | /* |
Mike Rapoport | ca5999f | 2020-06-08 21:32:38 -0700 | [diff] [blame] | 57 | * Only sets the access flags (dirty, accessed), as well as write |
Rik van Riel | cef23d9 | 2012-11-06 09:56:01 +0000 | [diff] [blame] | 58 | * permission. Furthermore, we know it always gets set to a "more |
Andrea Arcangeli | e2cda32 | 2011-01-13 15:46:40 -0800 | [diff] [blame] | 59 | * permissive" setting, which allows most architectures to optimize |
| 60 | * this. We return whether the PTE actually changed, which in turn |
| 61 | * instructs the caller to do things like update__mmu_cache. This |
| 62 | * used to be done in the caller, but sparc needs minor faults to |
| 63 | * force that call on sun4c so we changed this macro slightly |
| 64 | */ |
| 65 | int ptep_set_access_flags(struct vm_area_struct *vma, |
| 66 | unsigned long address, pte_t *ptep, |
| 67 | pte_t entry, int dirty) |
| 68 | { |
| 69 | int changed = !pte_same(*ptep, entry); |
| 70 | if (changed) { |
| 71 | set_pte_at(vma->vm_mm, address, ptep, entry); |
Rik van Riel | cef23d9 | 2012-11-06 09:56:01 +0000 | [diff] [blame] | 72 | flush_tlb_fix_spurious_fault(vma, address); |
Andrea Arcangeli | e2cda32 | 2011-01-13 15:46:40 -0800 | [diff] [blame] | 73 | } |
| 74 | return changed; |
| 75 | } |
| 76 | #endif |
| 77 | |
Vineet Gupta | 52585bc | 2015-07-09 17:19:30 +0530 | [diff] [blame] | 78 | #ifndef __HAVE_ARCH_PTEP_CLEAR_YOUNG_FLUSH |
| 79 | int ptep_clear_flush_young(struct vm_area_struct *vma, |
| 80 | unsigned long address, pte_t *ptep) |
| 81 | { |
| 82 | int young; |
| 83 | young = ptep_test_and_clear_young(vma, address, ptep); |
| 84 | if (young) |
| 85 | flush_tlb_page(vma, address); |
| 86 | return young; |
| 87 | } |
| 88 | #endif |
| 89 | |
| 90 | #ifndef __HAVE_ARCH_PTEP_CLEAR_FLUSH |
| 91 | pte_t ptep_clear_flush(struct vm_area_struct *vma, unsigned long address, |
| 92 | pte_t *ptep) |
| 93 | { |
| 94 | struct mm_struct *mm = (vma)->vm_mm; |
| 95 | pte_t pte; |
| 96 | pte = ptep_get_and_clear(mm, address, ptep); |
| 97 | if (pte_accessible(mm, pte)) |
| 98 | flush_tlb_page(vma, address); |
| 99 | return pte; |
| 100 | } |
| 101 | #endif |
| 102 | |
Vineet Gupta | bd5e88a | 2015-07-09 17:22:44 +0530 | [diff] [blame] | 103 | #ifdef CONFIG_TRANSPARENT_HUGEPAGE |
| 104 | |
Andrea Arcangeli | e2cda32 | 2011-01-13 15:46:40 -0800 | [diff] [blame] | 105 | #ifndef __HAVE_ARCH_PMDP_SET_ACCESS_FLAGS |
| 106 | int pmdp_set_access_flags(struct vm_area_struct *vma, |
| 107 | unsigned long address, pmd_t *pmdp, |
| 108 | pmd_t entry, int dirty) |
| 109 | { |
Andrea Arcangeli | e2cda32 | 2011-01-13 15:46:40 -0800 | [diff] [blame] | 110 | int changed = !pmd_same(*pmdp, entry); |
| 111 | VM_BUG_ON(address & ~HPAGE_PMD_MASK); |
| 112 | if (changed) { |
| 113 | set_pmd_at(vma->vm_mm, address, pmdp, entry); |
Vineet Gupta | 12ebc15 | 2015-02-20 10:36:28 +0530 | [diff] [blame] | 114 | flush_pmd_tlb_range(vma, address, address + HPAGE_PMD_SIZE); |
Andrea Arcangeli | e2cda32 | 2011-01-13 15:46:40 -0800 | [diff] [blame] | 115 | } |
| 116 | return changed; |
Andrea Arcangeli | e2cda32 | 2011-01-13 15:46:40 -0800 | [diff] [blame] | 117 | } |
| 118 | #endif |
| 119 | |
Andrea Arcangeli | e2cda32 | 2011-01-13 15:46:40 -0800 | [diff] [blame] | 120 | #ifndef __HAVE_ARCH_PMDP_CLEAR_YOUNG_FLUSH |
| 121 | int pmdp_clear_flush_young(struct vm_area_struct *vma, |
| 122 | unsigned long address, pmd_t *pmdp) |
| 123 | { |
| 124 | int young; |
Naoya Horiguchi | d8c37c4 | 2012-03-21 16:34:27 -0700 | [diff] [blame] | 125 | VM_BUG_ON(address & ~HPAGE_PMD_MASK); |
Andrea Arcangeli | e2cda32 | 2011-01-13 15:46:40 -0800 | [diff] [blame] | 126 | young = pmdp_test_and_clear_young(vma, address, pmdp); |
| 127 | if (young) |
Vineet Gupta | 12ebc15 | 2015-02-20 10:36:28 +0530 | [diff] [blame] | 128 | flush_pmd_tlb_range(vma, address, address + HPAGE_PMD_SIZE); |
Andrea Arcangeli | e2cda32 | 2011-01-13 15:46:40 -0800 | [diff] [blame] | 129 | return young; |
| 130 | } |
| 131 | #endif |
| 132 | |
Aneesh Kumar K.V | 8809aa2 | 2015-06-24 16:57:44 -0700 | [diff] [blame] | 133 | #ifndef __HAVE_ARCH_PMDP_HUGE_CLEAR_FLUSH |
Aneesh Kumar K.V | 8809aa2 | 2015-06-24 16:57:44 -0700 | [diff] [blame] | 134 | pmd_t pmdp_huge_clear_flush(struct vm_area_struct *vma, unsigned long address, |
| 135 | pmd_t *pmdp) |
Andrea Arcangeli | e2cda32 | 2011-01-13 15:46:40 -0800 | [diff] [blame] | 136 | { |
| 137 | pmd_t pmd; |
Andrea Arcangeli | e2cda32 | 2011-01-13 15:46:40 -0800 | [diff] [blame] | 138 | VM_BUG_ON(address & ~HPAGE_PMD_MASK); |
Hugh Dickins | 99fa8a4 | 2021-06-15 18:23:45 -0700 | [diff] [blame] | 139 | VM_BUG_ON(pmd_present(*pmdp) && !pmd_trans_huge(*pmdp) && |
| 140 | !pmd_devmap(*pmdp)); |
Aneesh Kumar K.V | 8809aa2 | 2015-06-24 16:57:44 -0700 | [diff] [blame] | 141 | pmd = pmdp_huge_get_and_clear(vma->vm_mm, address, pmdp); |
Vineet Gupta | 12ebc15 | 2015-02-20 10:36:28 +0530 | [diff] [blame] | 142 | flush_pmd_tlb_range(vma, address, address + HPAGE_PMD_SIZE); |
Andrea Arcangeli | e2cda32 | 2011-01-13 15:46:40 -0800 | [diff] [blame] | 143 | return pmd; |
| 144 | } |
Matthew Wilcox | a00cc7d | 2017-02-24 14:57:02 -0800 | [diff] [blame] | 145 | |
| 146 | #ifdef CONFIG_HAVE_ARCH_TRANSPARENT_HUGEPAGE_PUD |
| 147 | pud_t pudp_huge_clear_flush(struct vm_area_struct *vma, unsigned long address, |
| 148 | pud_t *pudp) |
| 149 | { |
| 150 | pud_t pud; |
| 151 | |
| 152 | VM_BUG_ON(address & ~HPAGE_PUD_MASK); |
| 153 | VM_BUG_ON(!pud_trans_huge(*pudp) && !pud_devmap(*pudp)); |
| 154 | pud = pudp_huge_get_and_clear(vma->vm_mm, address, pudp); |
| 155 | flush_pud_tlb_range(vma, address, address + HPAGE_PUD_SIZE); |
| 156 | return pud; |
| 157 | } |
| 158 | #endif |
Andrea Arcangeli | e2cda32 | 2011-01-13 15:46:40 -0800 | [diff] [blame] | 159 | #endif |
| 160 | |
Gerald Schaefer | e3ebcf64 | 2012-10-08 16:30:07 -0700 | [diff] [blame] | 161 | #ifndef __HAVE_ARCH_PGTABLE_DEPOSIT |
Aneesh Kumar K.V | 6b0b50b | 2013-06-05 17:14:02 -0700 | [diff] [blame] | 162 | void pgtable_trans_huge_deposit(struct mm_struct *mm, pmd_t *pmdp, |
| 163 | pgtable_t pgtable) |
Gerald Schaefer | e3ebcf64 | 2012-10-08 16:30:07 -0700 | [diff] [blame] | 164 | { |
Kirill A. Shutemov | c4088eb | 2013-11-14 14:31:04 -0800 | [diff] [blame] | 165 | assert_spin_locked(pmd_lockptr(mm, pmdp)); |
Gerald Schaefer | e3ebcf64 | 2012-10-08 16:30:07 -0700 | [diff] [blame] | 166 | |
| 167 | /* FIFO */ |
Kirill A. Shutemov | c389a25 | 2013-11-14 14:30:59 -0800 | [diff] [blame] | 168 | if (!pmd_huge_pte(mm, pmdp)) |
Gerald Schaefer | e3ebcf64 | 2012-10-08 16:30:07 -0700 | [diff] [blame] | 169 | INIT_LIST_HEAD(&pgtable->lru); |
| 170 | else |
Kirill A. Shutemov | c389a25 | 2013-11-14 14:30:59 -0800 | [diff] [blame] | 171 | list_add(&pgtable->lru, &pmd_huge_pte(mm, pmdp)->lru); |
| 172 | pmd_huge_pte(mm, pmdp) = pgtable; |
Gerald Schaefer | e3ebcf64 | 2012-10-08 16:30:07 -0700 | [diff] [blame] | 173 | } |
Gerald Schaefer | e3ebcf64 | 2012-10-08 16:30:07 -0700 | [diff] [blame] | 174 | #endif |
| 175 | |
| 176 | #ifndef __HAVE_ARCH_PGTABLE_WITHDRAW |
Gerald Schaefer | e3ebcf64 | 2012-10-08 16:30:07 -0700 | [diff] [blame] | 177 | /* no "address" argument so destroys page coloring of some arch */ |
Aneesh Kumar K.V | 6b0b50b | 2013-06-05 17:14:02 -0700 | [diff] [blame] | 178 | pgtable_t pgtable_trans_huge_withdraw(struct mm_struct *mm, pmd_t *pmdp) |
Gerald Schaefer | e3ebcf64 | 2012-10-08 16:30:07 -0700 | [diff] [blame] | 179 | { |
| 180 | pgtable_t pgtable; |
| 181 | |
Kirill A. Shutemov | c4088eb | 2013-11-14 14:31:04 -0800 | [diff] [blame] | 182 | assert_spin_locked(pmd_lockptr(mm, pmdp)); |
Gerald Schaefer | e3ebcf64 | 2012-10-08 16:30:07 -0700 | [diff] [blame] | 183 | |
| 184 | /* FIFO */ |
Kirill A. Shutemov | c389a25 | 2013-11-14 14:30:59 -0800 | [diff] [blame] | 185 | pgtable = pmd_huge_pte(mm, pmdp); |
Geliang Tang | 1466934 | 2016-01-14 15:19:32 -0800 | [diff] [blame] | 186 | pmd_huge_pte(mm, pmdp) = list_first_entry_or_null(&pgtable->lru, |
| 187 | struct page, lru); |
| 188 | if (pmd_huge_pte(mm, pmdp)) |
Gerald Schaefer | e3ebcf64 | 2012-10-08 16:30:07 -0700 | [diff] [blame] | 189 | list_del(&pgtable->lru); |
Gerald Schaefer | e3ebcf64 | 2012-10-08 16:30:07 -0700 | [diff] [blame] | 190 | return pgtable; |
| 191 | } |
Gerald Schaefer | e3ebcf64 | 2012-10-08 16:30:07 -0700 | [diff] [blame] | 192 | #endif |
Gerald Schaefer | 46dcde7 | 2012-10-08 16:30:09 -0700 | [diff] [blame] | 193 | |
| 194 | #ifndef __HAVE_ARCH_PMDP_INVALIDATE |
Kirill A. Shutemov | d52605d | 2018-01-31 16:18:16 -0800 | [diff] [blame] | 195 | pmd_t pmdp_invalidate(struct vm_area_struct *vma, unsigned long address, |
Gerald Schaefer | 46dcde7 | 2012-10-08 16:30:09 -0700 | [diff] [blame] | 196 | pmd_t *pmdp) |
| 197 | { |
Anshuman Khandual | 86ec2da | 2020-06-03 16:03:45 -0700 | [diff] [blame] | 198 | pmd_t old = pmdp_establish(vma, address, pmdp, pmd_mkinvalid(*pmdp)); |
Vineet Gupta | 12ebc15 | 2015-02-20 10:36:28 +0530 | [diff] [blame] | 199 | flush_pmd_tlb_range(vma, address, address + HPAGE_PMD_SIZE); |
Kirill A. Shutemov | d52605d | 2018-01-31 16:18:16 -0800 | [diff] [blame] | 200 | return old; |
Gerald Schaefer | 46dcde7 | 2012-10-08 16:30:09 -0700 | [diff] [blame] | 201 | } |
Gerald Schaefer | 46dcde7 | 2012-10-08 16:30:09 -0700 | [diff] [blame] | 202 | #endif |
Aneesh Kumar K.V | f28b6ff | 2015-06-24 16:57:42 -0700 | [diff] [blame] | 203 | |
| 204 | #ifndef pmdp_collapse_flush |
Aneesh Kumar K.V | f28b6ff | 2015-06-24 16:57:42 -0700 | [diff] [blame] | 205 | pmd_t pmdp_collapse_flush(struct vm_area_struct *vma, unsigned long address, |
| 206 | pmd_t *pmdp) |
| 207 | { |
Aneesh Kumar K.V | 8809aa2 | 2015-06-24 16:57:44 -0700 | [diff] [blame] | 208 | /* |
| 209 | * pmd and hugepage pte format are same. So we could |
| 210 | * use the same function. |
| 211 | */ |
Aneesh Kumar K.V | f28b6ff | 2015-06-24 16:57:42 -0700 | [diff] [blame] | 212 | pmd_t pmd; |
| 213 | |
| 214 | VM_BUG_ON(address & ~HPAGE_PMD_MASK); |
| 215 | VM_BUG_ON(pmd_trans_huge(*pmdp)); |
Aneesh Kumar K.V | 8809aa2 | 2015-06-24 16:57:44 -0700 | [diff] [blame] | 216 | pmd = pmdp_huge_get_and_clear(vma->vm_mm, address, pmdp); |
Vineet Gupta | 6a6ac72 | 2016-02-11 16:13:09 -0800 | [diff] [blame] | 217 | |
| 218 | /* collapse entails shooting down ptes not pmd */ |
| 219 | flush_tlb_range(vma, address, address + HPAGE_PMD_SIZE); |
Aneesh Kumar K.V | f28b6ff | 2015-06-24 16:57:42 -0700 | [diff] [blame] | 220 | return pmd; |
| 221 | } |
Aneesh Kumar K.V | f28b6ff | 2015-06-24 16:57:42 -0700 | [diff] [blame] | 222 | #endif |
Vineet Gupta | bd5e88a | 2015-07-09 17:22:44 +0530 | [diff] [blame] | 223 | #endif /* CONFIG_TRANSPARENT_HUGEPAGE */ |