Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 1 | /* |
| 2 | * MMU context allocation for 64-bit kernels. |
| 3 | * |
| 4 | * Copyright (C) 2004 Anton Blanchard, IBM Corp. <anton@samba.org> |
| 5 | * |
| 6 | * This program is free software; you can redistribute it and/or |
| 7 | * modify it under the terms of the GNU General Public License |
| 8 | * as published by the Free Software Foundation; either version |
| 9 | * 2 of the License, or (at your option) any later version. |
| 10 | * |
| 11 | */ |
| 12 | |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 13 | #include <linux/sched.h> |
| 14 | #include <linux/kernel.h> |
| 15 | #include <linux/errno.h> |
| 16 | #include <linux/string.h> |
| 17 | #include <linux/types.h> |
| 18 | #include <linux/mm.h> |
| 19 | #include <linux/spinlock.h> |
| 20 | #include <linux/idr.h> |
Paul Gortmaker | 4b16f8e | 2011-07-22 18:24:23 -0400 | [diff] [blame] | 21 | #include <linux/export.h> |
Tejun Heo | 5a0e3ad | 2010-03-24 17:04:11 +0900 | [diff] [blame] | 22 | #include <linux/gfp.h> |
Tseng-Hui (Frank) Lin | 851d2e2 | 2011-05-02 20:43:04 +0000 | [diff] [blame] | 23 | #include <linux/slab.h> |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 24 | |
| 25 | #include <asm/mmu_context.h> |
Aneesh Kumar K.V | 5c1f6ee | 2013-04-28 09:37:33 +0000 | [diff] [blame] | 26 | #include <asm/pgalloc.h> |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 27 | |
Jimi Xenidis | 9d67028 | 2011-09-29 10:55:12 +0000 | [diff] [blame] | 28 | #include "icswx.h" |
Tseng-Hui (Frank) Lin | 851d2e2 | 2011-05-02 20:43:04 +0000 | [diff] [blame] | 29 | |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 30 | static DEFINE_SPINLOCK(mmu_context_lock); |
Anton Blanchard | 7317ac8 | 2010-02-07 12:30:12 +0000 | [diff] [blame] | 31 | static DEFINE_IDA(mmu_context_ida); |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 32 | |
Michael Ellerman | c1ff840 | 2017-03-29 22:10:45 +1100 | [diff] [blame] | 33 | static int alloc_context_id(int min_id, int max_id) |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 34 | { |
Michael Ellerman | c1ff840 | 2017-03-29 22:10:45 +1100 | [diff] [blame] | 35 | int index, err; |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 36 | |
| 37 | again: |
Anton Blanchard | 7317ac8 | 2010-02-07 12:30:12 +0000 | [diff] [blame] | 38 | if (!ida_pre_get(&mmu_context_ida, GFP_KERNEL)) |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 39 | return -ENOMEM; |
| 40 | |
| 41 | spin_lock(&mmu_context_lock); |
Michael Ellerman | c1ff840 | 2017-03-29 22:10:45 +1100 | [diff] [blame] | 42 | err = ida_get_new_above(&mmu_context_ida, min_id, &index); |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 43 | spin_unlock(&mmu_context_lock); |
| 44 | |
| 45 | if (err == -EAGAIN) |
| 46 | goto again; |
| 47 | else if (err) |
| 48 | return err; |
| 49 | |
Michael Ellerman | c1ff840 | 2017-03-29 22:10:45 +1100 | [diff] [blame] | 50 | if (index > max_id) { |
Sonny Rao | f86c9747 | 2006-06-27 08:46:09 -0400 | [diff] [blame] | 51 | spin_lock(&mmu_context_lock); |
Anton Blanchard | 7317ac8 | 2010-02-07 12:30:12 +0000 | [diff] [blame] | 52 | ida_remove(&mmu_context_ida, index); |
Sonny Rao | f86c9747 | 2006-06-27 08:46:09 -0400 | [diff] [blame] | 53 | spin_unlock(&mmu_context_lock); |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 54 | return -ENOMEM; |
| 55 | } |
| 56 | |
Alexander Graf | e85a471 | 2009-11-02 12:02:30 +0000 | [diff] [blame] | 57 | return index; |
| 58 | } |
Michael Ellerman | a336f2f | 2017-03-29 22:00:46 +1100 | [diff] [blame] | 59 | |
Aneesh Kumar K.V | 82228e3 | 2017-03-22 09:07:00 +0530 | [diff] [blame] | 60 | void hash__reserve_context_id(int id) |
| 61 | { |
| 62 | int rc, result = 0; |
| 63 | |
| 64 | do { |
| 65 | if (!ida_pre_get(&mmu_context_ida, GFP_KERNEL)) |
| 66 | break; |
| 67 | |
| 68 | spin_lock(&mmu_context_lock); |
| 69 | rc = ida_get_new_above(&mmu_context_ida, id, &result); |
| 70 | spin_unlock(&mmu_context_lock); |
| 71 | } while (rc == -EAGAIN); |
| 72 | |
| 73 | WARN(result != id, "mmu: Failed to reserve context id %d (rc %d)\n", id, result); |
| 74 | } |
| 75 | |
Michael Ellerman | a336f2f | 2017-03-29 22:00:46 +1100 | [diff] [blame] | 76 | int hash__alloc_context_id(void) |
| 77 | { |
Aneesh Kumar K.V | e6f81a9 | 2017-03-29 17:21:53 +1100 | [diff] [blame] | 78 | unsigned long max; |
| 79 | |
| 80 | if (mmu_has_feature(MMU_FTR_68_BIT_VA)) |
| 81 | max = MAX_USER_CONTEXT; |
| 82 | else |
| 83 | max = MAX_USER_CONTEXT_65BIT_VA; |
| 84 | |
| 85 | return alloc_context_id(MIN_USER_CONTEXT, max); |
Michael Ellerman | a336f2f | 2017-03-29 22:00:46 +1100 | [diff] [blame] | 86 | } |
| 87 | EXPORT_SYMBOL_GPL(hash__alloc_context_id); |
| 88 | |
Michael Ellerman | 760573c | 2017-03-29 22:36:56 +1100 | [diff] [blame] | 89 | static int hash__init_new_context(struct mm_struct *mm) |
Alexander Graf | e85a471 | 2009-11-02 12:02:30 +0000 | [diff] [blame] | 90 | { |
| 91 | int index; |
| 92 | |
Michael Ellerman | c1ff840 | 2017-03-29 22:10:45 +1100 | [diff] [blame] | 93 | index = hash__alloc_context_id(); |
Alexander Graf | e85a471 | 2009-11-02 12:02:30 +0000 | [diff] [blame] | 94 | if (index < 0) |
| 95 | return index; |
| 96 | |
Michael Ellerman | 760573c | 2017-03-29 22:36:56 +1100 | [diff] [blame] | 97 | /* |
Aneesh Kumar K.V | 957b778 | 2017-03-22 09:06:58 +0530 | [diff] [blame] | 98 | * We do switch_slb() early in fork, even before we setup the |
| 99 | * mm->context.addr_limit. Default to max task size so that we copy the |
| 100 | * default values to paca which will help us to handle slb miss early. |
| 101 | */ |
Aneesh Kumar K.V | 92d9dfd | 2017-06-01 20:05:04 +0530 | [diff] [blame] | 102 | mm->context.addr_limit = DEFAULT_MAP_WINDOW_USER64; |
Aneesh Kumar K.V | 957b778 | 2017-03-22 09:06:58 +0530 | [diff] [blame] | 103 | |
| 104 | /* |
Michael Ellerman | 760573c | 2017-03-29 22:36:56 +1100 | [diff] [blame] | 105 | * The old code would re-promote on fork, we don't do that when using |
| 106 | * slices as it could cause problem promoting slices that have been |
| 107 | * forced down to 4K. |
| 108 | * |
| 109 | * For book3s we have MMU_NO_CONTEXT set to be ~0. Hence check |
| 110 | * explicitly against context.id == 0. This ensures that we properly |
| 111 | * initialize context slice details for newly allocated mm's (which will |
| 112 | * have id == 0) and don't alter context slice inherited via fork (which |
| 113 | * will have id != 0). |
| 114 | * |
| 115 | * We should not be calling init_new_context() on init_mm. Hence a |
| 116 | * check against 0 is OK. |
| 117 | */ |
| 118 | if (mm->context.id == 0) |
| 119 | slice_set_user_psize(mm, mmu_virtual_psize); |
Aneesh Kumar K.V | 7e381c0 | 2016-04-29 23:26:02 +1000 | [diff] [blame] | 120 | |
Michael Ellerman | 760573c | 2017-03-29 22:36:56 +1100 | [diff] [blame] | 121 | subpage_prot_init_new_context(mm); |
| 122 | |
| 123 | return index; |
| 124 | } |
| 125 | |
| 126 | static int radix__init_new_context(struct mm_struct *mm) |
| 127 | { |
| 128 | unsigned long rts_field; |
| 129 | int index; |
| 130 | |
| 131 | index = alloc_context_id(1, PRTB_ENTRIES - 1); |
| 132 | if (index < 0) |
| 133 | return index; |
| 134 | |
| 135 | /* |
| 136 | * set the process table entry, |
| 137 | */ |
| 138 | rts_field = radix__get_tree_size(); |
| 139 | process_tb[index].prtb0 = cpu_to_be64(rts_field | __pa(mm->pgd) | RADIX_PGD_INDEX_SIZE); |
| 140 | |
Alistair Popple | 1ab66d1 | 2017-04-03 19:51:44 +1000 | [diff] [blame] | 141 | mm->context.npu_context = NULL; |
| 142 | |
Michael Ellerman | 760573c | 2017-03-29 22:36:56 +1100 | [diff] [blame] | 143 | return index; |
| 144 | } |
| 145 | |
| 146 | int init_new_context(struct task_struct *tsk, struct mm_struct *mm) |
| 147 | { |
| 148 | int index; |
| 149 | |
| 150 | if (radix_enabled()) |
| 151 | index = radix__init_new_context(mm); |
| 152 | else |
| 153 | index = hash__init_new_context(mm); |
| 154 | |
| 155 | if (index < 0) |
| 156 | return index; |
| 157 | |
Stephen Rothwell | 9dfe5c53 | 2007-08-15 16:33:55 +1000 | [diff] [blame] | 158 | mm->context.id = index; |
Tseng-Hui (Frank) Lin | 851d2e2 | 2011-05-02 20:43:04 +0000 | [diff] [blame] | 159 | #ifdef CONFIG_PPC_ICSWX |
| 160 | mm->context.cop_lockp = kmalloc(sizeof(spinlock_t), GFP_KERNEL); |
| 161 | if (!mm->context.cop_lockp) { |
| 162 | __destroy_context(index); |
| 163 | subpage_prot_free(mm); |
Stephen Rothwell | 79af218 | 2011-05-06 10:39:08 +1000 | [diff] [blame] | 164 | mm->context.id = MMU_NO_CONTEXT; |
Tseng-Hui (Frank) Lin | 851d2e2 | 2011-05-02 20:43:04 +0000 | [diff] [blame] | 165 | return -ENOMEM; |
| 166 | } |
| 167 | spin_lock_init(mm->context.cop_lockp); |
| 168 | #endif /* CONFIG_PPC_ICSWX */ |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 169 | |
Aneesh Kumar K.V | 5c1f6ee | 2013-04-28 09:37:33 +0000 | [diff] [blame] | 170 | #ifdef CONFIG_PPC_64K_PAGES |
| 171 | mm->context.pte_frag = NULL; |
| 172 | #endif |
Alexey Kardashevskiy | 15b244a | 2015-06-05 16:35:24 +1000 | [diff] [blame] | 173 | #ifdef CONFIG_SPAPR_TCE_IOMMU |
Alexey Kardashevskiy | 88f54a3 | 2016-11-30 17:51:59 +1100 | [diff] [blame] | 174 | mm_iommu_init(mm); |
Alexey Kardashevskiy | 15b244a | 2015-06-05 16:35:24 +1000 | [diff] [blame] | 175 | #endif |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 176 | return 0; |
| 177 | } |
| 178 | |
Alexander Graf | e85a471 | 2009-11-02 12:02:30 +0000 | [diff] [blame] | 179 | void __destroy_context(int context_id) |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 180 | { |
| 181 | spin_lock(&mmu_context_lock); |
Anton Blanchard | 7317ac8 | 2010-02-07 12:30:12 +0000 | [diff] [blame] | 182 | ida_remove(&mmu_context_ida, context_id); |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 183 | spin_unlock(&mmu_context_lock); |
Alexander Graf | e85a471 | 2009-11-02 12:02:30 +0000 | [diff] [blame] | 184 | } |
| 185 | EXPORT_SYMBOL_GPL(__destroy_context); |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 186 | |
Aneesh Kumar K.V | 5c1f6ee | 2013-04-28 09:37:33 +0000 | [diff] [blame] | 187 | #ifdef CONFIG_PPC_64K_PAGES |
| 188 | static void destroy_pagetable_page(struct mm_struct *mm) |
| 189 | { |
| 190 | int count; |
| 191 | void *pte_frag; |
| 192 | struct page *page; |
| 193 | |
| 194 | pte_frag = mm->context.pte_frag; |
| 195 | if (!pte_frag) |
| 196 | return; |
| 197 | |
| 198 | page = virt_to_page(pte_frag); |
| 199 | /* drop all the pending references */ |
| 200 | count = ((unsigned long)pte_frag & ~PAGE_MASK) >> PTE_FRAG_SIZE_SHIFT; |
| 201 | /* We allow PTE_FRAG_NR fragments from a PTE page */ |
Joonsoo Kim | fe896d1 | 2016-03-17 14:19:26 -0700 | [diff] [blame] | 202 | if (page_ref_sub_and_test(page, PTE_FRAG_NR - count)) { |
Aneesh Kumar K.V | 5c1f6ee | 2013-04-28 09:37:33 +0000 | [diff] [blame] | 203 | pgtable_page_dtor(page); |
| 204 | free_hot_cold_page(page, 0); |
| 205 | } |
| 206 | } |
| 207 | |
| 208 | #else |
| 209 | static inline void destroy_pagetable_page(struct mm_struct *mm) |
| 210 | { |
| 211 | return; |
| 212 | } |
| 213 | #endif |
| 214 | |
Alexander Graf | e85a471 | 2009-11-02 12:02:30 +0000 | [diff] [blame] | 215 | void destroy_context(struct mm_struct *mm) |
| 216 | { |
Alexey Kardashevskiy | 15b244a | 2015-06-05 16:35:24 +1000 | [diff] [blame] | 217 | #ifdef CONFIG_SPAPR_TCE_IOMMU |
Alexey Kardashevskiy | 4b6fad7 | 2016-11-30 17:52:05 +1100 | [diff] [blame] | 218 | WARN_ON_ONCE(!list_empty(&mm->context.iommu_group_mem_list)); |
Alexey Kardashevskiy | 15b244a | 2015-06-05 16:35:24 +1000 | [diff] [blame] | 219 | #endif |
Tseng-Hui (Frank) Lin | 851d2e2 | 2011-05-02 20:43:04 +0000 | [diff] [blame] | 220 | #ifdef CONFIG_PPC_ICSWX |
| 221 | drop_cop(mm->context.acop, mm); |
| 222 | kfree(mm->context.cop_lockp); |
| 223 | mm->context.cop_lockp = NULL; |
| 224 | #endif /* CONFIG_PPC_ICSWX */ |
Aneesh Kumar K.V | 5c1f6ee | 2013-04-28 09:37:33 +0000 | [diff] [blame] | 225 | |
Benjamin Herrenschmidt | c6bb0b8 | 2017-07-08 07:45:32 -0500 | [diff] [blame^] | 226 | if (radix_enabled()) { |
| 227 | /* |
| 228 | * Radix doesn't have a valid bit in the process table |
| 229 | * entries. However we know that at least P9 implementation |
| 230 | * will avoid caching an entry with an invalid RTS field, |
| 231 | * and 0 is invalid. So this will do. |
| 232 | */ |
| 233 | process_tb[mm->context.id].prtb0 = 0; |
| 234 | } else |
Aneesh Kumar K.V | 7e381c0 | 2016-04-29 23:26:02 +1000 | [diff] [blame] | 235 | subpage_prot_free(mm); |
Aneesh Kumar K.V | 5c1f6ee | 2013-04-28 09:37:33 +0000 | [diff] [blame] | 236 | destroy_pagetable_page(mm); |
Alexander Graf | e85a471 | 2009-11-02 12:02:30 +0000 | [diff] [blame] | 237 | __destroy_context(mm->context.id); |
Michael Ellerman | 5e8e7b4 | 2011-04-12 19:00:04 +0000 | [diff] [blame] | 238 | mm->context.id = MMU_NO_CONTEXT; |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 239 | } |
Aneesh Kumar K.V | 7e381c0 | 2016-04-29 23:26:02 +1000 | [diff] [blame] | 240 | |
| 241 | #ifdef CONFIG_PPC_RADIX_MMU |
| 242 | void radix__switch_mmu_context(struct mm_struct *prev, struct mm_struct *next) |
| 243 | { |
Benjamin Herrenschmidt | 74e27c6 | 2017-06-25 15:08:46 -0500 | [diff] [blame] | 244 | |
| 245 | if (cpu_has_feature(CPU_FTR_POWER9_DD1)) { |
| 246 | isync(); |
| 247 | mtspr(SPRN_PID, next->context.id); |
| 248 | isync(); |
| 249 | asm volatile(PPC_INVALIDATE_ERAT : : :"memory"); |
| 250 | } else { |
| 251 | mtspr(SPRN_PID, next->context.id); |
| 252 | isync(); |
| 253 | } |
Aneesh Kumar K.V | 7e381c0 | 2016-04-29 23:26:02 +1000 | [diff] [blame] | 254 | } |
| 255 | #endif |