Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 1 | /* |
| 2 | * PowerPC version |
| 3 | * Copyright (C) 1995-1996 Gary Thomas (gdt@linuxppc.org) |
| 4 | * |
| 5 | * Modifications by Paul Mackerras (PowerMac) (paulus@cs.anu.edu.au) |
| 6 | * and Cort Dougan (PReP) (cort@cs.nmt.edu) |
| 7 | * Copyright (C) 1996 Paul Mackerras |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 8 | * PPC44x/36-bit changes by Matt Porter (mporter@mvista.com) |
| 9 | * |
| 10 | * Derived from "arch/i386/mm/init.c" |
| 11 | * Copyright (C) 1991, 1992, 1993, 1994 Linus Torvalds |
| 12 | * |
| 13 | * This program is free software; you can redistribute it and/or |
| 14 | * modify it under the terms of the GNU General Public License |
| 15 | * as published by the Free Software Foundation; either version |
| 16 | * 2 of the License, or (at your option) any later version. |
| 17 | * |
| 18 | */ |
| 19 | |
Paul Gortmaker | 4b16f8e | 2011-07-22 18:24:23 -0400 | [diff] [blame] | 20 | #include <linux/export.h> |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 21 | #include <linux/sched.h> |
| 22 | #include <linux/kernel.h> |
| 23 | #include <linux/errno.h> |
| 24 | #include <linux/string.h> |
Tejun Heo | 5a0e3ad | 2010-03-24 17:04:11 +0900 | [diff] [blame] | 25 | #include <linux/gfp.h> |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 26 | #include <linux/types.h> |
| 27 | #include <linux/mm.h> |
| 28 | #include <linux/stddef.h> |
| 29 | #include <linux/init.h> |
| 30 | #include <linux/bootmem.h> |
| 31 | #include <linux/highmem.h> |
| 32 | #include <linux/initrd.h> |
| 33 | #include <linux/pagemap.h> |
Johannes Berg | 4e8ad3e | 2007-05-08 19:25:00 +1000 | [diff] [blame] | 34 | #include <linux/suspend.h> |
Yinghai Lu | 95f72d1 | 2010-07-12 14:36:09 +1000 | [diff] [blame] | 35 | #include <linux/memblock.h> |
David Gibson | 0895ecd | 2009-10-26 19:24:31 +0000 | [diff] [blame] | 36 | #include <linux/hugetlb.h> |
Anton Blanchard | c40dd2f | 2011-11-02 14:56:12 +0000 | [diff] [blame] | 37 | #include <linux/slab.h> |
Anton Blanchard | 16d0f5c | 2014-10-14 22:17:47 +1100 | [diff] [blame] | 38 | #include <linux/vmalloc.h> |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 39 | |
| 40 | #include <asm/pgalloc.h> |
| 41 | #include <asm/prom.h> |
| 42 | #include <asm/io.h> |
| 43 | #include <asm/mmu_context.h> |
| 44 | #include <asm/pgtable.h> |
| 45 | #include <asm/mmu.h> |
| 46 | #include <asm/smp.h> |
| 47 | #include <asm/machdep.h> |
| 48 | #include <asm/btext.h> |
| 49 | #include <asm/tlb.h> |
Paul Mackerras | 7c8c6b9 | 2005-10-06 12:23:33 +1000 | [diff] [blame] | 50 | #include <asm/sections.h> |
Tony Breeds | db7f37d | 2008-07-01 11:30:06 +1000 | [diff] [blame] | 51 | #include <asm/sparsemem.h> |
Paul Mackerras | ab1f9da | 2005-10-10 21:58:35 +1000 | [diff] [blame] | 52 | #include <asm/vdso.h> |
Kumar Gala | 2c419bd | 2008-04-23 23:05:20 +1000 | [diff] [blame] | 53 | #include <asm/fixmap.h> |
FUJITA Tomonori | a932729 | 2010-03-16 13:16:25 +0000 | [diff] [blame] | 54 | #include <asm/swiotlb.h> |
sukadev@linux.vnet.ibm.com | 8a3e3d3 | 2011-12-02 12:26:23 +0000 | [diff] [blame] | 55 | #include <asm/rtas.h> |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 56 | |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 57 | #include "mmu_decl.h" |
| 58 | |
| 59 | #ifndef CPU_FTR_COHERENT_ICACHE |
| 60 | #define CPU_FTR_COHERENT_ICACHE 0 /* XXX for now */ |
| 61 | #define CPU_FTR_NOEXECUTE 0 |
| 62 | #endif |
| 63 | |
Suzuki Poulose | a84fcd4 | 2012-08-21 01:42:33 +0000 | [diff] [blame] | 64 | unsigned long long memory_limit; |
Paul Mackerras | 7c8c6b9 | 2005-10-06 12:23:33 +1000 | [diff] [blame] | 65 | |
Kumar Gala | 2c419bd | 2008-04-23 23:05:20 +1000 | [diff] [blame] | 66 | #ifdef CONFIG_HIGHMEM |
| 67 | pte_t *kmap_pte; |
Kumar Gala | 2c419bd | 2008-04-23 23:05:20 +1000 | [diff] [blame] | 68 | EXPORT_SYMBOL(kmap_pte); |
Valentina Manea | 8040bda | 2013-03-10 03:22:39 +0000 | [diff] [blame] | 69 | pgprot_t kmap_prot; |
| 70 | EXPORT_SYMBOL(kmap_prot); |
Kumar Gala | 2c419bd | 2008-04-23 23:05:20 +1000 | [diff] [blame] | 71 | |
| 72 | static inline pte_t *virt_to_kpte(unsigned long vaddr) |
| 73 | { |
| 74 | return pte_offset_kernel(pmd_offset(pud_offset(pgd_offset_k(vaddr), |
| 75 | vaddr), vaddr), vaddr); |
| 76 | } |
| 77 | #endif |
| 78 | |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 79 | int page_is_ram(unsigned long pfn) |
| 80 | { |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 81 | #ifndef CONFIG_PPC64 /* XXX for now */ |
Roland Dreier | a880e76 | 2008-09-15 10:43:35 +0000 | [diff] [blame] | 82 | return pfn < max_pfn; |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 83 | #else |
Roland Dreier | a880e76 | 2008-09-15 10:43:35 +0000 | [diff] [blame] | 84 | unsigned long paddr = (pfn << PAGE_SHIFT); |
Benjamin Herrenschmidt | 28be707 | 2010-08-04 13:43:53 +1000 | [diff] [blame] | 85 | struct memblock_region *reg; |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 86 | |
Benjamin Herrenschmidt | 28be707 | 2010-08-04 13:43:53 +1000 | [diff] [blame] | 87 | for_each_memblock(memory, reg) |
| 88 | if (paddr >= reg->base && paddr < (reg->base + reg->size)) |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 89 | return 1; |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 90 | return 0; |
| 91 | #endif |
| 92 | } |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 93 | |
Roland Dreier | 8b15047 | 2005-10-28 17:46:18 -0700 | [diff] [blame] | 94 | pgprot_t phys_mem_access_prot(struct file *file, unsigned long pfn, |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 95 | unsigned long size, pgprot_t vma_prot) |
| 96 | { |
| 97 | if (ppc_md.phys_mem_access_prot) |
Roland Dreier | 8b15047 | 2005-10-28 17:46:18 -0700 | [diff] [blame] | 98 | return ppc_md.phys_mem_access_prot(file, pfn, size, vma_prot); |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 99 | |
Roland Dreier | 8b15047 | 2005-10-28 17:46:18 -0700 | [diff] [blame] | 100 | if (!page_is_ram(pfn)) |
Benjamin Herrenschmidt | 64b3d0e | 2008-12-18 19:13:51 +0000 | [diff] [blame] | 101 | vma_prot = pgprot_noncached(vma_prot); |
| 102 | |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 103 | return vma_prot; |
| 104 | } |
| 105 | EXPORT_SYMBOL(phys_mem_access_prot); |
| 106 | |
Paul Mackerras | 23fd077 | 2005-10-31 13:37:12 +1100 | [diff] [blame] | 107 | #ifdef CONFIG_MEMORY_HOTPLUG |
| 108 | |
Yasunori Goto | bc02af9 | 2006-06-27 02:53:30 -0700 | [diff] [blame] | 109 | #ifdef CONFIG_NUMA |
| 110 | int memory_add_physaddr_to_nid(u64 start) |
| 111 | { |
| 112 | return hot_add_scn_to_nid(start); |
| 113 | } |
| 114 | #endif |
| 115 | |
Dan Williams | 033fbae | 2015-08-09 15:29:06 -0400 | [diff] [blame] | 116 | int arch_add_memory(int nid, u64 start, u64 size, bool for_device) |
Paul Mackerras | 23fd077 | 2005-10-31 13:37:12 +1100 | [diff] [blame] | 117 | { |
Mike Kravetz | 237a0989 | 2005-12-05 12:06:42 -0800 | [diff] [blame] | 118 | struct pglist_data *pgdata; |
Paul Mackerras | 23fd077 | 2005-10-31 13:37:12 +1100 | [diff] [blame] | 119 | struct zone *zone; |
| 120 | unsigned long start_pfn = start >> PAGE_SHIFT; |
| 121 | unsigned long nr_pages = size >> PAGE_SHIFT; |
| 122 | |
Mike Kravetz | 237a0989 | 2005-12-05 12:06:42 -0800 | [diff] [blame] | 123 | pgdata = NODE_DATA(nid); |
| 124 | |
Andrew Morton | 2d0eee1 | 2006-03-21 23:00:05 -0800 | [diff] [blame] | 125 | start = (unsigned long)__va(start); |
Anton Blanchard | a119409 | 2011-08-10 20:44:24 +0000 | [diff] [blame] | 126 | if (create_section_mapping(start, start + size)) |
| 127 | return -EINVAL; |
Mike Kravetz | 54b7924 | 2005-11-07 16:25:48 -0800 | [diff] [blame] | 128 | |
Paul Mackerras | 23fd077 | 2005-10-31 13:37:12 +1100 | [diff] [blame] | 129 | /* this should work for most non-highmem platforms */ |
Wang Nan | f51202d | 2014-08-06 16:07:45 -0700 | [diff] [blame] | 130 | zone = pgdata->node_zones + |
Dan Williams | 033fbae | 2015-08-09 15:29:06 -0400 | [diff] [blame] | 131 | zone_for_memory(nid, start, size, 0, for_device); |
Paul Mackerras | 23fd077 | 2005-10-31 13:37:12 +1100 | [diff] [blame] | 132 | |
Gary Hade | c04fc58 | 2009-01-06 14:39:14 -0800 | [diff] [blame] | 133 | return __add_pages(nid, zone, start_pfn, nr_pages); |
Paul Mackerras | 23fd077 | 2005-10-31 13:37:12 +1100 | [diff] [blame] | 134 | } |
Wen Congyang | 24d335c | 2013-02-22 16:32:58 -0800 | [diff] [blame] | 135 | |
| 136 | #ifdef CONFIG_MEMORY_HOTREMOVE |
| 137 | int arch_remove_memory(u64 start, u64 size) |
| 138 | { |
| 139 | unsigned long start_pfn = start >> PAGE_SHIFT; |
| 140 | unsigned long nr_pages = size >> PAGE_SHIFT; |
| 141 | struct zone *zone; |
Nathan Fontenot | 9ac8cde | 2014-01-27 10:54:06 -0600 | [diff] [blame] | 142 | int ret; |
Wen Congyang | 24d335c | 2013-02-22 16:32:58 -0800 | [diff] [blame] | 143 | |
| 144 | zone = page_zone(pfn_to_page(start_pfn)); |
Nathan Fontenot | 9ac8cde | 2014-01-27 10:54:06 -0600 | [diff] [blame] | 145 | ret = __remove_pages(zone, start_pfn, nr_pages); |
Anton Blanchard | 16d0f5c | 2014-10-14 22:17:47 +1100 | [diff] [blame] | 146 | if (ret) |
| 147 | return ret; |
| 148 | |
| 149 | /* Remove htab bolted mappings for this section of memory */ |
| 150 | start = (unsigned long)__va(start); |
| 151 | ret = remove_section_mapping(start, start + size); |
| 152 | |
| 153 | /* Ensure all vmalloc mappings are flushed in case they also |
| 154 | * hit that section of memory |
| 155 | */ |
| 156 | vm_unmap_aliases(); |
Nathan Fontenot | 9ac8cde | 2014-01-27 10:54:06 -0600 | [diff] [blame] | 157 | |
| 158 | return ret; |
Wen Congyang | 24d335c | 2013-02-22 16:32:58 -0800 | [diff] [blame] | 159 | } |
| 160 | #endif |
Nathan Lynch | 0d57994 | 2008-06-04 08:30:54 +1000 | [diff] [blame] | 161 | #endif /* CONFIG_MEMORY_HOTPLUG */ |
Badari Pulavarty | a99824f | 2008-02-05 00:10:18 -0800 | [diff] [blame] | 162 | |
| 163 | /* |
| 164 | * walk_memory_resource() needs to make sure there is no holes in a given |
Badari Pulavarty | 9d88a2e | 2008-04-18 13:33:53 -0700 | [diff] [blame] | 165 | * memory range. PPC64 does not maintain the memory layout in /proc/iomem. |
Yinghai Lu | 95f72d1 | 2010-07-12 14:36:09 +1000 | [diff] [blame] | 166 | * Instead it maintains it in memblock.memory structures. Walk through the |
Badari Pulavarty | 9d88a2e | 2008-04-18 13:33:53 -0700 | [diff] [blame] | 167 | * memory regions, find holes and callback for contiguous regions. |
Badari Pulavarty | a99824f | 2008-02-05 00:10:18 -0800 | [diff] [blame] | 168 | */ |
| 169 | int |
KAMEZAWA Hiroyuki | 908eedc | 2009-09-22 16:45:46 -0700 | [diff] [blame] | 170 | walk_system_ram_range(unsigned long start_pfn, unsigned long nr_pages, |
| 171 | void *arg, int (*func)(unsigned long, unsigned long, void *)) |
Badari Pulavarty | a99824f | 2008-02-05 00:10:18 -0800 | [diff] [blame] | 172 | { |
Benjamin Herrenschmidt | 28be707 | 2010-08-04 13:43:53 +1000 | [diff] [blame] | 173 | struct memblock_region *reg; |
| 174 | unsigned long end_pfn = start_pfn + nr_pages; |
| 175 | unsigned long tstart, tend; |
Badari Pulavarty | 9d88a2e | 2008-04-18 13:33:53 -0700 | [diff] [blame] | 176 | int ret = -1; |
| 177 | |
Benjamin Herrenschmidt | 28be707 | 2010-08-04 13:43:53 +1000 | [diff] [blame] | 178 | for_each_memblock(memory, reg) { |
Yinghai Lu | c7fc2de | 2010-10-12 14:07:09 -0700 | [diff] [blame] | 179 | tstart = max(start_pfn, memblock_region_memory_base_pfn(reg)); |
| 180 | tend = min(end_pfn, memblock_region_memory_end_pfn(reg)); |
Benjamin Herrenschmidt | 28be707 | 2010-08-04 13:43:53 +1000 | [diff] [blame] | 181 | if (tstart >= tend) |
| 182 | continue; |
| 183 | ret = (*func)(tstart, tend - tstart, arg); |
Badari Pulavarty | 9d88a2e | 2008-04-18 13:33:53 -0700 | [diff] [blame] | 184 | if (ret) |
| 185 | break; |
Badari Pulavarty | 9d88a2e | 2008-04-18 13:33:53 -0700 | [diff] [blame] | 186 | } |
| 187 | return ret; |
Badari Pulavarty | a99824f | 2008-02-05 00:10:18 -0800 | [diff] [blame] | 188 | } |
KAMEZAWA Hiroyuki | 908eedc | 2009-09-22 16:45:46 -0700 | [diff] [blame] | 189 | EXPORT_SYMBOL_GPL(walk_system_ram_range); |
Badari Pulavarty | a99824f | 2008-02-05 00:10:18 -0800 | [diff] [blame] | 190 | |
Paul Mackerras | 7c8c6b9 | 2005-10-06 12:23:33 +1000 | [diff] [blame] | 191 | #ifndef CONFIG_NEED_MULTIPLE_NODES |
Anton Blanchard | 1023973 | 2014-09-17 22:15:33 +1000 | [diff] [blame] | 192 | void __init initmem_init(void) |
Paul Mackerras | 7c8c6b9 | 2005-10-06 12:23:33 +1000 | [diff] [blame] | 193 | { |
Yinghai Lu | 95f72d1 | 2010-07-12 14:36:09 +1000 | [diff] [blame] | 194 | max_low_pfn = max_pfn = memblock_end_of_DRAM() >> PAGE_SHIFT; |
Anton Blanchard | 1023973 | 2014-09-17 22:15:33 +1000 | [diff] [blame] | 195 | min_low_pfn = MEMORY_START >> PAGE_SHIFT; |
Paul Mackerras | 7c8c6b9 | 2005-10-06 12:23:33 +1000 | [diff] [blame] | 196 | #ifdef CONFIG_HIGHMEM |
Kumar Gala | d7917ba | 2008-04-16 05:52:22 +1000 | [diff] [blame] | 197 | max_low_pfn = lowmem_end_addr >> PAGE_SHIFT; |
Paul Mackerras | 7c8c6b9 | 2005-10-06 12:23:33 +1000 | [diff] [blame] | 198 | #endif |
| 199 | |
Cody P Schafer | 4e8309b | 2013-01-09 12:40:18 +0000 | [diff] [blame] | 200 | /* Place all memblock_regions in the same node and merge contiguous |
| 201 | * memblock_regions |
| 202 | */ |
Tang Chen | e7e8de5 | 2014-01-21 15:49:26 -0800 | [diff] [blame] | 203 | memblock_set_node(0, (phys_addr_t)ULLONG_MAX, &memblock.memory, 0); |
Mel Gorman | c67c3cb | 2006-09-27 01:49:49 -0700 | [diff] [blame] | 204 | |
Paul Mackerras | 7c8c6b9 | 2005-10-06 12:23:33 +1000 | [diff] [blame] | 205 | /* XXX need to clip this if using highmem? */ |
Mel Gorman | c67c3cb | 2006-09-27 01:49:49 -0700 | [diff] [blame] | 206 | sparse_memory_present_with_active_regions(0); |
Anton Blanchard | 21098b9 | 2014-09-17 22:15:36 +1000 | [diff] [blame] | 207 | sparse_init(); |
Paul Mackerras | 7c8c6b9 | 2005-10-06 12:23:33 +1000 | [diff] [blame] | 208 | } |
| 209 | |
Johannes Berg | 4e8ad3e | 2007-05-08 19:25:00 +1000 | [diff] [blame] | 210 | /* mark pages that don't exist as nosave */ |
| 211 | static int __init mark_nonram_nosave(void) |
| 212 | { |
Benjamin Herrenschmidt | 28be707 | 2010-08-04 13:43:53 +1000 | [diff] [blame] | 213 | struct memblock_region *reg, *prev = NULL; |
Johannes Berg | 4e8ad3e | 2007-05-08 19:25:00 +1000 | [diff] [blame] | 214 | |
Benjamin Herrenschmidt | 28be707 | 2010-08-04 13:43:53 +1000 | [diff] [blame] | 215 | for_each_memblock(memory, reg) { |
| 216 | if (prev && |
Yinghai Lu | c7fc2de | 2010-10-12 14:07:09 -0700 | [diff] [blame] | 217 | memblock_region_memory_end_pfn(prev) < memblock_region_memory_base_pfn(reg)) |
| 218 | register_nosave_region(memblock_region_memory_end_pfn(prev), |
| 219 | memblock_region_memory_base_pfn(reg)); |
Benjamin Herrenschmidt | 28be707 | 2010-08-04 13:43:53 +1000 | [diff] [blame] | 220 | prev = reg; |
Johannes Berg | 4e8ad3e | 2007-05-08 19:25:00 +1000 | [diff] [blame] | 221 | } |
Johannes Berg | 4e8ad3e | 2007-05-08 19:25:00 +1000 | [diff] [blame] | 222 | return 0; |
| 223 | } |
Scott Wood | 6db35ad | 2014-09-18 14:05:02 -0500 | [diff] [blame] | 224 | #else /* CONFIG_NEED_MULTIPLE_NODES */ |
| 225 | static int __init mark_nonram_nosave(void) |
| 226 | { |
| 227 | return 0; |
| 228 | } |
| 229 | #endif |
Johannes Berg | 4e8ad3e | 2007-05-08 19:25:00 +1000 | [diff] [blame] | 230 | |
Scott Wood | 1c98025 | 2014-08-08 18:40:42 -0500 | [diff] [blame] | 231 | static bool zone_limits_final; |
| 232 | |
| 233 | static unsigned long max_zone_pfns[MAX_NR_ZONES] = { |
| 234 | [0 ... MAX_NR_ZONES - 1] = ~0UL |
| 235 | }; |
| 236 | |
| 237 | /* |
| 238 | * Restrict the specified zone and all more restrictive zones |
| 239 | * to be below the specified pfn. May not be called after |
| 240 | * paging_init(). |
| 241 | */ |
| 242 | void __init limit_zone_pfn(enum zone_type zone, unsigned long pfn_limit) |
| 243 | { |
| 244 | int i; |
| 245 | |
| 246 | if (WARN_ON(zone_limits_final)) |
| 247 | return; |
| 248 | |
| 249 | for (i = zone; i >= 0; i--) { |
| 250 | if (max_zone_pfns[i] > pfn_limit) |
| 251 | max_zone_pfns[i] = pfn_limit; |
| 252 | } |
| 253 | } |
| 254 | |
| 255 | /* |
| 256 | * Find the least restrictive zone that is entirely below the |
| 257 | * specified pfn limit. Returns < 0 if no suitable zone is found. |
| 258 | * |
| 259 | * pfn_limit must be u64 because it can exceed 32 bits even on 32-bit |
| 260 | * systems -- the DMA limit can be higher than any possible real pfn. |
| 261 | */ |
| 262 | int dma_pfn_limit_to_zone(u64 pfn_limit) |
| 263 | { |
| 264 | enum zone_type top_zone = ZONE_NORMAL; |
| 265 | int i; |
| 266 | |
| 267 | #ifdef CONFIG_HIGHMEM |
| 268 | top_zone = ZONE_HIGHMEM; |
| 269 | #endif |
| 270 | |
| 271 | for (i = top_zone; i >= 0; i--) { |
| 272 | if (max_zone_pfns[i] <= pfn_limit) |
| 273 | return i; |
| 274 | } |
| 275 | |
| 276 | return -EPERM; |
| 277 | } |
Paul Mackerras | 7c8c6b9 | 2005-10-06 12:23:33 +1000 | [diff] [blame] | 278 | |
| 279 | /* |
| 280 | * paging_init() sets up the page tables - in fact we've already done this. |
| 281 | */ |
| 282 | void __init paging_init(void) |
| 283 | { |
Tony Breeds | f7ba299 | 2011-07-04 18:44:19 +0000 | [diff] [blame] | 284 | unsigned long long total_ram = memblock_phys_mem_size(); |
Yinghai Lu | 95f72d1 | 2010-07-12 14:36:09 +1000 | [diff] [blame] | 285 | phys_addr_t top_of_ram = memblock_end_of_DRAM(); |
Scott Wood | 1c98025 | 2014-08-08 18:40:42 -0500 | [diff] [blame] | 286 | enum zone_type top_zone; |
Paul Mackerras | 7c8c6b9 | 2005-10-06 12:23:33 +1000 | [diff] [blame] | 287 | |
Kumar Gala | 2c419bd | 2008-04-23 23:05:20 +1000 | [diff] [blame] | 288 | #ifdef CONFIG_PPC32 |
| 289 | unsigned long v = __fix_to_virt(__end_of_fixed_addresses - 1); |
| 290 | unsigned long end = __fix_to_virt(FIX_HOLE); |
| 291 | |
| 292 | for (; v < end; v += PAGE_SIZE) |
| 293 | map_page(v, 0, 0); /* XXX gross */ |
| 294 | #endif |
| 295 | |
Paul Mackerras | 7c8c6b9 | 2005-10-06 12:23:33 +1000 | [diff] [blame] | 296 | #ifdef CONFIG_HIGHMEM |
| 297 | map_page(PKMAP_BASE, 0, 0); /* XXX gross */ |
Kumar Gala | 2c419bd | 2008-04-23 23:05:20 +1000 | [diff] [blame] | 298 | pkmap_page_table = virt_to_kpte(PKMAP_BASE); |
| 299 | |
| 300 | kmap_pte = virt_to_kpte(__fix_to_virt(FIX_KMAP_BEGIN)); |
Paul Mackerras | 7c8c6b9 | 2005-10-06 12:23:33 +1000 | [diff] [blame] | 301 | kmap_prot = PAGE_KERNEL; |
| 302 | #endif /* CONFIG_HIGHMEM */ |
| 303 | |
Tony Breeds | f7ba299 | 2011-07-04 18:44:19 +0000 | [diff] [blame] | 304 | printk(KERN_DEBUG "Top of RAM: 0x%llx, Total RAM: 0x%llx\n", |
Tony Breeds | fb61063 | 2008-07-31 13:51:42 +1000 | [diff] [blame] | 305 | (unsigned long long)top_of_ram, total_ram); |
Olof Johansson | e110b28 | 2006-04-12 15:25:01 -0500 | [diff] [blame] | 306 | printk(KERN_DEBUG "Memory hole size: %ldMB\n", |
Stefan Roese | 2bf3016 | 2008-07-10 01:09:23 +1000 | [diff] [blame] | 307 | (long int)((top_of_ram - total_ram) >> 20)); |
Scott Wood | 1c98025 | 2014-08-08 18:40:42 -0500 | [diff] [blame] | 308 | |
Paul Mackerras | 7c8c6b9 | 2005-10-06 12:23:33 +1000 | [diff] [blame] | 309 | #ifdef CONFIG_HIGHMEM |
Scott Wood | 1c98025 | 2014-08-08 18:40:42 -0500 | [diff] [blame] | 310 | top_zone = ZONE_HIGHMEM; |
| 311 | limit_zone_pfn(ZONE_NORMAL, lowmem_end_addr >> PAGE_SHIFT); |
Paul Mackerras | 7c8c6b9 | 2005-10-06 12:23:33 +1000 | [diff] [blame] | 312 | #else |
Scott Wood | 1c98025 | 2014-08-08 18:40:42 -0500 | [diff] [blame] | 313 | top_zone = ZONE_NORMAL; |
Mel Gorman | c67c3cb | 2006-09-27 01:49:49 -0700 | [diff] [blame] | 314 | #endif |
Scott Wood | 1c98025 | 2014-08-08 18:40:42 -0500 | [diff] [blame] | 315 | |
| 316 | limit_zone_pfn(top_zone, top_of_ram >> PAGE_SHIFT); |
| 317 | zone_limits_final = true; |
Mel Gorman | c67c3cb | 2006-09-27 01:49:49 -0700 | [diff] [blame] | 318 | free_area_init_nodes(max_zone_pfns); |
Johannes Berg | 4e8ad3e | 2007-05-08 19:25:00 +1000 | [diff] [blame] | 319 | |
| 320 | mark_nonram_nosave(); |
Paul Mackerras | 7c8c6b9 | 2005-10-06 12:23:33 +1000 | [diff] [blame] | 321 | } |
Paul Mackerras | 7c8c6b9 | 2005-10-06 12:23:33 +1000 | [diff] [blame] | 322 | |
| 323 | void __init mem_init(void) |
| 324 | { |
Scott Wood | 28efc35 | 2013-10-11 19:22:38 -0500 | [diff] [blame] | 325 | /* |
| 326 | * book3s is limited to 16 page sizes due to encoding this in |
| 327 | * a 4-bit field for slices. |
| 328 | */ |
| 329 | BUILD_BUG_ON(MMU_PAGE_COUNT > 16); |
| 330 | |
FUJITA Tomonori | a932729 | 2010-03-16 13:16:25 +0000 | [diff] [blame] | 331 | #ifdef CONFIG_SWIOTLB |
Jia Hongtao | 688ba1d | 2012-08-03 18:14:10 +0800 | [diff] [blame] | 332 | swiotlb_init(0); |
FUJITA Tomonori | a932729 | 2010-03-16 13:16:25 +0000 | [diff] [blame] | 333 | #endif |
| 334 | |
Paul Mackerras | 7c8c6b9 | 2005-10-06 12:23:33 +1000 | [diff] [blame] | 335 | high_memory = (void *) __va(max_low_pfn * PAGE_SIZE); |
Jiang Liu | 602ddc7 | 2013-07-03 15:04:32 -0700 | [diff] [blame] | 336 | set_max_mapnr(max_pfn); |
Jiang Liu | 0c98853 | 2013-07-03 15:03:24 -0700 | [diff] [blame] | 337 | free_all_bootmem(); |
Paul Mackerras | 7c8c6b9 | 2005-10-06 12:23:33 +1000 | [diff] [blame] | 338 | |
| 339 | #ifdef CONFIG_HIGHMEM |
| 340 | { |
| 341 | unsigned long pfn, highmem_mapnr; |
| 342 | |
Kumar Gala | d7917ba | 2008-04-16 05:52:22 +1000 | [diff] [blame] | 343 | highmem_mapnr = lowmem_end_addr >> PAGE_SHIFT; |
Paul Mackerras | 7c8c6b9 | 2005-10-06 12:23:33 +1000 | [diff] [blame] | 344 | for (pfn = highmem_mapnr; pfn < max_mapnr; ++pfn) { |
Becky Bruce | 3d41e0f | 2011-06-28 09:54:46 +0000 | [diff] [blame] | 345 | phys_addr_t paddr = (phys_addr_t)pfn << PAGE_SHIFT; |
Paul Mackerras | 7c8c6b9 | 2005-10-06 12:23:33 +1000 | [diff] [blame] | 346 | struct page *page = pfn_to_page(pfn); |
Jiang Liu | 369a9d8 | 2013-07-03 15:04:09 -0700 | [diff] [blame] | 347 | if (!memblock_is_reserved(paddr)) |
| 348 | free_highmem_page(page); |
Paul Mackerras | 7c8c6b9 | 2005-10-06 12:23:33 +1000 | [diff] [blame] | 349 | } |
Paul Mackerras | 7c8c6b9 | 2005-10-06 12:23:33 +1000 | [diff] [blame] | 350 | } |
| 351 | #endif /* CONFIG_HIGHMEM */ |
| 352 | |
Becky Bruce | 3160b09 | 2011-06-28 14:54:47 -0500 | [diff] [blame] | 353 | #if defined(CONFIG_PPC_FSL_BOOK3E) && !defined(CONFIG_SMP) |
| 354 | /* |
| 355 | * If smp is enabled, next_tlbcam_idx is initialized in the cpu up |
| 356 | * functions.... do it here for the non-smp case. |
| 357 | */ |
| 358 | per_cpu(next_tlbcam_idx, smp_processor_id()) = |
| 359 | (mfspr(SPRN_TLB1CFG) & TLBnCFG_N_ENTRY) - 1; |
| 360 | #endif |
| 361 | |
Jiang Liu | 369a9d8 | 2013-07-03 15:04:09 -0700 | [diff] [blame] | 362 | mem_init_print_info(NULL); |
Benjamin Herrenschmidt | f637a49 | 2009-05-27 13:44:50 +1000 | [diff] [blame] | 363 | #ifdef CONFIG_PPC32 |
| 364 | pr_info("Kernel virtual memory layout:\n"); |
| 365 | pr_info(" * 0x%08lx..0x%08lx : fixmap\n", FIXADDR_START, FIXADDR_TOP); |
| 366 | #ifdef CONFIG_HIGHMEM |
| 367 | pr_info(" * 0x%08lx..0x%08lx : highmem PTEs\n", |
| 368 | PKMAP_BASE, PKMAP_ADDR(LAST_PKMAP)); |
| 369 | #endif /* CONFIG_HIGHMEM */ |
Benjamin Herrenschmidt | 8b31e49 | 2009-05-27 13:50:33 +1000 | [diff] [blame] | 370 | #ifdef CONFIG_NOT_COHERENT_CACHE |
| 371 | pr_info(" * 0x%08lx..0x%08lx : consistent mem\n", |
| 372 | IOREMAP_TOP, IOREMAP_TOP + CONFIG_CONSISTENT_SIZE); |
| 373 | #endif /* CONFIG_NOT_COHERENT_CACHE */ |
Benjamin Herrenschmidt | f637a49 | 2009-05-27 13:44:50 +1000 | [diff] [blame] | 374 | pr_info(" * 0x%08lx..0x%08lx : early ioremap\n", |
| 375 | ioremap_bot, IOREMAP_TOP); |
| 376 | pr_info(" * 0x%08lx..0x%08lx : vmalloc & ioremap\n", |
| 377 | VMALLOC_START, VMALLOC_END); |
| 378 | #endif /* CONFIG_PPC32 */ |
Paul Mackerras | 7c8c6b9 | 2005-10-06 12:23:33 +1000 | [diff] [blame] | 379 | } |
| 380 | |
Dave Carroll | 2773fcc | 2011-06-18 07:36:39 +0000 | [diff] [blame] | 381 | void free_initmem(void) |
| 382 | { |
Dave Carroll | a9c0f41 | 2011-06-18 07:36:40 +0000 | [diff] [blame] | 383 | ppc_md.progress = ppc_printk_progress; |
Jiang Liu | 5d585e5 | 2013-04-29 15:06:47 -0700 | [diff] [blame] | 384 | free_initmem_default(POISON_FREE_INITMEM); |
Dave Carroll | 2773fcc | 2011-06-18 07:36:39 +0000 | [diff] [blame] | 385 | } |
| 386 | |
Benjamin Herrenschmidt | 307cfe7 | 2011-06-09 16:52:38 +1000 | [diff] [blame] | 387 | #ifdef CONFIG_BLK_DEV_INITRD |
| 388 | void __init free_initrd_mem(unsigned long start, unsigned long end) |
| 389 | { |
Jiang Liu | dbe67df | 2013-07-03 15:02:51 -0700 | [diff] [blame] | 390 | free_reserved_area((void *)start, (void *)end, -1, "initrd"); |
Benjamin Herrenschmidt | 307cfe7 | 2011-06-09 16:52:38 +1000 | [diff] [blame] | 391 | } |
| 392 | #endif |
| 393 | |
Paul Mackerras | 7c8c6b9 | 2005-10-06 12:23:33 +1000 | [diff] [blame] | 394 | /* |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 395 | * This is called when a page has been modified by the kernel. |
| 396 | * It just marks the page as not i-cache clean. We do the i-cache |
| 397 | * flush later when the page is given to a user process, if necessary. |
| 398 | */ |
| 399 | void flush_dcache_page(struct page *page) |
| 400 | { |
| 401 | if (cpu_has_feature(CPU_FTR_COHERENT_ICACHE)) |
| 402 | return; |
| 403 | /* avoid an atomic op if possible */ |
| 404 | if (test_bit(PG_arch_1, &page->flags)) |
| 405 | clear_bit(PG_arch_1, &page->flags); |
| 406 | } |
| 407 | EXPORT_SYMBOL(flush_dcache_page); |
| 408 | |
| 409 | void flush_dcache_icache_page(struct page *page) |
| 410 | { |
David Gibson | 0895ecd | 2009-10-26 19:24:31 +0000 | [diff] [blame] | 411 | #ifdef CONFIG_HUGETLB_PAGE |
| 412 | if (PageCompound(page)) { |
| 413 | flush_dcache_icache_hugepage(page); |
| 414 | return; |
| 415 | } |
| 416 | #endif |
Scott Wood | 2f7d2b7 | 2015-04-15 19:40:23 -0500 | [diff] [blame] | 417 | #if defined(CONFIG_8xx) || defined(CONFIG_PPC64) |
| 418 | /* On 8xx there is no need to kmap since highmem is not supported */ |
| 419 | __flush_dcache_icache(page_address(page)); |
| 420 | #else |
| 421 | if (IS_ENABLED(CONFIG_BOOKE) || sizeof(phys_addr_t) > sizeof(void *)) { |
Cong Wang | 2480b20 | 2011-11-25 23:14:16 +0800 | [diff] [blame] | 422 | void *start = kmap_atomic(page); |
David Gibson | 0895ecd | 2009-10-26 19:24:31 +0000 | [diff] [blame] | 423 | __flush_dcache_icache(start); |
Cong Wang | 2480b20 | 2011-11-25 23:14:16 +0800 | [diff] [blame] | 424 | kunmap_atomic(start); |
Scott Wood | 2f7d2b7 | 2015-04-15 19:40:23 -0500 | [diff] [blame] | 425 | } else { |
| 426 | __flush_dcache_icache_phys(page_to_pfn(page) << PAGE_SHIFT); |
David Gibson | 0895ecd | 2009-10-26 19:24:31 +0000 | [diff] [blame] | 427 | } |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 428 | #endif |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 429 | } |
Alexander Graf | 249ba1e | 2012-08-03 13:56:33 +0200 | [diff] [blame] | 430 | EXPORT_SYMBOL(flush_dcache_icache_page); |
David Gibson | 0895ecd | 2009-10-26 19:24:31 +0000 | [diff] [blame] | 431 | |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 432 | void clear_user_page(void *page, unsigned long vaddr, struct page *pg) |
| 433 | { |
| 434 | clear_page(page); |
| 435 | |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 436 | /* |
Lucas De Marchi | 25985ed | 2011-03-30 22:57:33 -0300 | [diff] [blame] | 437 | * We shouldn't have to do this, but some versions of glibc |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 438 | * require it (ld.so assumes zero filled pages are icache clean) |
| 439 | * - Anton |
| 440 | */ |
David Gibson | 09f5dc4 | 2006-02-06 13:24:53 +1100 | [diff] [blame] | 441 | flush_dcache_page(pg); |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 442 | } |
| 443 | EXPORT_SYMBOL(clear_user_page); |
| 444 | |
| 445 | void copy_user_page(void *vto, void *vfrom, unsigned long vaddr, |
| 446 | struct page *pg) |
| 447 | { |
| 448 | copy_page(vto, vfrom); |
| 449 | |
| 450 | /* |
| 451 | * We should be able to use the following optimisation, however |
| 452 | * there are two problems. |
| 453 | * Firstly a bug in some versions of binutils meant PLT sections |
| 454 | * were not marked executable. |
| 455 | * Secondly the first word in the GOT section is blrl, used |
| 456 | * to establish the GOT address. Until recently the GOT was |
| 457 | * not marked executable. |
| 458 | * - Anton |
| 459 | */ |
| 460 | #if 0 |
| 461 | if (!vma->vm_file && ((vma->vm_flags & VM_EXEC) == 0)) |
| 462 | return; |
| 463 | #endif |
| 464 | |
David Gibson | 09f5dc4 | 2006-02-06 13:24:53 +1100 | [diff] [blame] | 465 | flush_dcache_page(pg); |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 466 | } |
| 467 | |
| 468 | void flush_icache_user_range(struct vm_area_struct *vma, struct page *page, |
| 469 | unsigned long addr, int len) |
| 470 | { |
| 471 | unsigned long maddr; |
| 472 | |
| 473 | maddr = (unsigned long) kmap(page) + (addr & ~PAGE_MASK); |
| 474 | flush_icache_range(maddr, maddr + len); |
| 475 | kunmap(page); |
| 476 | } |
| 477 | EXPORT_SYMBOL(flush_icache_user_range); |
| 478 | |
| 479 | /* |
| 480 | * This is called at the end of handling a user page fault, when the |
| 481 | * fault has been handled by updating a PTE in the linux page tables. |
| 482 | * We use it to preload an HPTE into the hash table corresponding to |
| 483 | * the updated linux PTE. |
| 484 | * |
Hugh Dickins | 01edcd8 | 2005-11-23 13:37:39 -0800 | [diff] [blame] | 485 | * This must always be called with the pte lock held. |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 486 | */ |
| 487 | void update_mmu_cache(struct vm_area_struct *vma, unsigned long address, |
Russell King | 4b3073e | 2009-12-18 16:40:18 +0000 | [diff] [blame] | 488 | pte_t *ptep) |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 489 | { |
Benjamin Herrenschmidt | 3c726f8 | 2005-11-07 11:06:55 +1100 | [diff] [blame] | 490 | #ifdef CONFIG_PPC_STD_MMU |
Aneesh Kumar K.V | 0ac52dd | 2013-06-20 14:30:22 +0530 | [diff] [blame] | 491 | /* |
| 492 | * We don't need to worry about _PAGE_PRESENT here because we are |
| 493 | * called with either mm->page_table_lock held or ptl lock held |
| 494 | */ |
Benjamin Herrenschmidt | 3c726f8 | 2005-11-07 11:06:55 +1100 | [diff] [blame] | 495 | unsigned long access = 0, trap; |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 496 | |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 497 | /* We only want HPTEs for linux PTEs that have _PAGE_ACCESSED set */ |
Russell King | 4b3073e | 2009-12-18 16:40:18 +0000 | [diff] [blame] | 498 | if (!pte_young(*ptep) || address >= TASK_SIZE) |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 499 | return; |
Benjamin Herrenschmidt | 3c726f8 | 2005-11-07 11:06:55 +1100 | [diff] [blame] | 500 | |
| 501 | /* We try to figure out if we are coming from an instruction |
| 502 | * access fault and pass that down to __hash_page so we avoid |
| 503 | * double-faulting on execution of fresh text. We have to test |
| 504 | * for regs NULL since init will get here first thing at boot |
| 505 | * |
| 506 | * We also avoid filling the hash if not coming from a fault |
| 507 | */ |
| 508 | if (current->thread.regs == NULL) |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 509 | return; |
Benjamin Herrenschmidt | 3c726f8 | 2005-11-07 11:06:55 +1100 | [diff] [blame] | 510 | trap = TRAP(current->thread.regs); |
| 511 | if (trap == 0x400) |
| 512 | access |= _PAGE_EXEC; |
| 513 | else if (trap != 0x300) |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 514 | return; |
Benjamin Herrenschmidt | 3c726f8 | 2005-11-07 11:06:55 +1100 | [diff] [blame] | 515 | hash_preload(vma->vm_mm, address, access, trap); |
| 516 | #endif /* CONFIG_PPC_STD_MMU */ |
Becky Bruce | 41151e7 | 2011-06-28 09:54:48 +0000 | [diff] [blame] | 517 | #if (defined(CONFIG_PPC_BOOK3E_64) || defined(CONFIG_PPC_FSL_BOOK3E)) \ |
| 518 | && defined(CONFIG_HUGETLB_PAGE) |
| 519 | if (is_vm_hugetlb_page(vma)) |
Becky Bruce | d93e4d7 | 2011-11-28 14:43:33 +0000 | [diff] [blame] | 520 | book3e_hugetlb_preload(vma, address, *ptep); |
Becky Bruce | 41151e7 | 2011-06-28 09:54:48 +0000 | [diff] [blame] | 521 | #endif |
Paul Mackerras | 14cf11a | 2005-09-26 16:04:21 +1000 | [diff] [blame] | 522 | } |
Anton Blanchard | c40dd2f | 2011-11-02 14:56:12 +0000 | [diff] [blame] | 523 | |
| 524 | /* |
| 525 | * System memory should not be in /proc/iomem but various tools expect it |
| 526 | * (eg kdump). |
| 527 | */ |
Geert Uytterhoeven | 4f77092 | 2013-09-15 11:39:36 +0200 | [diff] [blame] | 528 | static int __init add_system_ram_resources(void) |
Anton Blanchard | c40dd2f | 2011-11-02 14:56:12 +0000 | [diff] [blame] | 529 | { |
| 530 | struct memblock_region *reg; |
| 531 | |
| 532 | for_each_memblock(memory, reg) { |
| 533 | struct resource *res; |
| 534 | unsigned long base = reg->base; |
| 535 | unsigned long size = reg->size; |
| 536 | |
| 537 | res = kzalloc(sizeof(struct resource), GFP_KERNEL); |
| 538 | WARN_ON(!res); |
| 539 | |
| 540 | if (res) { |
| 541 | res->name = "System RAM"; |
| 542 | res->start = base; |
| 543 | res->end = base + size - 1; |
Nathan Fontenot | f748eda | 2013-08-19 21:52:20 -0500 | [diff] [blame] | 544 | res->flags = IORESOURCE_MEM | IORESOURCE_BUSY; |
Anton Blanchard | c40dd2f | 2011-11-02 14:56:12 +0000 | [diff] [blame] | 545 | WARN_ON(request_resource(&iomem_resource, res) < 0); |
| 546 | } |
| 547 | } |
| 548 | |
| 549 | return 0; |
| 550 | } |
| 551 | subsys_initcall(add_system_ram_resources); |
sukadev@linux.vnet.ibm.com | 1d54cf2 | 2011-08-30 09:19:17 +0000 | [diff] [blame] | 552 | |
| 553 | #ifdef CONFIG_STRICT_DEVMEM |
| 554 | /* |
| 555 | * devmem_is_allowed(): check to see if /dev/mem access to a certain address |
| 556 | * is valid. The argument is a physical page number. |
| 557 | * |
| 558 | * Access has to be given to non-kernel-ram areas as well, these contain the |
| 559 | * PCI mmio resources as well as potential bios/acpi data regions. |
| 560 | */ |
| 561 | int devmem_is_allowed(unsigned long pfn) |
| 562 | { |
Scott Wood | 6c0cc62 | 2015-04-17 16:17:14 -0500 | [diff] [blame] | 563 | if (iomem_is_exclusive(PFN_PHYS(pfn))) |
sukadev@linux.vnet.ibm.com | 1d54cf2 | 2011-08-30 09:19:17 +0000 | [diff] [blame] | 564 | return 0; |
| 565 | if (!page_is_ram(pfn)) |
| 566 | return 1; |
sukadev@linux.vnet.ibm.com | 8a3e3d3 | 2011-12-02 12:26:23 +0000 | [diff] [blame] | 567 | if (page_is_rtas_user_buf(pfn)) |
| 568 | return 1; |
sukadev@linux.vnet.ibm.com | 1d54cf2 | 2011-08-30 09:19:17 +0000 | [diff] [blame] | 569 | return 0; |
| 570 | } |
| 571 | #endif /* CONFIG_STRICT_DEVMEM */ |