blob: d1b867101e5f01e74d296e52cdbd0d4801dd43e5 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
Linus Torvalds1da177e2005-04-16 15:20:36 -07002 * Re-map IO memory to kernel address space so that we can access it.
3 * This is needed for high PCI addresses that aren't mapped in the
4 * 640k-1MB IO memory area on PC's
5 *
6 * (C) Copyright 1995 1996 Linus Torvalds
7 */
8
Thomas Gleixnere9332ca2008-01-30 13:34:05 +01009#include <linux/bootmem.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070010#include <linux/init.h>
Haavard Skinnemoena148ecf2006-09-30 23:29:17 -070011#include <linux/io.h>
Thomas Gleixner3cbd09e2008-01-30 13:34:05 +010012#include <linux/module.h>
13#include <linux/slab.h>
14#include <linux/vmalloc.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070015
Thomas Gleixner3cbd09e2008-01-30 13:34:05 +010016#include <asm/cacheflush.h>
17#include <asm/e820.h>
18#include <asm/fixmap.h>
19#include <asm/pgtable.h>
20#include <asm/tlbflush.h>
Jeremy Fitzhardingef6df72e2008-01-30 13:34:11 +010021#include <asm/pgalloc.h>
venkatesh.pallipadi@intel.comd7677d42008-03-18 17:00:17 -070022#include <asm/pat.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070023
Thomas Gleixner240d3a72008-01-30 13:34:05 +010024#ifdef CONFIG_X86_64
25
26unsigned long __phys_addr(unsigned long x)
27{
28 if (x >= __START_KERNEL_map)
29 return x - __START_KERNEL_map + phys_base;
30 return x - PAGE_OFFSET;
31}
32EXPORT_SYMBOL(__phys_addr);
33
Thomas Gleixnere3100c82008-02-27 20:57:40 +010034static inline int phys_addr_valid(unsigned long addr)
35{
36 return addr < (1UL << boot_cpu_data.x86_phys_bits);
37}
38
39#else
40
41static inline int phys_addr_valid(unsigned long addr)
42{
43 return 1;
44}
45
Thomas Gleixner240d3a72008-01-30 13:34:05 +010046#endif
47
Thomas Gleixner5f5192b2008-01-30 13:34:06 +010048int page_is_ram(unsigned long pagenr)
49{
Ingo Molnar756a6c62008-03-25 08:31:17 +010050 resource_size_t addr, end;
Thomas Gleixner5f5192b2008-01-30 13:34:06 +010051 int i;
52
Arjan van de Vend8a9e6a2008-02-18 09:54:33 -080053 /*
54 * A special case is the first 4Kb of memory;
55 * This is a BIOS owned area, not kernel ram, but generally
56 * not listed as such in the E820 table.
57 */
58 if (pagenr == 0)
59 return 0;
60
Arjan van de Ven156fbc32008-02-18 09:58:45 -080061 /*
62 * Second special case: Some BIOSen report the PC BIOS
63 * area (640->1Mb) as ram even though it is not.
64 */
65 if (pagenr >= (BIOS_BEGIN >> PAGE_SHIFT) &&
66 pagenr < (BIOS_END >> PAGE_SHIFT))
67 return 0;
Arjan van de Vend8a9e6a2008-02-18 09:54:33 -080068
Thomas Gleixner5f5192b2008-01-30 13:34:06 +010069 for (i = 0; i < e820.nr_map; i++) {
70 /*
71 * Not usable memory:
72 */
73 if (e820.map[i].type != E820_RAM)
74 continue;
Thomas Gleixner5f5192b2008-01-30 13:34:06 +010075 addr = (e820.map[i].addr + PAGE_SIZE-1) >> PAGE_SHIFT;
76 end = (e820.map[i].addr + e820.map[i].size) >> PAGE_SHIFT;
Thomas Gleixner950f9d92008-01-30 13:34:06 +010077
Thomas Gleixner950f9d92008-01-30 13:34:06 +010078
Thomas Gleixner5f5192b2008-01-30 13:34:06 +010079 if ((pagenr >= addr) && (pagenr < end))
80 return 1;
81 }
82 return 0;
83}
84
Linus Torvalds1da177e2005-04-16 15:20:36 -070085/*
Thomas Gleixnere9332ca2008-01-30 13:34:05 +010086 * Fix up the linear direct mapping of the kernel to avoid cache attribute
87 * conflicts.
88 */
venkatesh.pallipadi@intel.com3a96ce82008-03-18 17:00:16 -070089int ioremap_change_attr(unsigned long vaddr, unsigned long size,
90 unsigned long prot_val)
Thomas Gleixnere9332ca2008-01-30 13:34:05 +010091{
Thomas Gleixnerd806e5e2008-01-30 13:34:06 +010092 unsigned long nrpages = size >> PAGE_SHIFT;
Harvey Harrison93809be2008-02-01 17:49:43 +010093 int err;
Thomas Gleixnere9332ca2008-01-30 13:34:05 +010094
venkatesh.pallipadi@intel.com3a96ce82008-03-18 17:00:16 -070095 switch (prot_val) {
96 case _PAGE_CACHE_UC:
Thomas Gleixnerd806e5e2008-01-30 13:34:06 +010097 default:
venkatesh.pallipadi@intel.com12193332008-03-18 17:00:18 -070098 err = _set_memory_uc(vaddr, nrpages);
Thomas Gleixnerd806e5e2008-01-30 13:34:06 +010099 break;
venkatesh.pallipadi@intel.comb310f381d2008-03-18 17:00:24 -0700100 case _PAGE_CACHE_WC:
101 err = _set_memory_wc(vaddr, nrpages);
102 break;
venkatesh.pallipadi@intel.com3a96ce82008-03-18 17:00:16 -0700103 case _PAGE_CACHE_WB:
venkatesh.pallipadi@intel.com12193332008-03-18 17:00:18 -0700104 err = _set_memory_wb(vaddr, nrpages);
Thomas Gleixnerd806e5e2008-01-30 13:34:06 +0100105 break;
106 }
Thomas Gleixnere9332ca2008-01-30 13:34:05 +0100107
108 return err;
109}
110
111/*
Linus Torvalds1da177e2005-04-16 15:20:36 -0700112 * Remap an arbitrary physical address space into the kernel virtual
113 * address space. Needed when the kernel wants to access high addresses
114 * directly.
115 *
116 * NOTE! We need to allow non-page-aligned mappings too: we will obviously
117 * have to convert them into an offset in a page-aligned mapping, but the
118 * caller shouldn't need to know that small detail.
119 */
Christoph Lameter23016962008-04-28 02:12:42 -0700120static void __iomem *__ioremap_caller(resource_size_t phys_addr,
121 unsigned long size, unsigned long prot_val, void *caller)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700122{
Ingo Molnar756a6c62008-03-25 08:31:17 +0100123 unsigned long pfn, offset, vaddr;
124 resource_size_t last_addr;
Thomas Gleixner91eebf42008-01-30 13:34:05 +0100125 struct vm_struct *area;
venkatesh.pallipadi@intel.comd7677d42008-03-18 17:00:17 -0700126 unsigned long new_prot_val;
Thomas Gleixnerd806e5e2008-01-30 13:34:06 +0100127 pgprot_t prot;
Venki Pallipadidee7cbb2008-03-24 14:39:55 -0700128 int retval;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700129
130 /* Don't allow wraparound or zero size */
131 last_addr = phys_addr + size - 1;
132 if (!size || last_addr < phys_addr)
133 return NULL;
134
Thomas Gleixnere3100c82008-02-27 20:57:40 +0100135 if (!phys_addr_valid(phys_addr)) {
venkatesh.pallipadi@intel.com6997ab42008-03-18 17:00:25 -0700136 printk(KERN_WARNING "ioremap: invalid physical address %llx\n",
Randy Dunlap4c8337a2008-04-10 15:09:50 -0700137 (unsigned long long)phys_addr);
Thomas Gleixnere3100c82008-02-27 20:57:40 +0100138 WARN_ON_ONCE(1);
139 return NULL;
140 }
141
Linus Torvalds1da177e2005-04-16 15:20:36 -0700142 /*
143 * Don't remap the low PCI/ISA area, it's always mapped..
144 */
145 if (phys_addr >= ISA_START_ADDRESS && last_addr < ISA_END_ADDRESS)
Thomas Gleixner4b40fce2008-01-30 13:34:05 +0100146 return (__force void __iomem *)phys_to_virt(phys_addr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700147
148 /*
149 * Don't allow anybody to remap normal RAM that we're using..
150 */
Andres Salomoncb8ab682008-04-30 11:30:24 -0400151 for (pfn = phys_addr >> PAGE_SHIFT;
152 (pfn << PAGE_SHIFT) < (last_addr & PAGE_MASK);
153 pfn++) {
Ingo Molnarbdd3cee2008-02-28 14:10:49 +0100154
Ingo Molnarba748d22008-03-03 09:37:41 +0100155 int is_ram = page_is_ram(pfn);
156
157 if (is_ram && pfn_valid(pfn) && !PageReserved(pfn_to_page(pfn)))
Thomas Gleixner266b9f82008-01-30 13:34:06 +0100158 return NULL;
Ingo Molnarba748d22008-03-03 09:37:41 +0100159 WARN_ON_ONCE(is_ram);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700160 }
161
venkatesh.pallipadi@intel.comd7677d42008-03-18 17:00:17 -0700162 /*
163 * Mappings have to be page-aligned
164 */
165 offset = phys_addr & ~PAGE_MASK;
166 phys_addr &= PAGE_MASK;
167 size = PAGE_ALIGN(last_addr+1) - phys_addr;
168
Venki Pallipadidee7cbb2008-03-24 14:39:55 -0700169 retval = reserve_memtype(phys_addr, phys_addr + size,
170 prot_val, &new_prot_val);
171 if (retval) {
Venki Pallipadib450e5e2008-03-25 16:51:26 -0700172 pr_debug("Warning: reserve_memtype returned %d\n", retval);
Venki Pallipadidee7cbb2008-03-24 14:39:55 -0700173 return NULL;
174 }
175
176 if (prot_val != new_prot_val) {
venkatesh.pallipadi@intel.comd7677d42008-03-18 17:00:17 -0700177 /*
178 * Do not fallback to certain memory types with certain
179 * requested type:
Suresh Siddhade33c442008-04-25 17:07:22 -0700180 * - request is uc-, return cannot be write-back
181 * - request is uc-, return cannot be write-combine
venkatesh.pallipadi@intel.comb310f381d2008-03-18 17:00:24 -0700182 * - request is write-combine, return cannot be write-back
venkatesh.pallipadi@intel.comd7677d42008-03-18 17:00:17 -0700183 */
Suresh Siddhade33c442008-04-25 17:07:22 -0700184 if ((prot_val == _PAGE_CACHE_UC_MINUS &&
venkatesh.pallipadi@intel.comb310f381d2008-03-18 17:00:24 -0700185 (new_prot_val == _PAGE_CACHE_WB ||
186 new_prot_val == _PAGE_CACHE_WC)) ||
187 (prot_val == _PAGE_CACHE_WC &&
venkatesh.pallipadi@intel.comd7677d42008-03-18 17:00:17 -0700188 new_prot_val == _PAGE_CACHE_WB)) {
Venki Pallipadib450e5e2008-03-25 16:51:26 -0700189 pr_debug(
venkatesh.pallipadi@intel.com6997ab42008-03-18 17:00:25 -0700190 "ioremap error for 0x%llx-0x%llx, requested 0x%lx, got 0x%lx\n",
Randy Dunlap4c8337a2008-04-10 15:09:50 -0700191 (unsigned long long)phys_addr,
192 (unsigned long long)(phys_addr + size),
venkatesh.pallipadi@intel.com6997ab42008-03-18 17:00:25 -0700193 prot_val, new_prot_val);
venkatesh.pallipadi@intel.comd7677d42008-03-18 17:00:17 -0700194 free_memtype(phys_addr, phys_addr + size);
195 return NULL;
196 }
197 prot_val = new_prot_val;
198 }
199
venkatesh.pallipadi@intel.com3a96ce82008-03-18 17:00:16 -0700200 switch (prot_val) {
201 case _PAGE_CACHE_UC:
Thomas Gleixnerd806e5e2008-01-30 13:34:06 +0100202 default:
Ingo Molnar55c62682008-03-26 06:19:45 +0100203 prot = PAGE_KERNEL_NOCACHE;
Thomas Gleixnerd806e5e2008-01-30 13:34:06 +0100204 break;
Suresh Siddhade33c442008-04-25 17:07:22 -0700205 case _PAGE_CACHE_UC_MINUS:
206 prot = PAGE_KERNEL_UC_MINUS;
207 break;
venkatesh.pallipadi@intel.comb310f381d2008-03-18 17:00:24 -0700208 case _PAGE_CACHE_WC:
209 prot = PAGE_KERNEL_WC;
210 break;
venkatesh.pallipadi@intel.com3a96ce82008-03-18 17:00:16 -0700211 case _PAGE_CACHE_WB:
Thomas Gleixnerd806e5e2008-01-30 13:34:06 +0100212 prot = PAGE_KERNEL;
213 break;
214 }
Haavard Skinnemoena148ecf2006-09-30 23:29:17 -0700215
Linus Torvalds1da177e2005-04-16 15:20:36 -0700216 /*
Linus Torvalds1da177e2005-04-16 15:20:36 -0700217 * Ok, go for it..
218 */
Christoph Lameter23016962008-04-28 02:12:42 -0700219 area = get_vm_area_caller(size, VM_IOREMAP, caller);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700220 if (!area)
221 return NULL;
222 area->phys_addr = phys_addr;
Thomas Gleixnere66aadb2008-02-04 16:48:05 +0100223 vaddr = (unsigned long) area->addr;
224 if (ioremap_page_range(vaddr, vaddr + size, phys_addr, prot)) {
venkatesh.pallipadi@intel.comd7677d42008-03-18 17:00:17 -0700225 free_memtype(phys_addr, phys_addr + size);
Ingo Molnarb16bf712008-02-28 14:02:08 +0100226 free_vm_area(area);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700227 return NULL;
228 }
Thomas Gleixnere9332ca2008-01-30 13:34:05 +0100229
venkatesh.pallipadi@intel.com3a96ce82008-03-18 17:00:16 -0700230 if (ioremap_change_attr(vaddr, size, prot_val) < 0) {
venkatesh.pallipadi@intel.comd7677d42008-03-18 17:00:17 -0700231 free_memtype(phys_addr, phys_addr + size);
Thomas Gleixnere66aadb2008-02-04 16:48:05 +0100232 vunmap(area->addr);
Thomas Gleixnere9332ca2008-01-30 13:34:05 +0100233 return NULL;
234 }
235
Thomas Gleixnere66aadb2008-02-04 16:48:05 +0100236 return (void __iomem *) (vaddr + offset);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700237}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700238
239/**
240 * ioremap_nocache - map bus memory into CPU space
241 * @offset: bus address of the memory
242 * @size: size of the resource to map
243 *
244 * ioremap_nocache performs a platform specific sequence of operations to
245 * make bus memory CPU accessible via the readb/readw/readl/writeb/
246 * writew/writel functions and the other mmio helpers. The returned
247 * address is not guaranteed to be usable directly as a virtual
Thomas Gleixner91eebf42008-01-30 13:34:05 +0100248 * address.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700249 *
250 * This version of ioremap ensures that the memory is marked uncachable
251 * on the CPU as well as honouring existing caching rules from things like
Thomas Gleixner91eebf42008-01-30 13:34:05 +0100252 * the PCI bus. Note that there are other caches and buffers on many
Linus Torvalds1da177e2005-04-16 15:20:36 -0700253 * busses. In particular driver authors should read up on PCI writes
254 *
255 * It's useful if some control registers are in such an area and
256 * write combining or read caching is not desirable:
Thomas Gleixner91eebf42008-01-30 13:34:05 +0100257 *
Linus Torvalds1da177e2005-04-16 15:20:36 -0700258 * Must be freed with iounmap.
259 */
Linus Torvaldsb9e76a02008-03-24 11:22:39 -0700260void __iomem *ioremap_nocache(resource_size_t phys_addr, unsigned long size)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700261{
Suresh Siddhade33c442008-04-25 17:07:22 -0700262 /*
263 * Ideally, this should be:
264 * pat_wc_enabled ? _PAGE_CACHE_UC : _PAGE_CACHE_UC_MINUS;
265 *
266 * Till we fix all X drivers to use ioremap_wc(), we will use
267 * UC MINUS.
268 */
269 unsigned long val = _PAGE_CACHE_UC_MINUS;
270
271 return __ioremap_caller(phys_addr, size, val,
Christoph Lameter23016962008-04-28 02:12:42 -0700272 __builtin_return_address(0));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700273}
Alexey Dobriyan129f6942005-06-23 00:08:33 -0700274EXPORT_SYMBOL(ioremap_nocache);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700275
venkatesh.pallipadi@intel.comb310f381d2008-03-18 17:00:24 -0700276/**
277 * ioremap_wc - map memory into CPU space write combined
278 * @offset: bus address of the memory
279 * @size: size of the resource to map
280 *
281 * This version of ioremap ensures that the memory is marked write combining.
282 * Write combining allows faster writes to some hardware devices.
283 *
284 * Must be freed with iounmap.
285 */
286void __iomem *ioremap_wc(unsigned long phys_addr, unsigned long size)
287{
288 if (pat_wc_enabled)
Christoph Lameter23016962008-04-28 02:12:42 -0700289 return __ioremap_caller(phys_addr, size, _PAGE_CACHE_WC,
290 __builtin_return_address(0));
venkatesh.pallipadi@intel.comb310f381d2008-03-18 17:00:24 -0700291 else
292 return ioremap_nocache(phys_addr, size);
293}
294EXPORT_SYMBOL(ioremap_wc);
295
Linus Torvaldsb9e76a02008-03-24 11:22:39 -0700296void __iomem *ioremap_cache(resource_size_t phys_addr, unsigned long size)
Thomas Gleixner5f868152008-01-30 13:34:06 +0100297{
Christoph Lameter23016962008-04-28 02:12:42 -0700298 return __ioremap_caller(phys_addr, size, _PAGE_CACHE_WB,
299 __builtin_return_address(0));
Thomas Gleixner5f868152008-01-30 13:34:06 +0100300}
301EXPORT_SYMBOL(ioremap_cache);
302
Venkatesh Pallipadia361ee52008-07-10 10:09:59 +0200303static void __iomem *ioremap_default(resource_size_t phys_addr,
304 unsigned long size)
305{
306 unsigned long flags;
307 void *ret;
308 int err;
309
310 /*
311 * - WB for WB-able memory and no other conflicting mappings
312 * - UC_MINUS for non-WB-able memory with no other conflicting mappings
313 * - Inherit from confliting mappings otherwise
314 */
315 err = reserve_memtype(phys_addr, phys_addr + size, -1, &flags);
316 if (err < 0)
317 return NULL;
318
319 ret = (void *) __ioremap_caller(phys_addr, size, flags,
320 __builtin_return_address(0));
321
322 free_memtype(phys_addr, phys_addr + size);
323 return (void __iomem *)ret;
324}
325
Andi Kleenbf5421c2005-12-12 22:17:09 -0800326/**
327 * iounmap - Free a IO remapping
328 * @addr: virtual address from ioremap_*
329 *
330 * Caller must ensure there is only one unmapping for the same pointer.
331 */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700332void iounmap(volatile void __iomem *addr)
333{
Andi Kleenbf5421c2005-12-12 22:17:09 -0800334 struct vm_struct *p, *o;
Andrew Mortonc23a4e962005-07-07 17:56:02 -0700335
336 if ((void __force *)addr <= high_memory)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700337 return;
338
339 /*
340 * __ioremap special-cases the PCI/ISA range by not instantiating a
341 * vm_area and by simply returning an address into the kernel mapping
342 * of ISA space. So handle that here.
343 */
344 if (addr >= phys_to_virt(ISA_START_ADDRESS) &&
Thomas Gleixner91eebf42008-01-30 13:34:05 +0100345 addr < phys_to_virt(ISA_END_ADDRESS))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700346 return;
347
Thomas Gleixner91eebf42008-01-30 13:34:05 +0100348 addr = (volatile void __iomem *)
349 (PAGE_MASK & (unsigned long __force)addr);
Andi Kleenbf5421c2005-12-12 22:17:09 -0800350
351 /* Use the vm area unlocked, assuming the caller
352 ensures there isn't another iounmap for the same address
353 in parallel. Reuse of the virtual address is prevented by
354 leaving it in the global lists until we're done with it.
355 cpa takes care of the direct mappings. */
356 read_lock(&vmlist_lock);
357 for (p = vmlist; p; p = p->next) {
358 if (p->addr == addr)
359 break;
360 }
361 read_unlock(&vmlist_lock);
362
363 if (!p) {
Thomas Gleixner91eebf42008-01-30 13:34:05 +0100364 printk(KERN_ERR "iounmap: bad address %p\n", addr);
Andrew Mortonc23a4e962005-07-07 17:56:02 -0700365 dump_stack();
Andi Kleenbf5421c2005-12-12 22:17:09 -0800366 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700367 }
368
venkatesh.pallipadi@intel.comd7677d42008-03-18 17:00:17 -0700369 free_memtype(p->phys_addr, p->phys_addr + get_vm_area_size(p));
370
Andi Kleenbf5421c2005-12-12 22:17:09 -0800371 /* Finally remove it */
372 o = remove_vm_area((void *)addr);
373 BUG_ON(p != o || o == NULL);
Thomas Gleixner91eebf42008-01-30 13:34:05 +0100374 kfree(p);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700375}
Alexey Dobriyan129f6942005-06-23 00:08:33 -0700376EXPORT_SYMBOL(iounmap);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700377
venkatesh.pallipadi@intel.come045fb22008-03-18 17:00:15 -0700378/*
379 * Convert a physical pointer to a virtual kernel pointer for /dev/mem
380 * access
381 */
382void *xlate_dev_mem_ptr(unsigned long phys)
383{
384 void *addr;
385 unsigned long start = phys & PAGE_MASK;
386
387 /* If page is RAM, we can use __va. Otherwise ioremap and unmap. */
388 if (page_is_ram(start >> PAGE_SHIFT))
389 return __va(phys);
390
Venkatesh Pallipadia361ee52008-07-10 10:09:59 +0200391 addr = (void *)ioremap_default(start, PAGE_SIZE);
venkatesh.pallipadi@intel.come045fb22008-03-18 17:00:15 -0700392 if (addr)
393 addr = (void *)((unsigned long)addr | (phys & ~PAGE_MASK));
394
395 return addr;
396}
397
398void unxlate_dev_mem_ptr(unsigned long phys, void *addr)
399{
400 if (page_is_ram(phys >> PAGE_SHIFT))
401 return;
402
403 iounmap((void __iomem *)((unsigned long)addr & PAGE_MASK));
404 return;
405}
406
Thomas Gleixner240d3a72008-01-30 13:34:05 +0100407#ifdef CONFIG_X86_32
Ingo Molnard18d6d62008-01-30 13:33:45 +0100408
409int __initdata early_ioremap_debug;
410
411static int __init early_ioremap_debug_setup(char *str)
412{
413 early_ioremap_debug = 1;
414
Huang, Ying793b24a2008-01-30 13:33:45 +0100415 return 0;
Ingo Molnard18d6d62008-01-30 13:33:45 +0100416}
Huang, Ying793b24a2008-01-30 13:33:45 +0100417early_param("early_ioremap_debug", early_ioremap_debug_setup);
Ingo Molnard18d6d62008-01-30 13:33:45 +0100418
Huang, Ying0947b2f2008-01-30 13:33:44 +0100419static __initdata int after_paging_init;
Ian Campbellc92a7a52008-02-17 19:09:42 +0000420static pte_t bm_pte[PAGE_SIZE/sizeof(pte_t)]
421 __section(.bss.page_aligned);
Huang, Ying0947b2f2008-01-30 13:33:44 +0100422
Ian Campbell551889a62008-02-09 23:24:09 +0100423static inline pmd_t * __init early_ioremap_pmd(unsigned long addr)
Huang, Ying0947b2f2008-01-30 13:33:44 +0100424{
Jeremy Fitzhardinge37cc8d72008-02-13 16:20:35 +0100425 /* Don't assume we're using swapper_pg_dir at this point */
426 pgd_t *base = __va(read_cr3());
427 pgd_t *pgd = &base[pgd_index(addr)];
Ian Campbell551889a62008-02-09 23:24:09 +0100428 pud_t *pud = pud_offset(pgd, addr);
429 pmd_t *pmd = pmd_offset(pud, addr);
430
431 return pmd;
Huang, Ying0947b2f2008-01-30 13:33:44 +0100432}
433
Ian Campbell551889a62008-02-09 23:24:09 +0100434static inline pte_t * __init early_ioremap_pte(unsigned long addr)
Huang, Ying0947b2f2008-01-30 13:33:44 +0100435{
Ian Campbell551889a62008-02-09 23:24:09 +0100436 return &bm_pte[pte_index(addr)];
Huang, Ying0947b2f2008-01-30 13:33:44 +0100437}
438
Huang, Yingbeacfaa2008-01-30 13:33:44 +0100439void __init early_ioremap_init(void)
Huang, Ying0947b2f2008-01-30 13:33:44 +0100440{
Ian Campbell551889a62008-02-09 23:24:09 +0100441 pmd_t *pmd;
Huang, Ying0947b2f2008-01-30 13:33:44 +0100442
Ingo Molnard18d6d62008-01-30 13:33:45 +0100443 if (early_ioremap_debug)
Ingo Molnaradafdf62008-01-30 13:34:08 +0100444 printk(KERN_INFO "early_ioremap_init()\n");
Ingo Molnard18d6d62008-01-30 13:33:45 +0100445
Ian Campbell551889a62008-02-09 23:24:09 +0100446 pmd = early_ioremap_pmd(fix_to_virt(FIX_BTMAP_BEGIN));
Huang, Ying0947b2f2008-01-30 13:33:44 +0100447 memset(bm_pte, 0, sizeof(bm_pte));
Ian Campbellb6fbb662008-02-09 23:24:09 +0100448 pmd_populate_kernel(&init_mm, pmd, bm_pte);
Ian Campbell551889a62008-02-09 23:24:09 +0100449
Ingo Molnar0e3a9542008-01-30 13:33:49 +0100450 /*
Ian Campbell551889a62008-02-09 23:24:09 +0100451 * The boot-ioremap range spans multiple pmds, for which
Ingo Molnar0e3a9542008-01-30 13:33:49 +0100452 * we are not prepared:
453 */
Ian Campbell551889a62008-02-09 23:24:09 +0100454 if (pmd != early_ioremap_pmd(fix_to_virt(FIX_BTMAP_END))) {
Ingo Molnar0e3a9542008-01-30 13:33:49 +0100455 WARN_ON(1);
Ian Campbell551889a62008-02-09 23:24:09 +0100456 printk(KERN_WARNING "pmd %p != %p\n",
457 pmd, early_ioremap_pmd(fix_to_virt(FIX_BTMAP_END)));
Thomas Gleixner91eebf42008-01-30 13:34:05 +0100458 printk(KERN_WARNING "fix_to_virt(FIX_BTMAP_BEGIN): %08lx\n",
Ian Campbell551889a62008-02-09 23:24:09 +0100459 fix_to_virt(FIX_BTMAP_BEGIN));
Thomas Gleixner91eebf42008-01-30 13:34:05 +0100460 printk(KERN_WARNING "fix_to_virt(FIX_BTMAP_END): %08lx\n",
Ian Campbell551889a62008-02-09 23:24:09 +0100461 fix_to_virt(FIX_BTMAP_END));
Ingo Molnar0e3a9542008-01-30 13:33:49 +0100462
Thomas Gleixner91eebf42008-01-30 13:34:05 +0100463 printk(KERN_WARNING "FIX_BTMAP_END: %d\n", FIX_BTMAP_END);
464 printk(KERN_WARNING "FIX_BTMAP_BEGIN: %d\n",
465 FIX_BTMAP_BEGIN);
Ingo Molnar0e3a9542008-01-30 13:33:49 +0100466 }
Huang, Ying0947b2f2008-01-30 13:33:44 +0100467}
468
Huang, Yingbeacfaa2008-01-30 13:33:44 +0100469void __init early_ioremap_clear(void)
Huang, Ying0947b2f2008-01-30 13:33:44 +0100470{
Ian Campbell551889a62008-02-09 23:24:09 +0100471 pmd_t *pmd;
Huang, Ying0947b2f2008-01-30 13:33:44 +0100472
Ingo Molnard18d6d62008-01-30 13:33:45 +0100473 if (early_ioremap_debug)
Ingo Molnaradafdf62008-01-30 13:34:08 +0100474 printk(KERN_INFO "early_ioremap_clear()\n");
Ingo Molnard18d6d62008-01-30 13:33:45 +0100475
Ian Campbell551889a62008-02-09 23:24:09 +0100476 pmd = early_ioremap_pmd(fix_to_virt(FIX_BTMAP_BEGIN));
477 pmd_clear(pmd);
Jeremy Fitzhardinge6944a9c2008-03-17 16:37:01 -0700478 paravirt_release_pte(__pa(bm_pte) >> PAGE_SHIFT);
Huang, Ying0947b2f2008-01-30 13:33:44 +0100479 __flush_tlb_all();
480}
481
Huang, Yingbeacfaa2008-01-30 13:33:44 +0100482void __init early_ioremap_reset(void)
Huang, Ying0947b2f2008-01-30 13:33:44 +0100483{
484 enum fixed_addresses idx;
Ian Campbell551889a62008-02-09 23:24:09 +0100485 unsigned long addr, phys;
486 pte_t *pte;
Huang, Ying0947b2f2008-01-30 13:33:44 +0100487
488 after_paging_init = 1;
Huang, Ying64a8f852008-01-30 13:33:44 +0100489 for (idx = FIX_BTMAP_BEGIN; idx >= FIX_BTMAP_END; idx--) {
Huang, Ying0947b2f2008-01-30 13:33:44 +0100490 addr = fix_to_virt(idx);
Huang, Yingbeacfaa2008-01-30 13:33:44 +0100491 pte = early_ioremap_pte(addr);
Ian Campbell551889a62008-02-09 23:24:09 +0100492 if (pte_present(*pte)) {
493 phys = pte_val(*pte) & PAGE_MASK;
Huang, Ying0947b2f2008-01-30 13:33:44 +0100494 set_fixmap(idx, phys);
495 }
496 }
497}
498
Huang, Yingbeacfaa2008-01-30 13:33:44 +0100499static void __init __early_set_fixmap(enum fixed_addresses idx,
Huang, Ying0947b2f2008-01-30 13:33:44 +0100500 unsigned long phys, pgprot_t flags)
501{
Ian Campbell551889a62008-02-09 23:24:09 +0100502 unsigned long addr = __fix_to_virt(idx);
503 pte_t *pte;
Huang, Ying0947b2f2008-01-30 13:33:44 +0100504
505 if (idx >= __end_of_fixed_addresses) {
506 BUG();
507 return;
508 }
Huang, Yingbeacfaa2008-01-30 13:33:44 +0100509 pte = early_ioremap_pte(addr);
Huang, Ying0947b2f2008-01-30 13:33:44 +0100510 if (pgprot_val(flags))
Ian Campbell551889a62008-02-09 23:24:09 +0100511 set_pte(pte, pfn_pte(phys >> PAGE_SHIFT, flags));
Huang, Ying0947b2f2008-01-30 13:33:44 +0100512 else
Ian Campbell551889a62008-02-09 23:24:09 +0100513 pte_clear(NULL, addr, pte);
Huang, Ying0947b2f2008-01-30 13:33:44 +0100514 __flush_tlb_one(addr);
515}
516
Huang, Yingbeacfaa2008-01-30 13:33:44 +0100517static inline void __init early_set_fixmap(enum fixed_addresses idx,
Huang, Ying0947b2f2008-01-30 13:33:44 +0100518 unsigned long phys)
519{
520 if (after_paging_init)
521 set_fixmap(idx, phys);
522 else
Huang, Yingbeacfaa2008-01-30 13:33:44 +0100523 __early_set_fixmap(idx, phys, PAGE_KERNEL);
Huang, Ying0947b2f2008-01-30 13:33:44 +0100524}
525
Huang, Yingbeacfaa2008-01-30 13:33:44 +0100526static inline void __init early_clear_fixmap(enum fixed_addresses idx)
Huang, Ying0947b2f2008-01-30 13:33:44 +0100527{
528 if (after_paging_init)
529 clear_fixmap(idx);
530 else
Huang, Yingbeacfaa2008-01-30 13:33:44 +0100531 __early_set_fixmap(idx, 0, __pgprot(0));
Huang, Ying0947b2f2008-01-30 13:33:44 +0100532}
533
Ingo Molnar1b42f512008-01-30 13:33:45 +0100534
535int __initdata early_ioremap_nested;
536
Ingo Molnard690b2a2008-01-30 13:33:47 +0100537static int __init check_early_ioremap_leak(void)
538{
539 if (!early_ioremap_nested)
540 return 0;
541
542 printk(KERN_WARNING
Thomas Gleixner91eebf42008-01-30 13:34:05 +0100543 "Debug warning: early ioremap leak of %d areas detected.\n",
544 early_ioremap_nested);
Ingo Molnard690b2a2008-01-30 13:33:47 +0100545 printk(KERN_WARNING
Thomas Gleixner91eebf42008-01-30 13:34:05 +0100546 "please boot with early_ioremap_debug and report the dmesg.\n");
Ingo Molnard690b2a2008-01-30 13:33:47 +0100547 WARN_ON(1);
548
549 return 1;
550}
551late_initcall(check_early_ioremap_leak);
552
Huang, Yingbeacfaa2008-01-30 13:33:44 +0100553void __init *early_ioremap(unsigned long phys_addr, unsigned long size)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700554{
555 unsigned long offset, last_addr;
Ingo Molnar1b42f512008-01-30 13:33:45 +0100556 unsigned int nrpages, nesting;
557 enum fixed_addresses idx0, idx;
558
559 WARN_ON(system_state != SYSTEM_BOOTING);
560
561 nesting = early_ioremap_nested;
Ingo Molnard18d6d62008-01-30 13:33:45 +0100562 if (early_ioremap_debug) {
Ingo Molnaradafdf62008-01-30 13:34:08 +0100563 printk(KERN_INFO "early_ioremap(%08lx, %08lx) [%d] => ",
Thomas Gleixner91eebf42008-01-30 13:34:05 +0100564 phys_addr, size, nesting);
Ingo Molnard18d6d62008-01-30 13:33:45 +0100565 dump_stack();
566 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700567
568 /* Don't allow wraparound or zero size */
569 last_addr = phys_addr + size - 1;
Ingo Molnarbd796ed2008-01-30 13:33:45 +0100570 if (!size || last_addr < phys_addr) {
571 WARN_ON(1);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700572 return NULL;
Ingo Molnarbd796ed2008-01-30 13:33:45 +0100573 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700574
Ingo Molnarbd796ed2008-01-30 13:33:45 +0100575 if (nesting >= FIX_BTMAPS_NESTING) {
576 WARN_ON(1);
Ingo Molnar1b42f512008-01-30 13:33:45 +0100577 return NULL;
Ingo Molnarbd796ed2008-01-30 13:33:45 +0100578 }
Ingo Molnar1b42f512008-01-30 13:33:45 +0100579 early_ioremap_nested++;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700580 /*
581 * Mappings have to be page-aligned
582 */
583 offset = phys_addr & ~PAGE_MASK;
584 phys_addr &= PAGE_MASK;
585 size = PAGE_ALIGN(last_addr) - phys_addr;
586
587 /*
588 * Mappings have to fit in the FIX_BTMAP area.
589 */
590 nrpages = size >> PAGE_SHIFT;
Ingo Molnarbd796ed2008-01-30 13:33:45 +0100591 if (nrpages > NR_FIX_BTMAPS) {
592 WARN_ON(1);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700593 return NULL;
Ingo Molnarbd796ed2008-01-30 13:33:45 +0100594 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700595
596 /*
597 * Ok, go for it..
598 */
Ingo Molnar1b42f512008-01-30 13:33:45 +0100599 idx0 = FIX_BTMAP_BEGIN - NR_FIX_BTMAPS*nesting;
600 idx = idx0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700601 while (nrpages > 0) {
Huang, Yingbeacfaa2008-01-30 13:33:44 +0100602 early_set_fixmap(idx, phys_addr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700603 phys_addr += PAGE_SIZE;
604 --idx;
605 --nrpages;
606 }
Ingo Molnard18d6d62008-01-30 13:33:45 +0100607 if (early_ioremap_debug)
608 printk(KERN_CONT "%08lx + %08lx\n", offset, fix_to_virt(idx0));
Ingo Molnar1b42f512008-01-30 13:33:45 +0100609
Thomas Gleixner91eebf42008-01-30 13:34:05 +0100610 return (void *) (offset + fix_to_virt(idx0));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700611}
612
Huang, Yingbeacfaa2008-01-30 13:33:44 +0100613void __init early_iounmap(void *addr, unsigned long size)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700614{
615 unsigned long virt_addr;
616 unsigned long offset;
617 unsigned int nrpages;
618 enum fixed_addresses idx;
Ingo Molnar226e9a92008-05-27 09:56:49 +0200619 int nesting;
Ingo Molnar1b42f512008-01-30 13:33:45 +0100620
621 nesting = --early_ioremap_nested;
Ingo Molnar226e9a92008-05-27 09:56:49 +0200622 if (WARN_ON(nesting < 0))
623 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700624
Ingo Molnard18d6d62008-01-30 13:33:45 +0100625 if (early_ioremap_debug) {
Ingo Molnaradafdf62008-01-30 13:34:08 +0100626 printk(KERN_INFO "early_iounmap(%p, %08lx) [%d]\n", addr,
Thomas Gleixner91eebf42008-01-30 13:34:05 +0100627 size, nesting);
Ingo Molnard18d6d62008-01-30 13:33:45 +0100628 dump_stack();
629 }
630
Linus Torvalds1da177e2005-04-16 15:20:36 -0700631 virt_addr = (unsigned long)addr;
Ingo Molnarbd796ed2008-01-30 13:33:45 +0100632 if (virt_addr < fix_to_virt(FIX_BTMAP_BEGIN)) {
633 WARN_ON(1);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700634 return;
Ingo Molnarbd796ed2008-01-30 13:33:45 +0100635 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700636 offset = virt_addr & ~PAGE_MASK;
637 nrpages = PAGE_ALIGN(offset + size - 1) >> PAGE_SHIFT;
638
Ingo Molnar1b42f512008-01-30 13:33:45 +0100639 idx = FIX_BTMAP_BEGIN - NR_FIX_BTMAPS*nesting;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700640 while (nrpages > 0) {
Huang, Yingbeacfaa2008-01-30 13:33:44 +0100641 early_clear_fixmap(idx);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700642 --idx;
643 --nrpages;
644 }
645}
Ingo Molnar1b42f512008-01-30 13:33:45 +0100646
647void __this_fixmap_does_not_exist(void)
648{
649 WARN_ON(1);
650}
Thomas Gleixner240d3a72008-01-30 13:34:05 +0100651
652#endif /* CONFIG_X86_32 */