Blame - include/asm-generic/tlb.h - SHIFTPHONES/kernel/shift/mainline

blob: 256c9de71fdba7b0558e21df43935db73c6ebe8a [file] [log] [blame]

Uwe Zeisberger	f30c226	2006-10-03 23:01:26 +0200	[diff] [blame]	1	/* include/asm-generic/tlb.h
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2	*
				3	* Generic TLB shootdown code
				4	*
				5	* Copyright 2001 Red Hat, Inc.
				6	* Based on code from mm/memory.c Copyright Linus Torvalds and others.
				7	*
Peter Zijlstra	90eec10	2015-11-16 11:08:45 +0100	[diff] [blame]	8	* Copyright 2011 Red Hat, Inc., Peter Zijlstra
Peter Zijlstra	d16dfc5	2011-05-24 17:11:45 -0700	[diff] [blame]	9	*
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	10	* This program is free software; you can redistribute it and/or
				11	* modify it under the terms of the GNU General Public License
				12	* as published by the Free Software Foundation; either version
				13	* 2 of the License, or (at your option) any later version.
				14	*/
				15	#ifndef _ASM_GENERIC__TLB_H
				16	#define _ASM_GENERIC__TLB_H
				17
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	18	#include <linux/swap.h>
Ingo Molnar	62152d0	2008-01-31 22:05:48 +0100	[diff] [blame]	19	#include <asm/pgalloc.h>
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	20	#include <asm/tlbflush.h>
				21
Peter Zijlstra	2672391	2011-05-24 17:12:00 -0700	[diff] [blame]	22	#ifdef CONFIG_HAVE_RCU_TABLE_FREE
				23	/*
				24	* Semi RCU freeing of the page directories.
				25	*
				26	* This is needed by some architectures to implement software pagetable walkers.
				27	*
				28	* gup_fast() and other software pagetable walkers do a lockless page-table
				29	* walk and therefore needs some synchronization with the freeing of the page
				30	* directories. The chosen means to accomplish that is by disabling IRQs over
				31	* the walk.
				32	*
				33	* Architectures that use IPIs to flush TLBs will then automagically DTRT,
				34	* since we unlink the page, flush TLBs, free the page. Since the disabling of
				35	* IRQs delays the completion of the TLB flush we can never observe an already
				36	* freed page.
				37	*
				38	* Architectures that do not have this (PPC) need to delay the freeing by some
				39	* other means, this is that means.
				40	*
				41	* What we do is batch the freed directory pages (tables) and RCU free them.
				42	* We use the sched RCU variant, as that guarantees that IRQ/preempt disabling
				43	* holds off grace periods.
				44	*
				45	* However, in order to batch these pages we need to allocate storage, this
				46	* allocation is deep inside the MM code and can thus easily fail on memory
				47	* pressure. To guarantee progress we fall back to single table freeing, see
				48	* the implementation of tlb_remove_table_one().
				49	*
				50	*/
				51	struct mmu_table_batch {
				52	struct rcu_head rcu;
				53	unsigned int nr;
				54	void *tables[0];
				55	};
				56
				57	#define MAX_TABLE_BATCH \
				58	((PAGE_SIZE - sizeof(struct mmu_table_batch)) / sizeof(void *))
				59
				60	extern void tlb_table_flush(struct mmu_gather *tlb);
				61	extern void tlb_remove_table(struct mmu_gather tlb, void table);
				62
				63	#endif
				64
Peter Zijlstra	d16dfc5	2011-05-24 17:11:45 -0700	[diff] [blame]	65	/*
				66	* If we can't allocate a page to make a big batch of page pointers
				67	* to work on, then just handle a few from the on-stack structure.
				68	*/
				69	#define MMU_GATHER_BUNDLE 8
				70
Peter Zijlstra	e303297	2011-05-24 17:12:01 -0700	[diff] [blame]	71	struct mmu_gather_batch {
				72	struct mmu_gather_batch *next;
				73	unsigned int nr;
				74	unsigned int max;
				75	struct page *pages[0];
				76	};
				77
				78	#define MAX_GATHER_BATCH \
				79	((PAGE_SIZE - sizeof(struct mmu_gather_batch)) / sizeof(void *))
				80
Michal Hocko	53a59fc	2013-01-04 15:35:12 -0800	[diff] [blame]	81	/*
				82	* Limit the maximum number of mmu_gather batches to reduce a risk of soft
				83	* lockups for non-preemptible kernels on huge machines when a lot of memory
				84	* is zapped during unmapping.
				85	* 10K pages freed at once should be safe even without a preemption point.
				86	*/
				87	#define MAX_GATHER_BATCH_COUNT (10000UL/MAX_GATHER_BATCH)
				88
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	89	/* struct mmu_gather is an opaque type used by the mm code for passing around
Hugh Dickins	15a23ff	2005-10-29 18:16:01 -0700	[diff] [blame]	90	* any data needed by arch specific code for tlb_remove_page.
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	91	*/
				92	struct mmu_gather {
				93	struct mm_struct *mm;
Peter Zijlstra	2672391	2011-05-24 17:12:00 -0700	[diff] [blame]	94	#ifdef CONFIG_HAVE_RCU_TABLE_FREE
				95	struct mmu_table_batch *batch;
				96	#endif
Alex Shi	597e1c3	2012-06-28 09:02:21 +0800	[diff] [blame]	97	unsigned long start;
				98	unsigned long end;
Dave Hansen	1de14c3	2013-04-12 16:23:54 -0700	[diff] [blame]	99	/* we are in the middle of an operation to clear
				100	* a full mm and can make some optimizations */
Will Deacon	fb7332a	2014-10-29 10:03:09 +0000	[diff] [blame]	101	unsigned int fullmm : 1,
Dave Hansen	1de14c3	2013-04-12 16:23:54 -0700	[diff] [blame]	102	/* we have performed an operation which
				103	* requires a complete flush of the tlb */
				104	need_flush_all : 1;
Peter Zijlstra	e303297	2011-05-24 17:12:01 -0700	[diff] [blame]	105
				106	struct mmu_gather_batch *active;
				107	struct mmu_gather_batch local;
				108	struct page *__pages[MMU_GATHER_BUNDLE];
Michal Hocko	53a59fc	2013-01-04 15:35:12 -0800	[diff] [blame]	109	unsigned int batch_count;
Aneesh Kumar K.V	e9d55e1	2016-07-26 15:24:09 -0700	[diff] [blame]	110	/*
				111	* __tlb_adjust_range will track the new addr here,
				112	* that that we can adjust the range after the flush
				113	*/
				114	unsigned long addr;
Aneesh Kumar K.V	e77b085	2016-07-26 15:24:12 -0700	[diff] [blame]	115	int page_size;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	116	};
				117
Peter Zijlstra	9547d01	2011-05-24 17:12:14 -0700	[diff] [blame]	118	#define HAVE_GENERIC_MMU_GATHER
				119
Linus Torvalds	2b04725	2013-08-15 11:42:25 -0700	[diff] [blame]	120	void tlb_gather_mmu(struct mmu_gather tlb, struct mm_struct mm, unsigned long start, unsigned long end);
Peter Zijlstra	9547d01	2011-05-24 17:12:14 -0700	[diff] [blame]	121	void tlb_flush_mmu(struct mmu_gather *tlb);
Alex Shi	c4211f4	2012-06-28 09:02:19 +0800	[diff] [blame]	122	void tlb_finish_mmu(struct mmu_gather *tlb, unsigned long start,
				123	unsigned long end);
Aneesh Kumar K.V	e77b085	2016-07-26 15:24:12 -0700	[diff] [blame]	124	extern bool __tlb_remove_page_size(struct mmu_gather tlb, struct page page,
				125	int page_size);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	126
Will Deacon	fb7332a	2014-10-29 10:03:09 +0000	[diff] [blame]	127	static inline void __tlb_adjust_range(struct mmu_gather *tlb,
Aneesh Kumar K.V	b5bc66b	2016-12-12 16:42:34 -0800	[diff] [blame]	128	unsigned long address,
				129	unsigned int range_size)
Will Deacon	fb7332a	2014-10-29 10:03:09 +0000	[diff] [blame]	130	{
				131	tlb->start = min(tlb->start, address);
Aneesh Kumar K.V	b5bc66b	2016-12-12 16:42:34 -0800	[diff] [blame]	132	tlb->end = max(tlb->end, address + range_size);
Aneesh Kumar K.V	e9d55e1	2016-07-26 15:24:09 -0700	[diff] [blame]	133	/*
				134	* Track the last address with which we adjusted the range. This
				135	* will be used later to adjust again after a mmu_flush due to
				136	* failed __tlb_remove_page
				137	*/
				138	tlb->addr = address;
Will Deacon	fb7332a	2014-10-29 10:03:09 +0000	[diff] [blame]	139	}
				140
				141	static inline void __tlb_reset_range(struct mmu_gather *tlb)
				142	{
Will Deacon	721c21c	2015-01-12 19:10:55 +0000	[diff] [blame]	143	if (tlb->fullmm) {
				144	tlb->start = tlb->end = ~0;
				145	} else {
				146	tlb->start = TASK_SIZE;
				147	tlb->end = 0;
				148	}
Will Deacon	fb7332a	2014-10-29 10:03:09 +0000	[diff] [blame]	149	}
				150
Aneesh Kumar K.V	e77b085	2016-07-26 15:24:12 -0700	[diff] [blame]	151	static inline void tlb_remove_page_size(struct mmu_gather *tlb,
				152	struct page *page, int page_size)
				153	{
				154	if (__tlb_remove_page_size(tlb, page, page_size)) {
				155	tlb_flush_mmu(tlb);
				156	tlb->page_size = page_size;
Aneesh Kumar K.V	b5bc66b	2016-12-12 16:42:34 -0800	[diff] [blame]	157	__tlb_adjust_range(tlb, tlb->addr, page_size);
Aneesh Kumar K.V	e77b085	2016-07-26 15:24:12 -0700	[diff] [blame]	158	__tlb_remove_page_size(tlb, page, page_size);
				159	}
				160	}
				161
				162	static bool __tlb_remove_page(struct mmu_gather tlb, struct page page)
				163	{
				164	return __tlb_remove_page_size(tlb, page, PAGE_SIZE);
				165	}
				166
Aneesh Kumar K.V	e9d55e1	2016-07-26 15:24:09 -0700	[diff] [blame]	167	/* tlb_remove_page
				168	* Similar to __tlb_remove_page but will call tlb_flush_mmu() itself when
				169	* required.
				170	*/
				171	static inline void tlb_remove_page(struct mmu_gather tlb, struct page page)
				172	{
Aneesh Kumar K.V	e77b085	2016-07-26 15:24:12 -0700	[diff] [blame]	173	return tlb_remove_page_size(tlb, page, PAGE_SIZE);
Aneesh Kumar K.V	e9d55e1	2016-07-26 15:24:09 -0700	[diff] [blame]	174	}
				175
				176	static inline bool __tlb_remove_pte_page(struct mmu_gather tlb, struct page page)
				177	{
				178	/* active->nr should be zero when we call this */
				179	VM_BUG_ON_PAGE(tlb->active->nr, page);
Aneesh Kumar K.V	e77b085	2016-07-26 15:24:12 -0700	[diff] [blame]	180	tlb->page_size = PAGE_SIZE;
Aneesh Kumar K.V	b5bc66b	2016-12-12 16:42:34 -0800	[diff] [blame]	181	__tlb_adjust_range(tlb, tlb->addr, PAGE_SIZE);
Aneesh Kumar K.V	e9d55e1	2016-07-26 15:24:09 -0700	[diff] [blame]	182	return __tlb_remove_page(tlb, page);
				183	}
				184
Aneesh Kumar K.V	07e3266	2016-12-12 16:42:40 -0800	[diff] [blame^]	185	#ifndef tlb_remove_check_page_size_change
				186	#define tlb_remove_check_page_size_change tlb_remove_check_page_size_change
				187	static inline void tlb_remove_check_page_size_change(struct mmu_gather *tlb,
				188	unsigned int page_size)
				189	{
				190	/*
				191	* We don't care about page size change, just update
				192	* mmu_gather page size here so that debug checks
				193	* doesn't throw false warning.
				194	*/
				195	#ifdef CONFIG_DEBUG_VM
				196	tlb->page_size = page_size;
				197	#endif
				198	}
				199	#endif
				200
Will Deacon	fb7332a	2014-10-29 10:03:09 +0000	[diff] [blame]	201	/*
				202	* In the case of tlb vma handling, we can optimise these away in the
				203	* case where we're doing a full MM flush. When we're doing a munmap,
				204	* the vmas are adjusted to only cover the region to be torn down.
				205	*/
				206	#ifndef tlb_start_vma
				207	#define tlb_start_vma(tlb, vma) do { } while (0)
				208	#endif
				209
				210	#define __tlb_end_vma(tlb, vma) \
				211	do { \
				212	if (!tlb->fullmm && tlb->end) { \
				213	tlb_flush(tlb); \
				214	__tlb_reset_range(tlb); \
				215	} \
				216	} while (0)
				217
				218	#ifndef tlb_end_vma
				219	#define tlb_end_vma __tlb_end_vma
				220	#endif
				221
				222	#ifndef __tlb_remove_tlb_entry
				223	#define __tlb_remove_tlb_entry(tlb, ptep, address) do { } while (0)
				224	#endif
				225
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	226	/**
				227	* tlb_remove_tlb_entry - remember a pte unmapping for later tlb invalidation.
				228	*
Will Deacon	fb7332a	2014-10-29 10:03:09 +0000	[diff] [blame]	229	* Record the fact that pte's were really unmapped by updating the range,
				230	* so we can later optimise away the tlb invalidate. This helps when
				231	* userspace is unmapping already-unmapped pages, which happens quite a lot.
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	232	*/
				233	#define tlb_remove_tlb_entry(tlb, ptep, address) \
				234	do { \
Aneesh Kumar K.V	b5bc66b	2016-12-12 16:42:34 -0800	[diff] [blame]	235	__tlb_adjust_range(tlb, address, PAGE_SIZE); \
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	236	__tlb_remove_tlb_entry(tlb, ptep, address); \
				237	} while (0)
				238
Aneesh Kumar K.V	b528e4b	2016-12-12 16:42:37 -0800	[diff] [blame]	239	#define tlb_remove_huge_tlb_entry(h, tlb, ptep, address) \
				240	do { \
				241	__tlb_adjust_range(tlb, address, huge_page_size(h)); \
				242	__tlb_remove_tlb_entry(tlb, ptep, address); \
				243	} while (0)
				244
Shaohua Li	f21760b	2012-01-12 17:19:16 -0800	[diff] [blame]	245	/**
				246	* tlb_remove_pmd_tlb_entry - remember a pmd mapping for later tlb invalidation
				247	* This is a nop so far, because only x86 needs it.
				248	*/
				249	#ifndef __tlb_remove_pmd_tlb_entry
				250	#define __tlb_remove_pmd_tlb_entry(tlb, pmdp, address) do {} while (0)
				251	#endif
				252
Aneesh Kumar K.V	b5bc66b	2016-12-12 16:42:34 -0800	[diff] [blame]	253	#define tlb_remove_pmd_tlb_entry(tlb, pmdp, address) \
				254	do { \
				255	__tlb_adjust_range(tlb, address, HPAGE_PMD_SIZE); \
				256	__tlb_remove_pmd_tlb_entry(tlb, pmdp, address); \
Shaohua Li	f21760b	2012-01-12 17:19:16 -0800	[diff] [blame]	257	} while (0)
				258
Aneesh Kumar K.V	b5bc66b	2016-12-12 16:42:34 -0800	[diff] [blame]	259	/*
				260	* For things like page tables caches (ie caching addresses "inside" the
				261	* page tables, like x86 does), for legacy reasons, flushing an
				262	* individual page had better flush the page table caches behind it. This
				263	* is definitely how x86 works, for example. And if you have an
				264	* architected non-legacy page table cache (which I'm not aware of
				265	* anybody actually doing), you're going to have some architecturally
				266	* explicit flushing for that, likely separate from a regular TLB entry
				267	* flush, and thus you'd need more than just some range expansion..
				268	*
				269	* So if we ever find an architecture
				270	* that would want something that odd, I think it is up to that
				271	* architecture to do its own odd thing, not cause pain for others
				272	* http://lkml.kernel.org/r/CA+55aFzBggoXtNXQeng5d_mRoDnaMBE5Y+URs+PHR67nUpMtaw@mail.gmail.com
				273	*
				274	* For now w.r.t page table cache, mark the range_size as PAGE_SIZE
				275	*/
				276
Benjamin Herrenschmidt	9e1b32c	2009-07-22 15:44:28 +1000	[diff] [blame]	277	#define pte_free_tlb(tlb, ptep, address) \
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	278	do { \
Aneesh Kumar K.V	b5bc66b	2016-12-12 16:42:34 -0800	[diff] [blame]	279	__tlb_adjust_range(tlb, address, PAGE_SIZE); \
Benjamin Herrenschmidt	9e1b32c	2009-07-22 15:44:28 +1000	[diff] [blame]	280	__pte_free_tlb(tlb, ptep, address); \
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	281	} while (0)
				282
				283	#ifndef __ARCH_HAS_4LEVEL_HACK
Benjamin Herrenschmidt	9e1b32c	2009-07-22 15:44:28 +1000	[diff] [blame]	284	#define pud_free_tlb(tlb, pudp, address) \
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	285	do { \
Aneesh Kumar K.V	b5bc66b	2016-12-12 16:42:34 -0800	[diff] [blame]	286	__tlb_adjust_range(tlb, address, PAGE_SIZE); \
Benjamin Herrenschmidt	9e1b32c	2009-07-22 15:44:28 +1000	[diff] [blame]	287	__pud_free_tlb(tlb, pudp, address); \
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	288	} while (0)
				289	#endif
				290
Benjamin Herrenschmidt	9e1b32c	2009-07-22 15:44:28 +1000	[diff] [blame]	291	#define pmd_free_tlb(tlb, pmdp, address) \
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	292	do { \
Aneesh Kumar K.V	b5bc66b	2016-12-12 16:42:34 -0800	[diff] [blame]	293	__tlb_adjust_range(tlb, address, PAGE_SIZE); \
Benjamin Herrenschmidt	9e1b32c	2009-07-22 15:44:28 +1000	[diff] [blame]	294	__pmd_free_tlb(tlb, pmdp, address); \
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	295	} while (0)
				296
				297	#define tlb_migrate_finish(mm) do {} while (0)
				298
				299	#endif /* _ASM_GENERIC__TLB_H */