Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1 | #ifndef _LINUX_RMAP_H |
| 2 | #define _LINUX_RMAP_H |
| 3 | /* |
| 4 | * Declarations for Reverse Mapping functions in mm/rmap.c |
| 5 | */ |
| 6 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 7 | #include <linux/list.h> |
| 8 | #include <linux/slab.h> |
| 9 | #include <linux/mm.h> |
Ingo Molnar | 5a50508 | 2012-12-02 19:56:46 +0000 | [diff] [blame] | 10 | #include <linux/rwsem.h> |
Balbir Singh | bed7161 | 2008-02-07 00:14:01 -0800 | [diff] [blame] | 11 | #include <linux/memcontrol.h> |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 12 | |
| 13 | /* |
| 14 | * The anon_vma heads a list of private "related" vmas, to scan if |
| 15 | * an anonymous page pointing to this anon_vma needs to be unmapped: |
| 16 | * the vmas on the list will be related by forking, or by splitting. |
| 17 | * |
| 18 | * Since vmas come and go as they are split and merged (particularly |
| 19 | * in mprotect), the mapping field of an anonymous page cannot point |
| 20 | * directly to a vma: instead it points to an anon_vma, on whose list |
| 21 | * the related vmas can be easily linked or unlinked. |
| 22 | * |
| 23 | * After unlinking the last vma on the list, we must garbage collect |
| 24 | * the anon_vma object itself: we're guaranteed no page can be |
| 25 | * pointing to this anon_vma once its vma list is empty. |
| 26 | */ |
| 27 | struct anon_vma { |
Ingo Molnar | 5a50508 | 2012-12-02 19:56:46 +0000 | [diff] [blame] | 28 | struct anon_vma *root; /* Root of this anon_vma tree */ |
| 29 | struct rw_semaphore rwsem; /* W: modification, R: walking the list */ |
Mel Gorman | 7f60c21 | 2010-05-24 14:32:18 -0700 | [diff] [blame] | 30 | /* |
Peter Zijlstra | 8381326 | 2011-03-22 16:32:48 -0700 | [diff] [blame] | 31 | * The refcount is taken on an anon_vma when there is no |
Mel Gorman | 7f60c21 | 2010-05-24 14:32:18 -0700 | [diff] [blame] | 32 | * guarantee that the vma of page tables will exist for |
| 33 | * the duration of the operation. A caller that takes |
| 34 | * the reference is responsible for clearing up the |
| 35 | * anon_vma if they are the last user on release |
| 36 | */ |
Peter Zijlstra | 8381326 | 2011-03-22 16:32:48 -0700 | [diff] [blame] | 37 | atomic_t refcount; |
| 38 | |
Andrea Arcangeli | 7906d00 | 2008-07-28 15:46:26 -0700 | [diff] [blame] | 39 | /* |
Michel Lespinasse | bf181b9 | 2012-10-08 16:31:39 -0700 | [diff] [blame] | 40 | * NOTE: the LSB of the rb_root.rb_node is set by |
Andrea Arcangeli | 7906d00 | 2008-07-28 15:46:26 -0700 | [diff] [blame] | 41 | * mm_take_all_locks() _after_ taking the above lock. So the |
Michel Lespinasse | bf181b9 | 2012-10-08 16:31:39 -0700 | [diff] [blame] | 42 | * rb_root must only be read/written after taking the above lock |
Andrea Arcangeli | 7906d00 | 2008-07-28 15:46:26 -0700 | [diff] [blame] | 43 | * to be sure to see a valid next pointer. The LSB bit itself |
| 44 | * is serialized by a system wide lock only visible to |
| 45 | * mm_take_all_locks() (mm_all_locks_mutex). |
| 46 | */ |
Michel Lespinasse | bf181b9 | 2012-10-08 16:31:39 -0700 | [diff] [blame] | 47 | struct rb_root rb_root; /* Interval tree of private "related" vmas */ |
Rik van Riel | 5beb493 | 2010-03-05 13:42:07 -0800 | [diff] [blame] | 48 | }; |
| 49 | |
| 50 | /* |
| 51 | * The copy-on-write semantics of fork mean that an anon_vma |
| 52 | * can become associated with multiple processes. Furthermore, |
| 53 | * each child process will have its own anon_vma, where new |
| 54 | * pages for that process are instantiated. |
| 55 | * |
| 56 | * This structure allows us to find the anon_vmas associated |
| 57 | * with a VMA, or the VMAs associated with an anon_vma. |
| 58 | * The "same_vma" list contains the anon_vma_chains linking |
| 59 | * all the anon_vmas associated with this VMA. |
Michel Lespinasse | bf181b9 | 2012-10-08 16:31:39 -0700 | [diff] [blame] | 60 | * The "rb" field indexes on an interval tree the anon_vma_chains |
Rik van Riel | 5beb493 | 2010-03-05 13:42:07 -0800 | [diff] [blame] | 61 | * which link all the VMAs associated with this anon_vma. |
| 62 | */ |
| 63 | struct anon_vma_chain { |
| 64 | struct vm_area_struct *vma; |
| 65 | struct anon_vma *anon_vma; |
| 66 | struct list_head same_vma; /* locked by mmap_sem & page_table_lock */ |
Ingo Molnar | 5a50508 | 2012-12-02 19:56:46 +0000 | [diff] [blame] | 67 | struct rb_node rb; /* locked by anon_vma->rwsem */ |
Michel Lespinasse | bf181b9 | 2012-10-08 16:31:39 -0700 | [diff] [blame] | 68 | unsigned long rb_subtree_last; |
Michel Lespinasse | ed8ea81 | 2012-10-08 16:31:45 -0700 | [diff] [blame] | 69 | #ifdef CONFIG_DEBUG_VM_RB |
| 70 | unsigned long cached_vma_start, cached_vma_last; |
| 71 | #endif |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 72 | }; |
| 73 | |
Minchan Kim | 02c6de8 | 2012-10-08 16:31:55 -0700 | [diff] [blame] | 74 | enum ttu_flags { |
Konstantin Khlebnikov | daa5ba7 | 2014-06-04 16:10:52 -0700 | [diff] [blame^] | 75 | TTU_UNMAP = 1, /* unmap mode */ |
| 76 | TTU_MIGRATION = 2, /* migration mode */ |
| 77 | TTU_MUNLOCK = 4, /* munlock mode */ |
Minchan Kim | 02c6de8 | 2012-10-08 16:31:55 -0700 | [diff] [blame] | 78 | |
| 79 | TTU_IGNORE_MLOCK = (1 << 8), /* ignore mlock */ |
| 80 | TTU_IGNORE_ACCESS = (1 << 9), /* don't age */ |
| 81 | TTU_IGNORE_HWPOISON = (1 << 10),/* corrupted page is recoverable */ |
| 82 | }; |
| 83 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 84 | #ifdef CONFIG_MMU |
Rik van Riel | 7654506 | 2010-08-09 17:18:41 -0700 | [diff] [blame] | 85 | static inline void get_anon_vma(struct anon_vma *anon_vma) |
| 86 | { |
Peter Zijlstra | 8381326 | 2011-03-22 16:32:48 -0700 | [diff] [blame] | 87 | atomic_inc(&anon_vma->refcount); |
Rik van Riel | 7654506 | 2010-08-09 17:18:41 -0700 | [diff] [blame] | 88 | } |
| 89 | |
Peter Zijlstra | 01d8b20 | 2011-03-22 16:32:49 -0700 | [diff] [blame] | 90 | void __put_anon_vma(struct anon_vma *anon_vma); |
| 91 | |
| 92 | static inline void put_anon_vma(struct anon_vma *anon_vma) |
| 93 | { |
| 94 | if (atomic_dec_and_test(&anon_vma->refcount)) |
| 95 | __put_anon_vma(anon_vma); |
| 96 | } |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 97 | |
Hugh Dickins | 3ca7b3c | 2009-12-14 17:58:57 -0800 | [diff] [blame] | 98 | static inline struct anon_vma *page_anon_vma(struct page *page) |
| 99 | { |
| 100 | if (((unsigned long)page->mapping & PAGE_MAPPING_FLAGS) != |
| 101 | PAGE_MAPPING_ANON) |
| 102 | return NULL; |
| 103 | return page_rmapping(page); |
| 104 | } |
| 105 | |
Rik van Riel | bb4a340 | 2010-08-09 17:18:37 -0700 | [diff] [blame] | 106 | static inline void vma_lock_anon_vma(struct vm_area_struct *vma) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 107 | { |
| 108 | struct anon_vma *anon_vma = vma->anon_vma; |
| 109 | if (anon_vma) |
Ingo Molnar | 5a50508 | 2012-12-02 19:56:46 +0000 | [diff] [blame] | 110 | down_write(&anon_vma->root->rwsem); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 111 | } |
| 112 | |
Rik van Riel | bb4a340 | 2010-08-09 17:18:37 -0700 | [diff] [blame] | 113 | static inline void vma_unlock_anon_vma(struct vm_area_struct *vma) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 114 | { |
| 115 | struct anon_vma *anon_vma = vma->anon_vma; |
| 116 | if (anon_vma) |
Ingo Molnar | 5a50508 | 2012-12-02 19:56:46 +0000 | [diff] [blame] | 117 | up_write(&anon_vma->root->rwsem); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 118 | } |
| 119 | |
Ingo Molnar | 4fc3f1d | 2012-12-02 19:56:50 +0000 | [diff] [blame] | 120 | static inline void anon_vma_lock_write(struct anon_vma *anon_vma) |
Rik van Riel | cba48b9 | 2010-08-09 17:18:38 -0700 | [diff] [blame] | 121 | { |
Ingo Molnar | 5a50508 | 2012-12-02 19:56:46 +0000 | [diff] [blame] | 122 | down_write(&anon_vma->root->rwsem); |
Rik van Riel | cba48b9 | 2010-08-09 17:18:38 -0700 | [diff] [blame] | 123 | } |
| 124 | |
Konstantin Khlebnikov | 08b5270 | 2013-02-22 16:34:40 -0800 | [diff] [blame] | 125 | static inline void anon_vma_unlock_write(struct anon_vma *anon_vma) |
Rik van Riel | cba48b9 | 2010-08-09 17:18:38 -0700 | [diff] [blame] | 126 | { |
Ingo Molnar | 5a50508 | 2012-12-02 19:56:46 +0000 | [diff] [blame] | 127 | up_write(&anon_vma->root->rwsem); |
Rik van Riel | cba48b9 | 2010-08-09 17:18:38 -0700 | [diff] [blame] | 128 | } |
| 129 | |
Ingo Molnar | 4fc3f1d | 2012-12-02 19:56:50 +0000 | [diff] [blame] | 130 | static inline void anon_vma_lock_read(struct anon_vma *anon_vma) |
| 131 | { |
| 132 | down_read(&anon_vma->root->rwsem); |
| 133 | } |
| 134 | |
| 135 | static inline void anon_vma_unlock_read(struct anon_vma *anon_vma) |
| 136 | { |
| 137 | up_read(&anon_vma->root->rwsem); |
| 138 | } |
| 139 | |
| 140 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 141 | /* |
| 142 | * anon_vma helper functions. |
| 143 | */ |
| 144 | void anon_vma_init(void); /* create anon_vma_cachep */ |
| 145 | int anon_vma_prepare(struct vm_area_struct *); |
Rik van Riel | 5beb493 | 2010-03-05 13:42:07 -0800 | [diff] [blame] | 146 | void unlink_anon_vmas(struct vm_area_struct *); |
| 147 | int anon_vma_clone(struct vm_area_struct *, struct vm_area_struct *); |
| 148 | int anon_vma_fork(struct vm_area_struct *, struct vm_area_struct *); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 149 | |
Rik van Riel | 5beb493 | 2010-03-05 13:42:07 -0800 | [diff] [blame] | 150 | static inline void anon_vma_merge(struct vm_area_struct *vma, |
| 151 | struct vm_area_struct *next) |
| 152 | { |
| 153 | VM_BUG_ON(vma->anon_vma != next->anon_vma); |
| 154 | unlink_anon_vmas(next); |
| 155 | } |
| 156 | |
Peter Zijlstra | 01d8b20 | 2011-03-22 16:32:49 -0700 | [diff] [blame] | 157 | struct anon_vma *page_get_anon_vma(struct page *page); |
| 158 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 159 | /* |
| 160 | * rmap interfaces called when adding or removing pte of page |
| 161 | */ |
Rik van Riel | c44b674 | 2010-03-05 13:42:09 -0800 | [diff] [blame] | 162 | void page_move_anon_rmap(struct page *, struct vm_area_struct *, unsigned long); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 163 | void page_add_anon_rmap(struct page *, struct vm_area_struct *, unsigned long); |
Rik van Riel | ad8c2ee | 2010-08-09 17:19:48 -0700 | [diff] [blame] | 164 | void do_page_add_anon_rmap(struct page *, struct vm_area_struct *, |
| 165 | unsigned long, int); |
Nick Piggin | 9617d95 | 2006-01-06 00:11:12 -0800 | [diff] [blame] | 166 | void page_add_new_anon_rmap(struct page *, struct vm_area_struct *, unsigned long); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 167 | void page_add_file_rmap(struct page *); |
Hugh Dickins | edc315f | 2009-01-06 14:40:11 -0800 | [diff] [blame] | 168 | void page_remove_rmap(struct page *); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 169 | |
Naoya Horiguchi | 0fe6e20 | 2010-05-28 09:29:16 +0900 | [diff] [blame] | 170 | void hugepage_add_anon_rmap(struct page *, struct vm_area_struct *, |
| 171 | unsigned long); |
| 172 | void hugepage_add_new_anon_rmap(struct page *, struct vm_area_struct *, |
| 173 | unsigned long); |
| 174 | |
Hugh Dickins | 21333b2 | 2009-09-21 17:01:59 -0700 | [diff] [blame] | 175 | static inline void page_dup_rmap(struct page *page) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 176 | { |
| 177 | atomic_inc(&page->_mapcount); |
| 178 | } |
| 179 | |
| 180 | /* |
| 181 | * Called from mm/vmscan.c to handle paging out |
| 182 | */ |
Wu Fengguang | 6fe6b7e | 2009-06-16 15:33:05 -0700 | [diff] [blame] | 183 | int page_referenced(struct page *, int is_locked, |
Johannes Weiner | 72835c8 | 2012-01-12 17:18:32 -0800 | [diff] [blame] | 184 | struct mem_cgroup *memcg, unsigned long *vm_flags); |
Hugh Dickins | 5ad6468 | 2009-12-14 17:59:24 -0800 | [diff] [blame] | 185 | |
Andi Kleen | 14fa31b | 2009-09-16 11:50:10 +0200 | [diff] [blame] | 186 | #define TTU_ACTION(x) ((x) & TTU_ACTION_MASK) |
| 187 | |
| 188 | int try_to_unmap(struct page *, enum ttu_flags flags); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 189 | |
| 190 | /* |
Carsten Otte | ceffc07 | 2005-06-23 22:05:25 -0700 | [diff] [blame] | 191 | * Called from mm/filemap_xip.c to unmap empty zero page |
| 192 | */ |
Namhyung Kim | e9a81a8 | 2010-10-26 14:22:01 -0700 | [diff] [blame] | 193 | pte_t *__page_check_address(struct page *, struct mm_struct *, |
Nick Piggin | 479db0b | 2008-08-20 14:09:18 -0700 | [diff] [blame] | 194 | unsigned long, spinlock_t **, int); |
Carsten Otte | ceffc07 | 2005-06-23 22:05:25 -0700 | [diff] [blame] | 195 | |
Namhyung Kim | e9a81a8 | 2010-10-26 14:22:01 -0700 | [diff] [blame] | 196 | static inline pte_t *page_check_address(struct page *page, struct mm_struct *mm, |
| 197 | unsigned long address, |
| 198 | spinlock_t **ptlp, int sync) |
| 199 | { |
| 200 | pte_t *ptep; |
| 201 | |
| 202 | __cond_lock(*ptlp, ptep = __page_check_address(page, mm, address, |
| 203 | ptlp, sync)); |
| 204 | return ptep; |
| 205 | } |
| 206 | |
Carsten Otte | ceffc07 | 2005-06-23 22:05:25 -0700 | [diff] [blame] | 207 | /* |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 208 | * Used by swapoff to help locate where page is expected in vma. |
| 209 | */ |
| 210 | unsigned long page_address_in_vma(struct page *, struct vm_area_struct *); |
| 211 | |
Peter Zijlstra | d08b385 | 2006-09-25 23:30:57 -0700 | [diff] [blame] | 212 | /* |
| 213 | * Cleans the PTEs of shared mappings. |
| 214 | * (and since clean PTEs should also be readonly, write protects them too) |
| 215 | * |
| 216 | * returns the number of cleaned PTEs. |
| 217 | */ |
| 218 | int page_mkclean(struct page *); |
| 219 | |
Nick Piggin | b291f00 | 2008-10-18 20:26:44 -0700 | [diff] [blame] | 220 | /* |
| 221 | * called in munlock()/munmap() path to check for other vmas holding |
| 222 | * the page mlocked. |
| 223 | */ |
| 224 | int try_to_munlock(struct page *); |
Nick Piggin | b291f00 | 2008-10-18 20:26:44 -0700 | [diff] [blame] | 225 | |
Andi Kleen | 10be22d | 2009-09-16 11:50:04 +0200 | [diff] [blame] | 226 | /* |
| 227 | * Called by memory-failure.c to kill processes. |
| 228 | */ |
Ingo Molnar | 4fc3f1d | 2012-12-02 19:56:50 +0000 | [diff] [blame] | 229 | struct anon_vma *page_lock_anon_vma_read(struct page *page); |
| 230 | void page_unlock_anon_vma_read(struct anon_vma *anon_vma); |
Andi Kleen | 6a46079 | 2009-09-16 11:50:15 +0200 | [diff] [blame] | 231 | int page_mapped_in_vma(struct page *page, struct vm_area_struct *vma); |
Andi Kleen | 10be22d | 2009-09-16 11:50:04 +0200 | [diff] [blame] | 232 | |
Joonsoo Kim | 0dd1c7b | 2014-01-21 15:49:49 -0800 | [diff] [blame] | 233 | /* |
| 234 | * rmap_walk_control: To control rmap traversing for specific needs |
| 235 | * |
| 236 | * arg: passed to rmap_one() and invalid_vma() |
| 237 | * rmap_one: executed on each vma where page is mapped |
| 238 | * done: for checking traversing termination condition |
| 239 | * file_nonlinear: for handling file nonlinear mapping |
| 240 | * anon_lock: for getting anon_lock by optimized way rather than default |
| 241 | * invalid_vma: for skipping uninterested vma |
| 242 | */ |
Joonsoo Kim | 051ac83 | 2014-01-21 15:49:48 -0800 | [diff] [blame] | 243 | struct rmap_walk_control { |
| 244 | void *arg; |
| 245 | int (*rmap_one)(struct page *page, struct vm_area_struct *vma, |
| 246 | unsigned long addr, void *arg); |
Joonsoo Kim | 0dd1c7b | 2014-01-21 15:49:49 -0800 | [diff] [blame] | 247 | int (*done)(struct page *page); |
Hugh Dickins | 7e09e73 | 2014-03-20 21:52:17 -0700 | [diff] [blame] | 248 | int (*file_nonlinear)(struct page *, struct address_space *, void *arg); |
Joonsoo Kim | 0dd1c7b | 2014-01-21 15:49:49 -0800 | [diff] [blame] | 249 | struct anon_vma *(*anon_lock)(struct page *page); |
| 250 | bool (*invalid_vma)(struct vm_area_struct *vma, void *arg); |
Joonsoo Kim | 051ac83 | 2014-01-21 15:49:48 -0800 | [diff] [blame] | 251 | }; |
| 252 | |
Joonsoo Kim | 051ac83 | 2014-01-21 15:49:48 -0800 | [diff] [blame] | 253 | int rmap_walk(struct page *page, struct rmap_walk_control *rwc); |
Hugh Dickins | e9995ef | 2009-12-14 17:59:31 -0800 | [diff] [blame] | 254 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 255 | #else /* !CONFIG_MMU */ |
| 256 | |
| 257 | #define anon_vma_init() do {} while (0) |
| 258 | #define anon_vma_prepare(vma) (0) |
| 259 | #define anon_vma_link(vma) do {} while (0) |
| 260 | |
Mike Frysinger | 01ff53f | 2009-06-23 12:37:01 -0700 | [diff] [blame] | 261 | static inline int page_referenced(struct page *page, int is_locked, |
Johannes Weiner | 72835c8 | 2012-01-12 17:18:32 -0800 | [diff] [blame] | 262 | struct mem_cgroup *memcg, |
Mike Frysinger | 01ff53f | 2009-06-23 12:37:01 -0700 | [diff] [blame] | 263 | unsigned long *vm_flags) |
| 264 | { |
| 265 | *vm_flags = 0; |
Johannes Weiner | 64574746 | 2010-03-05 13:42:22 -0800 | [diff] [blame] | 266 | return 0; |
Mike Frysinger | 01ff53f | 2009-06-23 12:37:01 -0700 | [diff] [blame] | 267 | } |
| 268 | |
Christoph Lameter | a48d07a | 2006-02-01 03:05:38 -0800 | [diff] [blame] | 269 | #define try_to_unmap(page, refs) SWAP_FAIL |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 270 | |
Peter Zijlstra | d08b385 | 2006-09-25 23:30:57 -0700 | [diff] [blame] | 271 | static inline int page_mkclean(struct page *page) |
| 272 | { |
| 273 | return 0; |
| 274 | } |
| 275 | |
| 276 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 277 | #endif /* CONFIG_MMU */ |
| 278 | |
| 279 | /* |
| 280 | * Return values of try_to_unmap |
| 281 | */ |
| 282 | #define SWAP_SUCCESS 0 |
| 283 | #define SWAP_AGAIN 1 |
| 284 | #define SWAP_FAIL 2 |
Nick Piggin | b291f00 | 2008-10-18 20:26:44 -0700 | [diff] [blame] | 285 | #define SWAP_MLOCK 3 |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 286 | |
| 287 | #endif /* _LINUX_RMAP_H */ |