blob: d5ceb2839a2ded8ccf49524d76a5eedd666b1cd1 [file] [log] [blame]
Greg Kroah-Hartmanb2441312017-11-01 15:07:57 +01001/* SPDX-License-Identifier: GPL-2.0 */
Dave Chinnera38e4082013-08-28 10:17:58 +10002/*
3 * Copyright (c) 2013 Red Hat, Inc. and Parallels Inc. All rights reserved.
4 * Authors: David Chinner and Glauber Costa
5 *
6 * Generic LRU infrastructure
7 */
8#ifndef _LRU_LIST_H
9#define _LRU_LIST_H
10
11#include <linux/list.h>
Dave Chinner3b1d58a2013-08-28 10:18:00 +100012#include <linux/nodemask.h>
Vladimir Davydov503c3582015-02-12 14:58:47 -080013#include <linux/shrinker.h>
Dave Chinnera38e4082013-08-28 10:17:58 +100014
Vladimir Davydov60d3fd32015-02-12 14:59:10 -080015struct mem_cgroup;
16
Dave Chinnera38e4082013-08-28 10:17:58 +100017/* list_lru_walk_cb has to always return one of those */
18enum lru_status {
19 LRU_REMOVED, /* item removed from list */
Johannes Weiner449dd692014-04-03 14:47:56 -070020 LRU_REMOVED_RETRY, /* item removed, but lock has been
21 dropped and reacquired */
Dave Chinnera38e4082013-08-28 10:17:58 +100022 LRU_ROTATE, /* item referenced, give another pass */
23 LRU_SKIP, /* item cannot be locked, skip */
24 LRU_RETRY, /* item not freeable. May drop the lock
25 internally, but has to return locked. */
26};
27
Vladimir Davydov60d3fd32015-02-12 14:59:10 -080028struct list_lru_one {
Dave Chinnera38e4082013-08-28 10:17:58 +100029 struct list_head list;
Vladimir Davydov2788cf02015-02-12 14:59:38 -080030 /* may become negative during memcg reparenting */
Dave Chinnera38e4082013-08-28 10:17:58 +100031 long nr_items;
Vladimir Davydov60d3fd32015-02-12 14:59:10 -080032};
33
34struct list_lru_memcg {
Kirill Tkhai0c7c1be2018-04-05 16:25:08 -070035 struct rcu_head rcu;
Vladimir Davydov60d3fd32015-02-12 14:59:10 -080036 /* array of per cgroup lists, indexed by memcg_cache_id */
37 struct list_lru_one *lru[0];
38};
39
40struct list_lru_node {
41 /* protects all lists on the node, including per cgroup */
42 spinlock_t lock;
43 /* global list, used for the root cgroup in cgroup aware lrus */
44 struct list_lru_one lru;
Kirill Tkhai84c07d12018-08-17 15:47:25 -070045#ifdef CONFIG_MEMCG_KMEM
Vladimir Davydov60d3fd32015-02-12 14:59:10 -080046 /* for cgroup aware lrus points to per cgroup lists, otherwise NULL */
Kirill Tkhai0c7c1be2018-04-05 16:25:08 -070047 struct list_lru_memcg __rcu *memcg_lrus;
Vladimir Davydov60d3fd32015-02-12 14:59:10 -080048#endif
Sahitya Tummala2c80cd52017-07-10 15:49:57 -070049 long nr_items;
Dave Chinner3b1d58a2013-08-28 10:18:00 +100050} ____cacheline_aligned_in_smp;
51
52struct list_lru {
Glauber Costa5ca302c2013-08-28 10:18:18 +100053 struct list_lru_node *node;
Kirill Tkhai84c07d12018-08-17 15:47:25 -070054#ifdef CONFIG_MEMCG_KMEM
Vladimir Davydovc0a5b562015-02-12 14:59:07 -080055 struct list_head list;
Kirill Tkhaic92e8e12018-08-17 15:47:50 -070056 int shrinker_id;
Jiri Slaby3e858992019-05-31 22:30:26 -070057 bool memcg_aware;
Vladimir Davydovc0a5b562015-02-12 14:59:07 -080058#endif
Dave Chinnera38e4082013-08-28 10:17:58 +100059};
60
Glauber Costa5ca302c2013-08-28 10:18:18 +100061void list_lru_destroy(struct list_lru *lru);
Vladimir Davydov60d3fd32015-02-12 14:59:10 -080062int __list_lru_init(struct list_lru *lru, bool memcg_aware,
Kirill Tkhaic92e8e12018-08-17 15:47:50 -070063 struct lock_class_key *key, struct shrinker *shrinker);
Vladimir Davydov60d3fd32015-02-12 14:59:10 -080064
Kirill Tkhaic92e8e12018-08-17 15:47:50 -070065#define list_lru_init(lru) \
66 __list_lru_init((lru), false, NULL, NULL)
67#define list_lru_init_key(lru, key) \
68 __list_lru_init((lru), false, (key), NULL)
69#define list_lru_init_memcg(lru, shrinker) \
70 __list_lru_init((lru), true, NULL, shrinker)
Vladimir Davydov60d3fd32015-02-12 14:59:10 -080071
72int memcg_update_all_list_lrus(int num_memcgs);
Kirill Tkhai9bec5c32018-08-17 15:47:58 -070073void memcg_drain_all_list_lrus(int src_idx, struct mem_cgroup *dst_memcg);
Dave Chinnera38e4082013-08-28 10:17:58 +100074
75/**
76 * list_lru_add: add an element to the lru list's tail
77 * @list_lru: the lru pointer
78 * @item: the item to be added.
79 *
80 * If the element is already part of a list, this function returns doing
81 * nothing. Therefore the caller does not need to keep state about whether or
82 * not the element already belongs in the list and is allowed to lazy update
83 * it. Note however that this is valid for *a* list, not *this* list. If
84 * the caller organize itself in a way that elements can be in more than
85 * one type of list, it is up to the caller to fully remove the item from
86 * the previous list (with list_lru_del() for instance) before moving it
87 * to @list_lru
88 *
89 * Return value: true if the list was updated, false otherwise
90 */
91bool list_lru_add(struct list_lru *lru, struct list_head *item);
92
93/**
94 * list_lru_del: delete an element to the lru list
95 * @list_lru: the lru pointer
96 * @item: the item to be deleted.
97 *
98 * This function works analogously as list_lru_add in terms of list
99 * manipulation. The comments about an element already pertaining to
100 * a list are also valid for list_lru_del.
101 *
102 * Return value: true if the list was updated, false otherwise
103 */
104bool list_lru_del(struct list_lru *lru, struct list_head *item);
105
106/**
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800107 * list_lru_count_one: return the number of objects currently held by @lru
Dave Chinnera38e4082013-08-28 10:17:58 +1000108 * @lru: the lru pointer.
Glauber Costa6a4f4962013-08-28 10:18:02 +1000109 * @nid: the node id to count from.
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800110 * @memcg: the cgroup to count from.
Dave Chinnera38e4082013-08-28 10:17:58 +1000111 *
112 * Always return a non-negative number, 0 for empty lists. There is no
113 * guarantee that the list is not updated while the count is being computed.
114 * Callers that want such a guarantee need to provide an outer lock.
115 */
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800116unsigned long list_lru_count_one(struct list_lru *lru,
117 int nid, struct mem_cgroup *memcg);
Glauber Costa6a4f4962013-08-28 10:18:02 +1000118unsigned long list_lru_count_node(struct list_lru *lru, int nid);
Vladimir Davydov503c3582015-02-12 14:58:47 -0800119
120static inline unsigned long list_lru_shrink_count(struct list_lru *lru,
121 struct shrink_control *sc)
122{
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800123 return list_lru_count_one(lru, sc->nid, sc->memcg);
Vladimir Davydov503c3582015-02-12 14:58:47 -0800124}
125
Glauber Costa6a4f4962013-08-28 10:18:02 +1000126static inline unsigned long list_lru_count(struct list_lru *lru)
127{
128 long count = 0;
129 int nid;
130
Vladimir Davydovff0b67e2015-02-12 14:59:04 -0800131 for_each_node_state(nid, N_NORMAL_MEMORY)
Glauber Costa6a4f4962013-08-28 10:18:02 +1000132 count += list_lru_count_node(lru, nid);
133
134 return count;
135}
Dave Chinnera38e4082013-08-28 10:17:58 +1000136
Vladimir Davydov3f97b162015-02-12 14:59:35 -0800137void list_lru_isolate(struct list_lru_one *list, struct list_head *item);
138void list_lru_isolate_move(struct list_lru_one *list, struct list_head *item,
139 struct list_head *head);
140
141typedef enum lru_status (*list_lru_walk_cb)(struct list_head *item,
142 struct list_lru_one *list, spinlock_t *lock, void *cb_arg);
143
Dave Chinnera38e4082013-08-28 10:17:58 +1000144/**
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800145 * list_lru_walk_one: walk a list_lru, isolating and disposing freeable items.
Dave Chinnera38e4082013-08-28 10:17:58 +1000146 * @lru: the lru pointer.
Glauber Costa6a4f4962013-08-28 10:18:02 +1000147 * @nid: the node id to scan from.
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800148 * @memcg: the cgroup to scan from.
Dave Chinnera38e4082013-08-28 10:17:58 +1000149 * @isolate: callback function that is resposible for deciding what to do with
150 * the item currently being scanned
151 * @cb_arg: opaque type that will be passed to @isolate
152 * @nr_to_walk: how many items to scan.
153 *
154 * This function will scan all elements in a particular list_lru, calling the
155 * @isolate callback for each of those items, along with the current list
156 * spinlock and a caller-provided opaque. The @isolate callback can choose to
157 * drop the lock internally, but *must* return with the lock held. The callback
158 * will return an enum lru_status telling the list_lru infrastructure what to
159 * do with the object being scanned.
160 *
161 * Please note that nr_to_walk does not mean how many objects will be freed,
162 * just how many objects will be scanned.
163 *
164 * Return value: the number of objects effectively removed from the LRU.
165 */
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800166unsigned long list_lru_walk_one(struct list_lru *lru,
167 int nid, struct mem_cgroup *memcg,
168 list_lru_walk_cb isolate, void *cb_arg,
169 unsigned long *nr_to_walk);
Sebastian Andrzej Siewior6b51e882018-08-17 15:49:55 -0700170/**
171 * list_lru_walk_one_irq: walk a list_lru, isolating and disposing freeable items.
172 * @lru: the lru pointer.
173 * @nid: the node id to scan from.
174 * @memcg: the cgroup to scan from.
175 * @isolate: callback function that is resposible for deciding what to do with
176 * the item currently being scanned
177 * @cb_arg: opaque type that will be passed to @isolate
178 * @nr_to_walk: how many items to scan.
179 *
180 * Same as @list_lru_walk_one except that the spinlock is acquired with
181 * spin_lock_irq().
182 */
183unsigned long list_lru_walk_one_irq(struct list_lru *lru,
184 int nid, struct mem_cgroup *memcg,
185 list_lru_walk_cb isolate, void *cb_arg,
186 unsigned long *nr_to_walk);
Glauber Costa6a4f4962013-08-28 10:18:02 +1000187unsigned long list_lru_walk_node(struct list_lru *lru, int nid,
188 list_lru_walk_cb isolate, void *cb_arg,
189 unsigned long *nr_to_walk);
190
191static inline unsigned long
Vladimir Davydov503c3582015-02-12 14:58:47 -0800192list_lru_shrink_walk(struct list_lru *lru, struct shrink_control *sc,
193 list_lru_walk_cb isolate, void *cb_arg)
194{
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800195 return list_lru_walk_one(lru, sc->nid, sc->memcg, isolate, cb_arg,
196 &sc->nr_to_scan);
Vladimir Davydov503c3582015-02-12 14:58:47 -0800197}
198
199static inline unsigned long
Sebastian Andrzej Siewior6b51e882018-08-17 15:49:55 -0700200list_lru_shrink_walk_irq(struct list_lru *lru, struct shrink_control *sc,
201 list_lru_walk_cb isolate, void *cb_arg)
202{
203 return list_lru_walk_one_irq(lru, sc->nid, sc->memcg, isolate, cb_arg,
204 &sc->nr_to_scan);
205}
206
207static inline unsigned long
Glauber Costa6a4f4962013-08-28 10:18:02 +1000208list_lru_walk(struct list_lru *lru, list_lru_walk_cb isolate,
209 void *cb_arg, unsigned long nr_to_walk)
210{
211 long isolated = 0;
212 int nid;
213
Vladimir Davydovff0b67e2015-02-12 14:59:04 -0800214 for_each_node_state(nid, N_NORMAL_MEMORY) {
Glauber Costa6a4f4962013-08-28 10:18:02 +1000215 isolated += list_lru_walk_node(lru, nid, isolate,
216 cb_arg, &nr_to_walk);
217 if (nr_to_walk <= 0)
218 break;
219 }
220 return isolated;
221}
Dave Chinnera38e4082013-08-28 10:17:58 +1000222#endif /* _LRU_LIST_H */