1 /* SPDX-License-Identifier: GPL-2.0 */
2 /*
3  * Copyright (c) 2013 Red Hat, Inc. and Parallels Inc. All rights reserved.
4  * Authors: David Chinner and Glauber Costa
5  *
6  * Generic LRU infrastructure
7  */
8 #ifndef _LRU_LIST_H
9 #define _LRU_LIST_H
10 
11 #include <linux/list.h>
12 #include <linux/nodemask.h>
13 #include <linux/shrinker.h>
14 #include <linux/xarray.h>
15 
16 struct mem_cgroup;
17 
18 /* list_lru_walk_cb has to always return one of those */
19 enum lru_status {
20 	LRU_REMOVED,		/* item removed from list */
21 	LRU_REMOVED_RETRY,	/* item removed, but lock has been
22 				   dropped and reacquired */
23 	LRU_ROTATE,		/* item referenced, give another pass */
24 	LRU_SKIP,		/* item cannot be locked, skip */
25 	LRU_RETRY,		/* item not freeable. May drop the lock
26 				   internally, but has to return locked. */
27 	LRU_STOP,		/* stop lru list walking. May drop the lock
28 				   internally, but has to return locked. */
29 };
30 
31 struct list_lru_one {
32 	struct list_head	list;
33 	/* may become negative during memcg reparenting */
34 	long			nr_items;
35 	/* protects all fields above */
36 	spinlock_t		lock;
37 };
38 
39 struct list_lru_memcg {
40 	struct rcu_head		rcu;
41 	/* array of per cgroup per node lists, indexed by node id */
42 	struct list_lru_one	node[];
43 };
44 
45 struct list_lru_node {
46 	/* global list, used for the root cgroup in cgroup aware lrus */
47 	struct list_lru_one	lru;
48 	atomic_long_t		nr_items;
49 } ____cacheline_aligned_in_smp;
50 
51 struct list_lru {
52 	struct list_lru_node	*node;
53 #ifdef CONFIG_MEMCG
54 	struct list_head	list;
55 	int			shrinker_id;
56 	bool			memcg_aware;
57 	struct xarray		xa;
58 #endif
59 #ifdef CONFIG_LOCKDEP
60 	struct lock_class_key	*key;
61 #endif
62 };
63 
64 void list_lru_destroy(struct list_lru *lru);
65 int __list_lru_init(struct list_lru *lru, bool memcg_aware,
66 		    struct shrinker *shrinker);
67 
68 #define list_lru_init(lru)				\
69 	__list_lru_init((lru), false, NULL)
70 #define list_lru_init_memcg(lru, shrinker)		\
71 	__list_lru_init((lru), true, shrinker)
72 
list_lru_init_memcg_key(struct list_lru * lru,struct shrinker * shrinker,struct lock_class_key * key)73 static inline int list_lru_init_memcg_key(struct list_lru *lru, struct shrinker *shrinker,
74 					  struct lock_class_key *key)
75 {
76 #ifdef CONFIG_LOCKDEP
77 	lru->key = key;
78 #endif
79 	return list_lru_init_memcg(lru, shrinker);
80 }
81 
82 int memcg_list_lru_alloc(struct mem_cgroup *memcg, struct list_lru *lru,
83 			 gfp_t gfp);
84 void memcg_reparent_list_lrus(struct mem_cgroup *memcg, struct mem_cgroup *parent);
85 
86 /**
87  * list_lru_add: add an element to the lru list's tail
88  * @lru: the lru pointer
89  * @item: the item to be added.
90  * @nid: the node id of the sublist to add the item to.
91  * @memcg: the cgroup of the sublist to add the item to.
92  *
93  * If the element is already part of a list, this function returns doing
94  * nothing. This means that it is not necessary to keep state about whether or
95  * not the element already belongs in the list. That said, this logic only
96  * works if the item is in *this* list. If the item might be in some other
97  * list, then you cannot rely on this check and you must remove it from the
98  * other list before trying to insert it.
99  *
100  * The lru list consists of many sublists internally; the @nid and @memcg
101  * parameters are used to determine which sublist to insert the item into.
102  * It's important to use the right value of @nid and @memcg when deleting the
103  * item, since it might otherwise get deleted from the wrong sublist.
104  *
105  * This also applies when attempting to insert the item multiple times - if
106  * the item is currently in one sublist and you call list_lru_add() again, you
107  * must pass the right @nid and @memcg parameters so that the same sublist is
108  * used.
109  *
110  * You must ensure that the memcg is not freed during this call (e.g., with
111  * rcu or by taking a css refcnt).
112  *
113  * Return: true if the list was updated, false otherwise
114  */
115 bool list_lru_add(struct list_lru *lru, struct list_head *item, int nid,
116 		    struct mem_cgroup *memcg);
117 
118 /**
119  * list_lru_add_obj: add an element to the lru list's tail
120  * @lru: the lru pointer
121  * @item: the item to be added.
122  *
123  * This function is similar to list_lru_add(), but the NUMA node and the
124  * memcg of the sublist is determined by @item list_head. This assumption is
125  * valid for slab objects LRU such as dentries, inodes, etc.
126  *
127  * Return: true if the list was updated, false otherwise
128  */
129 bool list_lru_add_obj(struct list_lru *lru, struct list_head *item);
130 
131 /**
132  * list_lru_del: delete an element from the lru list
133  * @lru: the lru pointer
134  * @item: the item to be deleted.
135  * @nid: the node id of the sublist to delete the item from.
136  * @memcg: the cgroup of the sublist to delete the item from.
137  *
138  * This function works analogously as list_lru_add() in terms of list
139  * manipulation.
140  *
141  * The comments in list_lru_add() about an element already being in a list are
142  * also valid for list_lru_del(), that is, you can delete an item that has
143  * already been removed or never been added. However, if the item is in a
144  * list, it must be in *this* list, and you must pass the right value of @nid
145  * and @memcg so that the right sublist is used.
146  *
147  * You must ensure that the memcg is not freed during this call (e.g., with
148  * rcu or by taking a css refcnt). When a memcg is deleted, list_lru entries
149  * are automatically moved to the parent memcg. This is done in a race-free
150  * way, so during deletion of an memcg both the old and new memcg will resolve
151  * to the same sublist internally.
152  *
153  * Return: true if the list was updated, false otherwise
154  */
155 bool list_lru_del(struct list_lru *lru, struct list_head *item, int nid,
156 		    struct mem_cgroup *memcg);
157 
158 /**
159  * list_lru_del_obj: delete an element from the lru list
160  * @lru: the lru pointer
161  * @item: the item to be deleted.
162  *
163  * This function is similar to list_lru_del(), but the NUMA node and the
164  * memcg of the sublist is determined by @item list_head. This assumption is
165  * valid for slab objects LRU such as dentries, inodes, etc.
166  *
167  * Return: true if the list was updated, false otherwise.
168  */
169 bool list_lru_del_obj(struct list_lru *lru, struct list_head *item);
170 
171 /**
172  * list_lru_count_one: return the number of objects currently held by @lru
173  * @lru: the lru pointer.
174  * @nid: the node id to count from.
175  * @memcg: the cgroup to count from.
176  *
177  * There is no guarantee that the list is not updated while the count is being
178  * computed. Callers that want such a guarantee need to provide an outer lock.
179  *
180  * Return: 0 for empty lists, otherwise the number of objects
181  * currently held by @lru.
182  */
183 unsigned long list_lru_count_one(struct list_lru *lru,
184 				 int nid, struct mem_cgroup *memcg);
185 unsigned long list_lru_count_node(struct list_lru *lru, int nid);
186 
list_lru_shrink_count(struct list_lru * lru,struct shrink_control * sc)187 static inline unsigned long list_lru_shrink_count(struct list_lru *lru,
188 						  struct shrink_control *sc)
189 {
190 	return list_lru_count_one(lru, sc->nid, sc->memcg);
191 }
192 
list_lru_count(struct list_lru * lru)193 static inline unsigned long list_lru_count(struct list_lru *lru)
194 {
195 	long count = 0;
196 	int nid;
197 
198 	for_each_node_state(nid, N_NORMAL_MEMORY)
199 		count += list_lru_count_node(lru, nid);
200 
201 	return count;
202 }
203 
204 void list_lru_isolate(struct list_lru_one *list, struct list_head *item);
205 void list_lru_isolate_move(struct list_lru_one *list, struct list_head *item,
206 			   struct list_head *head);
207 
208 typedef enum lru_status (*list_lru_walk_cb)(struct list_head *item,
209 		struct list_lru_one *list, void *cb_arg);
210 
211 /**
212  * list_lru_walk_one: walk a @lru, isolating and disposing freeable items.
213  * @lru: the lru pointer.
214  * @nid: the node id to scan from.
215  * @memcg: the cgroup to scan from.
216  * @isolate: callback function that is responsible for deciding what to do with
217  *  the item currently being scanned
218  * @cb_arg: opaque type that will be passed to @isolate
219  * @nr_to_walk: how many items to scan.
220  *
221  * This function will scan all elements in a particular @lru, calling the
222  * @isolate callback for each of those items, along with the current list
223  * spinlock and a caller-provided opaque. The @isolate callback can choose to
224  * drop the lock internally, but *must* return with the lock held. The callback
225  * will return an enum lru_status telling the @lru infrastructure what to
226  * do with the object being scanned.
227  *
228  * Please note that @nr_to_walk does not mean how many objects will be freed,
229  * just how many objects will be scanned.
230  *
231  * Return: the number of objects effectively removed from the LRU.
232  */
233 unsigned long list_lru_walk_one(struct list_lru *lru,
234 				int nid, struct mem_cgroup *memcg,
235 				list_lru_walk_cb isolate, void *cb_arg,
236 				unsigned long *nr_to_walk);
237 /**
238  * list_lru_walk_one_irq: walk a @lru, isolating and disposing freeable items.
239  * @lru: the lru pointer.
240  * @nid: the node id to scan from.
241  * @memcg: the cgroup to scan from.
242  * @isolate: callback function that is responsible for deciding what to do with
243  *  the item currently being scanned
244  * @cb_arg: opaque type that will be passed to @isolate
245  * @nr_to_walk: how many items to scan.
246  *
247  * Same as list_lru_walk_one() except that the spinlock is acquired with
248  * spin_lock_irq().
249  */
250 unsigned long list_lru_walk_one_irq(struct list_lru *lru,
251 				    int nid, struct mem_cgroup *memcg,
252 				    list_lru_walk_cb isolate, void *cb_arg,
253 				    unsigned long *nr_to_walk);
254 unsigned long list_lru_walk_node(struct list_lru *lru, int nid,
255 				 list_lru_walk_cb isolate, void *cb_arg,
256 				 unsigned long *nr_to_walk);
257 
258 static inline unsigned long
list_lru_shrink_walk(struct list_lru * lru,struct shrink_control * sc,list_lru_walk_cb isolate,void * cb_arg)259 list_lru_shrink_walk(struct list_lru *lru, struct shrink_control *sc,
260 		     list_lru_walk_cb isolate, void *cb_arg)
261 {
262 	return list_lru_walk_one(lru, sc->nid, sc->memcg, isolate, cb_arg,
263 				 &sc->nr_to_scan);
264 }
265 
266 static inline unsigned long
list_lru_shrink_walk_irq(struct list_lru * lru,struct shrink_control * sc,list_lru_walk_cb isolate,void * cb_arg)267 list_lru_shrink_walk_irq(struct list_lru *lru, struct shrink_control *sc,
268 			 list_lru_walk_cb isolate, void *cb_arg)
269 {
270 	return list_lru_walk_one_irq(lru, sc->nid, sc->memcg, isolate, cb_arg,
271 				     &sc->nr_to_scan);
272 }
273 
274 static inline unsigned long
list_lru_walk(struct list_lru * lru,list_lru_walk_cb isolate,void * cb_arg,unsigned long nr_to_walk)275 list_lru_walk(struct list_lru *lru, list_lru_walk_cb isolate,
276 	      void *cb_arg, unsigned long nr_to_walk)
277 {
278 	long isolated = 0;
279 	int nid;
280 
281 	for_each_node_state(nid, N_NORMAL_MEMORY) {
282 		isolated += list_lru_walk_node(lru, nid, isolate,
283 					       cb_arg, &nr_to_walk);
284 		if (nr_to_walk <= 0)
285 			break;
286 	}
287 	return isolated;
288 }
289 #endif /* _LRU_LIST_H */
290