blob: d12c1943f6f3936a4eb486b73de9acfa2656605e [file] [log] [blame]
Thomas Gleixner457c8992019-05-19 13:08:55 +01001// SPDX-License-Identifier: GPL-2.0-only
Dave Chinnera38e4082013-08-28 10:17:58 +10002/*
3 * Copyright (c) 2013 Red Hat, Inc. and Parallels Inc. All rights reserved.
4 * Authors: David Chinner and Glauber Costa
5 *
6 * Generic LRU infrastructure
7 */
8#include <linux/kernel.h>
9#include <linux/module.h>
Dave Chinner3b1d58a2013-08-28 10:18:00 +100010#include <linux/mm.h>
Dave Chinnera38e4082013-08-28 10:17:58 +100011#include <linux/list_lru.h>
Glauber Costa5ca302c2013-08-28 10:18:18 +100012#include <linux/slab.h>
Vladimir Davydovc0a5b5602015-02-12 14:59:07 -080013#include <linux/mutex.h>
Vladimir Davydov60d3fd32015-02-12 14:59:10 -080014#include <linux/memcontrol.h>
Roman Gushchin4d96ba32019-07-11 20:56:31 -070015#include "slab.h"
Vladimir Davydovc0a5b5602015-02-12 14:59:07 -080016
Kirill Tkhai84c07d12018-08-17 15:47:25 -070017#ifdef CONFIG_MEMCG_KMEM
Vladimir Davydovc0a5b5602015-02-12 14:59:07 -080018static LIST_HEAD(list_lrus);
19static DEFINE_MUTEX(list_lrus_mutex);
20
21static void list_lru_register(struct list_lru *lru)
22{
23 mutex_lock(&list_lrus_mutex);
24 list_add(&lru->list, &list_lrus);
25 mutex_unlock(&list_lrus_mutex);
26}
27
28static void list_lru_unregister(struct list_lru *lru)
29{
30 mutex_lock(&list_lrus_mutex);
31 list_del(&lru->list);
32 mutex_unlock(&list_lrus_mutex);
33}
Vladimir Davydovc0a5b5602015-02-12 14:59:07 -080034
Kirill Tkhaifae91d62018-08-17 15:48:10 -070035static int lru_shrinker_id(struct list_lru *lru)
36{
37 return lru->shrinker_id;
38}
39
Vladimir Davydov60d3fd32015-02-12 14:59:10 -080040static inline bool list_lru_memcg_aware(struct list_lru *lru)
41{
Jiri Slaby3e858992019-05-31 22:30:26 -070042 return lru->memcg_aware;
Vladimir Davydov60d3fd32015-02-12 14:59:10 -080043}
44
45static inline struct list_lru_one *
46list_lru_from_memcg_idx(struct list_lru_node *nlru, int idx)
47{
Kirill Tkhai0c7c1be2018-04-05 16:25:08 -070048 struct list_lru_memcg *memcg_lrus;
Vladimir Davydov60d3fd32015-02-12 14:59:10 -080049 /*
Kirill Tkhai0c7c1be2018-04-05 16:25:08 -070050 * Either lock or RCU protects the array of per cgroup lists
51 * from relocation (see memcg_update_list_lru_node).
Vladimir Davydov60d3fd32015-02-12 14:59:10 -080052 */
Kirill Tkhai0c7c1be2018-04-05 16:25:08 -070053 memcg_lrus = rcu_dereference_check(nlru->memcg_lrus,
54 lockdep_is_held(&nlru->lock));
55 if (memcg_lrus && idx >= 0)
56 return memcg_lrus->lru[idx];
Vladimir Davydov60d3fd32015-02-12 14:59:10 -080057 return &nlru->lru;
58}
59
Vladimir Davydovdf406552015-11-05 18:49:04 -080060static __always_inline struct mem_cgroup *mem_cgroup_from_kmem(void *ptr)
61{
62 struct page *page;
63
64 if (!memcg_kmem_enabled())
65 return NULL;
66 page = virt_to_head_page(ptr);
Roman Gushchin4d96ba32019-07-11 20:56:31 -070067 return memcg_from_slab_page(page);
Vladimir Davydovdf406552015-11-05 18:49:04 -080068}
69
Vladimir Davydov60d3fd32015-02-12 14:59:10 -080070static inline struct list_lru_one *
Kirill Tkhai44bd4a42018-08-17 15:47:54 -070071list_lru_from_kmem(struct list_lru_node *nlru, void *ptr,
72 struct mem_cgroup **memcg_ptr)
Vladimir Davydov60d3fd32015-02-12 14:59:10 -080073{
Kirill Tkhai44bd4a42018-08-17 15:47:54 -070074 struct list_lru_one *l = &nlru->lru;
75 struct mem_cgroup *memcg = NULL;
Vladimir Davydov60d3fd32015-02-12 14:59:10 -080076
77 if (!nlru->memcg_lrus)
Kirill Tkhai44bd4a42018-08-17 15:47:54 -070078 goto out;
Vladimir Davydov60d3fd32015-02-12 14:59:10 -080079
80 memcg = mem_cgroup_from_kmem(ptr);
81 if (!memcg)
Kirill Tkhai44bd4a42018-08-17 15:47:54 -070082 goto out;
Vladimir Davydov60d3fd32015-02-12 14:59:10 -080083
Kirill Tkhai44bd4a42018-08-17 15:47:54 -070084 l = list_lru_from_memcg_idx(nlru, memcg_cache_id(memcg));
85out:
86 if (memcg_ptr)
87 *memcg_ptr = memcg;
88 return l;
Vladimir Davydov60d3fd32015-02-12 14:59:10 -080089}
90#else
Kirill Tkhaie0295232018-08-17 15:47:21 -070091static void list_lru_register(struct list_lru *lru)
92{
93}
94
95static void list_lru_unregister(struct list_lru *lru)
96{
97}
98
Kirill Tkhaifae91d62018-08-17 15:48:10 -070099static int lru_shrinker_id(struct list_lru *lru)
100{
101 return -1;
102}
103
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800104static inline bool list_lru_memcg_aware(struct list_lru *lru)
105{
106 return false;
107}
108
109static inline struct list_lru_one *
110list_lru_from_memcg_idx(struct list_lru_node *nlru, int idx)
111{
112 return &nlru->lru;
113}
114
115static inline struct list_lru_one *
Kirill Tkhai44bd4a42018-08-17 15:47:54 -0700116list_lru_from_kmem(struct list_lru_node *nlru, void *ptr,
117 struct mem_cgroup **memcg_ptr)
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800118{
Kirill Tkhai44bd4a42018-08-17 15:47:54 -0700119 if (memcg_ptr)
120 *memcg_ptr = NULL;
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800121 return &nlru->lru;
122}
Kirill Tkhai84c07d12018-08-17 15:47:25 -0700123#endif /* CONFIG_MEMCG_KMEM */
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800124
Dave Chinnera38e4082013-08-28 10:17:58 +1000125bool list_lru_add(struct list_lru *lru, struct list_head *item)
126{
Dave Chinner3b1d58a2013-08-28 10:18:00 +1000127 int nid = page_to_nid(virt_to_page(item));
128 struct list_lru_node *nlru = &lru->node[nid];
Kirill Tkhaifae91d62018-08-17 15:48:10 -0700129 struct mem_cgroup *memcg;
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800130 struct list_lru_one *l;
Dave Chinner3b1d58a2013-08-28 10:18:00 +1000131
132 spin_lock(&nlru->lock);
Dave Chinnera38e4082013-08-28 10:17:58 +1000133 if (list_empty(item)) {
Kirill Tkhaifae91d62018-08-17 15:48:10 -0700134 l = list_lru_from_kmem(nlru, item, &memcg);
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800135 list_add_tail(item, &l->list);
Kirill Tkhaifae91d62018-08-17 15:48:10 -0700136 /* Set shrinker bit if the first element was added */
137 if (!l->nr_items++)
138 memcg_set_shrinker_bit(memcg, nid,
139 lru_shrinker_id(lru));
Sahitya Tummala2c80cd52017-07-10 15:49:57 -0700140 nlru->nr_items++;
Dave Chinner3b1d58a2013-08-28 10:18:00 +1000141 spin_unlock(&nlru->lock);
Dave Chinnera38e4082013-08-28 10:17:58 +1000142 return true;
143 }
Dave Chinner3b1d58a2013-08-28 10:18:00 +1000144 spin_unlock(&nlru->lock);
Dave Chinnera38e4082013-08-28 10:17:58 +1000145 return false;
146}
147EXPORT_SYMBOL_GPL(list_lru_add);
148
149bool list_lru_del(struct list_lru *lru, struct list_head *item)
150{
Dave Chinner3b1d58a2013-08-28 10:18:00 +1000151 int nid = page_to_nid(virt_to_page(item));
152 struct list_lru_node *nlru = &lru->node[nid];
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800153 struct list_lru_one *l;
Dave Chinner3b1d58a2013-08-28 10:18:00 +1000154
155 spin_lock(&nlru->lock);
Dave Chinnera38e4082013-08-28 10:17:58 +1000156 if (!list_empty(item)) {
Kirill Tkhai44bd4a42018-08-17 15:47:54 -0700157 l = list_lru_from_kmem(nlru, item, NULL);
Dave Chinnera38e4082013-08-28 10:17:58 +1000158 list_del_init(item);
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800159 l->nr_items--;
Sahitya Tummala2c80cd52017-07-10 15:49:57 -0700160 nlru->nr_items--;
Dave Chinner3b1d58a2013-08-28 10:18:00 +1000161 spin_unlock(&nlru->lock);
Dave Chinnera38e4082013-08-28 10:17:58 +1000162 return true;
163 }
Dave Chinner3b1d58a2013-08-28 10:18:00 +1000164 spin_unlock(&nlru->lock);
Dave Chinnera38e4082013-08-28 10:17:58 +1000165 return false;
166}
167EXPORT_SYMBOL_GPL(list_lru_del);
168
Vladimir Davydov3f97b162015-02-12 14:59:35 -0800169void list_lru_isolate(struct list_lru_one *list, struct list_head *item)
170{
171 list_del_init(item);
172 list->nr_items--;
173}
174EXPORT_SYMBOL_GPL(list_lru_isolate);
175
176void list_lru_isolate_move(struct list_lru_one *list, struct list_head *item,
177 struct list_head *head)
178{
179 list_move(item, head);
180 list->nr_items--;
181}
182EXPORT_SYMBOL_GPL(list_lru_isolate_move);
183
Andrew Morton930eaac2018-08-17 15:46:11 -0700184unsigned long list_lru_count_one(struct list_lru *lru,
185 int nid, struct mem_cgroup *memcg)
Dave Chinnera38e4082013-08-28 10:17:58 +1000186{
Glauber Costa6a4f4962013-08-28 10:18:02 +1000187 struct list_lru_node *nlru = &lru->node[nid];
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800188 struct list_lru_one *l;
189 unsigned long count;
Dave Chinner3b1d58a2013-08-28 10:18:00 +1000190
Kirill Tkhai0c7c1be2018-04-05 16:25:08 -0700191 rcu_read_lock();
Andrew Morton930eaac2018-08-17 15:46:11 -0700192 l = list_lru_from_memcg_idx(nlru, memcg_cache_id(memcg));
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800193 count = l->nr_items;
Kirill Tkhai0c7c1be2018-04-05 16:25:08 -0700194 rcu_read_unlock();
Dave Chinner3b1d58a2013-08-28 10:18:00 +1000195
196 return count;
197}
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800198EXPORT_SYMBOL_GPL(list_lru_count_one);
199
200unsigned long list_lru_count_node(struct list_lru *lru, int nid)
201{
Sahitya Tummala2c80cd52017-07-10 15:49:57 -0700202 struct list_lru_node *nlru;
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800203
Sahitya Tummala2c80cd52017-07-10 15:49:57 -0700204 nlru = &lru->node[nid];
205 return nlru->nr_items;
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800206}
Glauber Costa6a4f4962013-08-28 10:18:02 +1000207EXPORT_SYMBOL_GPL(list_lru_count_node);
Dave Chinner3b1d58a2013-08-28 10:18:00 +1000208
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800209static unsigned long
Sebastian Andrzej Siewior6e018962018-08-17 15:49:51 -0700210__list_lru_walk_one(struct list_lru_node *nlru, int memcg_idx,
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800211 list_lru_walk_cb isolate, void *cb_arg,
212 unsigned long *nr_to_walk)
Dave Chinner3b1d58a2013-08-28 10:18:00 +1000213{
214
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800215 struct list_lru_one *l;
Dave Chinnera38e4082013-08-28 10:17:58 +1000216 struct list_head *item, *n;
Dave Chinner3b1d58a2013-08-28 10:18:00 +1000217 unsigned long isolated = 0;
Dave Chinnera38e4082013-08-28 10:17:58 +1000218
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800219 l = list_lru_from_memcg_idx(nlru, memcg_idx);
Dave Chinnera38e4082013-08-28 10:17:58 +1000220restart:
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800221 list_for_each_safe(item, n, &l->list) {
Dave Chinnera38e4082013-08-28 10:17:58 +1000222 enum lru_status ret;
Dave Chinner5cedf7212013-08-28 10:18:01 +1000223
224 /*
225 * decrement nr_to_walk first so that we don't livelock if we
226 * get stuck on large numbesr of LRU_RETRY items
227 */
Russell Kingc56b0972013-10-30 14:16:16 +0000228 if (!*nr_to_walk)
Dave Chinner5cedf7212013-08-28 10:18:01 +1000229 break;
Russell Kingc56b0972013-10-30 14:16:16 +0000230 --*nr_to_walk;
Dave Chinner5cedf7212013-08-28 10:18:01 +1000231
Vladimir Davydov3f97b162015-02-12 14:59:35 -0800232 ret = isolate(item, l, &nlru->lock, cb_arg);
Dave Chinnera38e4082013-08-28 10:17:58 +1000233 switch (ret) {
Johannes Weiner449dd692014-04-03 14:47:56 -0700234 case LRU_REMOVED_RETRY:
235 assert_spin_locked(&nlru->lock);
Gustavo A. R. Silva5b568ac2017-11-15 17:38:49 -0800236 /* fall through */
Dave Chinnera38e4082013-08-28 10:17:58 +1000237 case LRU_REMOVED:
Dave Chinner3b1d58a2013-08-28 10:18:00 +1000238 isolated++;
Sahitya Tummala2c80cd52017-07-10 15:49:57 -0700239 nlru->nr_items--;
Johannes Weiner449dd692014-04-03 14:47:56 -0700240 /*
241 * If the lru lock has been dropped, our list
242 * traversal is now invalid and so we have to
243 * restart from scratch.
244 */
245 if (ret == LRU_REMOVED_RETRY)
246 goto restart;
Dave Chinnera38e4082013-08-28 10:17:58 +1000247 break;
248 case LRU_ROTATE:
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800249 list_move_tail(item, &l->list);
Dave Chinnera38e4082013-08-28 10:17:58 +1000250 break;
251 case LRU_SKIP:
252 break;
253 case LRU_RETRY:
Dave Chinner5cedf7212013-08-28 10:18:01 +1000254 /*
255 * The lru lock has been dropped, our list traversal is
256 * now invalid and so we have to restart from scratch.
257 */
Johannes Weiner449dd692014-04-03 14:47:56 -0700258 assert_spin_locked(&nlru->lock);
Dave Chinnera38e4082013-08-28 10:17:58 +1000259 goto restart;
260 default:
261 BUG();
262 }
Dave Chinnera38e4082013-08-28 10:17:58 +1000263 }
Dave Chinner3b1d58a2013-08-28 10:18:00 +1000264 return isolated;
265}
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800266
267unsigned long
268list_lru_walk_one(struct list_lru *lru, int nid, struct mem_cgroup *memcg,
269 list_lru_walk_cb isolate, void *cb_arg,
270 unsigned long *nr_to_walk)
271{
Sebastian Andrzej Siewior6cfe57a2018-08-17 15:49:48 -0700272 struct list_lru_node *nlru = &lru->node[nid];
273 unsigned long ret;
274
275 spin_lock(&nlru->lock);
Sebastian Andrzej Siewior6e018962018-08-17 15:49:51 -0700276 ret = __list_lru_walk_one(nlru, memcg_cache_id(memcg), isolate, cb_arg,
277 nr_to_walk);
Sebastian Andrzej Siewior6cfe57a2018-08-17 15:49:48 -0700278 spin_unlock(&nlru->lock);
279 return ret;
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800280}
281EXPORT_SYMBOL_GPL(list_lru_walk_one);
282
Sebastian Andrzej Siewior6b51e882018-08-17 15:49:55 -0700283unsigned long
284list_lru_walk_one_irq(struct list_lru *lru, int nid, struct mem_cgroup *memcg,
285 list_lru_walk_cb isolate, void *cb_arg,
286 unsigned long *nr_to_walk)
287{
288 struct list_lru_node *nlru = &lru->node[nid];
289 unsigned long ret;
290
291 spin_lock_irq(&nlru->lock);
292 ret = __list_lru_walk_one(nlru, memcg_cache_id(memcg), isolate, cb_arg,
293 nr_to_walk);
294 spin_unlock_irq(&nlru->lock);
295 return ret;
296}
297
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800298unsigned long list_lru_walk_node(struct list_lru *lru, int nid,
299 list_lru_walk_cb isolate, void *cb_arg,
300 unsigned long *nr_to_walk)
301{
302 long isolated = 0;
303 int memcg_idx;
304
Sebastian Andrzej Siewior87a5ffc2018-08-17 15:49:45 -0700305 isolated += list_lru_walk_one(lru, nid, NULL, isolate, cb_arg,
306 nr_to_walk);
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800307 if (*nr_to_walk > 0 && list_lru_memcg_aware(lru)) {
308 for_each_memcg_cache_index(memcg_idx) {
Sebastian Andrzej Siewior6cfe57a2018-08-17 15:49:48 -0700309 struct list_lru_node *nlru = &lru->node[nid];
310
311 spin_lock(&nlru->lock);
Sebastian Andrzej Siewior6e018962018-08-17 15:49:51 -0700312 isolated += __list_lru_walk_one(nlru, memcg_idx,
313 isolate, cb_arg,
314 nr_to_walk);
Sebastian Andrzej Siewior6cfe57a2018-08-17 15:49:48 -0700315 spin_unlock(&nlru->lock);
316
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800317 if (*nr_to_walk <= 0)
318 break;
319 }
320 }
321 return isolated;
322}
Dave Chinner3b1d58a2013-08-28 10:18:00 +1000323EXPORT_SYMBOL_GPL(list_lru_walk_node);
324
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800325static void init_one_lru(struct list_lru_one *l)
326{
327 INIT_LIST_HEAD(&l->list);
328 l->nr_items = 0;
329}
330
Kirill Tkhai84c07d12018-08-17 15:47:25 -0700331#ifdef CONFIG_MEMCG_KMEM
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800332static void __memcg_destroy_list_lru_node(struct list_lru_memcg *memcg_lrus,
333 int begin, int end)
334{
335 int i;
336
337 for (i = begin; i < end; i++)
338 kfree(memcg_lrus->lru[i]);
339}
340
341static int __memcg_init_list_lru_node(struct list_lru_memcg *memcg_lrus,
342 int begin, int end)
343{
344 int i;
345
346 for (i = begin; i < end; i++) {
347 struct list_lru_one *l;
348
349 l = kmalloc(sizeof(struct list_lru_one), GFP_KERNEL);
350 if (!l)
351 goto fail;
352
353 init_one_lru(l);
354 memcg_lrus->lru[i] = l;
355 }
356 return 0;
357fail:
Shakeel Butt35109552019-06-13 15:55:49 -0700358 __memcg_destroy_list_lru_node(memcg_lrus, begin, i);
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800359 return -ENOMEM;
360}
361
362static int memcg_init_list_lru_node(struct list_lru_node *nlru)
363{
Kirill Tkhai0c7c1be2018-04-05 16:25:08 -0700364 struct list_lru_memcg *memcg_lrus;
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800365 int size = memcg_nr_cache_ids;
366
Kirill Tkhai0c7c1be2018-04-05 16:25:08 -0700367 memcg_lrus = kvmalloc(sizeof(*memcg_lrus) +
368 size * sizeof(void *), GFP_KERNEL);
369 if (!memcg_lrus)
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800370 return -ENOMEM;
371
Kirill Tkhai0c7c1be2018-04-05 16:25:08 -0700372 if (__memcg_init_list_lru_node(memcg_lrus, 0, size)) {
373 kvfree(memcg_lrus);
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800374 return -ENOMEM;
375 }
Kirill Tkhai0c7c1be2018-04-05 16:25:08 -0700376 RCU_INIT_POINTER(nlru->memcg_lrus, memcg_lrus);
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800377
378 return 0;
379}
380
381static void memcg_destroy_list_lru_node(struct list_lru_node *nlru)
382{
Kirill Tkhai0c7c1be2018-04-05 16:25:08 -0700383 struct list_lru_memcg *memcg_lrus;
384 /*
385 * This is called when shrinker has already been unregistered,
386 * and nobody can use it. So, there is no need to use kvfree_rcu().
387 */
388 memcg_lrus = rcu_dereference_protected(nlru->memcg_lrus, true);
389 __memcg_destroy_list_lru_node(memcg_lrus, 0, memcg_nr_cache_ids);
390 kvfree(memcg_lrus);
391}
392
393static void kvfree_rcu(struct rcu_head *head)
394{
395 struct list_lru_memcg *mlru;
396
397 mlru = container_of(head, struct list_lru_memcg, rcu);
398 kvfree(mlru);
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800399}
400
401static int memcg_update_list_lru_node(struct list_lru_node *nlru,
402 int old_size, int new_size)
403{
404 struct list_lru_memcg *old, *new;
405
406 BUG_ON(old_size > new_size);
407
Kirill Tkhai0c7c1be2018-04-05 16:25:08 -0700408 old = rcu_dereference_protected(nlru->memcg_lrus,
409 lockdep_is_held(&list_lrus_mutex));
410 new = kvmalloc(sizeof(*new) + new_size * sizeof(void *), GFP_KERNEL);
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800411 if (!new)
412 return -ENOMEM;
413
414 if (__memcg_init_list_lru_node(new, old_size, new_size)) {
Johannes Weinerf80c7da2017-10-03 16:16:10 -0700415 kvfree(new);
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800416 return -ENOMEM;
417 }
418
Kirill Tkhai0c7c1be2018-04-05 16:25:08 -0700419 memcpy(&new->lru, &old->lru, old_size * sizeof(void *));
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800420
421 /*
Kirill Tkhai0c7c1be2018-04-05 16:25:08 -0700422 * The locking below allows readers that hold nlru->lock avoid taking
423 * rcu_read_lock (see list_lru_from_memcg_idx).
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800424 *
425 * Since list_lru_{add,del} may be called under an IRQ-safe lock,
426 * we have to use IRQ-safe primitives here to avoid deadlock.
427 */
428 spin_lock_irq(&nlru->lock);
Kirill Tkhai0c7c1be2018-04-05 16:25:08 -0700429 rcu_assign_pointer(nlru->memcg_lrus, new);
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800430 spin_unlock_irq(&nlru->lock);
431
Kirill Tkhai0c7c1be2018-04-05 16:25:08 -0700432 call_rcu(&old->rcu, kvfree_rcu);
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800433 return 0;
434}
435
436static void memcg_cancel_update_list_lru_node(struct list_lru_node *nlru,
437 int old_size, int new_size)
438{
Kirill Tkhai0c7c1be2018-04-05 16:25:08 -0700439 struct list_lru_memcg *memcg_lrus;
440
441 memcg_lrus = rcu_dereference_protected(nlru->memcg_lrus,
442 lockdep_is_held(&list_lrus_mutex));
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800443 /* do not bother shrinking the array back to the old size, because we
444 * cannot handle allocation failures here */
Kirill Tkhai0c7c1be2018-04-05 16:25:08 -0700445 __memcg_destroy_list_lru_node(memcg_lrus, old_size, new_size);
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800446}
447
448static int memcg_init_list_lru(struct list_lru *lru, bool memcg_aware)
449{
450 int i;
451
Jiri Slaby3e858992019-05-31 22:30:26 -0700452 lru->memcg_aware = memcg_aware;
453
Raghavendra K T145949a2015-11-05 18:46:26 -0800454 if (!memcg_aware)
455 return 0;
456
457 for_each_node(i) {
458 if (memcg_init_list_lru_node(&lru->node[i]))
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800459 goto fail;
460 }
461 return 0;
462fail:
Raghavendra K T145949a2015-11-05 18:46:26 -0800463 for (i = i - 1; i >= 0; i--) {
464 if (!lru->node[i].memcg_lrus)
465 continue;
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800466 memcg_destroy_list_lru_node(&lru->node[i]);
Raghavendra K T145949a2015-11-05 18:46:26 -0800467 }
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800468 return -ENOMEM;
469}
470
471static void memcg_destroy_list_lru(struct list_lru *lru)
472{
473 int i;
474
475 if (!list_lru_memcg_aware(lru))
476 return;
477
Raghavendra K T145949a2015-11-05 18:46:26 -0800478 for_each_node(i)
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800479 memcg_destroy_list_lru_node(&lru->node[i]);
480}
481
482static int memcg_update_list_lru(struct list_lru *lru,
483 int old_size, int new_size)
484{
485 int i;
486
487 if (!list_lru_memcg_aware(lru))
488 return 0;
489
Raghavendra K T145949a2015-11-05 18:46:26 -0800490 for_each_node(i) {
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800491 if (memcg_update_list_lru_node(&lru->node[i],
492 old_size, new_size))
493 goto fail;
494 }
495 return 0;
496fail:
Raghavendra K T145949a2015-11-05 18:46:26 -0800497 for (i = i - 1; i >= 0; i--) {
498 if (!lru->node[i].memcg_lrus)
499 continue;
500
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800501 memcg_cancel_update_list_lru_node(&lru->node[i],
502 old_size, new_size);
Raghavendra K T145949a2015-11-05 18:46:26 -0800503 }
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800504 return -ENOMEM;
505}
506
507static void memcg_cancel_update_list_lru(struct list_lru *lru,
508 int old_size, int new_size)
509{
510 int i;
511
512 if (!list_lru_memcg_aware(lru))
513 return;
514
Raghavendra K T145949a2015-11-05 18:46:26 -0800515 for_each_node(i)
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800516 memcg_cancel_update_list_lru_node(&lru->node[i],
517 old_size, new_size);
518}
519
520int memcg_update_all_list_lrus(int new_size)
521{
522 int ret = 0;
523 struct list_lru *lru;
524 int old_size = memcg_nr_cache_ids;
525
526 mutex_lock(&list_lrus_mutex);
527 list_for_each_entry(lru, &list_lrus, list) {
528 ret = memcg_update_list_lru(lru, old_size, new_size);
529 if (ret)
530 goto fail;
531 }
532out:
533 mutex_unlock(&list_lrus_mutex);
534 return ret;
535fail:
536 list_for_each_entry_continue_reverse(lru, &list_lrus, list)
537 memcg_cancel_update_list_lru(lru, old_size, new_size);
538 goto out;
539}
Vladimir Davydov2788cf02015-02-12 14:59:38 -0800540
Kirill Tkhai3b82c4d2018-08-17 15:48:01 -0700541static void memcg_drain_list_lru_node(struct list_lru *lru, int nid,
Kirill Tkhai9bec5c32018-08-17 15:47:58 -0700542 int src_idx, struct mem_cgroup *dst_memcg)
Vladimir Davydov2788cf02015-02-12 14:59:38 -0800543{
Kirill Tkhai3b82c4d2018-08-17 15:48:01 -0700544 struct list_lru_node *nlru = &lru->node[nid];
Kirill Tkhai9bec5c32018-08-17 15:47:58 -0700545 int dst_idx = dst_memcg->kmemcg_id;
Vladimir Davydov2788cf02015-02-12 14:59:38 -0800546 struct list_lru_one *src, *dst;
547
548 /*
549 * Since list_lru_{add,del} may be called under an IRQ-safe lock,
550 * we have to use IRQ-safe primitives here to avoid deadlock.
551 */
552 spin_lock_irq(&nlru->lock);
553
554 src = list_lru_from_memcg_idx(nlru, src_idx);
555 dst = list_lru_from_memcg_idx(nlru, dst_idx);
556
557 list_splice_init(&src->list, &dst->list);
Yang Shi48700042020-12-05 22:14:48 -0800558
559 if (src->nr_items) {
560 dst->nr_items += src->nr_items;
Kirill Tkhaifae91d62018-08-17 15:48:10 -0700561 memcg_set_shrinker_bit(dst_memcg, nid, lru_shrinker_id(lru));
Yang Shi48700042020-12-05 22:14:48 -0800562 src->nr_items = 0;
563 }
Vladimir Davydov2788cf02015-02-12 14:59:38 -0800564
565 spin_unlock_irq(&nlru->lock);
566}
567
568static void memcg_drain_list_lru(struct list_lru *lru,
Kirill Tkhai9bec5c32018-08-17 15:47:58 -0700569 int src_idx, struct mem_cgroup *dst_memcg)
Vladimir Davydov2788cf02015-02-12 14:59:38 -0800570{
571 int i;
572
573 if (!list_lru_memcg_aware(lru))
574 return;
575
Raghavendra K T145949a2015-11-05 18:46:26 -0800576 for_each_node(i)
Kirill Tkhai3b82c4d2018-08-17 15:48:01 -0700577 memcg_drain_list_lru_node(lru, i, src_idx, dst_memcg);
Vladimir Davydov2788cf02015-02-12 14:59:38 -0800578}
579
Kirill Tkhai9bec5c32018-08-17 15:47:58 -0700580void memcg_drain_all_list_lrus(int src_idx, struct mem_cgroup *dst_memcg)
Vladimir Davydov2788cf02015-02-12 14:59:38 -0800581{
582 struct list_lru *lru;
583
584 mutex_lock(&list_lrus_mutex);
585 list_for_each_entry(lru, &list_lrus, list)
Kirill Tkhai9bec5c32018-08-17 15:47:58 -0700586 memcg_drain_list_lru(lru, src_idx, dst_memcg);
Vladimir Davydov2788cf02015-02-12 14:59:38 -0800587 mutex_unlock(&list_lrus_mutex);
588}
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800589#else
590static int memcg_init_list_lru(struct list_lru *lru, bool memcg_aware)
591{
592 return 0;
593}
594
595static void memcg_destroy_list_lru(struct list_lru *lru)
596{
597}
Kirill Tkhai84c07d12018-08-17 15:47:25 -0700598#endif /* CONFIG_MEMCG_KMEM */
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800599
600int __list_lru_init(struct list_lru *lru, bool memcg_aware,
Kirill Tkhaic92e8e12018-08-17 15:47:50 -0700601 struct lock_class_key *key, struct shrinker *shrinker)
Dave Chinnera38e4082013-08-28 10:17:58 +1000602{
Dave Chinner3b1d58a2013-08-28 10:18:00 +1000603 int i;
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800604 int err = -ENOMEM;
605
Kirill Tkhaic92e8e12018-08-17 15:47:50 -0700606#ifdef CONFIG_MEMCG_KMEM
607 if (shrinker)
608 lru->shrinker_id = shrinker->id;
609 else
610 lru->shrinker_id = -1;
611#endif
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800612 memcg_get_cache_ids();
Glauber Costa5ca302c2013-08-28 10:18:18 +1000613
Alexey Dobriyanb9726c22019-03-05 15:48:26 -0800614 lru->node = kcalloc(nr_node_ids, sizeof(*lru->node), GFP_KERNEL);
Glauber Costa5ca302c2013-08-28 10:18:18 +1000615 if (!lru->node)
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800616 goto out;
Dave Chinnera38e4082013-08-28 10:17:58 +1000617
Raghavendra K T145949a2015-11-05 18:46:26 -0800618 for_each_node(i) {
Dave Chinner3b1d58a2013-08-28 10:18:00 +1000619 spin_lock_init(&lru->node[i].lock);
Johannes Weiner449dd692014-04-03 14:47:56 -0700620 if (key)
621 lockdep_set_class(&lru->node[i].lock, key);
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800622 init_one_lru(&lru->node[i].lru);
Dave Chinner3b1d58a2013-08-28 10:18:00 +1000623 }
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800624
625 err = memcg_init_list_lru(lru, memcg_aware);
626 if (err) {
627 kfree(lru->node);
Alexander Polakov1bc11d72016-10-27 17:46:27 -0700628 /* Do this so a list_lru_destroy() doesn't crash: */
629 lru->node = NULL;
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800630 goto out;
631 }
632
Vladimir Davydovc0a5b5602015-02-12 14:59:07 -0800633 list_lru_register(lru);
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800634out:
635 memcg_put_cache_ids();
636 return err;
Dave Chinnera38e4082013-08-28 10:17:58 +1000637}
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800638EXPORT_SYMBOL_GPL(__list_lru_init);
Glauber Costa5ca302c2013-08-28 10:18:18 +1000639
640void list_lru_destroy(struct list_lru *lru)
641{
Vladimir Davydovc0a5b5602015-02-12 14:59:07 -0800642 /* Already destroyed or not yet initialized? */
643 if (!lru->node)
644 return;
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800645
646 memcg_get_cache_ids();
647
Vladimir Davydovc0a5b5602015-02-12 14:59:07 -0800648 list_lru_unregister(lru);
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800649
650 memcg_destroy_list_lru(lru);
Glauber Costa5ca302c2013-08-28 10:18:18 +1000651 kfree(lru->node);
Vladimir Davydovc0a5b5602015-02-12 14:59:07 -0800652 lru->node = NULL;
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800653
Kirill Tkhaic92e8e12018-08-17 15:47:50 -0700654#ifdef CONFIG_MEMCG_KMEM
655 lru->shrinker_id = -1;
656#endif
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800657 memcg_put_cache_ids();
Glauber Costa5ca302c2013-08-28 10:18:18 +1000658}
659EXPORT_SYMBOL_GPL(list_lru_destroy);