blob: 305b598abac2a75a76bac26b4d081a18f88af36c [file] [log] [blame]
Dave Chinnera38e4082013-08-28 10:17:58 +10001/*
2 * Copyright (c) 2013 Red Hat, Inc. and Parallels Inc. All rights reserved.
3 * Authors: David Chinner and Glauber Costa
4 *
5 * Generic LRU infrastructure
6 */
7#ifndef _LRU_LIST_H
8#define _LRU_LIST_H
9
10#include <linux/list.h>
Dave Chinner3b1d58a2013-08-28 10:18:00 +100011#include <linux/nodemask.h>
Vladimir Davydov503c3582015-02-12 14:58:47 -080012#include <linux/shrinker.h>
Dave Chinnera38e4082013-08-28 10:17:58 +100013
Vladimir Davydov60d3fd32015-02-12 14:59:10 -080014struct mem_cgroup;
15
Dave Chinnera38e4082013-08-28 10:17:58 +100016/* list_lru_walk_cb has to always return one of those */
17enum lru_status {
18 LRU_REMOVED, /* item removed from list */
Johannes Weiner449dd692014-04-03 14:47:56 -070019 LRU_REMOVED_RETRY, /* item removed, but lock has been
20 dropped and reacquired */
Dave Chinnera38e4082013-08-28 10:17:58 +100021 LRU_ROTATE, /* item referenced, give another pass */
22 LRU_SKIP, /* item cannot be locked, skip */
23 LRU_RETRY, /* item not freeable. May drop the lock
24 internally, but has to return locked. */
25};
26
Vladimir Davydov60d3fd32015-02-12 14:59:10 -080027struct list_lru_one {
Dave Chinnera38e4082013-08-28 10:17:58 +100028 struct list_head list;
29 /* kept as signed so we can catch imbalance bugs */
30 long nr_items;
Vladimir Davydov60d3fd32015-02-12 14:59:10 -080031};
32
33struct list_lru_memcg {
34 /* array of per cgroup lists, indexed by memcg_cache_id */
35 struct list_lru_one *lru[0];
36};
37
38struct list_lru_node {
39 /* protects all lists on the node, including per cgroup */
40 spinlock_t lock;
41 /* global list, used for the root cgroup in cgroup aware lrus */
42 struct list_lru_one lru;
43#ifdef CONFIG_MEMCG_KMEM
44 /* for cgroup aware lrus points to per cgroup lists, otherwise NULL */
45 struct list_lru_memcg *memcg_lrus;
46#endif
Dave Chinner3b1d58a2013-08-28 10:18:00 +100047} ____cacheline_aligned_in_smp;
48
49struct list_lru {
Glauber Costa5ca302c2013-08-28 10:18:18 +100050 struct list_lru_node *node;
Vladimir Davydovc0a5b562015-02-12 14:59:07 -080051#ifdef CONFIG_MEMCG_KMEM
52 struct list_head list;
53#endif
Dave Chinnera38e4082013-08-28 10:17:58 +100054};
55
Glauber Costa5ca302c2013-08-28 10:18:18 +100056void list_lru_destroy(struct list_lru *lru);
Vladimir Davydov60d3fd32015-02-12 14:59:10 -080057int __list_lru_init(struct list_lru *lru, bool memcg_aware,
58 struct lock_class_key *key);
59
60#define list_lru_init(lru) __list_lru_init((lru), false, NULL)
61#define list_lru_init_key(lru, key) __list_lru_init((lru), false, (key))
62#define list_lru_init_memcg(lru) __list_lru_init((lru), true, NULL)
63
64int memcg_update_all_list_lrus(int num_memcgs);
Dave Chinnera38e4082013-08-28 10:17:58 +100065
66/**
67 * list_lru_add: add an element to the lru list's tail
68 * @list_lru: the lru pointer
69 * @item: the item to be added.
70 *
71 * If the element is already part of a list, this function returns doing
72 * nothing. Therefore the caller does not need to keep state about whether or
73 * not the element already belongs in the list and is allowed to lazy update
74 * it. Note however that this is valid for *a* list, not *this* list. If
75 * the caller organize itself in a way that elements can be in more than
76 * one type of list, it is up to the caller to fully remove the item from
77 * the previous list (with list_lru_del() for instance) before moving it
78 * to @list_lru
79 *
80 * Return value: true if the list was updated, false otherwise
81 */
82bool list_lru_add(struct list_lru *lru, struct list_head *item);
83
84/**
85 * list_lru_del: delete an element to the lru list
86 * @list_lru: the lru pointer
87 * @item: the item to be deleted.
88 *
89 * This function works analogously as list_lru_add in terms of list
90 * manipulation. The comments about an element already pertaining to
91 * a list are also valid for list_lru_del.
92 *
93 * Return value: true if the list was updated, false otherwise
94 */
95bool list_lru_del(struct list_lru *lru, struct list_head *item);
96
97/**
Vladimir Davydov60d3fd32015-02-12 14:59:10 -080098 * list_lru_count_one: return the number of objects currently held by @lru
Dave Chinnera38e4082013-08-28 10:17:58 +100099 * @lru: the lru pointer.
Glauber Costa6a4f4962013-08-28 10:18:02 +1000100 * @nid: the node id to count from.
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800101 * @memcg: the cgroup to count from.
Dave Chinnera38e4082013-08-28 10:17:58 +1000102 *
103 * Always return a non-negative number, 0 for empty lists. There is no
104 * guarantee that the list is not updated while the count is being computed.
105 * Callers that want such a guarantee need to provide an outer lock.
106 */
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800107unsigned long list_lru_count_one(struct list_lru *lru,
108 int nid, struct mem_cgroup *memcg);
Glauber Costa6a4f4962013-08-28 10:18:02 +1000109unsigned long list_lru_count_node(struct list_lru *lru, int nid);
Vladimir Davydov503c3582015-02-12 14:58:47 -0800110
111static inline unsigned long list_lru_shrink_count(struct list_lru *lru,
112 struct shrink_control *sc)
113{
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800114 return list_lru_count_one(lru, sc->nid, sc->memcg);
Vladimir Davydov503c3582015-02-12 14:58:47 -0800115}
116
Glauber Costa6a4f4962013-08-28 10:18:02 +1000117static inline unsigned long list_lru_count(struct list_lru *lru)
118{
119 long count = 0;
120 int nid;
121
Vladimir Davydovff0b67e2015-02-12 14:59:04 -0800122 for_each_node_state(nid, N_NORMAL_MEMORY)
Glauber Costa6a4f4962013-08-28 10:18:02 +1000123 count += list_lru_count_node(lru, nid);
124
125 return count;
126}
Dave Chinnera38e4082013-08-28 10:17:58 +1000127
128typedef enum lru_status
129(*list_lru_walk_cb)(struct list_head *item, spinlock_t *lock, void *cb_arg);
130/**
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800131 * list_lru_walk_one: walk a list_lru, isolating and disposing freeable items.
Dave Chinnera38e4082013-08-28 10:17:58 +1000132 * @lru: the lru pointer.
Glauber Costa6a4f4962013-08-28 10:18:02 +1000133 * @nid: the node id to scan from.
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800134 * @memcg: the cgroup to scan from.
Dave Chinnera38e4082013-08-28 10:17:58 +1000135 * @isolate: callback function that is resposible for deciding what to do with
136 * the item currently being scanned
137 * @cb_arg: opaque type that will be passed to @isolate
138 * @nr_to_walk: how many items to scan.
139 *
140 * This function will scan all elements in a particular list_lru, calling the
141 * @isolate callback for each of those items, along with the current list
142 * spinlock and a caller-provided opaque. The @isolate callback can choose to
143 * drop the lock internally, but *must* return with the lock held. The callback
144 * will return an enum lru_status telling the list_lru infrastructure what to
145 * do with the object being scanned.
146 *
147 * Please note that nr_to_walk does not mean how many objects will be freed,
148 * just how many objects will be scanned.
149 *
150 * Return value: the number of objects effectively removed from the LRU.
151 */
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800152unsigned long list_lru_walk_one(struct list_lru *lru,
153 int nid, struct mem_cgroup *memcg,
154 list_lru_walk_cb isolate, void *cb_arg,
155 unsigned long *nr_to_walk);
Glauber Costa6a4f4962013-08-28 10:18:02 +1000156unsigned long list_lru_walk_node(struct list_lru *lru, int nid,
157 list_lru_walk_cb isolate, void *cb_arg,
158 unsigned long *nr_to_walk);
159
160static inline unsigned long
Vladimir Davydov503c3582015-02-12 14:58:47 -0800161list_lru_shrink_walk(struct list_lru *lru, struct shrink_control *sc,
162 list_lru_walk_cb isolate, void *cb_arg)
163{
Vladimir Davydov60d3fd32015-02-12 14:59:10 -0800164 return list_lru_walk_one(lru, sc->nid, sc->memcg, isolate, cb_arg,
165 &sc->nr_to_scan);
Vladimir Davydov503c3582015-02-12 14:58:47 -0800166}
167
168static inline unsigned long
Glauber Costa6a4f4962013-08-28 10:18:02 +1000169list_lru_walk(struct list_lru *lru, list_lru_walk_cb isolate,
170 void *cb_arg, unsigned long nr_to_walk)
171{
172 long isolated = 0;
173 int nid;
174
Vladimir Davydovff0b67e2015-02-12 14:59:04 -0800175 for_each_node_state(nid, N_NORMAL_MEMORY) {
Glauber Costa6a4f4962013-08-28 10:18:02 +1000176 isolated += list_lru_walk_node(lru, nid, isolate,
177 cb_arg, &nr_to_walk);
178 if (nr_to_walk <= 0)
179 break;
180 }
181 return isolated;
182}
Dave Chinnera38e4082013-08-28 10:17:58 +1000183#endif /* _LRU_LIST_H */