Greg Kroah-Hartman | 355b050 | 2011-11-30 20:18:14 +0900 | [diff] [blame] | 1 | /* drivers/misc/lowmemorykiller.c |
| 2 | * |
| 3 | * The lowmemorykiller driver lets user-space specify a set of memory thresholds |
David Rientjes | 940f77b | 2012-02-13 19:28:49 -0800 | [diff] [blame] | 4 | * where processes with a range of oom_score_adj values will get killed. Specify |
| 5 | * the minimum oom_score_adj values in |
| 6 | * /sys/module/lowmemorykiller/parameters/adj and the number of free pages in |
| 7 | * /sys/module/lowmemorykiller/parameters/minfree. Both files take a comma |
| 8 | * separated list of numbers in ascending order. |
Greg Kroah-Hartman | 355b050 | 2011-11-30 20:18:14 +0900 | [diff] [blame] | 9 | * |
| 10 | * For example, write "0,8" to /sys/module/lowmemorykiller/parameters/adj and |
Marco Navarra | 3bf5d65 | 2011-12-22 13:28:23 +0100 | [diff] [blame] | 11 | * "1024,4096" to /sys/module/lowmemorykiller/parameters/minfree to kill |
David Rientjes | 940f77b | 2012-02-13 19:28:49 -0800 | [diff] [blame] | 12 | * processes with a oom_score_adj value of 8 or higher when the free memory |
| 13 | * drops below 4096 pages and kill processes with a oom_score_adj value of 0 or |
| 14 | * higher when the free memory drops below 1024 pages. |
Greg Kroah-Hartman | 355b050 | 2011-11-30 20:18:14 +0900 | [diff] [blame] | 15 | * |
| 16 | * The driver considers memory used for caches to be free, but if a large |
| 17 | * percentage of the cached memory is locked this can be very inaccurate |
| 18 | * and processes may not get killed until the normal oom killer is triggered. |
| 19 | * |
| 20 | * Copyright (C) 2007-2008 Google, Inc. |
| 21 | * |
| 22 | * This software is licensed under the terms of the GNU General Public |
| 23 | * License version 2, as published by the Free Software Foundation, and |
| 24 | * may be copied, distributed, and modified under those terms. |
| 25 | * |
| 26 | * This program is distributed in the hope that it will be useful, |
| 27 | * but WITHOUT ANY WARRANTY; without even the implied warranty of |
| 28 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
| 29 | * GNU General Public License for more details. |
| 30 | * |
| 31 | */ |
| 32 | |
Dmitry Voytik | 6b83f91 | 2013-03-16 11:37:26 +0400 | [diff] [blame] | 33 | #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt |
| 34 | |
Paul Gortmaker | 380b654 | 2015-10-11 15:47:32 -0400 | [diff] [blame] | 35 | #include <linux/init.h> |
| 36 | #include <linux/moduleparam.h> |
Greg Kroah-Hartman | 355b050 | 2011-11-30 20:18:14 +0900 | [diff] [blame] | 37 | #include <linux/kernel.h> |
| 38 | #include <linux/mm.h> |
| 39 | #include <linux/oom.h> |
| 40 | #include <linux/sched.h> |
Arve Hjønnevåg | eeb0f4f | 2013-02-26 22:07:35 -0800 | [diff] [blame] | 41 | #include <linux/swap.h> |
Anton Vorontsov | 294b271 | 2012-02-06 20:29:41 +0400 | [diff] [blame] | 42 | #include <linux/rcupdate.h> |
San Mehat | 4755b72 | 2010-05-05 11:38:42 -0700 | [diff] [blame] | 43 | #include <linux/profile.h> |
| 44 | #include <linux/notifier.h> |
Greg Kroah-Hartman | 355b050 | 2011-11-30 20:18:14 +0900 | [diff] [blame] | 45 | |
Ioana Ciornei | 36f16ff | 2015-11-01 16:38:21 +0200 | [diff] [blame] | 46 | static u32 lowmem_debug_level = 1; |
David Rientjes | a9c58b90 | 2012-12-11 16:02:54 -0800 | [diff] [blame] | 47 | static short lowmem_adj[6] = { |
Greg Kroah-Hartman | 355b050 | 2011-11-30 20:18:14 +0900 | [diff] [blame] | 48 | 0, |
| 49 | 1, |
| 50 | 6, |
| 51 | 12, |
| 52 | }; |
Sandeep Jain | b33061f | 2016-02-29 18:48:30 +0530 | [diff] [blame] | 53 | |
Greg Kroah-Hartman | 355b050 | 2011-11-30 20:18:14 +0900 | [diff] [blame] | 54 | static int lowmem_adj_size = 4; |
Greg Kroah-Hartman | 624b225 | 2012-03-07 13:21:23 -0800 | [diff] [blame] | 55 | static int lowmem_minfree[6] = { |
Greg Kroah-Hartman | 355b050 | 2011-11-30 20:18:14 +0900 | [diff] [blame] | 56 | 3 * 512, /* 6MB */ |
| 57 | 2 * 1024, /* 8MB */ |
| 58 | 4 * 1024, /* 16MB */ |
| 59 | 16 * 1024, /* 64MB */ |
| 60 | }; |
Sandeep Jain | b33061f | 2016-02-29 18:48:30 +0530 | [diff] [blame] | 61 | |
Greg Kroah-Hartman | 355b050 | 2011-11-30 20:18:14 +0900 | [diff] [blame] | 62 | static int lowmem_minfree_size = 4; |
| 63 | |
Arve Hjønnevåg | e5d7965 | 2012-01-13 22:21:25 +0400 | [diff] [blame] | 64 | static unsigned long lowmem_deathpending_timeout; |
San Mehat | 4755b72 | 2010-05-05 11:38:42 -0700 | [diff] [blame] | 65 | |
Greg Kroah-Hartman | 355b050 | 2011-11-30 20:18:14 +0900 | [diff] [blame] | 66 | #define lowmem_print(level, x...) \ |
| 67 | do { \ |
| 68 | if (lowmem_debug_level >= (level)) \ |
Dmitry Voytik | 6b83f91 | 2013-03-16 11:37:26 +0400 | [diff] [blame] | 69 | pr_info(x); \ |
Greg Kroah-Hartman | 355b050 | 2011-11-30 20:18:14 +0900 | [diff] [blame] | 70 | } while (0) |
| 71 | |
Dave Chinner | 7dc19d5 | 2013-08-28 10:18:11 +1000 | [diff] [blame] | 72 | static unsigned long lowmem_count(struct shrinker *s, |
| 73 | struct shrink_control *sc) |
| 74 | { |
Mel Gorman | 599d0c9 | 2016-07-28 15:45:31 -0700 | [diff] [blame] | 75 | return global_node_page_state(NR_ACTIVE_ANON) + |
| 76 | global_node_page_state(NR_ACTIVE_FILE) + |
| 77 | global_node_page_state(NR_INACTIVE_ANON) + |
| 78 | global_node_page_state(NR_INACTIVE_FILE); |
Dave Chinner | 7dc19d5 | 2013-08-28 10:18:11 +1000 | [diff] [blame] | 79 | } |
| 80 | |
| 81 | static unsigned long lowmem_scan(struct shrinker *s, struct shrink_control *sc) |
Greg Kroah-Hartman | 355b050 | 2011-11-30 20:18:14 +0900 | [diff] [blame] | 82 | { |
Anton Vorontsov | 9567000 | 2012-02-06 20:29:47 +0400 | [diff] [blame] | 83 | struct task_struct *tsk; |
Greg Kroah-Hartman | 355b050 | 2011-11-30 20:18:14 +0900 | [diff] [blame] | 84 | struct task_struct *selected = NULL; |
Dave Chinner | 7dc19d5 | 2013-08-28 10:18:11 +1000 | [diff] [blame] | 85 | unsigned long rem = 0; |
Greg Kroah-Hartman | 355b050 | 2011-11-30 20:18:14 +0900 | [diff] [blame] | 86 | int tasksize; |
| 87 | int i; |
David Rientjes | a9c58b90 | 2012-12-11 16:02:54 -0800 | [diff] [blame] | 88 | short min_score_adj = OOM_SCORE_ADJ_MAX + 1; |
Colin Cross | cc635da | 2016-01-29 22:07:33 -0800 | [diff] [blame] | 89 | int minfree = 0; |
Greg Kroah-Hartman | 355b050 | 2011-11-30 20:18:14 +0900 | [diff] [blame] | 90 | int selected_tasksize = 0; |
David Rientjes | a9c58b90 | 2012-12-11 16:02:54 -0800 | [diff] [blame] | 91 | short selected_oom_score_adj; |
Greg Kroah-Hartman | 355b050 | 2011-11-30 20:18:14 +0900 | [diff] [blame] | 92 | int array_size = ARRAY_SIZE(lowmem_adj); |
Arve Hjønnevåg | eeb0f4f | 2013-02-26 22:07:35 -0800 | [diff] [blame] | 93 | int other_free = global_page_state(NR_FREE_PAGES) - totalreserve_pages; |
Mel Gorman | 11fb998 | 2016-07-28 15:46:20 -0700 | [diff] [blame] | 94 | int other_file = global_node_page_state(NR_FILE_PAGES) - |
Anson Jacob | 9924e5d | 2016-08-25 11:10:25 -0400 | [diff] [blame] | 95 | global_node_page_state(NR_SHMEM) - |
| 96 | total_swapcache_pages(); |
Greg Kroah-Hartman | 355b050 | 2011-11-30 20:18:14 +0900 | [diff] [blame] | 97 | |
| 98 | if (lowmem_adj_size < array_size) |
| 99 | array_size = lowmem_adj_size; |
| 100 | if (lowmem_minfree_size < array_size) |
| 101 | array_size = lowmem_minfree_size; |
| 102 | for (i = 0; i < array_size; i++) { |
Colin Cross | cc635da | 2016-01-29 22:07:33 -0800 | [diff] [blame] | 103 | minfree = lowmem_minfree[i]; |
| 104 | if (other_free < minfree && other_file < minfree) { |
David Rientjes | 940f77b | 2012-02-13 19:28:49 -0800 | [diff] [blame] | 105 | min_score_adj = lowmem_adj[i]; |
Greg Kroah-Hartman | 355b050 | 2011-11-30 20:18:14 +0900 | [diff] [blame] | 106 | break; |
| 107 | } |
| 108 | } |
Dave Chinner | 7dc19d5 | 2013-08-28 10:18:11 +1000 | [diff] [blame] | 109 | |
| 110 | lowmem_print(3, "lowmem_scan %lu, %x, ofree %d %d, ma %hd\n", |
Ioana Ciornei | f8b053e | 2015-11-01 16:38:22 +0200 | [diff] [blame] | 111 | sc->nr_to_scan, sc->gfp_mask, other_free, |
| 112 | other_file, min_score_adj); |
Dave Chinner | 7dc19d5 | 2013-08-28 10:18:11 +1000 | [diff] [blame] | 113 | |
| 114 | if (min_score_adj == OOM_SCORE_ADJ_MAX + 1) { |
| 115 | lowmem_print(5, "lowmem_scan %lu, %x, return 0\n", |
| 116 | sc->nr_to_scan, sc->gfp_mask); |
| 117 | return 0; |
Greg Kroah-Hartman | 355b050 | 2011-11-30 20:18:14 +0900 | [diff] [blame] | 118 | } |
Dave Chinner | 7dc19d5 | 2013-08-28 10:18:11 +1000 | [diff] [blame] | 119 | |
David Rientjes | 940f77b | 2012-02-13 19:28:49 -0800 | [diff] [blame] | 120 | selected_oom_score_adj = min_score_adj; |
Greg Kroah-Hartman | 355b050 | 2011-11-30 20:18:14 +0900 | [diff] [blame] | 121 | |
Anton Vorontsov | 294b271 | 2012-02-06 20:29:41 +0400 | [diff] [blame] | 122 | rcu_read_lock(); |
Anton Vorontsov | 9567000 | 2012-02-06 20:29:47 +0400 | [diff] [blame] | 123 | for_each_process(tsk) { |
| 124 | struct task_struct *p; |
David Rientjes | a9c58b90 | 2012-12-11 16:02:54 -0800 | [diff] [blame] | 125 | short oom_score_adj; |
Greg Kroah-Hartman | 355b050 | 2011-11-30 20:18:14 +0900 | [diff] [blame] | 126 | |
Anton Vorontsov | 9823ec9 | 2012-02-06 20:30:01 +0400 | [diff] [blame] | 127 | if (tsk->flags & PF_KTHREAD) |
Greg Kroah-Hartman | 355b050 | 2011-11-30 20:18:14 +0900 | [diff] [blame] | 128 | continue; |
Anton Vorontsov | 9823ec9 | 2012-02-06 20:30:01 +0400 | [diff] [blame] | 129 | |
Anton Vorontsov | 9567000 | 2012-02-06 20:29:47 +0400 | [diff] [blame] | 130 | p = find_lock_task_mm(tsk); |
| 131 | if (!p) |
| 132 | continue; |
| 133 | |
Dan Carpenter | ae25d43 | 2016-04-08 16:02:35 +0300 | [diff] [blame] | 134 | if (task_lmk_waiting(p) && |
David Rientjes | 83dbbdb | 2012-04-09 16:56:18 -0700 | [diff] [blame] | 135 | time_before_eq(jiffies, lowmem_deathpending_timeout)) { |
| 136 | task_unlock(p); |
| 137 | rcu_read_unlock(); |
| 138 | return 0; |
| 139 | } |
David Rientjes | 940f77b | 2012-02-13 19:28:49 -0800 | [diff] [blame] | 140 | oom_score_adj = p->signal->oom_score_adj; |
| 141 | if (oom_score_adj < min_score_adj) { |
Greg Kroah-Hartman | 355b050 | 2011-11-30 20:18:14 +0900 | [diff] [blame] | 142 | task_unlock(p); |
| 143 | continue; |
| 144 | } |
Anton Vorontsov | 9567000 | 2012-02-06 20:29:47 +0400 | [diff] [blame] | 145 | tasksize = get_mm_rss(p->mm); |
Greg Kroah-Hartman | 355b050 | 2011-11-30 20:18:14 +0900 | [diff] [blame] | 146 | task_unlock(p); |
| 147 | if (tasksize <= 0) |
| 148 | continue; |
| 149 | if (selected) { |
David Rientjes | 940f77b | 2012-02-13 19:28:49 -0800 | [diff] [blame] | 150 | if (oom_score_adj < selected_oom_score_adj) |
Greg Kroah-Hartman | 355b050 | 2011-11-30 20:18:14 +0900 | [diff] [blame] | 151 | continue; |
David Rientjes | 940f77b | 2012-02-13 19:28:49 -0800 | [diff] [blame] | 152 | if (oom_score_adj == selected_oom_score_adj && |
Greg Kroah-Hartman | 355b050 | 2011-11-30 20:18:14 +0900 | [diff] [blame] | 153 | tasksize <= selected_tasksize) |
| 154 | continue; |
| 155 | } |
| 156 | selected = p; |
| 157 | selected_tasksize = tasksize; |
David Rientjes | 940f77b | 2012-02-13 19:28:49 -0800 | [diff] [blame] | 158 | selected_oom_score_adj = oom_score_adj; |
Colin Cross | cc635da | 2016-01-29 22:07:33 -0800 | [diff] [blame] | 159 | lowmem_print(2, "select '%s' (%d), adj %hd, size %d, to kill\n", |
| 160 | p->comm, p->pid, oom_score_adj, tasksize); |
Greg Kroah-Hartman | 355b050 | 2011-11-30 20:18:14 +0900 | [diff] [blame] | 161 | } |
| 162 | if (selected) { |
David Rientjes | e1099a6 | 2015-04-28 15:50:46 -0700 | [diff] [blame] | 163 | task_lock(selected); |
Tetsuo Handa | 3a81fc2 | 2015-09-06 14:25:35 +0900 | [diff] [blame] | 164 | send_sig(SIGKILL, selected, 0); |
Tetsuo Handa | 3a81fc2 | 2015-09-06 14:25:35 +0900 | [diff] [blame] | 165 | if (selected->mm) |
Tetsuo Handa | 77ed2c5 | 2016-03-08 20:01:32 +0900 | [diff] [blame] | 166 | task_set_lmk_waiting(selected); |
David Rientjes | e1099a6 | 2015-04-28 15:50:46 -0700 | [diff] [blame] | 167 | task_unlock(selected); |
Colin Cross | cc635da | 2016-01-29 22:07:33 -0800 | [diff] [blame] | 168 | lowmem_print(1, "Killing '%s' (%d), adj %hd,\n" |
| 169 | " to free %ldkB on behalf of '%s' (%d) because\n" |
| 170 | " cache %ldkB is below limit %ldkB for oom_score_adj %hd\n" |
| 171 | " Free memory is %ldkB above reserved\n", |
| 172 | selected->comm, selected->pid, |
| 173 | selected_oom_score_adj, |
| 174 | selected_tasksize * (long)(PAGE_SIZE / 1024), |
| 175 | current->comm, current->pid, |
| 176 | other_file * (long)(PAGE_SIZE / 1024), |
| 177 | minfree * (long)(PAGE_SIZE / 1024), |
| 178 | min_score_adj, |
| 179 | other_free * (long)(PAGE_SIZE / 1024)); |
David Rientjes | e1099a6 | 2015-04-28 15:50:46 -0700 | [diff] [blame] | 180 | lowmem_deathpending_timeout = jiffies + HZ; |
Dave Chinner | 7dc19d5 | 2013-08-28 10:18:11 +1000 | [diff] [blame] | 181 | rem += selected_tasksize; |
Greg Kroah-Hartman | 355b050 | 2011-11-30 20:18:14 +0900 | [diff] [blame] | 182 | } |
Tetsuo Handa | 3a81fc2 | 2015-09-06 14:25:35 +0900 | [diff] [blame] | 183 | |
Dave Chinner | 7dc19d5 | 2013-08-28 10:18:11 +1000 | [diff] [blame] | 184 | lowmem_print(4, "lowmem_scan %lu, %x, return %lu\n", |
Colin Cross | cae9bf1 | 2011-06-22 16:05:47 -0700 | [diff] [blame] | 185 | sc->nr_to_scan, sc->gfp_mask, rem); |
Anton Vorontsov | 294b271 | 2012-02-06 20:29:41 +0400 | [diff] [blame] | 186 | rcu_read_unlock(); |
Greg Kroah-Hartman | 355b050 | 2011-11-30 20:18:14 +0900 | [diff] [blame] | 187 | return rem; |
| 188 | } |
| 189 | |
| 190 | static struct shrinker lowmem_shrinker = { |
Dave Chinner | 7dc19d5 | 2013-08-28 10:18:11 +1000 | [diff] [blame] | 191 | .scan_objects = lowmem_scan, |
| 192 | .count_objects = lowmem_count, |
Greg Kroah-Hartman | 355b050 | 2011-11-30 20:18:14 +0900 | [diff] [blame] | 193 | .seeks = DEFAULT_SEEKS * 16 |
| 194 | }; |
| 195 | |
| 196 | static int __init lowmem_init(void) |
| 197 | { |
| 198 | register_shrinker(&lowmem_shrinker); |
| 199 | return 0; |
| 200 | } |
Paul Gortmaker | 380b654 | 2015-10-11 15:47:32 -0400 | [diff] [blame] | 201 | device_initcall(lowmem_init); |
Greg Kroah-Hartman | 355b050 | 2011-11-30 20:18:14 +0900 | [diff] [blame] | 202 | |
Paul Gortmaker | 380b654 | 2015-10-11 15:47:32 -0400 | [diff] [blame] | 203 | /* |
| 204 | * not really modular, but the easiest way to keep compat with existing |
| 205 | * bootargs behaviour is to continue using module_param here. |
| 206 | */ |
Eric Salem | 8abcae4 | 2016-09-25 22:33:34 -0500 | [diff] [blame] | 207 | module_param_named(cost, lowmem_shrinker.seeks, int, 0644); |
| 208 | module_param_array_named(adj, lowmem_adj, short, &lowmem_adj_size, 0644); |
Greg Kroah-Hartman | 355b050 | 2011-11-30 20:18:14 +0900 | [diff] [blame] | 209 | module_param_array_named(minfree, lowmem_minfree, uint, &lowmem_minfree_size, |
Eric Salem | 8abcae4 | 2016-09-25 22:33:34 -0500 | [diff] [blame] | 210 | 0644); |
| 211 | module_param_named(debug_level, lowmem_debug_level, uint, 0644); |
Greg Kroah-Hartman | 355b050 | 2011-11-30 20:18:14 +0900 | [diff] [blame] | 212 | |