lowmemorykiller.c revision 294b27119f2e20643e71a0c1a1b511320a11e4c3
1/* drivers/misc/lowmemorykiller.c 2 * 3 * The lowmemorykiller driver lets user-space specify a set of memory thresholds 4 * where processes with a range of oom_adj values will get killed. Specify the 5 * minimum oom_adj values in /sys/module/lowmemorykiller/parameters/adj and the 6 * number of free pages in /sys/module/lowmemorykiller/parameters/minfree. Both 7 * files take a comma separated list of numbers in ascending order. 8 * 9 * For example, write "0,8" to /sys/module/lowmemorykiller/parameters/adj and 10 * "1024,4096" to /sys/module/lowmemorykiller/parameters/minfree to kill 11 * processes with a oom_adj value of 8 or higher when the free memory drops 12 * below 4096 pages and kill processes with a oom_adj value of 0 or higher 13 * when the free memory drops below 1024 pages. 14 * 15 * The driver considers memory used for caches to be free, but if a large 16 * percentage of the cached memory is locked this can be very inaccurate 17 * and processes may not get killed until the normal oom killer is triggered. 18 * 19 * Copyright (C) 2007-2008 Google, Inc. 20 * 21 * This software is licensed under the terms of the GNU General Public 22 * License version 2, as published by the Free Software Foundation, and 23 * may be copied, distributed, and modified under those terms. 24 * 25 * This program is distributed in the hope that it will be useful, 26 * but WITHOUT ANY WARRANTY; without even the implied warranty of 27 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 28 * GNU General Public License for more details. 29 * 30 */ 31 32#include <linux/module.h> 33#include <linux/kernel.h> 34#include <linux/mm.h> 35#include <linux/oom.h> 36#include <linux/sched.h> 37#include <linux/rcupdate.h> 38#include <linux/profile.h> 39#include <linux/notifier.h> 40 41static uint32_t lowmem_debug_level = 2; 42static int lowmem_adj[6] = { 43 0, 44 1, 45 6, 46 12, 47}; 48static int lowmem_adj_size = 4; 49static size_t lowmem_minfree[6] = { 50 3 * 512, /* 6MB */ 51 2 * 1024, /* 8MB */ 52 4 * 1024, /* 16MB */ 53 16 * 1024, /* 64MB */ 54}; 55static int lowmem_minfree_size = 4; 56 57static struct task_struct *lowmem_deathpending; 58 59#define lowmem_print(level, x...) \ 60 do { \ 61 if (lowmem_debug_level >= (level)) \ 62 printk(x); \ 63 } while (0) 64 65static int 66task_notify_func(struct notifier_block *self, unsigned long val, void *data); 67 68static struct notifier_block task_nb = { 69 .notifier_call = task_notify_func, 70}; 71 72static int 73task_notify_func(struct notifier_block *self, unsigned long val, void *data) 74{ 75 struct task_struct *task = data; 76 if (task == lowmem_deathpending) { 77 lowmem_deathpending = NULL; 78 task_handoff_unregister(&task_nb); 79 } 80 return NOTIFY_OK; 81} 82 83static int lowmem_shrink(struct shrinker *s, struct shrink_control *sc) 84{ 85 struct task_struct *p; 86 struct task_struct *selected = NULL; 87 int rem = 0; 88 int tasksize; 89 int i; 90 int min_adj = OOM_ADJUST_MAX + 1; 91 int selected_tasksize = 0; 92 int selected_oom_adj; 93 int array_size = ARRAY_SIZE(lowmem_adj); 94 int other_free = global_page_state(NR_FREE_PAGES); 95 int other_file = global_page_state(NR_FILE_PAGES) - 96 global_page_state(NR_SHMEM); 97 98 /* 99 * If we already have a death outstanding, then 100 * bail out right away; indicating to vmscan 101 * that we have nothing further to offer on 102 * this pass. 103 * 104 * Note: Currently you need CONFIG_PROFILING 105 * for this to work correctly. 106 */ 107 if (lowmem_deathpending) 108 return 0; 109 110 if (lowmem_adj_size < array_size) 111 array_size = lowmem_adj_size; 112 if (lowmem_minfree_size < array_size) 113 array_size = lowmem_minfree_size; 114 for (i = 0; i < array_size; i++) { 115 if (other_free < lowmem_minfree[i] && 116 other_file < lowmem_minfree[i]) { 117 min_adj = lowmem_adj[i]; 118 break; 119 } 120 } 121 if (sc->nr_to_scan > 0) 122 lowmem_print(3, "lowmem_shrink %lu, %x, ofree %d %d, ma %d\n", 123 sc->nr_to_scan, sc->gfp_mask, other_free, 124 other_file, min_adj); 125 rem = global_page_state(NR_ACTIVE_ANON) + 126 global_page_state(NR_ACTIVE_FILE) + 127 global_page_state(NR_INACTIVE_ANON) + 128 global_page_state(NR_INACTIVE_FILE); 129 if (sc->nr_to_scan <= 0 || min_adj == OOM_ADJUST_MAX + 1) { 130 lowmem_print(5, "lowmem_shrink %lu, %x, return %d\n", 131 sc->nr_to_scan, sc->gfp_mask, rem); 132 return rem; 133 } 134 selected_oom_adj = min_adj; 135 136 rcu_read_lock(); 137 for_each_process(p) { 138 struct mm_struct *mm; 139 struct signal_struct *sig; 140 int oom_adj; 141 142 task_lock(p); 143 mm = p->mm; 144 sig = p->signal; 145 if (!mm || !sig) { 146 task_unlock(p); 147 continue; 148 } 149 oom_adj = sig->oom_adj; 150 if (oom_adj < min_adj) { 151 task_unlock(p); 152 continue; 153 } 154 tasksize = get_mm_rss(mm); 155 task_unlock(p); 156 if (tasksize <= 0) 157 continue; 158 if (selected) { 159 if (oom_adj < selected_oom_adj) 160 continue; 161 if (oom_adj == selected_oom_adj && 162 tasksize <= selected_tasksize) 163 continue; 164 } 165 selected = p; 166 selected_tasksize = tasksize; 167 selected_oom_adj = oom_adj; 168 lowmem_print(2, "select %d (%s), adj %d, size %d, to kill\n", 169 p->pid, p->comm, oom_adj, tasksize); 170 } 171 if (selected) { 172 lowmem_print(1, "send sigkill to %d (%s), adj %d, size %d\n", 173 selected->pid, selected->comm, 174 selected_oom_adj, selected_tasksize); 175 /* 176 * If CONFIG_PROFILING is off, then task_handoff_register() 177 * is a nop. In that case we don't want to stall the killer 178 * by setting lowmem_deathpending. 179 */ 180#ifdef CONFIG_PROFILING 181 lowmem_deathpending = selected; 182 task_handoff_register(&task_nb); 183#endif 184 send_sig(SIGKILL, selected, 0); 185 rem -= selected_tasksize; 186 } 187 lowmem_print(4, "lowmem_shrink %lu, %x, return %d\n", 188 sc->nr_to_scan, sc->gfp_mask, rem); 189 rcu_read_unlock(); 190 return rem; 191} 192 193static struct shrinker lowmem_shrinker = { 194 .shrink = lowmem_shrink, 195 .seeks = DEFAULT_SEEKS * 16 196}; 197 198static int __init lowmem_init(void) 199{ 200 register_shrinker(&lowmem_shrinker); 201 return 0; 202} 203 204static void __exit lowmem_exit(void) 205{ 206 unregister_shrinker(&lowmem_shrinker); 207} 208 209module_param_named(cost, lowmem_shrinker.seeks, int, S_IRUGO | S_IWUSR); 210module_param_array_named(adj, lowmem_adj, int, &lowmem_adj_size, 211 S_IRUGO | S_IWUSR); 212module_param_array_named(minfree, lowmem_minfree, uint, &lowmem_minfree_size, 213 S_IRUGO | S_IWUSR); 214module_param_named(debug_level, lowmem_debug_level, uint, S_IRUGO | S_IWUSR); 215 216module_init(lowmem_init); 217module_exit(lowmem_exit); 218 219MODULE_LICENSE("GPL"); 220 221