1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
34
35#include <linux/init.h>
36#include <linux/moduleparam.h>
37#include <linux/kernel.h>
38#include <linux/mm.h>
39#include <linux/oom.h>
40#include <linux/sched.h>
41#include <linux/swap.h>
42#include <linux/rcupdate.h>
43#include <linux/profile.h>
44#include <linux/notifier.h>
45
46static u32 lowmem_debug_level = 1;
47static short lowmem_adj[6] = {
48 0,
49 1,
50 6,
51 12,
52};
53
54static int lowmem_adj_size = 4;
55static int lowmem_minfree[6] = {
56 3 * 512,
57 2 * 1024,
58 4 * 1024,
59 16 * 1024,
60};
61
62static int lowmem_minfree_size = 4;
63
64static unsigned long lowmem_deathpending_timeout;
65
66#define lowmem_print(level, x...) \
67 do { \
68 if (lowmem_debug_level >= (level)) \
69 pr_info(x); \
70 } while (0)
71
72static unsigned long lowmem_count(struct shrinker *s,
73 struct shrink_control *sc)
74{
75 return global_page_state(NR_ACTIVE_ANON) +
76 global_page_state(NR_ACTIVE_FILE) +
77 global_page_state(NR_INACTIVE_ANON) +
78 global_page_state(NR_INACTIVE_FILE);
79}
80
81static unsigned long lowmem_scan(struct shrinker *s, struct shrink_control *sc)
82{
83 struct task_struct *tsk;
84 struct task_struct *selected = NULL;
85 unsigned long rem = 0;
86 int tasksize;
87 int i;
88 short min_score_adj = OOM_SCORE_ADJ_MAX + 1;
89 int minfree = 0;
90 int selected_tasksize = 0;
91 short selected_oom_score_adj;
92 int array_size = ARRAY_SIZE(lowmem_adj);
93 int other_free = global_page_state(NR_FREE_PAGES) - totalreserve_pages;
94 int other_file = global_page_state(NR_FILE_PAGES) -
95 global_page_state(NR_SHMEM) -
96 total_swapcache_pages();
97
98 if (lowmem_adj_size < array_size)
99 array_size = lowmem_adj_size;
100 if (lowmem_minfree_size < array_size)
101 array_size = lowmem_minfree_size;
102 for (i = 0; i < array_size; i++) {
103 minfree = lowmem_minfree[i];
104 if (other_free < minfree && other_file < minfree) {
105 min_score_adj = lowmem_adj[i];
106 break;
107 }
108 }
109
110 lowmem_print(3, "lowmem_scan %lu, %x, ofree %d %d, ma %hd\n",
111 sc->nr_to_scan, sc->gfp_mask, other_free,
112 other_file, min_score_adj);
113
114 if (min_score_adj == OOM_SCORE_ADJ_MAX + 1) {
115 lowmem_print(5, "lowmem_scan %lu, %x, return 0\n",
116 sc->nr_to_scan, sc->gfp_mask);
117 return 0;
118 }
119
120 selected_oom_score_adj = min_score_adj;
121
122 rcu_read_lock();
123 for_each_process(tsk) {
124 struct task_struct *p;
125 short oom_score_adj;
126
127 if (tsk->flags & PF_KTHREAD)
128 continue;
129
130 p = find_lock_task_mm(tsk);
131 if (!p)
132 continue;
133
134 if (test_tsk_thread_flag(p, TIF_MEMDIE) &&
135 time_before_eq(jiffies, lowmem_deathpending_timeout)) {
136 task_unlock(p);
137 rcu_read_unlock();
138 return 0;
139 }
140 oom_score_adj = p->signal->oom_score_adj;
141 if (oom_score_adj < min_score_adj) {
142 task_unlock(p);
143 continue;
144 }
145 tasksize = get_mm_rss(p->mm);
146 task_unlock(p);
147 if (tasksize <= 0)
148 continue;
149 if (selected) {
150 if (oom_score_adj < selected_oom_score_adj)
151 continue;
152 if (oom_score_adj == selected_oom_score_adj &&
153 tasksize <= selected_tasksize)
154 continue;
155 }
156 selected = p;
157 selected_tasksize = tasksize;
158 selected_oom_score_adj = oom_score_adj;
159 lowmem_print(2, "select '%s' (%d), adj %hd, size %d, to kill\n",
160 p->comm, p->pid, oom_score_adj, tasksize);
161 }
162 if (selected) {
163 task_lock(selected);
164 send_sig(SIGKILL, selected, 0);
165
166
167
168
169
170 if (selected->mm)
171 mark_oom_victim(selected);
172 task_unlock(selected);
173 lowmem_print(1, "Killing '%s' (%d), adj %hd,\n"
174 " to free %ldkB on behalf of '%s' (%d) because\n"
175 " cache %ldkB is below limit %ldkB for oom_score_adj %hd\n"
176 " Free memory is %ldkB above reserved\n",
177 selected->comm, selected->pid,
178 selected_oom_score_adj,
179 selected_tasksize * (long)(PAGE_SIZE / 1024),
180 current->comm, current->pid,
181 other_file * (long)(PAGE_SIZE / 1024),
182 minfree * (long)(PAGE_SIZE / 1024),
183 min_score_adj,
184 other_free * (long)(PAGE_SIZE / 1024));
185 lowmem_deathpending_timeout = jiffies + HZ;
186 rem += selected_tasksize;
187 }
188
189 lowmem_print(4, "lowmem_scan %lu, %x, return %lu\n",
190 sc->nr_to_scan, sc->gfp_mask, rem);
191 rcu_read_unlock();
192 return rem;
193}
194
195static struct shrinker lowmem_shrinker = {
196 .scan_objects = lowmem_scan,
197 .count_objects = lowmem_count,
198 .seeks = DEFAULT_SEEKS * 16
199};
200
201static int __init lowmem_init(void)
202{
203 register_shrinker(&lowmem_shrinker);
204 return 0;
205}
206device_initcall(lowmem_init);
207
208
209
210
211
212module_param_named(cost, lowmem_shrinker.seeks, int, S_IRUGO | S_IWUSR);
213module_param_array_named(adj, lowmem_adj, short, &lowmem_adj_size,
214 S_IRUGO | S_IWUSR);
215module_param_array_named(minfree, lowmem_minfree, uint, &lowmem_minfree_size,
216 S_IRUGO | S_IWUSR);
217module_param_named(debug_level, lowmem_debug_level, uint, S_IRUGO | S_IWUSR);
218
219