1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20#ifndef _LINUX_MEMCONTROL_H
21#define _LINUX_MEMCONTROL_H
22#include <linux/cgroup.h>
23#include <linux/vm_event_item.h>
24#include <linux/hardirq.h>
25#include <linux/jump_label.h>
26#include <linux/page_counter.h>
27#include <linux/vmpressure.h>
28#include <linux/eventfd.h>
29#include <linux/mmzone.h>
30#include <linux/writeback.h>
31#include <linux/page-flags.h>
32
33struct mem_cgroup;
34struct page;
35struct mm_struct;
36struct kmem_cache;
37
38
39
40
41
42enum mem_cgroup_stat_index {
43
44
45
46 MEM_CGROUP_STAT_CACHE,
47 MEM_CGROUP_STAT_RSS,
48 MEM_CGROUP_STAT_RSS_HUGE,
49 MEM_CGROUP_STAT_FILE_MAPPED,
50 MEM_CGROUP_STAT_DIRTY,
51 MEM_CGROUP_STAT_WRITEBACK,
52 MEM_CGROUP_STAT_SWAP,
53 MEM_CGROUP_STAT_NSTATS,
54
55 MEMCG_KERNEL_STACK_KB = MEM_CGROUP_STAT_NSTATS,
56 MEMCG_SLAB_RECLAIMABLE,
57 MEMCG_SLAB_UNRECLAIMABLE,
58 MEMCG_SOCK,
59 MEMCG_NR_STAT,
60};
61
62struct mem_cgroup_reclaim_cookie {
63 pg_data_t *pgdat;
64 int priority;
65 unsigned int generation;
66};
67
68enum mem_cgroup_events_index {
69 MEM_CGROUP_EVENTS_PGPGIN,
70 MEM_CGROUP_EVENTS_PGPGOUT,
71 MEM_CGROUP_EVENTS_PGFAULT,
72 MEM_CGROUP_EVENTS_PGMAJFAULT,
73 MEM_CGROUP_EVENTS_NSTATS,
74
75 MEMCG_LOW = MEM_CGROUP_EVENTS_NSTATS,
76 MEMCG_HIGH,
77 MEMCG_MAX,
78 MEMCG_OOM,
79 MEMCG_NR_EVENTS,
80};
81
82
83
84
85
86
87
88enum mem_cgroup_events_target {
89 MEM_CGROUP_TARGET_THRESH,
90 MEM_CGROUP_TARGET_SOFTLIMIT,
91 MEM_CGROUP_TARGET_NUMAINFO,
92 MEM_CGROUP_NTARGETS,
93};
94
95#ifdef CONFIG_MEMCG
96
97#define MEM_CGROUP_ID_SHIFT 16
98#define MEM_CGROUP_ID_MAX USHRT_MAX
99
100struct mem_cgroup_id {
101 int id;
102 atomic_t ref;
103};
104
105struct mem_cgroup_stat_cpu {
106 long count[MEMCG_NR_STAT];
107 unsigned long events[MEMCG_NR_EVENTS];
108 unsigned long nr_page_events;
109 unsigned long targets[MEM_CGROUP_NTARGETS];
110};
111
112struct mem_cgroup_reclaim_iter {
113 struct mem_cgroup *position;
114
115 unsigned int generation;
116};
117
118
119
120
121struct mem_cgroup_per_node {
122 struct lruvec lruvec;
123 unsigned long lru_zone_size[MAX_NR_ZONES][NR_LRU_LISTS];
124
125 struct mem_cgroup_reclaim_iter iter[DEF_PRIORITY + 1];
126
127 struct rb_node tree_node;
128 unsigned long usage_in_excess;
129
130 bool on_tree;
131 struct mem_cgroup *memcg;
132
133};
134
135struct mem_cgroup_threshold {
136 struct eventfd_ctx *eventfd;
137 unsigned long threshold;
138};
139
140
141struct mem_cgroup_threshold_ary {
142
143 int current_threshold;
144
145 unsigned int size;
146
147 struct mem_cgroup_threshold entries[0];
148};
149
150struct mem_cgroup_thresholds {
151
152 struct mem_cgroup_threshold_ary *primary;
153
154
155
156
157
158 struct mem_cgroup_threshold_ary *spare;
159};
160
161enum memcg_kmem_state {
162 KMEM_NONE,
163 KMEM_ALLOCATED,
164 KMEM_ONLINE,
165};
166
167
168
169
170
171
172
173struct mem_cgroup {
174 struct cgroup_subsys_state css;
175
176
177 struct mem_cgroup_id id;
178
179
180 struct page_counter memory;
181 struct page_counter swap;
182
183
184 struct page_counter memsw;
185 struct page_counter kmem;
186 struct page_counter tcpmem;
187
188
189 unsigned long low;
190 unsigned long high;
191
192
193 struct work_struct high_work;
194
195 unsigned long soft_limit;
196
197
198 struct vmpressure vmpressure;
199
200
201
202
203 bool use_hierarchy;
204
205
206 bool oom_lock;
207 int under_oom;
208
209 int swappiness;
210
211 int oom_kill_disable;
212
213
214 struct cgroup_file events_file;
215
216
217 struct mutex thresholds_lock;
218
219
220 struct mem_cgroup_thresholds thresholds;
221
222
223 struct mem_cgroup_thresholds memsw_thresholds;
224
225
226 struct list_head oom_notify;
227
228
229
230
231
232 unsigned long move_charge_at_immigrate;
233
234
235
236 atomic_t moving_account;
237
238 spinlock_t move_lock;
239 struct task_struct *move_lock_task;
240 unsigned long move_lock_flags;
241
242
243
244 struct mem_cgroup_stat_cpu __percpu *stat;
245
246 unsigned long socket_pressure;
247
248
249 bool tcpmem_active;
250 int tcpmem_pressure;
251
252#ifndef CONFIG_SLOB
253
254 int kmemcg_id;
255 enum memcg_kmem_state kmem_state;
256#endif
257
258 int last_scanned_node;
259#if MAX_NUMNODES > 1
260 nodemask_t scan_nodes;
261 atomic_t numainfo_events;
262 atomic_t numainfo_updating;
263#endif
264
265#ifdef CONFIG_CGROUP_WRITEBACK
266 struct list_head cgwb_list;
267 struct wb_domain cgwb_domain;
268#endif
269
270
271 struct list_head event_list;
272 spinlock_t event_list_lock;
273
274 struct mem_cgroup_per_node *nodeinfo[0];
275
276};
277
278extern struct mem_cgroup *root_mem_cgroup;
279
280static inline bool mem_cgroup_disabled(void)
281{
282 return !cgroup_subsys_enabled(memory_cgrp_subsys);
283}
284
285
286
287
288
289
290
291static inline void mem_cgroup_events(struct mem_cgroup *memcg,
292 enum mem_cgroup_events_index idx,
293 unsigned int nr)
294{
295 this_cpu_add(memcg->stat->events[idx], nr);
296 cgroup_file_notify(&memcg->events_file);
297}
298
299bool mem_cgroup_low(struct mem_cgroup *root, struct mem_cgroup *memcg);
300
301int mem_cgroup_try_charge(struct page *page, struct mm_struct *mm,
302 gfp_t gfp_mask, struct mem_cgroup **memcgp,
303 bool compound);
304void mem_cgroup_commit_charge(struct page *page, struct mem_cgroup *memcg,
305 bool lrucare, bool compound);
306void mem_cgroup_cancel_charge(struct page *page, struct mem_cgroup *memcg,
307 bool compound);
308void mem_cgroup_uncharge(struct page *page);
309void mem_cgroup_uncharge_list(struct list_head *page_list);
310
311void mem_cgroup_migrate(struct page *oldpage, struct page *newpage);
312
313static struct mem_cgroup_per_node *
314mem_cgroup_nodeinfo(struct mem_cgroup *memcg, int nid)
315{
316 return memcg->nodeinfo[nid];
317}
318
319
320
321
322
323
324
325
326
327
328static inline struct lruvec *mem_cgroup_lruvec(struct pglist_data *pgdat,
329 struct mem_cgroup *memcg)
330{
331 struct mem_cgroup_per_node *mz;
332 struct lruvec *lruvec;
333
334 if (mem_cgroup_disabled()) {
335 lruvec = node_lruvec(pgdat);
336 goto out;
337 }
338
339 mz = mem_cgroup_nodeinfo(memcg, pgdat->node_id);
340 lruvec = &mz->lruvec;
341out:
342
343
344
345
346
347 if (unlikely(lruvec->pgdat != pgdat))
348 lruvec->pgdat = pgdat;
349 return lruvec;
350}
351
352struct lruvec *mem_cgroup_page_lruvec(struct page *, struct pglist_data *);
353
354bool task_in_mem_cgroup(struct task_struct *task, struct mem_cgroup *memcg);
355struct mem_cgroup *mem_cgroup_from_task(struct task_struct *p);
356
357static inline
358struct mem_cgroup *mem_cgroup_from_css(struct cgroup_subsys_state *css){
359 return css ? container_of(css, struct mem_cgroup, css) : NULL;
360}
361
362#define mem_cgroup_from_counter(counter, member) \
363 container_of(counter, struct mem_cgroup, member)
364
365struct mem_cgroup *mem_cgroup_iter(struct mem_cgroup *,
366 struct mem_cgroup *,
367 struct mem_cgroup_reclaim_cookie *);
368void mem_cgroup_iter_break(struct mem_cgroup *, struct mem_cgroup *);
369int mem_cgroup_scan_tasks(struct mem_cgroup *,
370 int (*)(struct task_struct *, void *), void *);
371
372static inline unsigned short mem_cgroup_id(struct mem_cgroup *memcg)
373{
374 if (mem_cgroup_disabled())
375 return 0;
376
377 return memcg->id.id;
378}
379struct mem_cgroup *mem_cgroup_from_id(unsigned short id);
380
381
382
383
384
385
386
387
388static inline struct mem_cgroup *parent_mem_cgroup(struct mem_cgroup *memcg)
389{
390 if (!memcg->memory.parent)
391 return NULL;
392 return mem_cgroup_from_counter(memcg->memory.parent, memory);
393}
394
395static inline bool mem_cgroup_is_descendant(struct mem_cgroup *memcg,
396 struct mem_cgroup *root)
397{
398 if (root == memcg)
399 return true;
400 if (!root->use_hierarchy)
401 return false;
402 return cgroup_is_descendant(memcg->css.cgroup, root->css.cgroup);
403}
404
405static inline bool mm_match_cgroup(struct mm_struct *mm,
406 struct mem_cgroup *memcg)
407{
408 struct mem_cgroup *task_memcg;
409 bool match = false;
410
411 rcu_read_lock();
412 task_memcg = mem_cgroup_from_task(rcu_dereference(mm->owner));
413 if (task_memcg)
414 match = mem_cgroup_is_descendant(task_memcg, memcg);
415 rcu_read_unlock();
416 return match;
417}
418
419struct cgroup_subsys_state *mem_cgroup_css_from_page(struct page *page);
420ino_t page_cgroup_ino(struct page *page);
421
422static inline bool mem_cgroup_online(struct mem_cgroup *memcg)
423{
424 if (mem_cgroup_disabled())
425 return true;
426 return !!(memcg->css.flags & CSS_ONLINE);
427}
428
429
430
431
432int mem_cgroup_select_victim_node(struct mem_cgroup *memcg);
433
434void mem_cgroup_update_lru_size(struct lruvec *lruvec, enum lru_list lru,
435 int zid, int nr_pages);
436
437unsigned long mem_cgroup_node_nr_lru_pages(struct mem_cgroup *memcg,
438 int nid, unsigned int lru_mask);
439
440static inline
441unsigned long mem_cgroup_get_lru_size(struct lruvec *lruvec, enum lru_list lru)
442{
443 struct mem_cgroup_per_node *mz;
444 unsigned long nr_pages = 0;
445 int zid;
446
447 mz = container_of(lruvec, struct mem_cgroup_per_node, lruvec);
448 for (zid = 0; zid < MAX_NR_ZONES; zid++)
449 nr_pages += mz->lru_zone_size[zid][lru];
450 return nr_pages;
451}
452
453static inline
454unsigned long mem_cgroup_get_zone_lru_size(struct lruvec *lruvec,
455 enum lru_list lru, int zone_idx)
456{
457 struct mem_cgroup_per_node *mz;
458
459 mz = container_of(lruvec, struct mem_cgroup_per_node, lruvec);
460 return mz->lru_zone_size[zone_idx][lru];
461}
462
463void mem_cgroup_handle_over_high(void);
464
465unsigned long mem_cgroup_get_limit(struct mem_cgroup *memcg);
466
467void mem_cgroup_print_oom_info(struct mem_cgroup *memcg,
468 struct task_struct *p);
469
470static inline void mem_cgroup_oom_enable(void)
471{
472 WARN_ON(current->memcg_may_oom);
473 current->memcg_may_oom = 1;
474}
475
476static inline void mem_cgroup_oom_disable(void)
477{
478 WARN_ON(!current->memcg_may_oom);
479 current->memcg_may_oom = 0;
480}
481
482static inline bool task_in_memcg_oom(struct task_struct *p)
483{
484 return p->memcg_in_oom;
485}
486
487bool mem_cgroup_oom_synchronize(bool wait);
488
489#ifdef CONFIG_MEMCG_SWAP
490extern int do_swap_account;
491#endif
492
493void lock_page_memcg(struct page *page);
494void unlock_page_memcg(struct page *page);
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511static inline void mem_cgroup_update_page_stat(struct page *page,
512 enum mem_cgroup_stat_index idx, int val)
513{
514 VM_BUG_ON(!(rcu_read_lock_held() || PageLocked(page)));
515
516 if (page->mem_cgroup)
517 this_cpu_add(page->mem_cgroup->stat->count[idx], val);
518}
519
520static inline void mem_cgroup_inc_page_stat(struct page *page,
521 enum mem_cgroup_stat_index idx)
522{
523 mem_cgroup_update_page_stat(page, idx, 1);
524}
525
526static inline void mem_cgroup_dec_page_stat(struct page *page,
527 enum mem_cgroup_stat_index idx)
528{
529 mem_cgroup_update_page_stat(page, idx, -1);
530}
531
532unsigned long mem_cgroup_soft_limit_reclaim(pg_data_t *pgdat, int order,
533 gfp_t gfp_mask,
534 unsigned long *total_scanned);
535
536static inline void mem_cgroup_count_vm_event(struct mm_struct *mm,
537 enum vm_event_item idx)
538{
539 struct mem_cgroup *memcg;
540
541 if (mem_cgroup_disabled())
542 return;
543
544 rcu_read_lock();
545 memcg = mem_cgroup_from_task(rcu_dereference(mm->owner));
546 if (unlikely(!memcg))
547 goto out;
548
549 switch (idx) {
550 case PGFAULT:
551 this_cpu_inc(memcg->stat->events[MEM_CGROUP_EVENTS_PGFAULT]);
552 break;
553 case PGMAJFAULT:
554 this_cpu_inc(memcg->stat->events[MEM_CGROUP_EVENTS_PGMAJFAULT]);
555 break;
556 default:
557 BUG();
558 }
559out:
560 rcu_read_unlock();
561}
562#ifdef CONFIG_TRANSPARENT_HUGEPAGE
563void mem_cgroup_split_huge_fixup(struct page *head);
564#endif
565
566#else
567
568#define MEM_CGROUP_ID_SHIFT 0
569#define MEM_CGROUP_ID_MAX 0
570
571struct mem_cgroup;
572
573static inline bool mem_cgroup_disabled(void)
574{
575 return true;
576}
577
578static inline void mem_cgroup_events(struct mem_cgroup *memcg,
579 enum mem_cgroup_events_index idx,
580 unsigned int nr)
581{
582}
583
584static inline bool mem_cgroup_low(struct mem_cgroup *root,
585 struct mem_cgroup *memcg)
586{
587 return false;
588}
589
590static inline int mem_cgroup_try_charge(struct page *page, struct mm_struct *mm,
591 gfp_t gfp_mask,
592 struct mem_cgroup **memcgp,
593 bool compound)
594{
595 *memcgp = NULL;
596 return 0;
597}
598
599static inline void mem_cgroup_commit_charge(struct page *page,
600 struct mem_cgroup *memcg,
601 bool lrucare, bool compound)
602{
603}
604
605static inline void mem_cgroup_cancel_charge(struct page *page,
606 struct mem_cgroup *memcg,
607 bool compound)
608{
609}
610
611static inline void mem_cgroup_uncharge(struct page *page)
612{
613}
614
615static inline void mem_cgroup_uncharge_list(struct list_head *page_list)
616{
617}
618
619static inline void mem_cgroup_migrate(struct page *old, struct page *new)
620{
621}
622
623static inline struct lruvec *mem_cgroup_lruvec(struct pglist_data *pgdat,
624 struct mem_cgroup *memcg)
625{
626 return node_lruvec(pgdat);
627}
628
629static inline struct lruvec *mem_cgroup_page_lruvec(struct page *page,
630 struct pglist_data *pgdat)
631{
632 return &pgdat->lruvec;
633}
634
635static inline bool mm_match_cgroup(struct mm_struct *mm,
636 struct mem_cgroup *memcg)
637{
638 return true;
639}
640
641static inline bool task_in_mem_cgroup(struct task_struct *task,
642 const struct mem_cgroup *memcg)
643{
644 return true;
645}
646
647static inline struct mem_cgroup *
648mem_cgroup_iter(struct mem_cgroup *root,
649 struct mem_cgroup *prev,
650 struct mem_cgroup_reclaim_cookie *reclaim)
651{
652 return NULL;
653}
654
655static inline void mem_cgroup_iter_break(struct mem_cgroup *root,
656 struct mem_cgroup *prev)
657{
658}
659
660static inline int mem_cgroup_scan_tasks(struct mem_cgroup *memcg,
661 int (*fn)(struct task_struct *, void *), void *arg)
662{
663 return 0;
664}
665
666static inline unsigned short mem_cgroup_id(struct mem_cgroup *memcg)
667{
668 return 0;
669}
670
671static inline struct mem_cgroup *mem_cgroup_from_id(unsigned short id)
672{
673 WARN_ON_ONCE(id);
674
675 return NULL;
676}
677
678static inline bool mem_cgroup_online(struct mem_cgroup *memcg)
679{
680 return true;
681}
682
683static inline unsigned long
684mem_cgroup_get_lru_size(struct lruvec *lruvec, enum lru_list lru)
685{
686 return 0;
687}
688static inline
689unsigned long mem_cgroup_get_zone_lru_size(struct lruvec *lruvec,
690 enum lru_list lru, int zone_idx)
691{
692 return 0;
693}
694
695static inline unsigned long
696mem_cgroup_node_nr_lru_pages(struct mem_cgroup *memcg,
697 int nid, unsigned int lru_mask)
698{
699 return 0;
700}
701
702static inline unsigned long mem_cgroup_get_limit(struct mem_cgroup *memcg)
703{
704 return 0;
705}
706
707static inline void
708mem_cgroup_print_oom_info(struct mem_cgroup *memcg, struct task_struct *p)
709{
710}
711
712static inline void lock_page_memcg(struct page *page)
713{
714}
715
716static inline void unlock_page_memcg(struct page *page)
717{
718}
719
720static inline void mem_cgroup_handle_over_high(void)
721{
722}
723
724static inline void mem_cgroup_oom_enable(void)
725{
726}
727
728static inline void mem_cgroup_oom_disable(void)
729{
730}
731
732static inline bool task_in_memcg_oom(struct task_struct *p)
733{
734 return false;
735}
736
737static inline bool mem_cgroup_oom_synchronize(bool wait)
738{
739 return false;
740}
741
742static inline void mem_cgroup_inc_page_stat(struct page *page,
743 enum mem_cgroup_stat_index idx)
744{
745}
746
747static inline void mem_cgroup_dec_page_stat(struct page *page,
748 enum mem_cgroup_stat_index idx)
749{
750}
751
752static inline
753unsigned long mem_cgroup_soft_limit_reclaim(pg_data_t *pgdat, int order,
754 gfp_t gfp_mask,
755 unsigned long *total_scanned)
756{
757 return 0;
758}
759
760static inline void mem_cgroup_split_huge_fixup(struct page *head)
761{
762}
763
764static inline
765void mem_cgroup_count_vm_event(struct mm_struct *mm, enum vm_event_item idx)
766{
767}
768#endif
769
770#ifdef CONFIG_CGROUP_WRITEBACK
771
772struct list_head *mem_cgroup_cgwb_list(struct mem_cgroup *memcg);
773struct wb_domain *mem_cgroup_wb_domain(struct bdi_writeback *wb);
774void mem_cgroup_wb_stats(struct bdi_writeback *wb, unsigned long *pfilepages,
775 unsigned long *pheadroom, unsigned long *pdirty,
776 unsigned long *pwriteback);
777
778#else
779
780static inline struct wb_domain *mem_cgroup_wb_domain(struct bdi_writeback *wb)
781{
782 return NULL;
783}
784
785static inline void mem_cgroup_wb_stats(struct bdi_writeback *wb,
786 unsigned long *pfilepages,
787 unsigned long *pheadroom,
788 unsigned long *pdirty,
789 unsigned long *pwriteback)
790{
791}
792
793#endif
794
795struct sock;
796bool mem_cgroup_charge_skmem(struct mem_cgroup *memcg, unsigned int nr_pages);
797void mem_cgroup_uncharge_skmem(struct mem_cgroup *memcg, unsigned int nr_pages);
798#ifdef CONFIG_MEMCG
799extern struct static_key_false memcg_sockets_enabled_key;
800#define mem_cgroup_sockets_enabled static_branch_unlikely(&memcg_sockets_enabled_key)
801void mem_cgroup_sk_alloc(struct sock *sk);
802void mem_cgroup_sk_free(struct sock *sk);
803static inline bool mem_cgroup_under_socket_pressure(struct mem_cgroup *memcg)
804{
805 if (!cgroup_subsys_on_dfl(memory_cgrp_subsys) && memcg->tcpmem_pressure)
806 return true;
807 do {
808 if (time_before(jiffies, memcg->socket_pressure))
809 return true;
810 } while ((memcg = parent_mem_cgroup(memcg)));
811 return false;
812}
813#else
814#define mem_cgroup_sockets_enabled 0
815static inline void mem_cgroup_sk_alloc(struct sock *sk) { };
816static inline void mem_cgroup_sk_free(struct sock *sk) { };
817static inline bool mem_cgroup_under_socket_pressure(struct mem_cgroup *memcg)
818{
819 return false;
820}
821#endif
822
823struct kmem_cache *memcg_kmem_get_cache(struct kmem_cache *cachep);
824void memcg_kmem_put_cache(struct kmem_cache *cachep);
825int memcg_kmem_charge_memcg(struct page *page, gfp_t gfp, int order,
826 struct mem_cgroup *memcg);
827int memcg_kmem_charge(struct page *page, gfp_t gfp, int order);
828void memcg_kmem_uncharge(struct page *page, int order);
829
830#if defined(CONFIG_MEMCG) && !defined(CONFIG_SLOB)
831extern struct static_key_false memcg_kmem_enabled_key;
832
833extern int memcg_nr_cache_ids;
834void memcg_get_cache_ids(void);
835void memcg_put_cache_ids(void);
836
837
838
839
840
841
842#define for_each_memcg_cache_index(_idx) \
843 for ((_idx) = 0; (_idx) < memcg_nr_cache_ids; (_idx)++)
844
845static inline bool memcg_kmem_enabled(void)
846{
847 return static_branch_unlikely(&memcg_kmem_enabled_key);
848}
849
850
851
852
853
854
855static inline int memcg_cache_id(struct mem_cgroup *memcg)
856{
857 return memcg ? memcg->kmemcg_id : -1;
858}
859
860
861
862
863
864
865
866static inline void memcg_kmem_update_page_stat(struct page *page,
867 enum mem_cgroup_stat_index idx, int val)
868{
869 if (memcg_kmem_enabled() && page->mem_cgroup)
870 this_cpu_add(page->mem_cgroup->stat->count[idx], val);
871}
872
873#else
874#define for_each_memcg_cache_index(_idx) \
875 for (; NULL; )
876
877static inline bool memcg_kmem_enabled(void)
878{
879 return false;
880}
881
882static inline int memcg_cache_id(struct mem_cgroup *memcg)
883{
884 return -1;
885}
886
887static inline void memcg_get_cache_ids(void)
888{
889}
890
891static inline void memcg_put_cache_ids(void)
892{
893}
894
895static inline void memcg_kmem_update_page_stat(struct page *page,
896 enum mem_cgroup_stat_index idx, int val)
897{
898}
899#endif
900
901#endif
902