1#include <linux/mm.h>
2#include <linux/slab.h>
3#include <linux/string.h>
4#include <linux/compiler.h>
5#include <linux/export.h>
6#include <linux/err.h>
7#include <linux/sched.h>
8#include <linux/sched/mm.h>
9#include <linux/sched/task_stack.h>
10#include <linux/security.h>
11#include <linux/swap.h>
12#include <linux/swapops.h>
13#include <linux/mman.h>
14#include <linux/hugetlb.h>
15#include <linux/vmalloc.h>
16#include <linux/userfaultfd_k.h>
17
18#include <linux/uaccess.h>
19
20#include "internal.h"
21
22
23
24
25
26
27
28void kfree_const(const void *x)
29{
30 if (!is_kernel_rodata((unsigned long)x))
31 kfree(x);
32}
33EXPORT_SYMBOL(kfree_const);
34
35
36
37
38
39
40char *kstrdup(const char *s, gfp_t gfp)
41{
42 size_t len;
43 char *buf;
44
45 if (!s)
46 return NULL;
47
48 len = strlen(s) + 1;
49 buf = kmalloc_track_caller(len, gfp);
50 if (buf)
51 memcpy(buf, s, len);
52 return buf;
53}
54EXPORT_SYMBOL(kstrdup);
55
56
57
58
59
60
61
62
63
64
65const char *kstrdup_const(const char *s, gfp_t gfp)
66{
67 if (is_kernel_rodata((unsigned long)s))
68 return s;
69
70 return kstrdup(s, gfp);
71}
72EXPORT_SYMBOL(kstrdup_const);
73
74
75
76
77
78
79
80
81
82char *kstrndup(const char *s, size_t max, gfp_t gfp)
83{
84 size_t len;
85 char *buf;
86
87 if (!s)
88 return NULL;
89
90 len = strnlen(s, max);
91 buf = kmalloc_track_caller(len+1, gfp);
92 if (buf) {
93 memcpy(buf, s, len);
94 buf[len] = '\0';
95 }
96 return buf;
97}
98EXPORT_SYMBOL(kstrndup);
99
100
101
102
103
104
105
106
107void *kmemdup(const void *src, size_t len, gfp_t gfp)
108{
109 void *p;
110
111 p = kmalloc_track_caller(len, gfp);
112 if (p)
113 memcpy(p, src, len);
114 return p;
115}
116EXPORT_SYMBOL(kmemdup);
117
118
119
120
121
122
123
124char *kmemdup_nul(const char *s, size_t len, gfp_t gfp)
125{
126 char *buf;
127
128 if (!s)
129 return NULL;
130
131 buf = kmalloc_track_caller(len + 1, gfp);
132 if (buf) {
133 memcpy(buf, s, len);
134 buf[len] = '\0';
135 }
136 return buf;
137}
138EXPORT_SYMBOL(kmemdup_nul);
139
140
141
142
143
144
145
146
147
148
149void *memdup_user(const void __user *src, size_t len)
150{
151 void *p;
152
153 p = kmalloc_track_caller(len, GFP_USER);
154 if (!p)
155 return ERR_PTR(-ENOMEM);
156
157 if (copy_from_user(p, src, len)) {
158 kfree(p);
159 return ERR_PTR(-EFAULT);
160 }
161
162 return p;
163}
164EXPORT_SYMBOL(memdup_user);
165
166
167
168
169
170
171
172
173
174
175void *vmemdup_user(const void __user *src, size_t len)
176{
177 void *p;
178
179 p = kvmalloc(len, GFP_USER);
180 if (!p)
181 return ERR_PTR(-ENOMEM);
182
183 if (copy_from_user(p, src, len)) {
184 kvfree(p);
185 return ERR_PTR(-EFAULT);
186 }
187
188 return p;
189}
190EXPORT_SYMBOL(vmemdup_user);
191
192
193
194
195
196
197char *strndup_user(const char __user *s, long n)
198{
199 char *p;
200 long length;
201
202 length = strnlen_user(s, n);
203
204 if (!length)
205 return ERR_PTR(-EFAULT);
206
207 if (length > n)
208 return ERR_PTR(-EINVAL);
209
210 p = memdup_user(s, length);
211
212 if (IS_ERR(p))
213 return p;
214
215 p[length - 1] = '\0';
216
217 return p;
218}
219EXPORT_SYMBOL(strndup_user);
220
221
222
223
224
225
226
227
228
229void *memdup_user_nul(const void __user *src, size_t len)
230{
231 char *p;
232
233
234
235
236
237
238 p = kmalloc_track_caller(len + 1, GFP_KERNEL);
239 if (!p)
240 return ERR_PTR(-ENOMEM);
241
242 if (copy_from_user(p, src, len)) {
243 kfree(p);
244 return ERR_PTR(-EFAULT);
245 }
246 p[len] = '\0';
247
248 return p;
249}
250EXPORT_SYMBOL(memdup_user_nul);
251
252void __vma_link_list(struct mm_struct *mm, struct vm_area_struct *vma,
253 struct vm_area_struct *prev, struct rb_node *rb_parent)
254{
255 struct vm_area_struct *next;
256
257 vma->vm_prev = prev;
258 if (prev) {
259 next = prev->vm_next;
260 prev->vm_next = vma;
261 } else {
262 mm->mmap = vma;
263 if (rb_parent)
264 next = rb_entry(rb_parent,
265 struct vm_area_struct, vm_rb);
266 else
267 next = NULL;
268 }
269 vma->vm_next = next;
270 if (next)
271 next->vm_prev = vma;
272}
273
274
275int vma_is_stack_for_current(struct vm_area_struct *vma)
276{
277 struct task_struct * __maybe_unused t = current;
278
279 return (vma->vm_start <= KSTK_ESP(t) && vma->vm_end >= KSTK_ESP(t));
280}
281
282#if defined(CONFIG_MMU) && !defined(HAVE_ARCH_PICK_MMAP_LAYOUT)
283void arch_pick_mmap_layout(struct mm_struct *mm, struct rlimit *rlim_stack)
284{
285 mm->mmap_base = TASK_UNMAPPED_BASE;
286 mm->get_unmapped_area = arch_get_unmapped_area;
287}
288#endif
289
290
291
292
293
294
295
296
297
298int __weak __get_user_pages_fast(unsigned long start,
299 int nr_pages, int write, struct page **pages)
300{
301 return 0;
302}
303EXPORT_SYMBOL_GPL(__get_user_pages_fast);
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329int __weak get_user_pages_fast(unsigned long start,
330 int nr_pages, int write, struct page **pages)
331{
332 return get_user_pages_unlocked(start, nr_pages, pages,
333 write ? FOLL_WRITE : 0);
334}
335EXPORT_SYMBOL_GPL(get_user_pages_fast);
336
337unsigned long vm_mmap_pgoff(struct file *file, unsigned long addr,
338 unsigned long len, unsigned long prot,
339 unsigned long flag, unsigned long pgoff)
340{
341 unsigned long ret;
342 struct mm_struct *mm = current->mm;
343 unsigned long populate;
344 LIST_HEAD(uf);
345
346 ret = security_mmap_file(file, prot, flag);
347 if (!ret) {
348 if (down_write_killable(&mm->mmap_sem))
349 return -EINTR;
350 ret = do_mmap_pgoff(file, addr, len, prot, flag, pgoff,
351 &populate, &uf);
352 up_write(&mm->mmap_sem);
353 userfaultfd_unmap_complete(mm, &uf);
354 if (populate)
355 mm_populate(ret, populate);
356 }
357 return ret;
358}
359
360unsigned long vm_mmap(struct file *file, unsigned long addr,
361 unsigned long len, unsigned long prot,
362 unsigned long flag, unsigned long offset)
363{
364 if (unlikely(offset + PAGE_ALIGN(len) < offset))
365 return -EINVAL;
366 if (unlikely(offset_in_page(offset)))
367 return -EINVAL;
368
369 return vm_mmap_pgoff(file, addr, len, prot, flag, offset >> PAGE_SHIFT);
370}
371EXPORT_SYMBOL(vm_mmap);
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390void *kvmalloc_node(size_t size, gfp_t flags, int node)
391{
392 gfp_t kmalloc_flags = flags;
393 void *ret;
394
395
396
397
398
399 if ((flags & GFP_KERNEL) != GFP_KERNEL)
400 return kmalloc_node(size, flags, node);
401
402
403
404
405
406
407
408
409 if (size > PAGE_SIZE) {
410 kmalloc_flags |= __GFP_NOWARN;
411
412 if (!(kmalloc_flags & __GFP_RETRY_MAYFAIL))
413 kmalloc_flags |= __GFP_NORETRY;
414 }
415
416 ret = kmalloc_node(size, kmalloc_flags, node);
417
418
419
420
421
422 if (ret || size <= PAGE_SIZE)
423 return ret;
424
425 return __vmalloc_node_flags_caller(size, node, flags,
426 __builtin_return_address(0));
427}
428EXPORT_SYMBOL(kvmalloc_node);
429
430
431
432
433
434
435
436
437
438
439
440void kvfree(const void *addr)
441{
442 if (is_vmalloc_addr(addr))
443 vfree(addr);
444 else
445 kfree(addr);
446}
447EXPORT_SYMBOL(kvfree);
448
449static inline void *__page_rmapping(struct page *page)
450{
451 unsigned long mapping;
452
453 mapping = (unsigned long)page->mapping;
454 mapping &= ~PAGE_MAPPING_FLAGS;
455
456 return (void *)mapping;
457}
458
459
460void *page_rmapping(struct page *page)
461{
462 page = compound_head(page);
463 return __page_rmapping(page);
464}
465
466
467
468
469
470bool page_mapped(struct page *page)
471{
472 int i;
473
474 if (likely(!PageCompound(page)))
475 return atomic_read(&page->_mapcount) >= 0;
476 page = compound_head(page);
477 if (atomic_read(compound_mapcount_ptr(page)) >= 0)
478 return true;
479 if (PageHuge(page))
480 return false;
481 for (i = 0; i < hpage_nr_pages(page); i++) {
482 if (atomic_read(&page[i]._mapcount) >= 0)
483 return true;
484 }
485 return false;
486}
487EXPORT_SYMBOL(page_mapped);
488
489struct anon_vma *page_anon_vma(struct page *page)
490{
491 unsigned long mapping;
492
493 page = compound_head(page);
494 mapping = (unsigned long)page->mapping;
495 if ((mapping & PAGE_MAPPING_FLAGS) != PAGE_MAPPING_ANON)
496 return NULL;
497 return __page_rmapping(page);
498}
499
500struct address_space *page_mapping(struct page *page)
501{
502 struct address_space *mapping;
503
504 page = compound_head(page);
505
506
507 if (unlikely(PageSlab(page)))
508 return NULL;
509
510 if (unlikely(PageSwapCache(page))) {
511 swp_entry_t entry;
512
513 entry.val = page_private(page);
514 return swap_address_space(entry);
515 }
516
517 mapping = page->mapping;
518 if ((unsigned long)mapping & PAGE_MAPPING_ANON)
519 return NULL;
520
521 return (void *)((unsigned long)mapping & ~PAGE_MAPPING_FLAGS);
522}
523EXPORT_SYMBOL(page_mapping);
524
525
526
527
528struct address_space *page_mapping_file(struct page *page)
529{
530 if (unlikely(PageSwapCache(page)))
531 return NULL;
532 return page_mapping(page);
533}
534
535
536int __page_mapcount(struct page *page)
537{
538 int ret;
539
540 ret = atomic_read(&page->_mapcount) + 1;
541
542
543
544
545 if (!PageAnon(page) && !PageHuge(page))
546 return ret;
547 page = compound_head(page);
548 ret += atomic_read(compound_mapcount_ptr(page)) + 1;
549 if (PageDoubleMap(page))
550 ret--;
551 return ret;
552}
553EXPORT_SYMBOL_GPL(__page_mapcount);
554
555int sysctl_overcommit_memory __read_mostly = OVERCOMMIT_GUESS;
556int sysctl_overcommit_ratio __read_mostly = 50;
557unsigned long sysctl_overcommit_kbytes __read_mostly;
558int sysctl_max_map_count __read_mostly = DEFAULT_MAX_MAP_COUNT;
559unsigned long sysctl_user_reserve_kbytes __read_mostly = 1UL << 17;
560unsigned long sysctl_admin_reserve_kbytes __read_mostly = 1UL << 13;
561
562int overcommit_ratio_handler(struct ctl_table *table, int write,
563 void __user *buffer, size_t *lenp,
564 loff_t *ppos)
565{
566 int ret;
567
568 ret = proc_dointvec(table, write, buffer, lenp, ppos);
569 if (ret == 0 && write)
570 sysctl_overcommit_kbytes = 0;
571 return ret;
572}
573
574int overcommit_kbytes_handler(struct ctl_table *table, int write,
575 void __user *buffer, size_t *lenp,
576 loff_t *ppos)
577{
578 int ret;
579
580 ret = proc_doulongvec_minmax(table, write, buffer, lenp, ppos);
581 if (ret == 0 && write)
582 sysctl_overcommit_ratio = 0;
583 return ret;
584}
585
586
587
588
589unsigned long vm_commit_limit(void)
590{
591 unsigned long allowed;
592
593 if (sysctl_overcommit_kbytes)
594 allowed = sysctl_overcommit_kbytes >> (PAGE_SHIFT - 10);
595 else
596 allowed = ((totalram_pages - hugetlb_total_pages())
597 * sysctl_overcommit_ratio / 100);
598 allowed += total_swap_pages;
599
600 return allowed;
601}
602
603
604
605
606
607struct percpu_counter vm_committed_as ____cacheline_aligned_in_smp;
608
609
610
611
612
613
614
615
616
617unsigned long vm_memory_committed(void)
618{
619 return percpu_counter_read_positive(&vm_committed_as);
620}
621EXPORT_SYMBOL_GPL(vm_memory_committed);
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639int __vm_enough_memory(struct mm_struct *mm, long pages, int cap_sys_admin)
640{
641 long free, allowed, reserve;
642
643 VM_WARN_ONCE(percpu_counter_read(&vm_committed_as) <
644 -(s64)vm_committed_as_batch * num_online_cpus(),
645 "memory commitment underflow");
646
647 vm_acct_memory(pages);
648
649
650
651
652 if (sysctl_overcommit_memory == OVERCOMMIT_ALWAYS)
653 return 0;
654
655 if (sysctl_overcommit_memory == OVERCOMMIT_GUESS) {
656 free = global_zone_page_state(NR_FREE_PAGES);
657 free += global_node_page_state(NR_FILE_PAGES);
658
659
660
661
662
663
664
665 free -= global_node_page_state(NR_SHMEM);
666
667 free += get_nr_swap_pages();
668
669
670
671
672
673
674
675 free += global_node_page_state(NR_SLAB_RECLAIMABLE);
676
677
678
679
680
681 free += global_node_page_state(NR_KERNEL_MISC_RECLAIMABLE);
682
683
684
685
686 if (free <= totalreserve_pages)
687 goto error;
688 else
689 free -= totalreserve_pages;
690
691
692
693
694 if (!cap_sys_admin)
695 free -= sysctl_admin_reserve_kbytes >> (PAGE_SHIFT - 10);
696
697 if (free > pages)
698 return 0;
699
700 goto error;
701 }
702
703 allowed = vm_commit_limit();
704
705
706
707 if (!cap_sys_admin)
708 allowed -= sysctl_admin_reserve_kbytes >> (PAGE_SHIFT - 10);
709
710
711
712
713 if (mm) {
714 reserve = sysctl_user_reserve_kbytes >> (PAGE_SHIFT - 10);
715 allowed -= min_t(long, mm->total_vm / 32, reserve);
716 }
717
718 if (percpu_counter_read_positive(&vm_committed_as) < allowed)
719 return 0;
720error:
721 vm_unacct_memory(pages);
722
723 return -ENOMEM;
724}
725
726
727
728
729
730
731
732
733
734
735int get_cmdline(struct task_struct *task, char *buffer, int buflen)
736{
737 int res = 0;
738 unsigned int len;
739 struct mm_struct *mm = get_task_mm(task);
740 unsigned long arg_start, arg_end, env_start, env_end;
741 if (!mm)
742 goto out;
743 if (!mm->arg_end)
744 goto out_mm;
745
746 down_read(&mm->mmap_sem);
747 arg_start = mm->arg_start;
748 arg_end = mm->arg_end;
749 env_start = mm->env_start;
750 env_end = mm->env_end;
751 up_read(&mm->mmap_sem);
752
753 len = arg_end - arg_start;
754
755 if (len > buflen)
756 len = buflen;
757
758 res = access_process_vm(task, arg_start, buffer, len, FOLL_FORCE);
759
760
761
762
763
764 if (res > 0 && buffer[res-1] != '\0' && len < buflen) {
765 len = strnlen(buffer, res);
766 if (len < res) {
767 res = len;
768 } else {
769 len = env_end - env_start;
770 if (len > buflen - res)
771 len = buflen - res;
772 res += access_process_vm(task, env_start,
773 buffer+res, len,
774 FOLL_FORCE);
775 res = strnlen(buffer, res);
776 }
777 }
778out_mm:
779 mmput(mm);
780out:
781 return res;
782}
783