1
2
3
4#include <linux/lockdep.h>
5#include <linux/mm.h>
6#include <linux/mman.h>
7#include <linux/shmem_fs.h>
8#include <linux/suspend.h>
9#include <linux/sched/mm.h>
10#include <asm/sgx.h>
11#include "encl.h"
12#include "encls.h"
13#include "sgx.h"
14
15
16
17
18
19static int __sgx_encl_eldu(struct sgx_encl_page *encl_page,
20 struct sgx_epc_page *epc_page,
21 struct sgx_epc_page *secs_page)
22{
23 unsigned long va_offset = encl_page->desc & SGX_ENCL_PAGE_VA_OFFSET_MASK;
24 struct sgx_encl *encl = encl_page->encl;
25 struct sgx_pageinfo pginfo;
26 struct sgx_backing b;
27 pgoff_t page_index;
28 int ret;
29
30 if (secs_page)
31 page_index = PFN_DOWN(encl_page->desc - encl_page->encl->base);
32 else
33 page_index = PFN_DOWN(encl->size);
34
35 ret = sgx_encl_get_backing(encl, page_index, &b);
36 if (ret)
37 return ret;
38
39 pginfo.addr = encl_page->desc & PAGE_MASK;
40 pginfo.contents = (unsigned long)kmap_atomic(b.contents);
41 pginfo.metadata = (unsigned long)kmap_atomic(b.pcmd) +
42 b.pcmd_offset;
43
44 if (secs_page)
45 pginfo.secs = (u64)sgx_get_epc_virt_addr(secs_page);
46 else
47 pginfo.secs = 0;
48
49 ret = __eldu(&pginfo, sgx_get_epc_virt_addr(epc_page),
50 sgx_get_epc_virt_addr(encl_page->va_page->epc_page) + va_offset);
51 if (ret) {
52 if (encls_failed(ret))
53 ENCLS_WARN(ret, "ELDU");
54
55 ret = -EFAULT;
56 }
57
58 kunmap_atomic((void *)(unsigned long)(pginfo.metadata - b.pcmd_offset));
59 kunmap_atomic((void *)(unsigned long)pginfo.contents);
60
61 sgx_encl_put_backing(&b, false);
62
63 return ret;
64}
65
66static struct sgx_epc_page *sgx_encl_eldu(struct sgx_encl_page *encl_page,
67 struct sgx_epc_page *secs_page)
68{
69
70 unsigned long va_offset = encl_page->desc & SGX_ENCL_PAGE_VA_OFFSET_MASK;
71 struct sgx_encl *encl = encl_page->encl;
72 struct sgx_epc_page *epc_page;
73 int ret;
74
75 epc_page = sgx_alloc_epc_page(encl_page, false);
76 if (IS_ERR(epc_page))
77 return epc_page;
78
79 ret = __sgx_encl_eldu(encl_page, epc_page, secs_page);
80 if (ret) {
81 sgx_encl_free_epc_page(epc_page);
82 return ERR_PTR(ret);
83 }
84
85 sgx_free_va_slot(encl_page->va_page, va_offset);
86 list_move(&encl_page->va_page->list, &encl->va_pages);
87 encl_page->desc &= ~SGX_ENCL_PAGE_VA_OFFSET_MASK;
88 encl_page->epc_page = epc_page;
89
90 return epc_page;
91}
92
93static struct sgx_encl_page *sgx_encl_load_page(struct sgx_encl *encl,
94 unsigned long addr,
95 unsigned long vm_flags)
96{
97 unsigned long vm_prot_bits = vm_flags & (VM_READ | VM_WRITE | VM_EXEC);
98 struct sgx_epc_page *epc_page;
99 struct sgx_encl_page *entry;
100
101 entry = xa_load(&encl->page_array, PFN_DOWN(addr));
102 if (!entry)
103 return ERR_PTR(-EFAULT);
104
105
106
107
108
109
110 if ((entry->vm_max_prot_bits & vm_prot_bits) != vm_prot_bits)
111 return ERR_PTR(-EFAULT);
112
113
114 if (entry->epc_page) {
115 if (entry->desc & SGX_ENCL_PAGE_BEING_RECLAIMED)
116 return ERR_PTR(-EBUSY);
117
118 return entry;
119 }
120
121 if (!(encl->secs.epc_page)) {
122 epc_page = sgx_encl_eldu(&encl->secs, NULL);
123 if (IS_ERR(epc_page))
124 return ERR_CAST(epc_page);
125 }
126
127 epc_page = sgx_encl_eldu(entry, encl->secs.epc_page);
128 if (IS_ERR(epc_page))
129 return ERR_CAST(epc_page);
130
131 encl->secs_child_cnt++;
132 sgx_mark_page_reclaimable(entry->epc_page);
133
134 return entry;
135}
136
137static vm_fault_t sgx_vma_fault(struct vm_fault *vmf)
138{
139 unsigned long addr = (unsigned long)vmf->address;
140 struct vm_area_struct *vma = vmf->vma;
141 struct sgx_encl_page *entry;
142 unsigned long phys_addr;
143 struct sgx_encl *encl;
144 vm_fault_t ret;
145
146 encl = vma->vm_private_data;
147
148
149
150
151
152
153 if (unlikely(!encl))
154 return VM_FAULT_SIGBUS;
155
156 mutex_lock(&encl->lock);
157
158 entry = sgx_encl_load_page(encl, addr, vma->vm_flags);
159 if (IS_ERR(entry)) {
160 mutex_unlock(&encl->lock);
161
162 if (PTR_ERR(entry) == -EBUSY)
163 return VM_FAULT_NOPAGE;
164
165 return VM_FAULT_SIGBUS;
166 }
167
168 phys_addr = sgx_get_epc_phys_addr(entry->epc_page);
169
170 ret = vmf_insert_pfn(vma, addr, PFN_DOWN(phys_addr));
171 if (ret != VM_FAULT_NOPAGE) {
172 mutex_unlock(&encl->lock);
173
174 return VM_FAULT_SIGBUS;
175 }
176
177 sgx_encl_test_and_clear_young(vma->vm_mm, entry);
178 mutex_unlock(&encl->lock);
179
180 return VM_FAULT_NOPAGE;
181}
182
183static void sgx_vma_open(struct vm_area_struct *vma)
184{
185 struct sgx_encl *encl = vma->vm_private_data;
186
187
188
189
190
191
192 if (unlikely(!encl))
193 return;
194
195 if (sgx_encl_mm_add(encl, vma->vm_mm))
196 vma->vm_private_data = NULL;
197}
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218int sgx_encl_may_map(struct sgx_encl *encl, unsigned long start,
219 unsigned long end, unsigned long vm_flags)
220{
221 unsigned long vm_prot_bits = vm_flags & (VM_READ | VM_WRITE | VM_EXEC);
222 struct sgx_encl_page *page;
223 unsigned long count = 0;
224 int ret = 0;
225
226 XA_STATE(xas, &encl->page_array, PFN_DOWN(start));
227
228
229
230
231
232 if (current->personality & READ_IMPLIES_EXEC)
233 return -EACCES;
234
235 mutex_lock(&encl->lock);
236 xas_lock(&xas);
237 xas_for_each(&xas, page, PFN_DOWN(end - 1)) {
238 if (~page->vm_max_prot_bits & vm_prot_bits) {
239 ret = -EACCES;
240 break;
241 }
242
243
244 if (!(++count % XA_CHECK_SCHED)) {
245 xas_pause(&xas);
246 xas_unlock(&xas);
247 mutex_unlock(&encl->lock);
248
249 cond_resched();
250
251 mutex_lock(&encl->lock);
252 xas_lock(&xas);
253 }
254 }
255 xas_unlock(&xas);
256 mutex_unlock(&encl->lock);
257
258 return ret;
259}
260
261static int sgx_vma_mprotect(struct vm_area_struct *vma, unsigned long start,
262 unsigned long end, unsigned long newflags)
263{
264 return sgx_encl_may_map(vma->vm_private_data, start, end, newflags);
265}
266
267static int sgx_encl_debug_read(struct sgx_encl *encl, struct sgx_encl_page *page,
268 unsigned long addr, void *data)
269{
270 unsigned long offset = addr & ~PAGE_MASK;
271 int ret;
272
273
274 ret = __edbgrd(sgx_get_epc_virt_addr(page->epc_page) + offset, data);
275 if (ret)
276 return -EIO;
277
278 return 0;
279}
280
281static int sgx_encl_debug_write(struct sgx_encl *encl, struct sgx_encl_page *page,
282 unsigned long addr, void *data)
283{
284 unsigned long offset = addr & ~PAGE_MASK;
285 int ret;
286
287 ret = __edbgwr(sgx_get_epc_virt_addr(page->epc_page) + offset, data);
288 if (ret)
289 return -EIO;
290
291 return 0;
292}
293
294
295
296
297static struct sgx_encl_page *sgx_encl_reserve_page(struct sgx_encl *encl,
298 unsigned long addr,
299 unsigned long vm_flags)
300{
301 struct sgx_encl_page *entry;
302
303 for ( ; ; ) {
304 mutex_lock(&encl->lock);
305
306 entry = sgx_encl_load_page(encl, addr, vm_flags);
307 if (PTR_ERR(entry) != -EBUSY)
308 break;
309
310 mutex_unlock(&encl->lock);
311 }
312
313 if (IS_ERR(entry))
314 mutex_unlock(&encl->lock);
315
316 return entry;
317}
318
319static int sgx_vma_access(struct vm_area_struct *vma, unsigned long addr,
320 void *buf, int len, int write)
321{
322 struct sgx_encl *encl = vma->vm_private_data;
323 struct sgx_encl_page *entry = NULL;
324 char data[sizeof(unsigned long)];
325 unsigned long align;
326 int offset;
327 int cnt;
328 int ret = 0;
329 int i;
330
331
332
333
334
335 if (!encl)
336 return -EFAULT;
337
338 if (!test_bit(SGX_ENCL_DEBUG, &encl->flags))
339 return -EFAULT;
340
341 for (i = 0; i < len; i += cnt) {
342 entry = sgx_encl_reserve_page(encl, (addr + i) & PAGE_MASK,
343 vma->vm_flags);
344 if (IS_ERR(entry)) {
345 ret = PTR_ERR(entry);
346 break;
347 }
348
349 align = ALIGN_DOWN(addr + i, sizeof(unsigned long));
350 offset = (addr + i) & (sizeof(unsigned long) - 1);
351 cnt = sizeof(unsigned long) - offset;
352 cnt = min(cnt, len - i);
353
354 ret = sgx_encl_debug_read(encl, entry, align, data);
355 if (ret)
356 goto out;
357
358 if (write) {
359 memcpy(data + offset, buf + i, cnt);
360 ret = sgx_encl_debug_write(encl, entry, align, data);
361 if (ret)
362 goto out;
363 } else {
364 memcpy(buf + i, data + offset, cnt);
365 }
366
367out:
368 mutex_unlock(&encl->lock);
369
370 if (ret)
371 break;
372 }
373
374 return ret < 0 ? ret : i;
375}
376
377const struct vm_operations_struct sgx_vm_ops = {
378 .fault = sgx_vma_fault,
379 .mprotect = sgx_vma_mprotect,
380 .open = sgx_vma_open,
381 .access = sgx_vma_access,
382};
383
384
385
386
387
388
389
390
391void sgx_encl_release(struct kref *ref)
392{
393 struct sgx_encl *encl = container_of(ref, struct sgx_encl, refcount);
394 struct sgx_va_page *va_page;
395 struct sgx_encl_page *entry;
396 unsigned long index;
397
398 xa_for_each(&encl->page_array, index, entry) {
399 if (entry->epc_page) {
400
401
402
403
404 if (sgx_unmark_page_reclaimable(entry->epc_page))
405 continue;
406
407 sgx_encl_free_epc_page(entry->epc_page);
408 encl->secs_child_cnt--;
409 entry->epc_page = NULL;
410 }
411
412 kfree(entry);
413 }
414
415 xa_destroy(&encl->page_array);
416
417 if (!encl->secs_child_cnt && encl->secs.epc_page) {
418 sgx_encl_free_epc_page(encl->secs.epc_page);
419 encl->secs.epc_page = NULL;
420 }
421
422 while (!list_empty(&encl->va_pages)) {
423 va_page = list_first_entry(&encl->va_pages, struct sgx_va_page,
424 list);
425 list_del(&va_page->list);
426 sgx_encl_free_epc_page(va_page->epc_page);
427 kfree(va_page);
428 }
429
430 if (encl->backing)
431 fput(encl->backing);
432
433 cleanup_srcu_struct(&encl->srcu);
434
435 WARN_ON_ONCE(!list_empty(&encl->mm_list));
436
437
438 WARN_ON_ONCE(encl->secs_child_cnt);
439 WARN_ON_ONCE(encl->secs.epc_page);
440
441 kfree(encl);
442}
443
444
445
446
447static void sgx_mmu_notifier_release(struct mmu_notifier *mn,
448 struct mm_struct *mm)
449{
450 struct sgx_encl_mm *encl_mm = container_of(mn, struct sgx_encl_mm, mmu_notifier);
451 struct sgx_encl_mm *tmp = NULL;
452
453
454
455
456
457 spin_lock(&encl_mm->encl->mm_lock);
458 list_for_each_entry(tmp, &encl_mm->encl->mm_list, list) {
459 if (tmp == encl_mm) {
460 list_del_rcu(&encl_mm->list);
461 break;
462 }
463 }
464 spin_unlock(&encl_mm->encl->mm_lock);
465
466 if (tmp == encl_mm) {
467 synchronize_srcu(&encl_mm->encl->srcu);
468 mmu_notifier_put(mn);
469 }
470}
471
472static void sgx_mmu_notifier_free(struct mmu_notifier *mn)
473{
474 struct sgx_encl_mm *encl_mm = container_of(mn, struct sgx_encl_mm, mmu_notifier);
475
476
477 kref_put(&encl_mm->encl->refcount, sgx_encl_release);
478
479 kfree(encl_mm);
480}
481
482static const struct mmu_notifier_ops sgx_mmu_notifier_ops = {
483 .release = sgx_mmu_notifier_release,
484 .free_notifier = sgx_mmu_notifier_free,
485};
486
487static struct sgx_encl_mm *sgx_encl_find_mm(struct sgx_encl *encl,
488 struct mm_struct *mm)
489{
490 struct sgx_encl_mm *encl_mm = NULL;
491 struct sgx_encl_mm *tmp;
492 int idx;
493
494 idx = srcu_read_lock(&encl->srcu);
495
496 list_for_each_entry_rcu(tmp, &encl->mm_list, list) {
497 if (tmp->mm == mm) {
498 encl_mm = tmp;
499 break;
500 }
501 }
502
503 srcu_read_unlock(&encl->srcu, idx);
504
505 return encl_mm;
506}
507
508int sgx_encl_mm_add(struct sgx_encl *encl, struct mm_struct *mm)
509{
510 struct sgx_encl_mm *encl_mm;
511 int ret;
512
513
514
515
516
517
518
519 mmap_assert_write_locked(mm);
520
521
522
523
524
525 if (sgx_encl_find_mm(encl, mm))
526 return 0;
527
528 encl_mm = kzalloc(sizeof(*encl_mm), GFP_KERNEL);
529 if (!encl_mm)
530 return -ENOMEM;
531
532
533 kref_get(&encl->refcount);
534 encl_mm->encl = encl;
535 encl_mm->mm = mm;
536 encl_mm->mmu_notifier.ops = &sgx_mmu_notifier_ops;
537
538 ret = __mmu_notifier_register(&encl_mm->mmu_notifier, mm);
539 if (ret) {
540 kfree(encl_mm);
541 return ret;
542 }
543
544 spin_lock(&encl->mm_lock);
545 list_add_rcu(&encl_mm->list, &encl->mm_list);
546
547 smp_wmb();
548 encl->mm_list_version++;
549 spin_unlock(&encl->mm_lock);
550
551 return 0;
552}
553
554static struct page *sgx_encl_get_backing_page(struct sgx_encl *encl,
555 pgoff_t index)
556{
557 struct inode *inode = encl->backing->f_path.dentry->d_inode;
558 struct address_space *mapping = inode->i_mapping;
559 gfp_t gfpmask = mapping_gfp_mask(mapping);
560
561 return shmem_read_mapping_page_gfp(mapping, index, gfpmask);
562}
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577int sgx_encl_get_backing(struct sgx_encl *encl, unsigned long page_index,
578 struct sgx_backing *backing)
579{
580 pgoff_t pcmd_index = PFN_DOWN(encl->size) + 1 + (page_index >> 5);
581 struct page *contents;
582 struct page *pcmd;
583
584 contents = sgx_encl_get_backing_page(encl, page_index);
585 if (IS_ERR(contents))
586 return PTR_ERR(contents);
587
588 pcmd = sgx_encl_get_backing_page(encl, pcmd_index);
589 if (IS_ERR(pcmd)) {
590 put_page(contents);
591 return PTR_ERR(pcmd);
592 }
593
594 backing->page_index = page_index;
595 backing->contents = contents;
596 backing->pcmd = pcmd;
597 backing->pcmd_offset =
598 (page_index & (PAGE_SIZE / sizeof(struct sgx_pcmd) - 1)) *
599 sizeof(struct sgx_pcmd);
600
601 return 0;
602}
603
604
605
606
607
608
609void sgx_encl_put_backing(struct sgx_backing *backing, bool do_write)
610{
611 if (do_write) {
612 set_page_dirty(backing->pcmd);
613 set_page_dirty(backing->contents);
614 }
615
616 put_page(backing->pcmd);
617 put_page(backing->contents);
618}
619
620static int sgx_encl_test_and_clear_young_cb(pte_t *ptep, unsigned long addr,
621 void *data)
622{
623 pte_t pte;
624 int ret;
625
626 ret = pte_young(*ptep);
627 if (ret) {
628 pte = pte_mkold(*ptep);
629 set_pte_at((struct mm_struct *)data, addr, ptep, pte);
630 }
631
632 return ret;
633}
634
635
636
637
638
639
640
641
642
643
644
645int sgx_encl_test_and_clear_young(struct mm_struct *mm,
646 struct sgx_encl_page *page)
647{
648 unsigned long addr = page->desc & PAGE_MASK;
649 struct sgx_encl *encl = page->encl;
650 struct vm_area_struct *vma;
651 int ret;
652
653 ret = sgx_encl_find(mm, addr, &vma);
654 if (ret)
655 return 0;
656
657 if (encl != vma->vm_private_data)
658 return 0;
659
660 ret = apply_to_page_range(vma->vm_mm, addr, PAGE_SIZE,
661 sgx_encl_test_and_clear_young_cb, vma->vm_mm);
662 if (ret < 0)
663 return 0;
664
665 return ret;
666}
667
668
669
670
671
672
673
674
675
676
677struct sgx_epc_page *sgx_alloc_va_page(void)
678{
679 struct sgx_epc_page *epc_page;
680 int ret;
681
682 epc_page = sgx_alloc_epc_page(NULL, true);
683 if (IS_ERR(epc_page))
684 return ERR_CAST(epc_page);
685
686 ret = __epa(sgx_get_epc_virt_addr(epc_page));
687 if (ret) {
688 WARN_ONCE(1, "EPA returned %d (0x%x)", ret, ret);
689 sgx_encl_free_epc_page(epc_page);
690 return ERR_PTR(-EFAULT);
691 }
692
693 return epc_page;
694}
695
696
697
698
699
700
701
702
703
704unsigned int sgx_alloc_va_slot(struct sgx_va_page *va_page)
705{
706 int slot = find_first_zero_bit(va_page->slots, SGX_VA_SLOT_COUNT);
707
708 if (slot < SGX_VA_SLOT_COUNT)
709 set_bit(slot, va_page->slots);
710
711 return slot << 3;
712}
713
714
715
716
717
718
719
720
721void sgx_free_va_slot(struct sgx_va_page *va_page, unsigned int offset)
722{
723 clear_bit(offset >> 3, va_page->slots);
724}
725
726
727
728
729
730
731
732bool sgx_va_page_full(struct sgx_va_page *va_page)
733{
734 int slot = find_first_zero_bit(va_page->slots, SGX_VA_SLOT_COUNT);
735
736 return slot == SGX_VA_SLOT_COUNT;
737}
738
739
740
741
742
743
744
745
746
747void sgx_encl_free_epc_page(struct sgx_epc_page *page)
748{
749 int ret;
750
751 WARN_ON_ONCE(page->flags & SGX_EPC_PAGE_RECLAIMER_TRACKED);
752
753 ret = __eremove(sgx_get_epc_virt_addr(page));
754 if (WARN_ONCE(ret, EREMOVE_ERROR_MESSAGE, ret, ret))
755 return;
756
757 sgx_free_epc_page(page);
758}
759