1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32#include <linux/atomic.h>
33#include <linux/firmware.h>
34#include <linux/kref.h>
35#include <linux/sched/signal.h>
36#include <linux/seq_file.h>
37#include <linux/slab.h>
38#include <linux/wait.h>
39
40#include <drm/drm_device.h>
41#include <drm/drm_file.h>
42
43#include "radeon.h"
44#include "radeon_reg.h"
45#include "radeon_trace.h"
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67static void radeon_fence_write(struct radeon_device *rdev, u32 seq, int ring)
68{
69 struct radeon_fence_driver *drv = &rdev->fence_drv[ring];
70 if (likely(rdev->wb.enabled || !drv->scratch_reg)) {
71 if (drv->cpu_addr) {
72 *drv->cpu_addr = cpu_to_le32(seq);
73 }
74 } else {
75 WREG32(drv->scratch_reg, seq);
76 }
77}
78
79
80
81
82
83
84
85
86
87
88static u32 radeon_fence_read(struct radeon_device *rdev, int ring)
89{
90 struct radeon_fence_driver *drv = &rdev->fence_drv[ring];
91 u32 seq = 0;
92
93 if (likely(rdev->wb.enabled || !drv->scratch_reg)) {
94 if (drv->cpu_addr) {
95 seq = le32_to_cpu(*drv->cpu_addr);
96 } else {
97 seq = lower_32_bits(atomic64_read(&drv->last_seq));
98 }
99 } else {
100 seq = RREG32(drv->scratch_reg);
101 }
102 return seq;
103}
104
105
106
107
108
109
110
111
112
113static void radeon_fence_schedule_check(struct radeon_device *rdev, int ring)
114{
115
116
117
118
119 queue_delayed_work(system_power_efficient_wq,
120 &rdev->fence_drv[ring].lockup_work,
121 RADEON_FENCE_JIFFIES_TIMEOUT);
122}
123
124
125
126
127
128
129
130
131
132
133
134int radeon_fence_emit(struct radeon_device *rdev,
135 struct radeon_fence **fence,
136 int ring)
137{
138 u64 seq;
139
140
141 *fence = kmalloc(sizeof(struct radeon_fence), GFP_KERNEL);
142 if ((*fence) == NULL) {
143 return -ENOMEM;
144 }
145 (*fence)->rdev = rdev;
146 (*fence)->seq = seq = ++rdev->fence_drv[ring].sync_seq[ring];
147 (*fence)->ring = ring;
148 (*fence)->is_vm_update = false;
149 dma_fence_init(&(*fence)->base, &radeon_fence_ops,
150 &rdev->fence_queue.lock,
151 rdev->fence_context + ring,
152 seq);
153 radeon_fence_ring_emit(rdev, ring, *fence);
154 trace_radeon_fence_emit(rdev->ddev, ring, (*fence)->seq);
155 radeon_fence_schedule_check(rdev, ring);
156 return 0;
157}
158
159
160
161
162
163
164
165
166static int radeon_fence_check_signaled(wait_queue_entry_t *wait, unsigned mode, int flags, void *key)
167{
168 struct radeon_fence *fence;
169 u64 seq;
170
171 fence = container_of(wait, struct radeon_fence, fence_wake);
172
173
174
175
176
177 seq = atomic64_read(&fence->rdev->fence_drv[fence->ring].last_seq);
178 if (seq >= fence->seq) {
179 int ret = dma_fence_signal_locked(&fence->base);
180
181 if (!ret)
182 DMA_FENCE_TRACE(&fence->base, "signaled from irq context\n");
183 else
184 DMA_FENCE_TRACE(&fence->base, "was already signaled\n");
185
186 radeon_irq_kms_sw_irq_put(fence->rdev, fence->ring);
187 __remove_wait_queue(&fence->rdev->fence_queue, &fence->fence_wake);
188 dma_fence_put(&fence->base);
189 } else
190 DMA_FENCE_TRACE(&fence->base, "pending\n");
191 return 0;
192}
193
194
195
196
197
198
199
200
201
202
203
204static bool radeon_fence_activity(struct radeon_device *rdev, int ring)
205{
206 uint64_t seq, last_seq, last_emitted;
207 unsigned count_loop = 0;
208 bool wake = false;
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231 last_seq = atomic64_read(&rdev->fence_drv[ring].last_seq);
232 do {
233 last_emitted = rdev->fence_drv[ring].sync_seq[ring];
234 seq = radeon_fence_read(rdev, ring);
235 seq |= last_seq & 0xffffffff00000000LL;
236 if (seq < last_seq) {
237 seq &= 0xffffffff;
238 seq |= last_emitted & 0xffffffff00000000LL;
239 }
240
241 if (seq <= last_seq || seq > last_emitted) {
242 break;
243 }
244
245
246
247
248 wake = true;
249 last_seq = seq;
250 if ((count_loop++) > 10) {
251
252
253
254
255
256 break;
257 }
258 } while (atomic64_xchg(&rdev->fence_drv[ring].last_seq, seq) > seq);
259
260 if (seq < last_emitted)
261 radeon_fence_schedule_check(rdev, ring);
262
263 return wake;
264}
265
266
267
268
269
270
271
272
273
274static void radeon_fence_check_lockup(struct work_struct *work)
275{
276 struct radeon_fence_driver *fence_drv;
277 struct radeon_device *rdev;
278 int ring;
279
280 fence_drv = container_of(work, struct radeon_fence_driver,
281 lockup_work.work);
282 rdev = fence_drv->rdev;
283 ring = fence_drv - &rdev->fence_drv[0];
284
285 if (!down_read_trylock(&rdev->exclusive_lock)) {
286
287 radeon_fence_schedule_check(rdev, ring);
288 return;
289 }
290
291 if (fence_drv->delayed_irq && rdev->irq.installed) {
292 unsigned long irqflags;
293
294 fence_drv->delayed_irq = false;
295 spin_lock_irqsave(&rdev->irq.lock, irqflags);
296 radeon_irq_set(rdev);
297 spin_unlock_irqrestore(&rdev->irq.lock, irqflags);
298 }
299
300 if (radeon_fence_activity(rdev, ring))
301 wake_up_all(&rdev->fence_queue);
302
303 else if (radeon_ring_is_lockup(rdev, ring, &rdev->ring[ring])) {
304
305
306 dev_warn(rdev->dev, "GPU lockup (current fence id "
307 "0x%016llx last fence id 0x%016llx on ring %d)\n",
308 (uint64_t)atomic64_read(&fence_drv->last_seq),
309 fence_drv->sync_seq[ring], ring);
310
311
312 rdev->needs_reset = true;
313 wake_up_all(&rdev->fence_queue);
314 }
315 up_read(&rdev->exclusive_lock);
316}
317
318
319
320
321
322
323
324
325
326
327void radeon_fence_process(struct radeon_device *rdev, int ring)
328{
329 if (radeon_fence_activity(rdev, ring))
330 wake_up_all(&rdev->fence_queue);
331}
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347static bool radeon_fence_seq_signaled(struct radeon_device *rdev,
348 u64 seq, unsigned ring)
349{
350 if (atomic64_read(&rdev->fence_drv[ring].last_seq) >= seq) {
351 return true;
352 }
353
354 radeon_fence_process(rdev, ring);
355 if (atomic64_read(&rdev->fence_drv[ring].last_seq) >= seq) {
356 return true;
357 }
358 return false;
359}
360
361static bool radeon_fence_is_signaled(struct dma_fence *f)
362{
363 struct radeon_fence *fence = to_radeon_fence(f);
364 struct radeon_device *rdev = fence->rdev;
365 unsigned ring = fence->ring;
366 u64 seq = fence->seq;
367
368 if (atomic64_read(&rdev->fence_drv[ring].last_seq) >= seq) {
369 return true;
370 }
371
372 if (down_read_trylock(&rdev->exclusive_lock)) {
373 radeon_fence_process(rdev, ring);
374 up_read(&rdev->exclusive_lock);
375
376 if (atomic64_read(&rdev->fence_drv[ring].last_seq) >= seq) {
377 return true;
378 }
379 }
380 return false;
381}
382
383
384
385
386
387
388
389
390
391static bool radeon_fence_enable_signaling(struct dma_fence *f)
392{
393 struct radeon_fence *fence = to_radeon_fence(f);
394 struct radeon_device *rdev = fence->rdev;
395
396 if (atomic64_read(&rdev->fence_drv[fence->ring].last_seq) >= fence->seq)
397 return false;
398
399 if (down_read_trylock(&rdev->exclusive_lock)) {
400 radeon_irq_kms_sw_irq_get(rdev, fence->ring);
401
402 if (radeon_fence_activity(rdev, fence->ring))
403 wake_up_all_locked(&rdev->fence_queue);
404
405
406 if (atomic64_read(&rdev->fence_drv[fence->ring].last_seq) >= fence->seq) {
407 radeon_irq_kms_sw_irq_put(rdev, fence->ring);
408 up_read(&rdev->exclusive_lock);
409 return false;
410 }
411
412 up_read(&rdev->exclusive_lock);
413 } else {
414
415 if (radeon_irq_kms_sw_irq_get_delayed(rdev, fence->ring))
416 rdev->fence_drv[fence->ring].delayed_irq = true;
417 radeon_fence_schedule_check(rdev, fence->ring);
418 }
419
420 fence->fence_wake.flags = 0;
421 fence->fence_wake.private = NULL;
422 fence->fence_wake.func = radeon_fence_check_signaled;
423 __add_wait_queue(&rdev->fence_queue, &fence->fence_wake);
424 dma_fence_get(f);
425
426 DMA_FENCE_TRACE(&fence->base, "armed on ring %i!\n", fence->ring);
427 return true;
428}
429
430
431
432
433
434
435
436
437
438bool radeon_fence_signaled(struct radeon_fence *fence)
439{
440 if (!fence)
441 return true;
442
443 if (radeon_fence_seq_signaled(fence->rdev, fence->seq, fence->ring)) {
444 int ret;
445
446 ret = dma_fence_signal(&fence->base);
447 if (!ret)
448 DMA_FENCE_TRACE(&fence->base, "signaled from radeon_fence_signaled\n");
449 return true;
450 }
451 return false;
452}
453
454
455
456
457
458
459
460
461
462
463
464
465static bool radeon_fence_any_seq_signaled(struct radeon_device *rdev, u64 *seq)
466{
467 unsigned i;
468
469 for (i = 0; i < RADEON_NUM_RINGS; ++i) {
470 if (seq[i] && radeon_fence_seq_signaled(rdev, seq[i], i))
471 return true;
472 }
473 return false;
474}
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493static long radeon_fence_wait_seq_timeout(struct radeon_device *rdev,
494 u64 *target_seq, bool intr,
495 long timeout)
496{
497 long r;
498 int i;
499
500 if (radeon_fence_any_seq_signaled(rdev, target_seq))
501 return timeout;
502
503
504 for (i = 0; i < RADEON_NUM_RINGS; ++i) {
505 if (!target_seq[i])
506 continue;
507
508 trace_radeon_fence_wait_begin(rdev->ddev, i, target_seq[i]);
509 radeon_irq_kms_sw_irq_get(rdev, i);
510 }
511
512 if (intr) {
513 r = wait_event_interruptible_timeout(rdev->fence_queue, (
514 radeon_fence_any_seq_signaled(rdev, target_seq)
515 || rdev->needs_reset), timeout);
516 } else {
517 r = wait_event_timeout(rdev->fence_queue, (
518 radeon_fence_any_seq_signaled(rdev, target_seq)
519 || rdev->needs_reset), timeout);
520 }
521
522 if (rdev->needs_reset)
523 r = -EDEADLK;
524
525 for (i = 0; i < RADEON_NUM_RINGS; ++i) {
526 if (!target_seq[i])
527 continue;
528
529 radeon_irq_kms_sw_irq_put(rdev, i);
530 trace_radeon_fence_wait_end(rdev->ddev, i, target_seq[i]);
531 }
532
533 return r;
534}
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549long radeon_fence_wait_timeout(struct radeon_fence *fence, bool intr, long timeout)
550{
551 uint64_t seq[RADEON_NUM_RINGS] = {};
552 long r;
553 int r_sig;
554
555
556
557
558
559
560
561 if (WARN_ON_ONCE(!to_radeon_fence(&fence->base)))
562 return dma_fence_wait(&fence->base, intr);
563
564 seq[fence->ring] = fence->seq;
565 r = radeon_fence_wait_seq_timeout(fence->rdev, seq, intr, timeout);
566 if (r <= 0) {
567 return r;
568 }
569
570 r_sig = dma_fence_signal(&fence->base);
571 if (!r_sig)
572 DMA_FENCE_TRACE(&fence->base, "signaled from fence_wait\n");
573 return r;
574}
575
576
577
578
579
580
581
582
583
584
585
586
587int radeon_fence_wait(struct radeon_fence *fence, bool intr)
588{
589 long r = radeon_fence_wait_timeout(fence, intr, MAX_SCHEDULE_TIMEOUT);
590 if (r > 0) {
591 return 0;
592 } else {
593 return r;
594 }
595}
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610int radeon_fence_wait_any(struct radeon_device *rdev,
611 struct radeon_fence **fences,
612 bool intr)
613{
614 uint64_t seq[RADEON_NUM_RINGS];
615 unsigned i, num_rings = 0;
616 long r;
617
618 for (i = 0; i < RADEON_NUM_RINGS; ++i) {
619 seq[i] = 0;
620
621 if (!fences[i]) {
622 continue;
623 }
624
625 seq[i] = fences[i]->seq;
626 ++num_rings;
627 }
628
629
630 if (num_rings == 0)
631 return -ENOENT;
632
633 r = radeon_fence_wait_seq_timeout(rdev, seq, intr, MAX_SCHEDULE_TIMEOUT);
634 if (r < 0) {
635 return r;
636 }
637 return 0;
638}
639
640
641
642
643
644
645
646
647
648
649
650int radeon_fence_wait_next(struct radeon_device *rdev, int ring)
651{
652 uint64_t seq[RADEON_NUM_RINGS] = {};
653 long r;
654
655 seq[ring] = atomic64_read(&rdev->fence_drv[ring].last_seq) + 1ULL;
656 if (seq[ring] >= rdev->fence_drv[ring].sync_seq[ring]) {
657
658
659 return -ENOENT;
660 }
661 r = radeon_fence_wait_seq_timeout(rdev, seq, false, MAX_SCHEDULE_TIMEOUT);
662 if (r < 0)
663 return r;
664 return 0;
665}
666
667
668
669
670
671
672
673
674
675
676
677int radeon_fence_wait_empty(struct radeon_device *rdev, int ring)
678{
679 uint64_t seq[RADEON_NUM_RINGS] = {};
680 long r;
681
682 seq[ring] = rdev->fence_drv[ring].sync_seq[ring];
683 if (!seq[ring])
684 return 0;
685
686 r = radeon_fence_wait_seq_timeout(rdev, seq, false, MAX_SCHEDULE_TIMEOUT);
687 if (r < 0) {
688 if (r == -EDEADLK)
689 return -EDEADLK;
690
691 dev_err(rdev->dev, "error waiting for ring[%d] to become idle (%ld)\n",
692 ring, r);
693 }
694 return 0;
695}
696
697
698
699
700
701
702
703
704
705struct radeon_fence *radeon_fence_ref(struct radeon_fence *fence)
706{
707 dma_fence_get(&fence->base);
708 return fence;
709}
710
711
712
713
714
715
716
717
718void radeon_fence_unref(struct radeon_fence **fence)
719{
720 struct radeon_fence *tmp = *fence;
721
722 *fence = NULL;
723 if (tmp) {
724 dma_fence_put(&tmp->base);
725 }
726}
727
728
729
730
731
732
733
734
735
736
737
738unsigned radeon_fence_count_emitted(struct radeon_device *rdev, int ring)
739{
740 uint64_t emitted;
741
742
743
744
745 radeon_fence_process(rdev, ring);
746 emitted = rdev->fence_drv[ring].sync_seq[ring]
747 - atomic64_read(&rdev->fence_drv[ring].last_seq);
748
749 if (emitted > 0x10000000) {
750 emitted = 0x10000000;
751 }
752 return (unsigned)emitted;
753}
754
755
756
757
758
759
760
761
762
763
764
765
766bool radeon_fence_need_sync(struct radeon_fence *fence, int dst_ring)
767{
768 struct radeon_fence_driver *fdrv;
769
770 if (!fence) {
771 return false;
772 }
773
774 if (fence->ring == dst_ring) {
775 return false;
776 }
777
778
779 fdrv = &fence->rdev->fence_drv[dst_ring];
780 if (fence->seq <= fdrv->sync_seq[fence->ring]) {
781 return false;
782 }
783
784 return true;
785}
786
787
788
789
790
791
792
793
794
795
796void radeon_fence_note_sync(struct radeon_fence *fence, int dst_ring)
797{
798 struct radeon_fence_driver *dst, *src;
799 unsigned i;
800
801 if (!fence) {
802 return;
803 }
804
805 if (fence->ring == dst_ring) {
806 return;
807 }
808
809
810 src = &fence->rdev->fence_drv[fence->ring];
811 dst = &fence->rdev->fence_drv[dst_ring];
812 for (i = 0; i < RADEON_NUM_RINGS; ++i) {
813 if (i == dst_ring) {
814 continue;
815 }
816 dst->sync_seq[i] = max(dst->sync_seq[i], src->sync_seq[i]);
817 }
818}
819
820
821
822
823
824
825
826
827
828
829
830
831
832int radeon_fence_driver_start_ring(struct radeon_device *rdev, int ring)
833{
834 uint64_t index;
835 int r;
836
837 radeon_scratch_free(rdev, rdev->fence_drv[ring].scratch_reg);
838 if (rdev->wb.use_event || !radeon_ring_supports_scratch_reg(rdev, &rdev->ring[ring])) {
839 rdev->fence_drv[ring].scratch_reg = 0;
840 if (ring != R600_RING_TYPE_UVD_INDEX) {
841 index = R600_WB_EVENT_OFFSET + ring * 4;
842 rdev->fence_drv[ring].cpu_addr = &rdev->wb.wb[index/4];
843 rdev->fence_drv[ring].gpu_addr = rdev->wb.gpu_addr +
844 index;
845
846 } else {
847
848 index = ALIGN(rdev->uvd_fw->size, 8);
849 rdev->fence_drv[ring].cpu_addr = rdev->uvd.cpu_addr + index;
850 rdev->fence_drv[ring].gpu_addr = rdev->uvd.gpu_addr + index;
851 }
852
853 } else {
854 r = radeon_scratch_get(rdev, &rdev->fence_drv[ring].scratch_reg);
855 if (r) {
856 dev_err(rdev->dev, "fence failed to get scratch register\n");
857 return r;
858 }
859 index = RADEON_WB_SCRATCH_OFFSET +
860 rdev->fence_drv[ring].scratch_reg -
861 rdev->scratch.reg_base;
862 rdev->fence_drv[ring].cpu_addr = &rdev->wb.wb[index/4];
863 rdev->fence_drv[ring].gpu_addr = rdev->wb.gpu_addr + index;
864 }
865 radeon_fence_write(rdev, atomic64_read(&rdev->fence_drv[ring].last_seq), ring);
866 rdev->fence_drv[ring].initialized = true;
867 dev_info(rdev->dev, "fence driver on ring %d use gpu addr 0x%016llx\n",
868 ring, rdev->fence_drv[ring].gpu_addr);
869 return 0;
870}
871
872
873
874
875
876
877
878
879
880
881
882static void radeon_fence_driver_init_ring(struct radeon_device *rdev, int ring)
883{
884 int i;
885
886 rdev->fence_drv[ring].scratch_reg = -1;
887 rdev->fence_drv[ring].cpu_addr = NULL;
888 rdev->fence_drv[ring].gpu_addr = 0;
889 for (i = 0; i < RADEON_NUM_RINGS; ++i)
890 rdev->fence_drv[ring].sync_seq[i] = 0;
891 atomic64_set(&rdev->fence_drv[ring].last_seq, 0);
892 rdev->fence_drv[ring].initialized = false;
893 INIT_DELAYED_WORK(&rdev->fence_drv[ring].lockup_work,
894 radeon_fence_check_lockup);
895 rdev->fence_drv[ring].rdev = rdev;
896}
897
898
899
900
901
902
903
904
905
906
907
908
909void radeon_fence_driver_init(struct radeon_device *rdev)
910{
911 int ring;
912
913 init_waitqueue_head(&rdev->fence_queue);
914 for (ring = 0; ring < RADEON_NUM_RINGS; ring++) {
915 radeon_fence_driver_init_ring(rdev, ring);
916 }
917
918 radeon_debugfs_fence_init(rdev);
919}
920
921
922
923
924
925
926
927
928
929void radeon_fence_driver_fini(struct radeon_device *rdev)
930{
931 int ring, r;
932
933 mutex_lock(&rdev->ring_lock);
934 for (ring = 0; ring < RADEON_NUM_RINGS; ring++) {
935 if (!rdev->fence_drv[ring].initialized)
936 continue;
937 r = radeon_fence_wait_empty(rdev, ring);
938 if (r) {
939
940 radeon_fence_driver_force_completion(rdev, ring);
941 }
942 cancel_delayed_work_sync(&rdev->fence_drv[ring].lockup_work);
943 wake_up_all(&rdev->fence_queue);
944 radeon_scratch_free(rdev, rdev->fence_drv[ring].scratch_reg);
945 rdev->fence_drv[ring].initialized = false;
946 }
947 mutex_unlock(&rdev->ring_lock);
948}
949
950
951
952
953
954
955
956
957
958
959void radeon_fence_driver_force_completion(struct radeon_device *rdev, int ring)
960{
961 if (rdev->fence_drv[ring].initialized) {
962 radeon_fence_write(rdev, rdev->fence_drv[ring].sync_seq[ring], ring);
963 cancel_delayed_work_sync(&rdev->fence_drv[ring].lockup_work);
964 }
965}
966
967
968
969
970
971#if defined(CONFIG_DEBUG_FS)
972static int radeon_debugfs_fence_info_show(struct seq_file *m, void *data)
973{
974 struct radeon_device *rdev = (struct radeon_device *)m->private;
975 int i, j;
976
977 for (i = 0; i < RADEON_NUM_RINGS; ++i) {
978 if (!rdev->fence_drv[i].initialized)
979 continue;
980
981 radeon_fence_process(rdev, i);
982
983 seq_printf(m, "--- ring %d ---\n", i);
984 seq_printf(m, "Last signaled fence 0x%016llx\n",
985 (unsigned long long)atomic64_read(&rdev->fence_drv[i].last_seq));
986 seq_printf(m, "Last emitted 0x%016llx\n",
987 rdev->fence_drv[i].sync_seq[i]);
988
989 for (j = 0; j < RADEON_NUM_RINGS; ++j) {
990 if (i != j && rdev->fence_drv[j].initialized)
991 seq_printf(m, "Last sync to ring %d 0x%016llx\n",
992 j, rdev->fence_drv[i].sync_seq[j]);
993 }
994 }
995 return 0;
996}
997
998
999
1000
1001
1002
1003static int radeon_debugfs_gpu_reset(void *data, u64 *val)
1004{
1005 struct radeon_device *rdev = (struct radeon_device *)data;
1006
1007 down_read(&rdev->exclusive_lock);
1008 *val = rdev->needs_reset;
1009 rdev->needs_reset = true;
1010 wake_up_all(&rdev->fence_queue);
1011 up_read(&rdev->exclusive_lock);
1012
1013 return 0;
1014}
1015DEFINE_SHOW_ATTRIBUTE(radeon_debugfs_fence_info);
1016DEFINE_DEBUGFS_ATTRIBUTE(radeon_debugfs_gpu_reset_fops,
1017 radeon_debugfs_gpu_reset, NULL, "%lld\n");
1018#endif
1019
1020void radeon_debugfs_fence_init(struct radeon_device *rdev)
1021{
1022#if defined(CONFIG_DEBUG_FS)
1023 struct dentry *root = rdev->ddev->primary->debugfs_root;
1024
1025 debugfs_create_file("radeon_gpu_reset", 0444, root, rdev,
1026 &radeon_debugfs_gpu_reset_fops);
1027 debugfs_create_file("radeon_fence_info", 0444, root, rdev,
1028 &radeon_debugfs_fence_info_fops);
1029
1030
1031#endif
1032}
1033
1034static const char *radeon_fence_get_driver_name(struct dma_fence *fence)
1035{
1036 return "radeon";
1037}
1038
1039static const char *radeon_fence_get_timeline_name(struct dma_fence *f)
1040{
1041 struct radeon_fence *fence = to_radeon_fence(f);
1042 switch (fence->ring) {
1043 case RADEON_RING_TYPE_GFX_INDEX: return "radeon.gfx";
1044 case CAYMAN_RING_TYPE_CP1_INDEX: return "radeon.cp1";
1045 case CAYMAN_RING_TYPE_CP2_INDEX: return "radeon.cp2";
1046 case R600_RING_TYPE_DMA_INDEX: return "radeon.dma";
1047 case CAYMAN_RING_TYPE_DMA1_INDEX: return "radeon.dma1";
1048 case R600_RING_TYPE_UVD_INDEX: return "radeon.uvd";
1049 case TN_RING_TYPE_VCE1_INDEX: return "radeon.vce1";
1050 case TN_RING_TYPE_VCE2_INDEX: return "radeon.vce2";
1051 default: WARN_ON_ONCE(1); return "radeon.unk";
1052 }
1053}
1054
1055static inline bool radeon_test_signaled(struct radeon_fence *fence)
1056{
1057 return test_bit(DMA_FENCE_FLAG_SIGNALED_BIT, &fence->base.flags);
1058}
1059
1060struct radeon_wait_cb {
1061 struct dma_fence_cb base;
1062 struct task_struct *task;
1063};
1064
1065static void
1066radeon_fence_wait_cb(struct dma_fence *fence, struct dma_fence_cb *cb)
1067{
1068 struct radeon_wait_cb *wait =
1069 container_of(cb, struct radeon_wait_cb, base);
1070
1071 wake_up_process(wait->task);
1072}
1073
1074static signed long radeon_fence_default_wait(struct dma_fence *f, bool intr,
1075 signed long t)
1076{
1077 struct radeon_fence *fence = to_radeon_fence(f);
1078 struct radeon_device *rdev = fence->rdev;
1079 struct radeon_wait_cb cb;
1080
1081 cb.task = current;
1082
1083 if (dma_fence_add_callback(f, &cb.base, radeon_fence_wait_cb))
1084 return t;
1085
1086 while (t > 0) {
1087 if (intr)
1088 set_current_state(TASK_INTERRUPTIBLE);
1089 else
1090 set_current_state(TASK_UNINTERRUPTIBLE);
1091
1092
1093
1094
1095
1096 if (radeon_test_signaled(fence))
1097 break;
1098
1099 if (rdev->needs_reset) {
1100 t = -EDEADLK;
1101 break;
1102 }
1103
1104 t = schedule_timeout(t);
1105
1106 if (t > 0 && intr && signal_pending(current))
1107 t = -ERESTARTSYS;
1108 }
1109
1110 __set_current_state(TASK_RUNNING);
1111 dma_fence_remove_callback(f, &cb.base);
1112
1113 return t;
1114}
1115
1116const struct dma_fence_ops radeon_fence_ops = {
1117 .get_driver_name = radeon_fence_get_driver_name,
1118 .get_timeline_name = radeon_fence_get_timeline_name,
1119 .enable_signaling = radeon_fence_enable_signaling,
1120 .signaled = radeon_fence_is_signaled,
1121 .wait = radeon_fence_default_wait,
1122 .release = NULL,
1123};
1124