1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25#include <drm/drm_auth.h>
26#include "amdgpu.h"
27#include "amdgpu_sched.h"
28#include "amdgpu_ras.h"
29#include <linux/nospec.h>
30
31#define to_amdgpu_ctx_entity(e) \
32 container_of((e), struct amdgpu_ctx_entity, entity)
33
34const unsigned int amdgpu_ctx_num_entities[AMDGPU_HW_IP_NUM] = {
35 [AMDGPU_HW_IP_GFX] = 1,
36 [AMDGPU_HW_IP_COMPUTE] = 4,
37 [AMDGPU_HW_IP_DMA] = 2,
38 [AMDGPU_HW_IP_UVD] = 1,
39 [AMDGPU_HW_IP_VCE] = 1,
40 [AMDGPU_HW_IP_UVD_ENC] = 1,
41 [AMDGPU_HW_IP_VCN_DEC] = 1,
42 [AMDGPU_HW_IP_VCN_ENC] = 1,
43 [AMDGPU_HW_IP_VCN_JPEG] = 1,
44};
45
46static int amdgpu_ctx_priority_permit(struct drm_file *filp,
47 enum drm_sched_priority priority)
48{
49 if (priority < 0 || priority >= DRM_SCHED_PRIORITY_COUNT)
50 return -EINVAL;
51
52
53 if (priority <= DRM_SCHED_PRIORITY_NORMAL)
54 return 0;
55
56 if (capable(CAP_SYS_NICE))
57 return 0;
58
59 if (drm_is_current_master(filp))
60 return 0;
61
62 return -EACCES;
63}
64
65static enum gfx_pipe_priority amdgpu_ctx_sched_prio_to_compute_prio(enum drm_sched_priority prio)
66{
67 switch (prio) {
68 case DRM_SCHED_PRIORITY_HIGH:
69 case DRM_SCHED_PRIORITY_KERNEL:
70 return AMDGPU_GFX_PIPE_PRIO_HIGH;
71 default:
72 return AMDGPU_GFX_PIPE_PRIO_NORMAL;
73 }
74}
75
76static unsigned int amdgpu_ctx_prio_sched_to_hw(struct amdgpu_device *adev,
77 enum drm_sched_priority prio,
78 u32 hw_ip)
79{
80 unsigned int hw_prio;
81
82 hw_prio = (hw_ip == AMDGPU_HW_IP_COMPUTE) ?
83 amdgpu_ctx_sched_prio_to_compute_prio(prio) :
84 AMDGPU_RING_PRIO_DEFAULT;
85 hw_ip = array_index_nospec(hw_ip, AMDGPU_HW_IP_NUM);
86 if (adev->gpu_sched[hw_ip][hw_prio].num_scheds == 0)
87 hw_prio = AMDGPU_RING_PRIO_DEFAULT;
88
89 return hw_prio;
90}
91
92static int amdgpu_ctx_init_entity(struct amdgpu_ctx *ctx, u32 hw_ip,
93 const u32 ring)
94{
95 struct amdgpu_device *adev = ctx->adev;
96 struct amdgpu_ctx_entity *entity;
97 struct drm_gpu_scheduler **scheds = NULL, *sched = NULL;
98 unsigned num_scheds = 0;
99 unsigned int hw_prio;
100 enum drm_sched_priority priority;
101 int r;
102
103 entity = kzalloc(struct_size(entity, fences, amdgpu_sched_jobs),
104 GFP_KERNEL);
105 if (!entity)
106 return -ENOMEM;
107
108 entity->sequence = 1;
109 priority = (ctx->override_priority == DRM_SCHED_PRIORITY_UNSET) ?
110 ctx->init_priority : ctx->override_priority;
111 hw_prio = amdgpu_ctx_prio_sched_to_hw(adev, priority, hw_ip);
112
113 hw_ip = array_index_nospec(hw_ip, AMDGPU_HW_IP_NUM);
114 scheds = adev->gpu_sched[hw_ip][hw_prio].sched;
115 num_scheds = adev->gpu_sched[hw_ip][hw_prio].num_scheds;
116
117
118 if (hw_ip == AMDGPU_HW_IP_VCN_ENC ||
119 hw_ip == AMDGPU_HW_IP_VCN_DEC ||
120 hw_ip == AMDGPU_HW_IP_UVD_ENC ||
121 hw_ip == AMDGPU_HW_IP_UVD) {
122 sched = drm_sched_pick_best(scheds, num_scheds);
123 scheds = &sched;
124 num_scheds = 1;
125 }
126
127 r = drm_sched_entity_init(&entity->entity, priority, scheds, num_scheds,
128 &ctx->guilty);
129 if (r)
130 goto error_free_entity;
131
132 ctx->entities[hw_ip][ring] = entity;
133 return 0;
134
135error_free_entity:
136 kfree(entity);
137
138 return r;
139}
140
141static int amdgpu_ctx_init(struct amdgpu_device *adev,
142 enum drm_sched_priority priority,
143 struct drm_file *filp,
144 struct amdgpu_ctx *ctx)
145{
146 int r;
147
148 r = amdgpu_ctx_priority_permit(filp, priority);
149 if (r)
150 return r;
151
152 memset(ctx, 0, sizeof(*ctx));
153
154 ctx->adev = adev;
155
156 kref_init(&ctx->refcount);
157 spin_lock_init(&ctx->ring_lock);
158 mutex_init(&ctx->lock);
159
160 ctx->reset_counter = atomic_read(&adev->gpu_reset_counter);
161 ctx->reset_counter_query = ctx->reset_counter;
162 ctx->vram_lost_counter = atomic_read(&adev->vram_lost_counter);
163 ctx->init_priority = priority;
164 ctx->override_priority = DRM_SCHED_PRIORITY_UNSET;
165
166 return 0;
167}
168
169static void amdgpu_ctx_fini_entity(struct amdgpu_ctx_entity *entity)
170{
171
172 int i;
173
174 if (!entity)
175 return;
176
177 for (i = 0; i < amdgpu_sched_jobs; ++i)
178 dma_fence_put(entity->fences[i]);
179
180 kfree(entity);
181}
182
183static void amdgpu_ctx_fini(struct kref *ref)
184{
185 struct amdgpu_ctx *ctx = container_of(ref, struct amdgpu_ctx, refcount);
186 struct amdgpu_device *adev = ctx->adev;
187 unsigned i, j;
188
189 if (!adev)
190 return;
191
192 for (i = 0; i < AMDGPU_HW_IP_NUM; ++i) {
193 for (j = 0; j < AMDGPU_MAX_ENTITY_NUM; ++j) {
194 amdgpu_ctx_fini_entity(ctx->entities[i][j]);
195 ctx->entities[i][j] = NULL;
196 }
197 }
198
199 mutex_destroy(&ctx->lock);
200 kfree(ctx);
201}
202
203int amdgpu_ctx_get_entity(struct amdgpu_ctx *ctx, u32 hw_ip, u32 instance,
204 u32 ring, struct drm_sched_entity **entity)
205{
206 int r;
207
208 if (hw_ip >= AMDGPU_HW_IP_NUM) {
209 DRM_ERROR("unknown HW IP type: %d\n", hw_ip);
210 return -EINVAL;
211 }
212
213
214 if (instance != 0) {
215 DRM_DEBUG("invalid ip instance: %d\n", instance);
216 return -EINVAL;
217 }
218
219 if (ring >= amdgpu_ctx_num_entities[hw_ip]) {
220 DRM_DEBUG("invalid ring: %d %d\n", hw_ip, ring);
221 return -EINVAL;
222 }
223
224 if (ctx->entities[hw_ip][ring] == NULL) {
225 r = amdgpu_ctx_init_entity(ctx, hw_ip, ring);
226 if (r)
227 return r;
228 }
229
230 *entity = &ctx->entities[hw_ip][ring]->entity;
231 return 0;
232}
233
234static int amdgpu_ctx_alloc(struct amdgpu_device *adev,
235 struct amdgpu_fpriv *fpriv,
236 struct drm_file *filp,
237 enum drm_sched_priority priority,
238 uint32_t *id)
239{
240 struct amdgpu_ctx_mgr *mgr = &fpriv->ctx_mgr;
241 struct amdgpu_ctx *ctx;
242 int r;
243
244 ctx = kmalloc(sizeof(*ctx), GFP_KERNEL);
245 if (!ctx)
246 return -ENOMEM;
247
248 mutex_lock(&mgr->lock);
249 r = idr_alloc(&mgr->ctx_handles, ctx, 1, AMDGPU_VM_MAX_NUM_CTX, GFP_KERNEL);
250 if (r < 0) {
251 mutex_unlock(&mgr->lock);
252 kfree(ctx);
253 return r;
254 }
255
256 *id = (uint32_t)r;
257 r = amdgpu_ctx_init(adev, priority, filp, ctx);
258 if (r) {
259 idr_remove(&mgr->ctx_handles, *id);
260 *id = 0;
261 kfree(ctx);
262 }
263 mutex_unlock(&mgr->lock);
264 return r;
265}
266
267static void amdgpu_ctx_do_release(struct kref *ref)
268{
269 struct amdgpu_ctx *ctx;
270 u32 i, j;
271
272 ctx = container_of(ref, struct amdgpu_ctx, refcount);
273 for (i = 0; i < AMDGPU_HW_IP_NUM; ++i) {
274 for (j = 0; j < amdgpu_ctx_num_entities[i]; ++j) {
275 if (!ctx->entities[i][j])
276 continue;
277
278 drm_sched_entity_destroy(&ctx->entities[i][j]->entity);
279 }
280 }
281
282 amdgpu_ctx_fini(ref);
283}
284
285static int amdgpu_ctx_free(struct amdgpu_fpriv *fpriv, uint32_t id)
286{
287 struct amdgpu_ctx_mgr *mgr = &fpriv->ctx_mgr;
288 struct amdgpu_ctx *ctx;
289
290 mutex_lock(&mgr->lock);
291 ctx = idr_remove(&mgr->ctx_handles, id);
292 if (ctx)
293 kref_put(&ctx->refcount, amdgpu_ctx_do_release);
294 mutex_unlock(&mgr->lock);
295 return ctx ? 0 : -EINVAL;
296}
297
298static int amdgpu_ctx_query(struct amdgpu_device *adev,
299 struct amdgpu_fpriv *fpriv, uint32_t id,
300 union drm_amdgpu_ctx_out *out)
301{
302 struct amdgpu_ctx *ctx;
303 struct amdgpu_ctx_mgr *mgr;
304 unsigned reset_counter;
305
306 if (!fpriv)
307 return -EINVAL;
308
309 mgr = &fpriv->ctx_mgr;
310 mutex_lock(&mgr->lock);
311 ctx = idr_find(&mgr->ctx_handles, id);
312 if (!ctx) {
313 mutex_unlock(&mgr->lock);
314 return -EINVAL;
315 }
316
317
318 out->state.flags = 0x0;
319 out->state.hangs = 0x0;
320
321
322 reset_counter = atomic_read(&adev->gpu_reset_counter);
323
324 if (ctx->reset_counter_query == reset_counter)
325 out->state.reset_status = AMDGPU_CTX_NO_RESET;
326 else
327 out->state.reset_status = AMDGPU_CTX_UNKNOWN_RESET;
328 ctx->reset_counter_query = reset_counter;
329
330 mutex_unlock(&mgr->lock);
331 return 0;
332}
333
334static int amdgpu_ctx_query2(struct amdgpu_device *adev,
335 struct amdgpu_fpriv *fpriv, uint32_t id,
336 union drm_amdgpu_ctx_out *out)
337{
338 struct amdgpu_ctx *ctx;
339 struct amdgpu_ctx_mgr *mgr;
340 unsigned long ras_counter;
341
342 if (!fpriv)
343 return -EINVAL;
344
345 mgr = &fpriv->ctx_mgr;
346 mutex_lock(&mgr->lock);
347 ctx = idr_find(&mgr->ctx_handles, id);
348 if (!ctx) {
349 mutex_unlock(&mgr->lock);
350 return -EINVAL;
351 }
352
353 out->state.flags = 0x0;
354 out->state.hangs = 0x0;
355
356 if (ctx->reset_counter != atomic_read(&adev->gpu_reset_counter))
357 out->state.flags |= AMDGPU_CTX_QUERY2_FLAGS_RESET;
358
359 if (ctx->vram_lost_counter != atomic_read(&adev->vram_lost_counter))
360 out->state.flags |= AMDGPU_CTX_QUERY2_FLAGS_VRAMLOST;
361
362 if (atomic_read(&ctx->guilty))
363 out->state.flags |= AMDGPU_CTX_QUERY2_FLAGS_GUILTY;
364
365
366 ras_counter = amdgpu_ras_query_error_count(adev, false);
367
368 if (ras_counter != ctx->ras_counter_ue) {
369 out->state.flags |= AMDGPU_CTX_QUERY2_FLAGS_RAS_UE;
370 ctx->ras_counter_ue = ras_counter;
371 }
372
373
374 ras_counter = amdgpu_ras_query_error_count(adev, true);
375 if (ras_counter != ctx->ras_counter_ce) {
376 out->state.flags |= AMDGPU_CTX_QUERY2_FLAGS_RAS_CE;
377 ctx->ras_counter_ce = ras_counter;
378 }
379
380 mutex_unlock(&mgr->lock);
381 return 0;
382}
383
384int amdgpu_ctx_ioctl(struct drm_device *dev, void *data,
385 struct drm_file *filp)
386{
387 int r;
388 uint32_t id;
389 enum drm_sched_priority priority;
390
391 union drm_amdgpu_ctx *args = data;
392 struct amdgpu_device *adev = drm_to_adev(dev);
393 struct amdgpu_fpriv *fpriv = filp->driver_priv;
394
395 id = args->in.ctx_id;
396 r = amdgpu_to_sched_priority(args->in.priority, &priority);
397
398
399
400 if (r == -EINVAL)
401 priority = DRM_SCHED_PRIORITY_NORMAL;
402
403 switch (args->in.op) {
404 case AMDGPU_CTX_OP_ALLOC_CTX:
405 r = amdgpu_ctx_alloc(adev, fpriv, filp, priority, &id);
406 args->out.alloc.ctx_id = id;
407 break;
408 case AMDGPU_CTX_OP_FREE_CTX:
409 r = amdgpu_ctx_free(fpriv, id);
410 break;
411 case AMDGPU_CTX_OP_QUERY_STATE:
412 r = amdgpu_ctx_query(adev, fpriv, id, &args->out);
413 break;
414 case AMDGPU_CTX_OP_QUERY_STATE2:
415 r = amdgpu_ctx_query2(adev, fpriv, id, &args->out);
416 break;
417 default:
418 return -EINVAL;
419 }
420
421 return r;
422}
423
424struct amdgpu_ctx *amdgpu_ctx_get(struct amdgpu_fpriv *fpriv, uint32_t id)
425{
426 struct amdgpu_ctx *ctx;
427 struct amdgpu_ctx_mgr *mgr;
428
429 if (!fpriv)
430 return NULL;
431
432 mgr = &fpriv->ctx_mgr;
433
434 mutex_lock(&mgr->lock);
435 ctx = idr_find(&mgr->ctx_handles, id);
436 if (ctx)
437 kref_get(&ctx->refcount);
438 mutex_unlock(&mgr->lock);
439 return ctx;
440}
441
442int amdgpu_ctx_put(struct amdgpu_ctx *ctx)
443{
444 if (ctx == NULL)
445 return -EINVAL;
446
447 kref_put(&ctx->refcount, amdgpu_ctx_do_release);
448 return 0;
449}
450
451void amdgpu_ctx_add_fence(struct amdgpu_ctx *ctx,
452 struct drm_sched_entity *entity,
453 struct dma_fence *fence, uint64_t *handle)
454{
455 struct amdgpu_ctx_entity *centity = to_amdgpu_ctx_entity(entity);
456 uint64_t seq = centity->sequence;
457 struct dma_fence *other = NULL;
458 unsigned idx = 0;
459
460 idx = seq & (amdgpu_sched_jobs - 1);
461 other = centity->fences[idx];
462 if (other)
463 BUG_ON(!dma_fence_is_signaled(other));
464
465 dma_fence_get(fence);
466
467 spin_lock(&ctx->ring_lock);
468 centity->fences[idx] = fence;
469 centity->sequence++;
470 spin_unlock(&ctx->ring_lock);
471
472 dma_fence_put(other);
473 if (handle)
474 *handle = seq;
475}
476
477struct dma_fence *amdgpu_ctx_get_fence(struct amdgpu_ctx *ctx,
478 struct drm_sched_entity *entity,
479 uint64_t seq)
480{
481 struct amdgpu_ctx_entity *centity = to_amdgpu_ctx_entity(entity);
482 struct dma_fence *fence;
483
484 spin_lock(&ctx->ring_lock);
485
486 if (seq == ~0ull)
487 seq = centity->sequence - 1;
488
489 if (seq >= centity->sequence) {
490 spin_unlock(&ctx->ring_lock);
491 return ERR_PTR(-EINVAL);
492 }
493
494
495 if (seq + amdgpu_sched_jobs < centity->sequence) {
496 spin_unlock(&ctx->ring_lock);
497 return NULL;
498 }
499
500 fence = dma_fence_get(centity->fences[seq & (amdgpu_sched_jobs - 1)]);
501 spin_unlock(&ctx->ring_lock);
502
503 return fence;
504}
505
506static void amdgpu_ctx_set_entity_priority(struct amdgpu_ctx *ctx,
507 struct amdgpu_ctx_entity *aentity,
508 int hw_ip,
509 enum drm_sched_priority priority)
510{
511 struct amdgpu_device *adev = ctx->adev;
512 unsigned int hw_prio;
513 struct drm_gpu_scheduler **scheds = NULL;
514 unsigned num_scheds;
515
516
517 drm_sched_entity_set_priority(&aentity->entity, priority);
518
519
520 if (hw_ip == AMDGPU_HW_IP_COMPUTE) {
521 hw_prio = amdgpu_ctx_prio_sched_to_hw(adev, priority,
522 AMDGPU_HW_IP_COMPUTE);
523 hw_prio = array_index_nospec(hw_prio, AMDGPU_RING_PRIO_MAX);
524 scheds = adev->gpu_sched[hw_ip][hw_prio].sched;
525 num_scheds = adev->gpu_sched[hw_ip][hw_prio].num_scheds;
526 drm_sched_entity_modify_sched(&aentity->entity, scheds,
527 num_scheds);
528 }
529}
530
531void amdgpu_ctx_priority_override(struct amdgpu_ctx *ctx,
532 enum drm_sched_priority priority)
533{
534 enum drm_sched_priority ctx_prio;
535 unsigned i, j;
536
537 ctx->override_priority = priority;
538
539 ctx_prio = (ctx->override_priority == DRM_SCHED_PRIORITY_UNSET) ?
540 ctx->init_priority : ctx->override_priority;
541 for (i = 0; i < AMDGPU_HW_IP_NUM; ++i) {
542 for (j = 0; j < amdgpu_ctx_num_entities[i]; ++j) {
543 if (!ctx->entities[i][j])
544 continue;
545
546 amdgpu_ctx_set_entity_priority(ctx, ctx->entities[i][j],
547 i, ctx_prio);
548 }
549 }
550}
551
552int amdgpu_ctx_wait_prev_fence(struct amdgpu_ctx *ctx,
553 struct drm_sched_entity *entity)
554{
555 struct amdgpu_ctx_entity *centity = to_amdgpu_ctx_entity(entity);
556 struct dma_fence *other;
557 unsigned idx;
558 long r;
559
560 spin_lock(&ctx->ring_lock);
561 idx = centity->sequence & (amdgpu_sched_jobs - 1);
562 other = dma_fence_get(centity->fences[idx]);
563 spin_unlock(&ctx->ring_lock);
564
565 if (!other)
566 return 0;
567
568 r = dma_fence_wait(other, true);
569 if (r < 0 && r != -ERESTARTSYS)
570 DRM_ERROR("Error (%ld) waiting for fence!\n", r);
571
572 dma_fence_put(other);
573 return r;
574}
575
576void amdgpu_ctx_mgr_init(struct amdgpu_ctx_mgr *mgr)
577{
578 mutex_init(&mgr->lock);
579 idr_init(&mgr->ctx_handles);
580}
581
582long amdgpu_ctx_mgr_entity_flush(struct amdgpu_ctx_mgr *mgr, long timeout)
583{
584 struct amdgpu_ctx *ctx;
585 struct idr *idp;
586 uint32_t id, i, j;
587
588 idp = &mgr->ctx_handles;
589
590 mutex_lock(&mgr->lock);
591 idr_for_each_entry(idp, ctx, id) {
592 for (i = 0; i < AMDGPU_HW_IP_NUM; ++i) {
593 for (j = 0; j < amdgpu_ctx_num_entities[i]; ++j) {
594 struct drm_sched_entity *entity;
595
596 if (!ctx->entities[i][j])
597 continue;
598
599 entity = &ctx->entities[i][j]->entity;
600 timeout = drm_sched_entity_flush(entity, timeout);
601 }
602 }
603 }
604 mutex_unlock(&mgr->lock);
605 return timeout;
606}
607
608void amdgpu_ctx_mgr_entity_fini(struct amdgpu_ctx_mgr *mgr)
609{
610 struct amdgpu_ctx *ctx;
611 struct idr *idp;
612 uint32_t id, i, j;
613
614 idp = &mgr->ctx_handles;
615
616 idr_for_each_entry(idp, ctx, id) {
617 if (kref_read(&ctx->refcount) != 1) {
618 DRM_ERROR("ctx %p is still alive\n", ctx);
619 continue;
620 }
621
622 for (i = 0; i < AMDGPU_HW_IP_NUM; ++i) {
623 for (j = 0; j < amdgpu_ctx_num_entities[i]; ++j) {
624 struct drm_sched_entity *entity;
625
626 if (!ctx->entities[i][j])
627 continue;
628
629 entity = &ctx->entities[i][j]->entity;
630 drm_sched_entity_fini(entity);
631 }
632 }
633 }
634}
635
636void amdgpu_ctx_mgr_fini(struct amdgpu_ctx_mgr *mgr)
637{
638 struct amdgpu_ctx *ctx;
639 struct idr *idp;
640 uint32_t id;
641
642 amdgpu_ctx_mgr_entity_fini(mgr);
643
644 idp = &mgr->ctx_handles;
645
646 idr_for_each_entry(idp, ctx, id) {
647 if (kref_put(&ctx->refcount, amdgpu_ctx_fini) != 1)
648 DRM_ERROR("ctx %p is still alive\n", ctx);
649 }
650
651 idr_destroy(&mgr->ctx_handles);
652 mutex_destroy(&mgr->lock);
653}
654