LXR linux/drivers/gpu/drm/amd/amdgpu/amdgpu

   1/*
   2 * Copyright 2015 Advanced Micro Devices, Inc.
   3 *
   4 * Permission is hereby granted, free of charge, to any person obtaining a
   5 * copy of this software and associated documentation files (the "Software"),
   6 * to deal in the Software without restriction, including without limitation
   7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
   8 * and/or sell copies of the Software, and to permit persons to whom the
   9 * Software is furnished to do so, subject to the following conditions:
  10 *
  11 * The above copyright notice and this permission notice shall be included in
  12 * all copies or substantial portions of the Software.
  13 *
  14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
  17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  20 * OTHER DEALINGS IN THE SOFTWARE.
  21 *
  22 * Authors: monk liu <monk.liu@amd.com>
  23 */
  24
  25#include <drm/drmP.h>
  26#include <drm/drm_auth.h>
  27#include "amdgpu.h"
  28#include "amdgpu_sched.h"
  29
  30static int amdgpu_ctx_priority_permit(struct drm_file *filp,
  31                                      enum drm_sched_priority priority)
  32{
  33        /* NORMAL and below are accessible by everyone */
  34        if (priority <= DRM_SCHED_PRIORITY_NORMAL)
  35                return 0;
  36
  37        if (capable(CAP_SYS_NICE))
  38                return 0;
  39
  40        if (drm_is_current_master(filp))
  41                return 0;
  42
  43        return -EACCES;
  44}
  45
  46static int amdgpu_ctx_init(struct amdgpu_device *adev,
  47                           enum drm_sched_priority priority,
  48                           struct drm_file *filp,
  49                           struct amdgpu_ctx *ctx)
  50{
  51        unsigned i, j;
  52        int r;
  53
  54        if (priority < 0 || priority >= DRM_SCHED_PRIORITY_MAX)
  55                return -EINVAL;
  56
  57        r = amdgpu_ctx_priority_permit(filp, priority);
  58        if (r)
  59                return r;
  60
  61        memset(ctx, 0, sizeof(*ctx));
  62        ctx->adev = adev;
  63        kref_init(&ctx->refcount);
  64        spin_lock_init(&ctx->ring_lock);
  65        ctx->fences = kcalloc(amdgpu_sched_jobs * AMDGPU_MAX_RINGS,
  66                              sizeof(struct dma_fence*), GFP_KERNEL);
  67        if (!ctx->fences)
  68                return -ENOMEM;
  69
  70        mutex_init(&ctx->lock);
  71
  72        for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
  73                ctx->rings[i].sequence = 1;
  74                ctx->rings[i].fences = &ctx->fences[amdgpu_sched_jobs * i];
  75        }
  76
  77        ctx->reset_counter = atomic_read(&adev->gpu_reset_counter);
  78        ctx->reset_counter_query = ctx->reset_counter;
  79        ctx->vram_lost_counter = atomic_read(&adev->vram_lost_counter);
  80        ctx->init_priority = priority;
  81        ctx->override_priority = DRM_SCHED_PRIORITY_UNSET;
  82
  83        /* create context entity for each ring */
  84        for (i = 0; i < adev->num_rings; i++) {
  85                struct amdgpu_ring *ring = adev->rings[i];
  86                struct drm_sched_rq *rq;
  87
  88                rq = &ring->sched.sched_rq[priority];
  89
  90                if (ring == &adev->gfx.kiq.ring)
  91                        continue;
  92
  93                r = drm_sched_entity_init(&ctx->rings[i].entity,
  94                                          &rq, 1, &ctx->guilty);
  95                if (r)
  96                        goto failed;
  97        }
  98
  99        r = amdgpu_queue_mgr_init(adev, &ctx->queue_mgr);
 100        if (r)
 101                goto failed;
 102
 103        return 0;
 104
 105failed:
 106        for (j = 0; j < i; j++)
 107                drm_sched_entity_destroy(&ctx->rings[j].entity);
 108        kfree(ctx->fences);
 109        ctx->fences = NULL;
 110        return r;
 111}
 112
 113static void amdgpu_ctx_fini(struct kref *ref)
 114{
 115        struct amdgpu_ctx *ctx = container_of(ref, struct amdgpu_ctx, refcount);
 116        struct amdgpu_device *adev = ctx->adev;
 117        unsigned i, j;
 118
 119        if (!adev)
 120                return;
 121
 122        for (i = 0; i < AMDGPU_MAX_RINGS; ++i)
 123                for (j = 0; j < amdgpu_sched_jobs; ++j)
 124                        dma_fence_put(ctx->rings[i].fences[j]);
 125        kfree(ctx->fences);
 126        ctx->fences = NULL;
 127
 128        amdgpu_queue_mgr_fini(adev, &ctx->queue_mgr);
 129
 130        mutex_destroy(&ctx->lock);
 131
 132        kfree(ctx);
 133}
 134
 135static int amdgpu_ctx_alloc(struct amdgpu_device *adev,
 136                            struct amdgpu_fpriv *fpriv,
 137                            struct drm_file *filp,
 138                            enum drm_sched_priority priority,
 139                            uint32_t *id)
 140{
 141        struct amdgpu_ctx_mgr *mgr = &fpriv->ctx_mgr;
 142        struct amdgpu_ctx *ctx;
 143        int r;
 144
 145        ctx = kmalloc(sizeof(*ctx), GFP_KERNEL);
 146        if (!ctx)
 147                return -ENOMEM;
 148
 149        mutex_lock(&mgr->lock);
 150        r = idr_alloc(&mgr->ctx_handles, ctx, 1, 0, GFP_KERNEL);
 151        if (r < 0) {
 152                mutex_unlock(&mgr->lock);
 153                kfree(ctx);
 154                return r;
 155        }
 156
 157        *id = (uint32_t)r;
 158        r = amdgpu_ctx_init(adev, priority, filp, ctx);
 159        if (r) {
 160                idr_remove(&mgr->ctx_handles, *id);
 161                *id = 0;
 162                kfree(ctx);
 163        }
 164        mutex_unlock(&mgr->lock);
 165        return r;
 166}
 167
 168static void amdgpu_ctx_do_release(struct kref *ref)
 169{
 170        struct amdgpu_ctx *ctx;
 171        u32 i;
 172
 173        ctx = container_of(ref, struct amdgpu_ctx, refcount);
 174
 175        for (i = 0; i < ctx->adev->num_rings; i++) {
 176
 177                if (ctx->adev->rings[i] == &ctx->adev->gfx.kiq.ring)
 178                        continue;
 179
 180                drm_sched_entity_destroy(&ctx->rings[i].entity);
 181        }
 182
 183        amdgpu_ctx_fini(ref);
 184}
 185
 186static int amdgpu_ctx_free(struct amdgpu_fpriv *fpriv, uint32_t id)
 187{
 188        struct amdgpu_ctx_mgr *mgr = &fpriv->ctx_mgr;
 189        struct amdgpu_ctx *ctx;
 190
 191        mutex_lock(&mgr->lock);
 192        ctx = idr_remove(&mgr->ctx_handles, id);
 193        if (ctx)
 194                kref_put(&ctx->refcount, amdgpu_ctx_do_release);
 195        mutex_unlock(&mgr->lock);
 196        return ctx ? 0 : -EINVAL;
 197}
 198
 199static int amdgpu_ctx_query(struct amdgpu_device *adev,
 200                            struct amdgpu_fpriv *fpriv, uint32_t id,
 201                            union drm_amdgpu_ctx_out *out)
 202{
 203        struct amdgpu_ctx *ctx;
 204        struct amdgpu_ctx_mgr *mgr;
 205        unsigned reset_counter;
 206
 207        if (!fpriv)
 208                return -EINVAL;
 209
 210        mgr = &fpriv->ctx_mgr;
 211        mutex_lock(&mgr->lock);
 212        ctx = idr_find(&mgr->ctx_handles, id);
 213        if (!ctx) {
 214                mutex_unlock(&mgr->lock);
 215                return -EINVAL;
 216        }
 217
 218        /* TODO: these two are always zero */
 219        out->state.flags = 0x0;
 220        out->state.hangs = 0x0;
 221
 222        /* determine if a GPU reset has occured since the last call */
 223        reset_counter = atomic_read(&adev->gpu_reset_counter);
 224        /* TODO: this should ideally return NO, GUILTY, or INNOCENT. */
 225        if (ctx->reset_counter_query == reset_counter)
 226                out->state.reset_status = AMDGPU_CTX_NO_RESET;
 227        else
 228                out->state.reset_status = AMDGPU_CTX_UNKNOWN_RESET;
 229        ctx->reset_counter_query = reset_counter;
 230
 231        mutex_unlock(&mgr->lock);
 232        return 0;
 233}
 234
 235static int amdgpu_ctx_query2(struct amdgpu_device *adev,
 236        struct amdgpu_fpriv *fpriv, uint32_t id,
 237        union drm_amdgpu_ctx_out *out)
 238{
 239        struct amdgpu_ctx *ctx;
 240        struct amdgpu_ctx_mgr *mgr;
 241
 242        if (!fpriv)
 243                return -EINVAL;
 244
 245        mgr = &fpriv->ctx_mgr;
 246        mutex_lock(&mgr->lock);
 247        ctx = idr_find(&mgr->ctx_handles, id);
 248        if (!ctx) {
 249                mutex_unlock(&mgr->lock);
 250                return -EINVAL;
 251        }
 252
 253        out->state.flags = 0x0;
 254        out->state.hangs = 0x0;
 255
 256        if (ctx->reset_counter != atomic_read(&adev->gpu_reset_counter))
 257                out->state.flags |= AMDGPU_CTX_QUERY2_FLAGS_RESET;
 258
 259        if (ctx->vram_lost_counter != atomic_read(&adev->vram_lost_counter))
 260                out->state.flags |= AMDGPU_CTX_QUERY2_FLAGS_VRAMLOST;
 261
 262        if (atomic_read(&ctx->guilty))
 263                out->state.flags |= AMDGPU_CTX_QUERY2_FLAGS_GUILTY;
 264
 265        mutex_unlock(&mgr->lock);
 266        return 0;
 267}
 268
 269int amdgpu_ctx_ioctl(struct drm_device *dev, void *data,
 270                     struct drm_file *filp)
 271{
 272        int r;
 273        uint32_t id;
 274        enum drm_sched_priority priority;
 275
 276        union drm_amdgpu_ctx *args = data;
 277        struct amdgpu_device *adev = dev->dev_private;
 278        struct amdgpu_fpriv *fpriv = filp->driver_priv;
 279
 280        r = 0;
 281        id = args->in.ctx_id;
 282        priority = amdgpu_to_sched_priority(args->in.priority);
 283
 284        /* For backwards compatibility reasons, we need to accept
 285         * ioctls with garbage in the priority field */
 286        if (priority == DRM_SCHED_PRIORITY_INVALID)
 287                priority = DRM_SCHED_PRIORITY_NORMAL;
 288
 289        switch (args->in.op) {
 290        case AMDGPU_CTX_OP_ALLOC_CTX:
 291                r = amdgpu_ctx_alloc(adev, fpriv, filp, priority, &id);
 292                args->out.alloc.ctx_id = id;
 293                break;
 294        case AMDGPU_CTX_OP_FREE_CTX:
 295                r = amdgpu_ctx_free(fpriv, id);
 296                break;
 297        case AMDGPU_CTX_OP_QUERY_STATE:
 298                r = amdgpu_ctx_query(adev, fpriv, id, &args->out);
 299                break;
 300        case AMDGPU_CTX_OP_QUERY_STATE2:
 301                r = amdgpu_ctx_query2(adev, fpriv, id, &args->out);
 302                break;
 303        default:
 304                return -EINVAL;
 305        }
 306
 307        return r;
 308}
 309
 310struct amdgpu_ctx *amdgpu_ctx_get(struct amdgpu_fpriv *fpriv, uint32_t id)
 311{
 312        struct amdgpu_ctx *ctx;
 313        struct amdgpu_ctx_mgr *mgr;
 314
 315        if (!fpriv)
 316                return NULL;
 317
 318        mgr = &fpriv->ctx_mgr;
 319
 320        mutex_lock(&mgr->lock);
 321        ctx = idr_find(&mgr->ctx_handles, id);
 322        if (ctx)
 323                kref_get(&ctx->refcount);
 324        mutex_unlock(&mgr->lock);
 325        return ctx;
 326}
 327
 328int amdgpu_ctx_put(struct amdgpu_ctx *ctx)
 329{
 330        if (ctx == NULL)
 331                return -EINVAL;
 332
 333        kref_put(&ctx->refcount, amdgpu_ctx_do_release);
 334        return 0;
 335}
 336
 337int amdgpu_ctx_add_fence(struct amdgpu_ctx *ctx, struct amdgpu_ring *ring,
 338                              struct dma_fence *fence, uint64_t* handler)
 339{
 340        struct amdgpu_ctx_ring *cring = & ctx->rings[ring->idx];
 341        uint64_t seq = cring->sequence;
 342        unsigned idx = 0;
 343        struct dma_fence *other = NULL;
 344
 345        idx = seq & (amdgpu_sched_jobs - 1);
 346        other = cring->fences[idx];
 347        if (other)
 348                BUG_ON(!dma_fence_is_signaled(other));
 349
 350        dma_fence_get(fence);
 351
 352        spin_lock(&ctx->ring_lock);
 353        cring->fences[idx] = fence;
 354        cring->sequence++;
 355        spin_unlock(&ctx->ring_lock);
 356
 357        dma_fence_put(other);
 358        if (handler)
 359                *handler = seq;
 360
 361        return 0;
 362}
 363
 364struct dma_fence *amdgpu_ctx_get_fence(struct amdgpu_ctx *ctx,
 365                                       struct amdgpu_ring *ring, uint64_t seq)
 366{
 367        struct amdgpu_ctx_ring *cring = & ctx->rings[ring->idx];
 368        struct dma_fence *fence;
 369
 370        spin_lock(&ctx->ring_lock);
 371
 372        if (seq == ~0ull)
 373                seq = ctx->rings[ring->idx].sequence - 1;
 374
 375        if (seq >= cring->sequence) {
 376                spin_unlock(&ctx->ring_lock);
 377                return ERR_PTR(-EINVAL);
 378        }
 379
 380
 381        if (seq + amdgpu_sched_jobs < cring->sequence) {
 382                spin_unlock(&ctx->ring_lock);
 383                return NULL;
 384        }
 385
 386        fence = dma_fence_get(cring->fences[seq & (amdgpu_sched_jobs - 1)]);
 387        spin_unlock(&ctx->ring_lock);
 388
 389        return fence;
 390}
 391
 392void amdgpu_ctx_priority_override(struct amdgpu_ctx *ctx,
 393                                  enum drm_sched_priority priority)
 394{
 395        int i;
 396        struct amdgpu_device *adev = ctx->adev;
 397        struct drm_sched_rq *rq;
 398        struct drm_sched_entity *entity;
 399        struct amdgpu_ring *ring;
 400        enum drm_sched_priority ctx_prio;
 401
 402        ctx->override_priority = priority;
 403
 404        ctx_prio = (ctx->override_priority == DRM_SCHED_PRIORITY_UNSET) ?
 405                        ctx->init_priority : ctx->override_priority;
 406
 407        for (i = 0; i < adev->num_rings; i++) {
 408                ring = adev->rings[i];
 409                entity = &ctx->rings[i].entity;
 410                rq = &ring->sched.sched_rq[ctx_prio];
 411
 412                if (ring->funcs->type == AMDGPU_RING_TYPE_KIQ)
 413                        continue;
 414
 415                drm_sched_entity_set_rq(entity, rq);
 416        }
 417}
 418
 419int amdgpu_ctx_wait_prev_fence(struct amdgpu_ctx *ctx, unsigned ring_id)
 420{
 421        struct amdgpu_ctx_ring *cring = &ctx->rings[ring_id];
 422        unsigned idx = cring->sequence & (amdgpu_sched_jobs - 1);
 423        struct dma_fence *other = cring->fences[idx];
 424
 425        if (other) {
 426                signed long r;
 427                r = dma_fence_wait(other, true);
 428                if (r < 0) {
 429                        if (r != -ERESTARTSYS)
 430                                DRM_ERROR("Error (%ld) waiting for fence!\n", r);
 431
 432                        return r;
 433                }
 434        }
 435
 436        return 0;
 437}
 438
 439void amdgpu_ctx_mgr_init(struct amdgpu_ctx_mgr *mgr)
 440{
 441        mutex_init(&mgr->lock);
 442        idr_init(&mgr->ctx_handles);
 443}
 444
 445void amdgpu_ctx_mgr_entity_flush(struct amdgpu_ctx_mgr *mgr)
 446{
 447        struct amdgpu_ctx *ctx;
 448        struct idr *idp;
 449        uint32_t id, i;
 450        long max_wait = MAX_WAIT_SCHED_ENTITY_Q_EMPTY;
 451
 452        idp = &mgr->ctx_handles;
 453
 454        mutex_lock(&mgr->lock);
 455        idr_for_each_entry(idp, ctx, id) {
 456
 457                if (!ctx->adev) {
 458                        mutex_unlock(&mgr->lock);
 459                        return;
 460                }
 461
 462                for (i = 0; i < ctx->adev->num_rings; i++) {
 463
 464                        if (ctx->adev->rings[i] == &ctx->adev->gfx.kiq.ring)
 465                                continue;
 466
 467                        max_wait = drm_sched_entity_flush(&ctx->rings[i].entity,
 468                                                          max_wait);
 469                }
 470        }
 471        mutex_unlock(&mgr->lock);
 472}
 473
 474void amdgpu_ctx_mgr_entity_fini(struct amdgpu_ctx_mgr *mgr)
 475{
 476        struct amdgpu_ctx *ctx;
 477        struct idr *idp;
 478        uint32_t id, i;
 479
 480        idp = &mgr->ctx_handles;
 481
 482        idr_for_each_entry(idp, ctx, id) {
 483
 484                if (!ctx->adev)
 485                        return;
 486
 487                for (i = 0; i < ctx->adev->num_rings; i++) {
 488
 489                        if (ctx->adev->rings[i] == &ctx->adev->gfx.kiq.ring)
 490                                continue;
 491
 492                        if (kref_read(&ctx->refcount) == 1)
 493                                drm_sched_entity_fini(&ctx->rings[i].entity);
 494                        else
 495                                DRM_ERROR("ctx %p is still alive\n", ctx);
 496                }
 497        }
 498}
 499
 500void amdgpu_ctx_mgr_fini(struct amdgpu_ctx_mgr *mgr)
 501{
 502        struct amdgpu_ctx *ctx;
 503        struct idr *idp;
 504        uint32_t id;
 505
 506        amdgpu_ctx_mgr_entity_fini(mgr);
 507
 508        idp = &mgr->ctx_handles;
 509
 510        idr_for_each_entry(idp, ctx, id) {
 511                if (kref_put(&ctx->refcount, amdgpu_ctx_fini) != 1)
 512                        DRM_ERROR("ctx %p is still alive\n", ctx);
 513        }
 514
 515        idr_destroy(&mgr->ctx_handles);
 516        mutex_destroy(&mgr->lock);
 517}
 518