linux/drivers/gpu/drm/amd/amdgpu/amdgpu_amdkfd_fence.c
<<
>>
Prefs
   1/*
   2 * Copyright 2016-2018 Advanced Micro Devices, Inc.
   3 *
   4 * Permission is hereby granted, free of charge, to any person obtaining a
   5 * copy of this software and associated documentation files (the "Software"),
   6 * to deal in the Software without restriction, including without limitation
   7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
   8 * and/or sell copies of the Software, and to permit persons to whom the
   9 * Software is furnished to do so, subject to the following conditions:
  10 *
  11 * The above copyright notice and this permission notice shall be included in
  12 * all copies or substantial portions of the Software.
  13 *
  14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
  17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  20 * OTHER DEALINGS IN THE SOFTWARE.
  21 */
  22
  23#include <linux/dma-fence.h>
  24#include <linux/spinlock.h>
  25#include <linux/atomic.h>
  26#include <linux/stacktrace.h>
  27#include <linux/sched.h>
  28#include <linux/slab.h>
  29#include <linux/sched/mm.h>
  30#include "amdgpu_amdkfd.h"
  31#include "kfd_svm.h"
  32
  33static const struct dma_fence_ops amdkfd_fence_ops;
  34static atomic_t fence_seq = ATOMIC_INIT(0);
  35
  36/* Eviction Fence
  37 * Fence helper functions to deal with KFD memory eviction.
  38 * Big Idea - Since KFD submissions are done by user queues, a BO cannot be
  39 *  evicted unless all the user queues for that process are evicted.
  40 *
  41 * All the BOs in a process share an eviction fence. When process X wants
  42 * to map VRAM memory but TTM can't find enough space, TTM will attempt to
  43 * evict BOs from its LRU list. TTM checks if the BO is valuable to evict
  44 * by calling ttm_device_funcs->eviction_valuable().
  45 *
  46 * ttm_device_funcs->eviction_valuable() - will return false if the BO belongs
  47 *  to process X. Otherwise, it will return true to indicate BO can be
  48 *  evicted by TTM.
  49 *
  50 * If ttm_device_funcs->eviction_valuable returns true, then TTM will continue
  51 * the evcition process for that BO by calling ttm_bo_evict --> amdgpu_bo_move
  52 * --> amdgpu_copy_buffer(). This sets up job in GPU scheduler.
  53 *
  54 * GPU Scheduler (amd_sched_main) - sets up a cb (fence_add_callback) to
  55 *  nofity when the BO is free to move. fence_add_callback --> enable_signaling
  56 *  --> amdgpu_amdkfd_fence.enable_signaling
  57 *
  58 * amdgpu_amdkfd_fence.enable_signaling - Start a work item that will quiesce
  59 * user queues and signal fence. The work item will also start another delayed
  60 * work item to restore BOs
  61 */
  62
  63struct amdgpu_amdkfd_fence *amdgpu_amdkfd_fence_create(u64 context,
  64                                struct mm_struct *mm,
  65                                struct svm_range_bo *svm_bo)
  66{
  67        struct amdgpu_amdkfd_fence *fence;
  68
  69        fence = kzalloc(sizeof(*fence), GFP_KERNEL);
  70        if (fence == NULL)
  71                return NULL;
  72
  73        /* This reference gets released in amdkfd_fence_release */
  74        mmgrab(mm);
  75        fence->mm = mm;
  76        get_task_comm(fence->timeline_name, current);
  77        spin_lock_init(&fence->lock);
  78        fence->svm_bo = svm_bo;
  79        dma_fence_init(&fence->base, &amdkfd_fence_ops, &fence->lock,
  80                   context, atomic_inc_return(&fence_seq));
  81
  82        return fence;
  83}
  84
  85struct amdgpu_amdkfd_fence *to_amdgpu_amdkfd_fence(struct dma_fence *f)
  86{
  87        struct amdgpu_amdkfd_fence *fence;
  88
  89        if (!f)
  90                return NULL;
  91
  92        fence = container_of(f, struct amdgpu_amdkfd_fence, base);
  93        if (fence && f->ops == &amdkfd_fence_ops)
  94                return fence;
  95
  96        return NULL;
  97}
  98
  99static const char *amdkfd_fence_get_driver_name(struct dma_fence *f)
 100{
 101        return "amdgpu_amdkfd_fence";
 102}
 103
 104static const char *amdkfd_fence_get_timeline_name(struct dma_fence *f)
 105{
 106        struct amdgpu_amdkfd_fence *fence = to_amdgpu_amdkfd_fence(f);
 107
 108        return fence->timeline_name;
 109}
 110
 111/**
 112 * amdkfd_fence_enable_signaling - This gets called when TTM wants to evict
 113 *  a KFD BO and schedules a job to move the BO.
 114 *  If fence is already signaled return true.
 115 *  If fence is not signaled schedule a evict KFD process work item.
 116 *
 117 *  @f: dma_fence
 118 */
 119static bool amdkfd_fence_enable_signaling(struct dma_fence *f)
 120{
 121        struct amdgpu_amdkfd_fence *fence = to_amdgpu_amdkfd_fence(f);
 122
 123        if (!fence)
 124                return false;
 125
 126        if (dma_fence_is_signaled(f))
 127                return true;
 128
 129        if (!fence->svm_bo) {
 130                if (!kgd2kfd_schedule_evict_and_restore_process(fence->mm, f))
 131                        return true;
 132        } else {
 133                if (!svm_range_schedule_evict_svm_bo(fence))
 134                        return true;
 135        }
 136        return false;
 137}
 138
 139/**
 140 * amdkfd_fence_release - callback that fence can be freed
 141 *
 142 * @f: dma_fence
 143 *
 144 * This function is called when the reference count becomes zero.
 145 * Drops the mm_struct reference and RCU schedules freeing up the fence.
 146 */
 147static void amdkfd_fence_release(struct dma_fence *f)
 148{
 149        struct amdgpu_amdkfd_fence *fence = to_amdgpu_amdkfd_fence(f);
 150
 151        /* Unconditionally signal the fence. The process is getting
 152         * terminated.
 153         */
 154        if (WARN_ON(!fence))
 155                return; /* Not an amdgpu_amdkfd_fence */
 156
 157        mmdrop(fence->mm);
 158        kfree_rcu(f, rcu);
 159}
 160
 161/**
 162 * amdkfd_fence_check_mm - Check if @mm is same as that of the fence @f
 163 *  if same return TRUE else return FALSE.
 164 *
 165 * @f: [IN] fence
 166 * @mm: [IN] mm that needs to be verified
 167 */
 168bool amdkfd_fence_check_mm(struct dma_fence *f, struct mm_struct *mm)
 169{
 170        struct amdgpu_amdkfd_fence *fence = to_amdgpu_amdkfd_fence(f);
 171
 172        if (!fence)
 173                return false;
 174        else if (fence->mm == mm)
 175                return true;
 176
 177        return false;
 178}
 179
 180static const struct dma_fence_ops amdkfd_fence_ops = {
 181        .get_driver_name = amdkfd_fence_get_driver_name,
 182        .get_timeline_name = amdkfd_fence_get_timeline_name,
 183        .enable_signaling = amdkfd_fence_enable_signaling,
 184        .release = amdkfd_fence_release,
 185};
 186