LXR linux/drivers/gpu/drm/amd/amdgpu/amdgpu

   1/*
   2 * Copyright 2008 Advanced Micro Devices, Inc.
   3 * Copyright 2008 Red Hat Inc.
   4 * Copyright 2009 Jerome Glisse.
   5 *
   6 * Permission is hereby granted, free of charge, to any person obtaining a
   7 * copy of this software and associated documentation files (the "Software"),
   8 * to deal in the Software without restriction, including without limitation
   9 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  10 * and/or sell copies of the Software, and to permit persons to whom the
  11 * Software is furnished to do so, subject to the following conditions:
  12 *
  13 * The above copyright notice and this permission notice shall be included in
  14 * all copies or substantial portions of the Software.
  15 *
  16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
  19 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  20 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  21 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  22 * OTHER DEALINGS IN THE SOFTWARE.
  23 *
  24 * Authors: Dave Airlie
  25 *          Alex Deucher
  26 *          Jerome Glisse
  27 */
  28#include <linux/power_supply.h>
  29#include <linux/kthread.h>
  30#include <linux/module.h>
  31#include <linux/console.h>
  32#include <linux/slab.h>
  33#include <linux/iommu.h>
  34#include <linux/pci.h>
  35
  36#include <drm/drm_atomic_helper.h>
  37#include <drm/drm_probe_helper.h>
  38#include <drm/amdgpu_drm.h>
  39#include <linux/vgaarb.h>
  40#include <linux/vga_switcheroo.h>
  41#include <linux/efi.h>
  42#include "amdgpu.h"
  43#include "amdgpu_trace.h"
  44#include "amdgpu_i2c.h"
  45#include "atom.h"
  46#include "amdgpu_atombios.h"
  47#include "amdgpu_atomfirmware.h"
  48#include "amd_pcie.h"
  49#ifdef CONFIG_DRM_AMDGPU_SI
  50#include "si.h"
  51#endif
  52#ifdef CONFIG_DRM_AMDGPU_CIK
  53#include "cik.h"
  54#endif
  55#include "vi.h"
  56#include "soc15.h"
  57#include "nv.h"
  58#include "bif/bif_4_1_d.h"
  59#include <linux/firmware.h>
  60#include "amdgpu_vf_error.h"
  61
  62#include "amdgpu_amdkfd.h"
  63#include "amdgpu_pm.h"
  64
  65#include "amdgpu_xgmi.h"
  66#include "amdgpu_ras.h"
  67#include "amdgpu_pmu.h"
  68#include "amdgpu_fru_eeprom.h"
  69#include "amdgpu_reset.h"
  70
  71#include <linux/suspend.h>
  72#include <drm/task_barrier.h>
  73#include <linux/pm_runtime.h>
  74
  75#include <drm/drm_drv.h>
  76
  77MODULE_FIRMWARE("amdgpu/vega10_gpu_info.bin");
  78MODULE_FIRMWARE("amdgpu/vega12_gpu_info.bin");
  79MODULE_FIRMWARE("amdgpu/raven_gpu_info.bin");
  80MODULE_FIRMWARE("amdgpu/picasso_gpu_info.bin");
  81MODULE_FIRMWARE("amdgpu/raven2_gpu_info.bin");
  82MODULE_FIRMWARE("amdgpu/arcturus_gpu_info.bin");
  83MODULE_FIRMWARE("amdgpu/navi12_gpu_info.bin");
  84
  85#define AMDGPU_RESUME_MS                2000
  86#define AMDGPU_MAX_RETRY_LIMIT          2
  87#define AMDGPU_RETRY_SRIOV_RESET(r) ((r) == -EBUSY || (r) == -ETIMEDOUT || (r) == -EINVAL)
  88
  89const char *amdgpu_asic_name[] = {
  90        "TAHITI",
  91        "PITCAIRN",
  92        "VERDE",
  93        "OLAND",
  94        "HAINAN",
  95        "BONAIRE",
  96        "KAVERI",
  97        "KABINI",
  98        "HAWAII",
  99        "MULLINS",
 100        "TOPAZ",
 101        "TONGA",
 102        "FIJI",
 103        "CARRIZO",
 104        "STONEY",
 105        "POLARIS10",
 106        "POLARIS11",
 107        "POLARIS12",
 108        "VEGAM",
 109        "VEGA10",
 110        "VEGA12",
 111        "VEGA20",
 112        "RAVEN",
 113        "ARCTURUS",
 114        "RENOIR",
 115        "ALDEBARAN",
 116        "NAVI10",
 117        "CYAN_SKILLFISH",
 118        "NAVI14",
 119        "NAVI12",
 120        "SIENNA_CICHLID",
 121        "NAVY_FLOUNDER",
 122        "VANGOGH",
 123        "DIMGREY_CAVEFISH",
 124        "BEIGE_GOBY",
 125        "YELLOW_CARP",
 126        "IP DISCOVERY",
 127        "LAST",
 128};
 129
 130/**
 131 * DOC: pcie_replay_count
 132 *
 133 * The amdgpu driver provides a sysfs API for reporting the total number
 134 * of PCIe replays (NAKs)
 135 * The file pcie_replay_count is used for this and returns the total
 136 * number of replays as a sum of the NAKs generated and NAKs received
 137 */
 138
 139static ssize_t amdgpu_device_get_pcie_replay_count(struct device *dev,
 140                struct device_attribute *attr, char *buf)
 141{
 142        struct drm_device *ddev = dev_get_drvdata(dev);
 143        struct amdgpu_device *adev = drm_to_adev(ddev);
 144        uint64_t cnt = amdgpu_asic_get_pcie_replay_count(adev);
 145
 146        return sysfs_emit(buf, "%llu\n", cnt);
 147}
 148
 149static DEVICE_ATTR(pcie_replay_count, S_IRUGO,
 150                amdgpu_device_get_pcie_replay_count, NULL);
 151
 152static void amdgpu_device_get_pcie_info(struct amdgpu_device *adev);
 153
 154/**
 155 * DOC: product_name
 156 *
 157 * The amdgpu driver provides a sysfs API for reporting the product name
 158 * for the device
 159 * The file serial_number is used for this and returns the product name
 160 * as returned from the FRU.
 161 * NOTE: This is only available for certain server cards
 162 */
 163
 164static ssize_t amdgpu_device_get_product_name(struct device *dev,
 165                struct device_attribute *attr, char *buf)
 166{
 167        struct drm_device *ddev = dev_get_drvdata(dev);
 168        struct amdgpu_device *adev = drm_to_adev(ddev);
 169
 170        return sysfs_emit(buf, "%s\n", adev->product_name);
 171}
 172
 173static DEVICE_ATTR(product_name, S_IRUGO,
 174                amdgpu_device_get_product_name, NULL);
 175
 176/**
 177 * DOC: product_number
 178 *
 179 * The amdgpu driver provides a sysfs API for reporting the part number
 180 * for the device
 181 * The file serial_number is used for this and returns the part number
 182 * as returned from the FRU.
 183 * NOTE: This is only available for certain server cards
 184 */
 185
 186static ssize_t amdgpu_device_get_product_number(struct device *dev,
 187                struct device_attribute *attr, char *buf)
 188{
 189        struct drm_device *ddev = dev_get_drvdata(dev);
 190        struct amdgpu_device *adev = drm_to_adev(ddev);
 191
 192        return sysfs_emit(buf, "%s\n", adev->product_number);
 193}
 194
 195static DEVICE_ATTR(product_number, S_IRUGO,
 196                amdgpu_device_get_product_number, NULL);
 197
 198/**
 199 * DOC: serial_number
 200 *
 201 * The amdgpu driver provides a sysfs API for reporting the serial number
 202 * for the device
 203 * The file serial_number is used for this and returns the serial number
 204 * as returned from the FRU.
 205 * NOTE: This is only available for certain server cards
 206 */
 207
 208static ssize_t amdgpu_device_get_serial_number(struct device *dev,
 209                struct device_attribute *attr, char *buf)
 210{
 211        struct drm_device *ddev = dev_get_drvdata(dev);
 212        struct amdgpu_device *adev = drm_to_adev(ddev);
 213
 214        return sysfs_emit(buf, "%s\n", adev->serial);
 215}
 216
 217static DEVICE_ATTR(serial_number, S_IRUGO,
 218                amdgpu_device_get_serial_number, NULL);
 219
 220/**
 221 * amdgpu_device_supports_px - Is the device a dGPU with ATPX power control
 222 *
 223 * @dev: drm_device pointer
 224 *
 225 * Returns true if the device is a dGPU with ATPX power control,
 226 * otherwise return false.
 227 */
 228bool amdgpu_device_supports_px(struct drm_device *dev)
 229{
 230        struct amdgpu_device *adev = drm_to_adev(dev);
 231
 232        if ((adev->flags & AMD_IS_PX) && !amdgpu_is_atpx_hybrid())
 233                return true;
 234        return false;
 235}
 236
 237/**
 238 * amdgpu_device_supports_boco - Is the device a dGPU with ACPI power resources
 239 *
 240 * @dev: drm_device pointer
 241 *
 242 * Returns true if the device is a dGPU with ACPI power control,
 243 * otherwise return false.
 244 */
 245bool amdgpu_device_supports_boco(struct drm_device *dev)
 246{
 247        struct amdgpu_device *adev = drm_to_adev(dev);
 248
 249        if (adev->has_pr3 ||
 250            ((adev->flags & AMD_IS_PX) && amdgpu_is_atpx_hybrid()))
 251                return true;
 252        return false;
 253}
 254
 255/**
 256 * amdgpu_device_supports_baco - Does the device support BACO
 257 *
 258 * @dev: drm_device pointer
 259 *
 260 * Returns true if the device supporte BACO,
 261 * otherwise return false.
 262 */
 263bool amdgpu_device_supports_baco(struct drm_device *dev)
 264{
 265        struct amdgpu_device *adev = drm_to_adev(dev);
 266
 267        return amdgpu_asic_supports_baco(adev);
 268}
 269
 270/**
 271 * amdgpu_device_supports_smart_shift - Is the device dGPU with
 272 * smart shift support
 273 *
 274 * @dev: drm_device pointer
 275 *
 276 * Returns true if the device is a dGPU with Smart Shift support,
 277 * otherwise returns false.
 278 */
 279bool amdgpu_device_supports_smart_shift(struct drm_device *dev)
 280{
 281        return (amdgpu_device_supports_boco(dev) &&
 282                amdgpu_acpi_is_power_shift_control_supported());
 283}
 284
 285/*
 286 * VRAM access helper functions
 287 */
 288
 289/**
 290 * amdgpu_device_mm_access - access vram by MM_INDEX/MM_DATA
 291 *
 292 * @adev: amdgpu_device pointer
 293 * @pos: offset of the buffer in vram
 294 * @buf: virtual address of the buffer in system memory
 295 * @size: read/write size, sizeof(@buf) must > @size
 296 * @write: true - write to vram, otherwise - read from vram
 297 */
 298void amdgpu_device_mm_access(struct amdgpu_device *adev, loff_t pos,
 299                             void *buf, size_t size, bool write)
 300{
 301        unsigned long flags;
 302        uint32_t hi = ~0, tmp = 0;
 303        uint32_t *data = buf;
 304        uint64_t last;
 305        int idx;
 306
 307        if (!drm_dev_enter(adev_to_drm(adev), &idx))
 308                return;
 309
 310        BUG_ON(!IS_ALIGNED(pos, 4) || !IS_ALIGNED(size, 4));
 311
 312        spin_lock_irqsave(&adev->mmio_idx_lock, flags);
 313        for (last = pos + size; pos < last; pos += 4) {
 314                tmp = pos >> 31;
 315
 316                WREG32_NO_KIQ(mmMM_INDEX, ((uint32_t)pos) | 0x80000000);
 317                if (tmp != hi) {
 318                        WREG32_NO_KIQ(mmMM_INDEX_HI, tmp);
 319                        hi = tmp;
 320                }
 321                if (write)
 322                        WREG32_NO_KIQ(mmMM_DATA, *data++);
 323                else
 324                        *data++ = RREG32_NO_KIQ(mmMM_DATA);
 325        }
 326
 327        spin_unlock_irqrestore(&adev->mmio_idx_lock, flags);
 328        drm_dev_exit(idx);
 329}
 330
 331/**
 332 * amdgpu_device_aper_access - access vram by vram aperature
 333 *
 334 * @adev: amdgpu_device pointer
 335 * @pos: offset of the buffer in vram
 336 * @buf: virtual address of the buffer in system memory
 337 * @size: read/write size, sizeof(@buf) must > @size
 338 * @write: true - write to vram, otherwise - read from vram
 339 *
 340 * The return value means how many bytes have been transferred.
 341 */
 342size_t amdgpu_device_aper_access(struct amdgpu_device *adev, loff_t pos,
 343                                 void *buf, size_t size, bool write)
 344{
 345#ifdef CONFIG_64BIT
 346        void __iomem *addr;
 347        size_t count = 0;
 348        uint64_t last;
 349
 350        if (!adev->mman.aper_base_kaddr)
 351                return 0;
 352
 353        last = min(pos + size, adev->gmc.visible_vram_size);
 354        if (last > pos) {
 355                addr = adev->mman.aper_base_kaddr + pos;
 356                count = last - pos;
 357
 358                if (write) {
 359                        memcpy_toio(addr, buf, count);
 360                        mb();
 361                        amdgpu_device_flush_hdp(adev, NULL);
 362                } else {
 363                        amdgpu_device_invalidate_hdp(adev, NULL);
 364                        mb();
 365                        memcpy_fromio(buf, addr, count);
 366                }
 367
 368        }
 369
 370        return count;
 371#else
 372        return 0;
 373#endif
 374}
 375
 376/**
 377 * amdgpu_device_vram_access - read/write a buffer in vram
 378 *
 379 * @adev: amdgpu_device pointer
 380 * @pos: offset of the buffer in vram
 381 * @buf: virtual address of the buffer in system memory
 382 * @size: read/write size, sizeof(@buf) must > @size
 383 * @write: true - write to vram, otherwise - read from vram
 384 */
 385void amdgpu_device_vram_access(struct amdgpu_device *adev, loff_t pos,
 386                               void *buf, size_t size, bool write)
 387{
 388        size_t count;
 389
 390        /* try to using vram apreature to access vram first */
 391        count = amdgpu_device_aper_access(adev, pos, buf, size, write);
 392        size -= count;
 393        if (size) {
 394                /* using MM to access rest vram */
 395                pos += count;
 396                buf += count;
 397                amdgpu_device_mm_access(adev, pos, buf, size, write);
 398        }
 399}
 400
 401/*
 402 * register access helper functions.
 403 */
 404
 405/* Check if hw access should be skipped because of hotplug or device error */
 406bool amdgpu_device_skip_hw_access(struct amdgpu_device *adev)
 407{
 408        if (adev->no_hw_access)
 409                return true;
 410
 411#ifdef CONFIG_LOCKDEP
 412        /*
 413         * This is a bit complicated to understand, so worth a comment. What we assert
 414         * here is that the GPU reset is not running on another thread in parallel.
 415         *
 416         * For this we trylock the read side of the reset semaphore, if that succeeds
 417         * we know that the reset is not running in paralell.
 418         *
 419         * If the trylock fails we assert that we are either already holding the read
 420         * side of the lock or are the reset thread itself and hold the write side of
 421         * the lock.
 422         */
 423        if (in_task()) {
 424                if (down_read_trylock(&adev->reset_domain->sem))
 425                        up_read(&adev->reset_domain->sem);
 426                else
 427                        lockdep_assert_held(&adev->reset_domain->sem);
 428        }
 429#endif
 430        return false;
 431}
 432
 433/**
 434 * amdgpu_device_rreg - read a memory mapped IO or indirect register
 435 *
 436 * @adev: amdgpu_device pointer
 437 * @reg: dword aligned register offset
 438 * @acc_flags: access flags which require special behavior
 439 *
 440 * Returns the 32 bit value from the offset specified.
 441 */
 442uint32_t amdgpu_device_rreg(struct amdgpu_device *adev,
 443                            uint32_t reg, uint32_t acc_flags)
 444{
 445        uint32_t ret;
 446
 447        if (amdgpu_device_skip_hw_access(adev))
 448                return 0;
 449
 450        if ((reg * 4) < adev->rmmio_size) {
 451                if (!(acc_flags & AMDGPU_REGS_NO_KIQ) &&
 452                    amdgpu_sriov_runtime(adev) &&
 453                    down_read_trylock(&adev->reset_domain->sem)) {
 454                        ret = amdgpu_kiq_rreg(adev, reg);
 455                        up_read(&adev->reset_domain->sem);
 456                } else {
 457                        ret = readl(((void __iomem *)adev->rmmio) + (reg * 4));
 458                }
 459        } else {
 460                ret = adev->pcie_rreg(adev, reg * 4);
 461        }
 462
 463        trace_amdgpu_device_rreg(adev->pdev->device, reg, ret);
 464
 465        return ret;
 466}
 467
 468/*
 469 * MMIO register read with bytes helper functions
 470 * @offset:bytes offset from MMIO start
 471 *
 472*/
 473
 474/**
 475 * amdgpu_mm_rreg8 - read a memory mapped IO register
 476 *
 477 * @adev: amdgpu_device pointer
 478 * @offset: byte aligned register offset
 479 *
 480 * Returns the 8 bit value from the offset specified.
 481 */
 482uint8_t amdgpu_mm_rreg8(struct amdgpu_device *adev, uint32_t offset)
 483{
 484        if (amdgpu_device_skip_hw_access(adev))
 485                return 0;
 486
 487        if (offset < adev->rmmio_size)
 488                return (readb(adev->rmmio + offset));
 489        BUG();
 490}
 491
 492/*
 493 * MMIO register write with bytes helper functions
 494 * @offset:bytes offset from MMIO start
 495 * @value: the value want to be written to the register
 496 *
 497*/
 498/**
 499 * amdgpu_mm_wreg8 - read a memory mapped IO register
 500 *
 501 * @adev: amdgpu_device pointer
 502 * @offset: byte aligned register offset
 503 * @value: 8 bit value to write
 504 *
 505 * Writes the value specified to the offset specified.
 506 */
 507void amdgpu_mm_wreg8(struct amdgpu_device *adev, uint32_t offset, uint8_t value)
 508{
 509        if (amdgpu_device_skip_hw_access(adev))
 510                return;
 511
 512        if (offset < adev->rmmio_size)
 513                writeb(value, adev->rmmio + offset);
 514        else
 515                BUG();
 516}
 517
 518/**
 519 * amdgpu_device_wreg - write to a memory mapped IO or indirect register
 520 *
 521 * @adev: amdgpu_device pointer
 522 * @reg: dword aligned register offset
 523 * @v: 32 bit value to write to the register
 524 * @acc_flags: access flags which require special behavior
 525 *
 526 * Writes the value specified to the offset specified.
 527 */
 528void amdgpu_device_wreg(struct amdgpu_device *adev,
 529                        uint32_t reg, uint32_t v,
 530                        uint32_t acc_flags)
 531{
 532        if (amdgpu_device_skip_hw_access(adev))
 533                return;
 534
 535        if ((reg * 4) < adev->rmmio_size) {
 536                if (!(acc_flags & AMDGPU_REGS_NO_KIQ) &&
 537                    amdgpu_sriov_runtime(adev) &&
 538                    down_read_trylock(&adev->reset_domain->sem)) {
 539                        amdgpu_kiq_wreg(adev, reg, v);
 540                        up_read(&adev->reset_domain->sem);
 541                } else {
 542                        writel(v, ((void __iomem *)adev->rmmio) + (reg * 4));
 543                }
 544        } else {
 545                adev->pcie_wreg(adev, reg * 4, v);
 546        }
 547
 548        trace_amdgpu_device_wreg(adev->pdev->device, reg, v);
 549}
 550
 551/**
 552 * amdgpu_mm_wreg_mmio_rlc -  write register either with direct/indirect mmio or with RLC path if in range
 553 *
 554 * @adev: amdgpu_device pointer
 555 * @reg: mmio/rlc register
 556 * @v: value to write
 557 *
 558 * this function is invoked only for the debugfs register access
 559 */
 560void amdgpu_mm_wreg_mmio_rlc(struct amdgpu_device *adev,
 561                             uint32_t reg, uint32_t v)
 562{
 563        if (amdgpu_device_skip_hw_access(adev))
 564                return;
 565
 566        if (amdgpu_sriov_fullaccess(adev) &&
 567            adev->gfx.rlc.funcs &&
 568            adev->gfx.rlc.funcs->is_rlcg_access_range) {
 569                if (adev->gfx.rlc.funcs->is_rlcg_access_range(adev, reg))
 570                        return amdgpu_sriov_wreg(adev, reg, v, 0, 0);
 571        } else if ((reg * 4) >= adev->rmmio_size) {
 572                adev->pcie_wreg(adev, reg * 4, v);
 573        } else {
 574                writel(v, ((void __iomem *)adev->rmmio) + (reg * 4));
 575        }
 576}
 577
 578/**
 579 * amdgpu_mm_rdoorbell - read a doorbell dword
 580 *
 581 * @adev: amdgpu_device pointer
 582 * @index: doorbell index
 583 *
 584 * Returns the value in the doorbell aperture at the
 585 * requested doorbell index (CIK).
 586 */
 587u32 amdgpu_mm_rdoorbell(struct amdgpu_device *adev, u32 index)
 588{
 589        if (amdgpu_device_skip_hw_access(adev))
 590                return 0;
 591
 592        if (index < adev->doorbell.num_doorbells) {
 593                return readl(adev->doorbell.ptr + index);
 594        } else {
 595                DRM_ERROR("reading beyond doorbell aperture: 0x%08x!\n", index);
 596                return 0;
 597        }
 598}
 599
 600/**
 601 * amdgpu_mm_wdoorbell - write a doorbell dword
 602 *
 603 * @adev: amdgpu_device pointer
 604 * @index: doorbell index
 605 * @v: value to write
 606 *
 607 * Writes @v to the doorbell aperture at the
 608 * requested doorbell index (CIK).
 609 */
 610void amdgpu_mm_wdoorbell(struct amdgpu_device *adev, u32 index, u32 v)
 611{
 612        if (amdgpu_device_skip_hw_access(adev))
 613                return;
 614
 615        if (index < adev->doorbell.num_doorbells) {
 616                writel(v, adev->doorbell.ptr + index);
 617        } else {
 618                DRM_ERROR("writing beyond doorbell aperture: 0x%08x!\n", index);
 619        }
 620}
 621
 622/**
 623 * amdgpu_mm_rdoorbell64 - read a doorbell Qword
 624 *
 625 * @adev: amdgpu_device pointer
 626 * @index: doorbell index
 627 *
 628 * Returns the value in the doorbell aperture at the
 629 * requested doorbell index (VEGA10+).
 630 */
 631u64 amdgpu_mm_rdoorbell64(struct amdgpu_device *adev, u32 index)
 632{
 633        if (amdgpu_device_skip_hw_access(adev))
 634                return 0;
 635
 636        if (index < adev->doorbell.num_doorbells) {
 637                return atomic64_read((atomic64_t *)(adev->doorbell.ptr + index));
 638        } else {
 639                DRM_ERROR("reading beyond doorbell aperture: 0x%08x!\n", index);
 640                return 0;
 641        }
 642}
 643
 644/**
 645 * amdgpu_mm_wdoorbell64 - write a doorbell Qword
 646 *
 647 * @adev: amdgpu_device pointer
 648 * @index: doorbell index
 649 * @v: value to write
 650 *
 651 * Writes @v to the doorbell aperture at the
 652 * requested doorbell index (VEGA10+).
 653 */
 654void amdgpu_mm_wdoorbell64(struct amdgpu_device *adev, u32 index, u64 v)
 655{
 656        if (amdgpu_device_skip_hw_access(adev))
 657                return;
 658
 659        if (index < adev->doorbell.num_doorbells) {
 660                atomic64_set((atomic64_t *)(adev->doorbell.ptr + index), v);
 661        } else {
 662                DRM_ERROR("writing beyond doorbell aperture: 0x%08x!\n", index);
 663        }
 664}
 665
 666/**
 667 * amdgpu_device_indirect_rreg - read an indirect register
 668 *
 669 * @adev: amdgpu_device pointer
 670 * @pcie_index: mmio register offset
 671 * @pcie_data: mmio register offset
 672 * @reg_addr: indirect register address to read from
 673 *
 674 * Returns the value of indirect register @reg_addr
 675 */
 676u32 amdgpu_device_indirect_rreg(struct amdgpu_device *adev,
 677                                u32 pcie_index, u32 pcie_data,
 678                                u32 reg_addr)
 679{
 680        unsigned long flags;
 681        u32 r;
 682        void __iomem *pcie_index_offset;
 683        void __iomem *pcie_data_offset;
 684
 685        spin_lock_irqsave(&adev->pcie_idx_lock, flags);
 686        pcie_index_offset = (void __iomem *)adev->rmmio + pcie_index * 4;
 687        pcie_data_offset = (void __iomem *)adev->rmmio + pcie_data * 4;
 688
 689        writel(reg_addr, pcie_index_offset);
 690        readl(pcie_index_offset);
 691        r = readl(pcie_data_offset);
 692        spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
 693
 694        return r;
 695}
 696
 697/**
 698 * amdgpu_device_indirect_rreg64 - read a 64bits indirect register
 699 *
 700 * @adev: amdgpu_device pointer
 701 * @pcie_index: mmio register offset
 702 * @pcie_data: mmio register offset
 703 * @reg_addr: indirect register address to read from
 704 *
 705 * Returns the value of indirect register @reg_addr
 706 */
 707u64 amdgpu_device_indirect_rreg64(struct amdgpu_device *adev,
 708                                  u32 pcie_index, u32 pcie_data,
 709                                  u32 reg_addr)
 710{
 711        unsigned long flags;
 712        u64 r;
 713        void __iomem *pcie_index_offset;
 714        void __iomem *pcie_data_offset;
 715
 716        spin_lock_irqsave(&adev->pcie_idx_lock, flags);
 717        pcie_index_offset = (void __iomem *)adev->rmmio + pcie_index * 4;
 718        pcie_data_offset = (void __iomem *)adev->rmmio + pcie_data * 4;
 719
 720        /* read low 32 bits */
 721        writel(reg_addr, pcie_index_offset);
 722        readl(pcie_index_offset);
 723        r = readl(pcie_data_offset);
 724        /* read high 32 bits */
 725        writel(reg_addr + 4, pcie_index_offset);
 726        readl(pcie_index_offset);
 727        r |= ((u64)readl(pcie_data_offset) << 32);
 728        spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
 729
 730        return r;
 731}
 732
 733/**
 734 * amdgpu_device_indirect_wreg - write an indirect register address
 735 *
 736 * @adev: amdgpu_device pointer
 737 * @pcie_index: mmio register offset
 738 * @pcie_data: mmio register offset
 739 * @reg_addr: indirect register offset
 740 * @reg_data: indirect register data
 741 *
 742 */
 743void amdgpu_device_indirect_wreg(struct amdgpu_device *adev,
 744                                 u32 pcie_index, u32 pcie_data,
 745                                 u32 reg_addr, u32 reg_data)
 746{
 747        unsigned long flags;
 748        void __iomem *pcie_index_offset;
 749        void __iomem *pcie_data_offset;
 750
 751        spin_lock_irqsave(&adev->pcie_idx_lock, flags);
 752        pcie_index_offset = (void __iomem *)adev->rmmio + pcie_index * 4;
 753        pcie_data_offset = (void __iomem *)adev->rmmio + pcie_data * 4;
 754
 755        writel(reg_addr, pcie_index_offset);
 756        readl(pcie_index_offset);
 757        writel(reg_data, pcie_data_offset);
 758        readl(pcie_data_offset);
 759        spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
 760}
 761
 762/**
 763 * amdgpu_device_indirect_wreg64 - write a 64bits indirect register address
 764 *
 765 * @adev: amdgpu_device pointer
 766 * @pcie_index: mmio register offset
 767 * @pcie_data: mmio register offset
 768 * @reg_addr: indirect register offset
 769 * @reg_data: indirect register data
 770 *
 771 */
 772void amdgpu_device_indirect_wreg64(struct amdgpu_device *adev,
 773                                   u32 pcie_index, u32 pcie_data,
 774                                   u32 reg_addr, u64 reg_data)
 775{
 776        unsigned long flags;
 777        void __iomem *pcie_index_offset;
 778        void __iomem *pcie_data_offset;
 779
 780        spin_lock_irqsave(&adev->pcie_idx_lock, flags);
 781        pcie_index_offset = (void __iomem *)adev->rmmio + pcie_index * 4;
 782        pcie_data_offset = (void __iomem *)adev->rmmio + pcie_data * 4;
 783
 784        /* write low 32 bits */
 785        writel(reg_addr, pcie_index_offset);
 786        readl(pcie_index_offset);
 787        writel((u32)(reg_data & 0xffffffffULL), pcie_data_offset);
 788        readl(pcie_data_offset);
 789        /* write high 32 bits */
 790        writel(reg_addr + 4, pcie_index_offset);
 791        readl(pcie_index_offset);
 792        writel((u32)(reg_data >> 32), pcie_data_offset);
 793        readl(pcie_data_offset);
 794        spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
 795}
 796
 797/**
 798 * amdgpu_invalid_rreg - dummy reg read function
 799 *
 800 * @adev: amdgpu_device pointer
 801 * @reg: offset of register
 802 *
 803 * Dummy register read function.  Used for register blocks
 804 * that certain asics don't have (all asics).
 805 * Returns the value in the register.
 806 */
 807static uint32_t amdgpu_invalid_rreg(struct amdgpu_device *adev, uint32_t reg)
 808{
 809        DRM_ERROR("Invalid callback to read register 0x%04X\n", reg);
 810        BUG();
 811        return 0;
 812}
 813
 814/**
 815 * amdgpu_invalid_wreg - dummy reg write function
 816 *
 817 * @adev: amdgpu_device pointer
 818 * @reg: offset of register
 819 * @v: value to write to the register
 820 *
 821 * Dummy register read function.  Used for register blocks
 822 * that certain asics don't have (all asics).
 823 */
 824static void amdgpu_invalid_wreg(struct amdgpu_device *adev, uint32_t reg, uint32_t v)
 825{
 826        DRM_ERROR("Invalid callback to write register 0x%04X with 0x%08X\n",
 827                  reg, v);
 828        BUG();
 829}
 830
 831/**
 832 * amdgpu_invalid_rreg64 - dummy 64 bit reg read function
 833 *
 834 * @adev: amdgpu_device pointer
 835 * @reg: offset of register
 836 *
 837 * Dummy register read function.  Used for register blocks
 838 * that certain asics don't have (all asics).
 839 * Returns the value in the register.
 840 */
 841static uint64_t amdgpu_invalid_rreg64(struct amdgpu_device *adev, uint32_t reg)
 842{
 843        DRM_ERROR("Invalid callback to read 64 bit register 0x%04X\n", reg);
 844        BUG();
 845        return 0;
 846}
 847
 848/**
 849 * amdgpu_invalid_wreg64 - dummy reg write function
 850 *
 851 * @adev: amdgpu_device pointer
 852 * @reg: offset of register
 853 * @v: value to write to the register
 854 *
 855 * Dummy register read function.  Used for register blocks
 856 * that certain asics don't have (all asics).
 857 */
 858static void amdgpu_invalid_wreg64(struct amdgpu_device *adev, uint32_t reg, uint64_t v)
 859{
 860        DRM_ERROR("Invalid callback to write 64 bit register 0x%04X with 0x%08llX\n",
 861                  reg, v);
 862        BUG();
 863}
 864
 865/**
 866 * amdgpu_block_invalid_rreg - dummy reg read function
 867 *
 868 * @adev: amdgpu_device pointer
 869 * @block: offset of instance
 870 * @reg: offset of register
 871 *
 872 * Dummy register read function.  Used for register blocks
 873 * that certain asics don't have (all asics).
 874 * Returns the value in the register.
 875 */
 876static uint32_t amdgpu_block_invalid_rreg(struct amdgpu_device *adev,
 877                                          uint32_t block, uint32_t reg)
 878{
 879        DRM_ERROR("Invalid callback to read register 0x%04X in block 0x%04X\n",
 880                  reg, block);
 881        BUG();
 882        return 0;
 883}
 884
 885/**
 886 * amdgpu_block_invalid_wreg - dummy reg write function
 887 *
 888 * @adev: amdgpu_device pointer
 889 * @block: offset of instance
 890 * @reg: offset of register
 891 * @v: value to write to the register
 892 *
 893 * Dummy register read function.  Used for register blocks
 894 * that certain asics don't have (all asics).
 895 */
 896static void amdgpu_block_invalid_wreg(struct amdgpu_device *adev,
 897                                      uint32_t block,
 898                                      uint32_t reg, uint32_t v)
 899{
 900        DRM_ERROR("Invalid block callback to write register 0x%04X in block 0x%04X with 0x%08X\n",
 901                  reg, block, v);
 902        BUG();
 903}
 904
 905/**
 906 * amdgpu_device_asic_init - Wrapper for atom asic_init
 907 *
 908 * @adev: amdgpu_device pointer
 909 *
 910 * Does any asic specific work and then calls atom asic init.
 911 */
 912static int amdgpu_device_asic_init(struct amdgpu_device *adev)
 913{
 914        amdgpu_asic_pre_asic_init(adev);
 915
 916        if (adev->ip_versions[GC_HWIP][0] >= IP_VERSION(11, 0, 0))
 917                return amdgpu_atomfirmware_asic_init(adev, true);
 918        else
 919                return amdgpu_atom_asic_init(adev->mode_info.atom_context);
 920}
 921
 922/**
 923 * amdgpu_device_vram_scratch_init - allocate the VRAM scratch page
 924 *
 925 * @adev: amdgpu_device pointer
 926 *
 927 * Allocates a scratch page of VRAM for use by various things in the
 928 * driver.
 929 */
 930static int amdgpu_device_vram_scratch_init(struct amdgpu_device *adev)
 931{
 932        return amdgpu_bo_create_kernel(adev, AMDGPU_GPU_PAGE_SIZE,
 933                                       PAGE_SIZE, AMDGPU_GEM_DOMAIN_VRAM,
 934                                       &adev->vram_scratch.robj,
 935                                       &adev->vram_scratch.gpu_addr,
 936                                       (void **)&adev->vram_scratch.ptr);
 937}
 938
 939/**
 940 * amdgpu_device_vram_scratch_fini - Free the VRAM scratch page
 941 *
 942 * @adev: amdgpu_device pointer
 943 *
 944 * Frees the VRAM scratch page.
 945 */
 946static void amdgpu_device_vram_scratch_fini(struct amdgpu_device *adev)
 947{
 948        amdgpu_bo_free_kernel(&adev->vram_scratch.robj, NULL, NULL);
 949}
 950
 951/**
 952 * amdgpu_device_program_register_sequence - program an array of registers.
 953 *
 954 * @adev: amdgpu_device pointer
 955 * @registers: pointer to the register array
 956 * @array_size: size of the register array
 957 *
 958 * Programs an array or registers with and and or masks.
 959 * This is a helper for setting golden registers.
 960 */
 961void amdgpu_device_program_register_sequence(struct amdgpu_device *adev,
 962                                             const u32 *registers,
 963                                             const u32 array_size)
 964{
 965        u32 tmp, reg, and_mask, or_mask;
 966        int i;
 967
 968        if (array_size % 3)
 969                return;
 970
 971        for (i = 0; i < array_size; i +=3) {
 972                reg = registers[i + 0];
 973                and_mask = registers[i + 1];
 974                or_mask = registers[i + 2];
 975
 976                if (and_mask == 0xffffffff) {
 977                        tmp = or_mask;
 978                } else {
 979                        tmp = RREG32(reg);
 980                        tmp &= ~and_mask;
 981                        if (adev->family >= AMDGPU_FAMILY_AI)
 982                                tmp |= (or_mask & and_mask);
 983                        else
 984                                tmp |= or_mask;
 985                }
 986                WREG32(reg, tmp);
 987        }
 988}
 989
 990/**
 991 * amdgpu_device_pci_config_reset - reset the GPU
 992 *
 993 * @adev: amdgpu_device pointer
 994 *
 995 * Resets the GPU using the pci config reset sequence.
 996 * Only applicable to asics prior to vega10.
 997 */
 998void amdgpu_device_pci_config_reset(struct amdgpu_device *adev)
 999{
1000        pci_write_config_dword(adev->pdev, 0x7c, AMDGPU_ASIC_RESET_DATA);

1001}
1002
1003/**
1004 * amdgpu_device_pci_reset - reset the GPU using generic PCI means
1005 *
1006 * @adev: amdgpu_device pointer
1007 *
1008 * Resets the GPU using generic pci reset interfaces (FLR, SBR, etc.).
1009 */
1010int amdgpu_device_pci_reset(struct amdgpu_device *adev)
1011{
1012        return pci_reset_function(adev->pdev);
1013}
1014
1015/*
1016 * GPU doorbell aperture helpers function.
1017 */
1018/**
1019 * amdgpu_device_doorbell_init - Init doorbell driver information.
1020 *
1021 * @adev: amdgpu_device pointer
1022 *
1023 * Init doorbell driver information (CIK)
1024 * Returns 0 on success, error on failure.
1025 */
1026static int amdgpu_device_doorbell_init(struct amdgpu_device *adev)
1027{
1028
1029        /* No doorbell on SI hardware generation */
1030        if (adev->asic_type < CHIP_BONAIRE) {
1031                adev->doorbell.base = 0;
1032                adev->doorbell.size = 0;
1033                adev->doorbell.num_doorbells = 0;
1034                adev->doorbell.ptr = NULL;
1035                return 0;
1036        }
1037
1038        if (pci_resource_flags(adev->pdev, 2) & IORESOURCE_UNSET)
1039                return -EINVAL;
1040
1041        amdgpu_asic_init_doorbell_index(adev);
1042
1043        /* doorbell bar mapping */
1044        adev->doorbell.base = pci_resource_start(adev->pdev, 2);
1045        adev->doorbell.size = pci_resource_len(adev->pdev, 2);
1046
1047        if (adev->enable_mes) {
1048                adev->doorbell.num_doorbells =
1049                        adev->doorbell.size / sizeof(u32);
1050        } else {
1051                adev->doorbell.num_doorbells =
1052                        min_t(u32, adev->doorbell.size / sizeof(u32),
1053                              adev->doorbell_index.max_assignment+1);
1054                if (adev->doorbell.num_doorbells == 0)
1055                        return -EINVAL;
1056
1057                /* For Vega, reserve and map two pages on doorbell BAR since SDMA
1058                 * paging queue doorbell use the second page. The
1059                 * AMDGPU_DOORBELL64_MAX_ASSIGNMENT definition assumes all the
1060                 * doorbells are in the first page. So with paging queue enabled,
1061                 * the max num_doorbells should + 1 page (0x400 in dword)
1062                 */
1063                if (adev->asic_type >= CHIP_VEGA10)
1064                        adev->doorbell.num_doorbells += 0x400;
1065        }
1066
1067        adev->doorbell.ptr = ioremap(adev->doorbell.base,
1068                                     adev->doorbell.num_doorbells *
1069                                     sizeof(u32));
1070        if (adev->doorbell.ptr == NULL)
1071                return -ENOMEM;
1072
1073        return 0;
1074}
1075
1076/**
1077 * amdgpu_device_doorbell_fini - Tear down doorbell driver information.
1078 *
1079 * @adev: amdgpu_device pointer
1080 *
1081 * Tear down doorbell driver information (CIK)
1082 */
1083static void amdgpu_device_doorbell_fini(struct amdgpu_device *adev)
1084{
1085        iounmap(adev->doorbell.ptr);
1086        adev->doorbell.ptr = NULL;
1087}
1088
1089
1090
1091/*
1092 * amdgpu_device_wb_*()
1093 * Writeback is the method by which the GPU updates special pages in memory
1094 * with the status of certain GPU events (fences, ring pointers,etc.).
1095 */
1096
1097/**
1098 * amdgpu_device_wb_fini - Disable Writeback and free memory
1099 *
1100 * @adev: amdgpu_device pointer
1101 *
1102 * Disables Writeback and frees the Writeback memory (all asics).
1103 * Used at driver shutdown.
1104 */
1105static void amdgpu_device_wb_fini(struct amdgpu_device *adev)
1106{
1107        if (adev->wb.wb_obj) {
1108                amdgpu_bo_free_kernel(&adev->wb.wb_obj,
1109                                      &adev->wb.gpu_addr,
1110                                      (void **)&adev->wb.wb);
1111                adev->wb.wb_obj = NULL;
1112        }
1113}
1114
1115/**
1116 * amdgpu_device_wb_init - Init Writeback driver info and allocate memory
1117 *
1118 * @adev: amdgpu_device pointer
1119 *
1120 * Initializes writeback and allocates writeback memory (all asics).
1121 * Used at driver startup.
1122 * Returns 0 on success or an -error on failure.
1123 */
1124static int amdgpu_device_wb_init(struct amdgpu_device *adev)
1125{
1126        int r;
1127
1128        if (adev->wb.wb_obj == NULL) {
1129                /* AMDGPU_MAX_WB * sizeof(uint32_t) * 8 = AMDGPU_MAX_WB 256bit slots */
1130                r = amdgpu_bo_create_kernel(adev, AMDGPU_MAX_WB * sizeof(uint32_t) * 8,
1131                                            PAGE_SIZE, AMDGPU_GEM_DOMAIN_GTT,
1132                                            &adev->wb.wb_obj, &adev->wb.gpu_addr,
1133                                            (void **)&adev->wb.wb);
1134                if (r) {
1135                        dev_warn(adev->dev, "(%d) create WB bo failed\n", r);
1136                        return r;
1137                }
1138
1139                adev->wb.num_wb = AMDGPU_MAX_WB;
1140                memset(&adev->wb.used, 0, sizeof(adev->wb.used));
1141
1142                /* clear wb memory */
1143                memset((char *)adev->wb.wb, 0, AMDGPU_MAX_WB * sizeof(uint32_t) * 8);
1144        }
1145
1146        return 0;
1147}
1148
1149/**
1150 * amdgpu_device_wb_get - Allocate a wb entry
1151 *
1152 * @adev: amdgpu_device pointer
1153 * @wb: wb index
1154 *
1155 * Allocate a wb slot for use by the driver (all asics).
1156 * Returns 0 on success or -EINVAL on failure.
1157 */
1158int amdgpu_device_wb_get(struct amdgpu_device *adev, u32 *wb)
1159{
1160        unsigned long offset = find_first_zero_bit(adev->wb.used, adev->wb.num_wb);
1161
1162        if (offset < adev->wb.num_wb) {
1163                __set_bit(offset, adev->wb.used);
1164                *wb = offset << 3; /* convert to dw offset */
1165                return 0;
1166        } else {
1167                return -EINVAL;
1168        }
1169}
1170
1171/**
1172 * amdgpu_device_wb_free - Free a wb entry
1173 *
1174 * @adev: amdgpu_device pointer
1175 * @wb: wb index
1176 *
1177 * Free a wb slot allocated for use by the driver (all asics)
1178 */
1179void amdgpu_device_wb_free(struct amdgpu_device *adev, u32 wb)
1180{
1181        wb >>= 3;
1182        if (wb < adev->wb.num_wb)
1183                __clear_bit(wb, adev->wb.used);
1184}
1185
1186/**
1187 * amdgpu_device_resize_fb_bar - try to resize FB BAR
1188 *
1189 * @adev: amdgpu_device pointer
1190 *
1191 * Try to resize FB BAR to make all VRAM CPU accessible. We try very hard not
1192 * to fail, but if any of the BARs is not accessible after the size we abort
1193 * driver loading by returning -ENODEV.
1194 */
1195int amdgpu_device_resize_fb_bar(struct amdgpu_device *adev)
1196{
1197        int rbar_size = pci_rebar_bytes_to_size(adev->gmc.real_vram_size);
1198        struct pci_bus *root;
1199        struct resource *res;
1200        unsigned i;
1201        u16 cmd;
1202        int r;
1203
1204        /* Bypass for VF */
1205        if (amdgpu_sriov_vf(adev))
1206                return 0;
1207
1208        /* skip if the bios has already enabled large BAR */
1209        if (adev->gmc.real_vram_size &&
1210            (pci_resource_len(adev->pdev, 0) >= adev->gmc.real_vram_size))
1211                return 0;
1212
1213        /* Check if the root BUS has 64bit memory resources */
1214        root = adev->pdev->bus;
1215        while (root->parent)
1216                root = root->parent;
1217
1218        pci_bus_for_each_resource(root, res, i) {
1219                if (res && res->flags & (IORESOURCE_MEM | IORESOURCE_MEM_64) &&
1220                    res->start > 0x100000000ull)
1221                        break;
1222        }
1223
1224        /* Trying to resize is pointless without a root hub window above 4GB */
1225        if (!res)
1226                return 0;
1227
1228        /* Limit the BAR size to what is available */
1229        rbar_size = min(fls(pci_rebar_get_possible_sizes(adev->pdev, 0)) - 1,
1230                        rbar_size);
1231
1232        /* Disable memory decoding while we change the BAR addresses and size */
1233        pci_read_config_word(adev->pdev, PCI_COMMAND, &cmd);
1234        pci_write_config_word(adev->pdev, PCI_COMMAND,
1235                              cmd & ~PCI_COMMAND_MEMORY);
1236
1237        /* Free the VRAM and doorbell BAR, we most likely need to move both. */
1238        amdgpu_device_doorbell_fini(adev);
1239        if (adev->asic_type >= CHIP_BONAIRE)
1240                pci_release_resource(adev->pdev, 2);
1241
1242        pci_release_resource(adev->pdev, 0);
1243
1244        r = pci_resize_resource(adev->pdev, 0, rbar_size);
1245        if (r == -ENOSPC)
1246                DRM_INFO("Not enough PCI address space for a large BAR.");
1247        else if (r && r != -ENOTSUPP)
1248                DRM_ERROR("Problem resizing BAR0 (%d).", r);
1249
1250        pci_assign_unassigned_bus_resources(adev->pdev->bus);
1251
1252        /* When the doorbell or fb BAR isn't available we have no chance of
1253         * using the device.
1254         */
1255        r = amdgpu_device_doorbell_init(adev);
1256        if (r || (pci_resource_flags(adev->pdev, 0) & IORESOURCE_UNSET))
1257                return -ENODEV;
1258
1259        pci_write_config_word(adev->pdev, PCI_COMMAND, cmd);
1260
1261        return 0;
1262}
1263
1264/*
1265 * GPU helpers function.
1266 */
1267/**
1268 * amdgpu_device_need_post - check if the hw need post or not
1269 *
1270 * @adev: amdgpu_device pointer
1271 *
1272 * Check if the asic has been initialized (all asics) at driver startup
1273 * or post is needed if  hw reset is performed.
1274 * Returns true if need or false if not.
1275 */
1276bool amdgpu_device_need_post(struct amdgpu_device *adev)
1277{
1278        uint32_t reg;
1279
1280        if (amdgpu_sriov_vf(adev))
1281                return false;
1282
1283        if (amdgpu_passthrough(adev)) {
1284                /* for FIJI: In whole GPU pass-through virtualization case, after VM reboot
1285                 * some old smc fw still need driver do vPost otherwise gpu hang, while
1286                 * those smc fw version above 22.15 doesn't have this flaw, so we force
1287                 * vpost executed for smc version below 22.15
1288                 */
1289                if (adev->asic_type == CHIP_FIJI) {
1290                        int err;
1291                        uint32_t fw_ver;
1292                        err = request_firmware(&adev->pm.fw, "amdgpu/fiji_smc.bin", adev->dev);
1293                        /* force vPost if error occured */
1294                        if (err)
1295                                return true;
1296
1297                        fw_ver = *((uint32_t *)adev->pm.fw->data + 69);
1298                        if (fw_ver < 0x00160e00)
1299                                return true;
1300                }
1301        }
1302
1303        /* Don't post if we need to reset whole hive on init */
1304        if (adev->gmc.xgmi.pending_reset)
1305                return false;
1306
1307        if (adev->has_hw_reset) {
1308                adev->has_hw_reset = false;
1309                return true;
1310        }
1311
1312        /* bios scratch used on CIK+ */
1313        if (adev->asic_type >= CHIP_BONAIRE)
1314                return amdgpu_atombios_scratch_need_asic_init(adev);
1315
1316        /* check MEM_SIZE for older asics */
1317        reg = amdgpu_asic_get_config_memsize(adev);
1318
1319        if ((reg != 0) && (reg != 0xffffffff))
1320                return false;
1321
1322        return true;
1323}
1324
1325/**
1326 * amdgpu_device_should_use_aspm - check if the device should program ASPM
1327 *
1328 * @adev: amdgpu_device pointer
1329 *
1330 * Confirm whether the module parameter and pcie bridge agree that ASPM should
1331 * be set for this device.
1332 *
1333 * Returns true if it should be used or false if not.
1334 */
1335bool amdgpu_device_should_use_aspm(struct amdgpu_device *adev)
1336{
1337        switch (amdgpu_aspm) {
1338        case -1:
1339                break;
1340        case 0:
1341                return false;
1342        case 1:
1343                return true;
1344        default:
1345                return false;
1346        }
1347        return pcie_aspm_enabled(adev->pdev);
1348}
1349
1350/* if we get transitioned to only one device, take VGA back */
1351/**
1352 * amdgpu_device_vga_set_decode - enable/disable vga decode
1353 *
1354 * @pdev: PCI device pointer
1355 * @state: enable/disable vga decode
1356 *
1357 * Enable/disable vga decode (all asics).
1358 * Returns VGA resource flags.
1359 */
1360static unsigned int amdgpu_device_vga_set_decode(struct pci_dev *pdev,
1361                bool state)
1362{
1363        struct amdgpu_device *adev = drm_to_adev(pci_get_drvdata(pdev));
1364        amdgpu_asic_set_vga_state(adev, state);
1365        if (state)
1366                return VGA_RSRC_LEGACY_IO | VGA_RSRC_LEGACY_MEM |
1367                       VGA_RSRC_NORMAL_IO | VGA_RSRC_NORMAL_MEM;
1368        else
1369                return VGA_RSRC_NORMAL_IO | VGA_RSRC_NORMAL_MEM;
1370}
1371
1372/**
1373 * amdgpu_device_check_block_size - validate the vm block size
1374 *
1375 * @adev: amdgpu_device pointer
1376 *
1377 * Validates the vm block size specified via module parameter.
1378 * The vm block size defines number of bits in page table versus page directory,
1379 * a page is 4KB so we have 12 bits offset, minimum 9 bits in the
1380 * page table and the remaining bits are in the page directory.
1381 */
1382static void amdgpu_device_check_block_size(struct amdgpu_device *adev)
1383{
1384        /* defines number of bits in page table versus page directory,
1385         * a page is 4KB so we have 12 bits offset, minimum 9 bits in the
1386         * page table and the remaining bits are in the page directory */
1387        if (amdgpu_vm_block_size == -1)
1388                return;
1389
1390        if (amdgpu_vm_block_size < 9) {
1391                dev_warn(adev->dev, "VM page table size (%d) too small\n",
1392                         amdgpu_vm_block_size);
1393                amdgpu_vm_block_size = -1;
1394        }
1395}
1396
1397/**
1398 * amdgpu_device_check_vm_size - validate the vm size
1399 *
1400 * @adev: amdgpu_device pointer
1401 *
1402 * Validates the vm size in GB specified via module parameter.
1403 * The VM size is the size of the GPU virtual memory space in GB.
1404 */
1405static void amdgpu_device_check_vm_size(struct amdgpu_device *adev)
1406{
1407        /* no need to check the default value */
1408        if (amdgpu_vm_size == -1)
1409                return;
1410
1411        if (amdgpu_vm_size < 1) {
1412                dev_warn(adev->dev, "VM size (%d) too small, min is 1GB\n",
1413                         amdgpu_vm_size);
1414                amdgpu_vm_size = -1;
1415        }
1416}
1417
1418static void amdgpu_device_check_smu_prv_buffer_size(struct amdgpu_device *adev)
1419{
1420        struct sysinfo si;
1421        bool is_os_64 = (sizeof(void *) == 8);
1422        uint64_t total_memory;
1423        uint64_t dram_size_seven_GB = 0x1B8000000;
1424        uint64_t dram_size_three_GB = 0xB8000000;
1425
1426        if (amdgpu_smu_memory_pool_size == 0)
1427                return;
1428
1429        if (!is_os_64) {
1430                DRM_WARN("Not 64-bit OS, feature not supported\n");
1431                goto def_value;
1432        }
1433        si_meminfo(&si);
1434        total_memory = (uint64_t)si.totalram * si.mem_unit;
1435
1436        if ((amdgpu_smu_memory_pool_size == 1) ||
1437                (amdgpu_smu_memory_pool_size == 2)) {
1438                if (total_memory < dram_size_three_GB)
1439                        goto def_value1;
1440        } else if ((amdgpu_smu_memory_pool_size == 4) ||
1441                (amdgpu_smu_memory_pool_size == 8)) {
1442                if (total_memory < dram_size_seven_GB)
1443                        goto def_value1;
1444        } else {
1445                DRM_WARN("Smu memory pool size not supported\n");
1446                goto def_value;
1447        }
1448        adev->pm.smu_prv_buffer_size = amdgpu_smu_memory_pool_size << 28;
1449
1450        return;
1451
1452def_value1:
1453        DRM_WARN("No enough system memory\n");
1454def_value:
1455        adev->pm.smu_prv_buffer_size = 0;
1456}
1457
1458static int amdgpu_device_init_apu_flags(struct amdgpu_device *adev)
1459{
1460        if (!(adev->flags & AMD_IS_APU) ||
1461            adev->asic_type < CHIP_RAVEN)
1462                return 0;
1463
1464        switch (adev->asic_type) {
1465        case CHIP_RAVEN:
1466                if (adev->pdev->device == 0x15dd)
1467                        adev->apu_flags |= AMD_APU_IS_RAVEN;
1468                if (adev->pdev->device == 0x15d8)
1469                        adev->apu_flags |= AMD_APU_IS_PICASSO;
1470                break;
1471        case CHIP_RENOIR:
1472                if ((adev->pdev->device == 0x1636) ||
1473                    (adev->pdev->device == 0x164c))
1474                        adev->apu_flags |= AMD_APU_IS_RENOIR;
1475                else
1476                        adev->apu_flags |= AMD_APU_IS_GREEN_SARDINE;
1477                break;
1478        case CHIP_VANGOGH:
1479                adev->apu_flags |= AMD_APU_IS_VANGOGH;
1480                break;
1481        case CHIP_YELLOW_CARP:
1482                break;
1483        case CHIP_CYAN_SKILLFISH:
1484                if ((adev->pdev->device == 0x13FE) ||
1485                    (adev->pdev->device == 0x143F))
1486                        adev->apu_flags |= AMD_APU_IS_CYAN_SKILLFISH2;
1487                break;
1488        default:
1489                break;
1490        }
1491
1492        return 0;
1493}
1494
1495/**
1496 * amdgpu_device_check_arguments - validate module params
1497 *
1498 * @adev: amdgpu_device pointer
1499 *
1500 * Validates certain module parameters and updates
1501 * the associated values used by the driver (all asics).
1502 */
1503static int amdgpu_device_check_arguments(struct amdgpu_device *adev)
1504{
1505        if (amdgpu_sched_jobs < 4) {
1506                dev_warn(adev->dev, "sched jobs (%d) must be at least 4\n",
1507                         amdgpu_sched_jobs);
1508                amdgpu_sched_jobs = 4;
1509        } else if (!is_power_of_2(amdgpu_sched_jobs)){
1510                dev_warn(adev->dev, "sched jobs (%d) must be a power of 2\n",
1511                         amdgpu_sched_jobs);
1512                amdgpu_sched_jobs = roundup_pow_of_two(amdgpu_sched_jobs);
1513        }
1514
1515        if (amdgpu_gart_size != -1 && amdgpu_gart_size < 32) {
1516                /* gart size must be greater or equal to 32M */
1517                dev_warn(adev->dev, "gart size (%d) too small\n",
1518                         amdgpu_gart_size);
1519                amdgpu_gart_size = -1;
1520        }
1521
1522        if (amdgpu_gtt_size != -1 && amdgpu_gtt_size < 32) {
1523                /* gtt size must be greater or equal to 32M */
1524                dev_warn(adev->dev, "gtt size (%d) too small\n",
1525                                 amdgpu_gtt_size);
1526                amdgpu_gtt_size = -1;
1527        }
1528
1529        /* valid range is between 4 and 9 inclusive */
1530        if (amdgpu_vm_fragment_size != -1 &&
1531            (amdgpu_vm_fragment_size > 9 || amdgpu_vm_fragment_size < 4)) {
1532                dev_warn(adev->dev, "valid range is between 4 and 9\n");
1533                amdgpu_vm_fragment_size = -1;
1534        }
1535
1536        if (amdgpu_sched_hw_submission < 2) {
1537                dev_warn(adev->dev, "sched hw submission jobs (%d) must be at least 2\n",
1538                         amdgpu_sched_hw_submission);
1539                amdgpu_sched_hw_submission = 2;
1540        } else if (!is_power_of_2(amdgpu_sched_hw_submission)) {
1541                dev_warn(adev->dev, "sched hw submission jobs (%d) must be a power of 2\n",
1542                         amdgpu_sched_hw_submission);
1543                amdgpu_sched_hw_submission = roundup_pow_of_two(amdgpu_sched_hw_submission);
1544        }
1545
1546        if (amdgpu_reset_method < -1 || amdgpu_reset_method > 4) {
1547                dev_warn(adev->dev, "invalid option for reset method, reverting to default\n");
1548                amdgpu_reset_method = -1;
1549        }
1550
1551        amdgpu_device_check_smu_prv_buffer_size(adev);
1552
1553        amdgpu_device_check_vm_size(adev);
1554
1555        amdgpu_device_check_block_size(adev);
1556
1557        adev->firmware.load_type = amdgpu_ucode_get_load_type(adev, amdgpu_fw_load_type);
1558
1559        return 0;
1560}
1561
1562/**
1563 * amdgpu_switcheroo_set_state - set switcheroo state
1564 *
1565 * @pdev: pci dev pointer
1566 * @state: vga_switcheroo state
1567 *
1568 * Callback for the switcheroo driver.  Suspends or resumes the
1569 * the asics before or after it is powered up using ACPI methods.
1570 */
1571static void amdgpu_switcheroo_set_state(struct pci_dev *pdev,
1572                                        enum vga_switcheroo_state state)
1573{
1574        struct drm_device *dev = pci_get_drvdata(pdev);
1575        int r;
1576
1577        if (amdgpu_device_supports_px(dev) && state == VGA_SWITCHEROO_OFF)
1578                return;
1579
1580        if (state == VGA_SWITCHEROO_ON) {
1581                pr_info("switched on\n");
1582                /* don't suspend or resume card normally */
1583                dev->switch_power_state = DRM_SWITCH_POWER_CHANGING;
1584
1585                pci_set_power_state(pdev, PCI_D0);
1586                amdgpu_device_load_pci_state(pdev);
1587                r = pci_enable_device(pdev);
1588                if (r)
1589                        DRM_WARN("pci_enable_device failed (%d)\n", r);
1590                amdgpu_device_resume(dev, true);
1591
1592                dev->switch_power_state = DRM_SWITCH_POWER_ON;
1593        } else {
1594                pr_info("switched off\n");
1595                dev->switch_power_state = DRM_SWITCH_POWER_CHANGING;
1596                amdgpu_device_suspend(dev, true);
1597                amdgpu_device_cache_pci_state(pdev);
1598                /* Shut down the device */
1599                pci_disable_device(pdev);
1600                pci_set_power_state(pdev, PCI_D3cold);
1601                dev->switch_power_state = DRM_SWITCH_POWER_OFF;
1602        }
1603}
1604
1605/**
1606 * amdgpu_switcheroo_can_switch - see if switcheroo state can change
1607 *
1608 * @pdev: pci dev pointer
1609 *
1610 * Callback for the switcheroo driver.  Check of the switcheroo
1611 * state can be changed.
1612 * Returns true if the state can be changed, false if not.
1613 */
1614static bool amdgpu_switcheroo_can_switch(struct pci_dev *pdev)
1615{
1616        struct drm_device *dev = pci_get_drvdata(pdev);
1617
1618        /*
1619        * FIXME: open_count is protected by drm_global_mutex but that would lead to
1620        * locking inversion with the driver load path. And the access here is
1621        * completely racy anyway. So don't bother with locking for now.
1622        */
1623        return atomic_read(&dev->open_count) == 0;
1624}
1625
1626static const struct vga_switcheroo_client_ops amdgpu_switcheroo_ops = {
1627        .set_gpu_state = amdgpu_switcheroo_set_state,
1628        .reprobe = NULL,
1629        .can_switch = amdgpu_switcheroo_can_switch,
1630};
1631
1632/**
1633 * amdgpu_device_ip_set_clockgating_state - set the CG state
1634 *
1635 * @dev: amdgpu_device pointer
1636 * @block_type: Type of hardware IP (SMU, GFX, UVD, etc.)
1637 * @state: clockgating state (gate or ungate)
1638 *
1639 * Sets the requested clockgating state for all instances of
1640 * the hardware IP specified.
1641 * Returns the error code from the last instance.
1642 */
1643int amdgpu_device_ip_set_clockgating_state(void *dev,
1644                                           enum amd_ip_block_type block_type,
1645                                           enum amd_clockgating_state state)
1646{
1647        struct amdgpu_device *adev = dev;
1648        int i, r = 0;
1649
1650        for (i = 0; i < adev->num_ip_blocks; i++) {
1651                if (!adev->ip_blocks[i].status.valid)
1652                        continue;
1653                if (adev->ip_blocks[i].version->type != block_type)
1654                        continue;
1655                if (!adev->ip_blocks[i].version->funcs->set_clockgating_state)
1656                        continue;
1657                r = adev->ip_blocks[i].version->funcs->set_clockgating_state(
1658                        (void *)adev, state);
1659                if (r)
1660                        DRM_ERROR("set_clockgating_state of IP block <%s> failed %d\n",
1661                                  adev->ip_blocks[i].version->funcs->name, r);
1662        }
1663        return r;
1664}
1665
1666/**
1667 * amdgpu_device_ip_set_powergating_state - set the PG state
1668 *
1669 * @dev: amdgpu_device pointer
1670 * @block_type: Type of hardware IP (SMU, GFX, UVD, etc.)
1671 * @state: powergating state (gate or ungate)
1672 *
1673 * Sets the requested powergating state for all instances of
1674 * the hardware IP specified.
1675 * Returns the error code from the last instance.
1676 */
1677int amdgpu_device_ip_set_powergating_state(void *dev,
1678                                           enum amd_ip_block_type block_type,
1679                                           enum amd_powergating_state state)
1680{
1681        struct amdgpu_device *adev = dev;
1682        int i, r = 0;
1683
1684        for (i = 0; i < adev->num_ip_blocks; i++) {
1685                if (!adev->ip_blocks[i].status.valid)
1686                        continue;
1687                if (adev->ip_blocks[i].version->type != block_type)
1688                        continue;
1689                if (!adev->ip_blocks[i].version->funcs->set_powergating_state)
1690                        continue;
1691                r = adev->ip_blocks[i].version->funcs->set_powergating_state(
1692                        (void *)adev, state);
1693                if (r)
1694                        DRM_ERROR("set_powergating_state of IP block <%s> failed %d\n",
1695                                  adev->ip_blocks[i].version->funcs->name, r);
1696        }
1697        return r;
1698}
1699
1700/**
1701 * amdgpu_device_ip_get_clockgating_state - get the CG state
1702 *
1703 * @adev: amdgpu_device pointer
1704 * @flags: clockgating feature flags
1705 *
1706 * Walks the list of IPs on the device and updates the clockgating
1707 * flags for each IP.
1708 * Updates @flags with the feature flags for each hardware IP where
1709 * clockgating is enabled.
1710 */
1711void amdgpu_device_ip_get_clockgating_state(struct amdgpu_device *adev,
1712                                            u64 *flags)
1713{
1714        int i;
1715
1716        for (i = 0; i < adev->num_ip_blocks; i++) {
1717                if (!adev->ip_blocks[i].status.valid)
1718                        continue;
1719                if (adev->ip_blocks[i].version->funcs->get_clockgating_state)
1720                        adev->ip_blocks[i].version->funcs->get_clockgating_state((void *)adev, flags);
1721        }
1722}
1723
1724/**
1725 * amdgpu_device_ip_wait_for_idle - wait for idle
1726 *
1727 * @adev: amdgpu_device pointer
1728 * @block_type: Type of hardware IP (SMU, GFX, UVD, etc.)
1729 *
1730 * Waits for the request hardware IP to be idle.
1731 * Returns 0 for success or a negative error code on failure.
1732 */
1733int amdgpu_device_ip_wait_for_idle(struct amdgpu_device *adev,
1734                                   enum amd_ip_block_type block_type)
1735{
1736        int i, r;
1737
1738        for (i = 0; i < adev->num_ip_blocks; i++) {
1739                if (!adev->ip_blocks[i].status.valid)
1740                        continue;
1741                if (adev->ip_blocks[i].version->type == block_type) {
1742                        r = adev->ip_blocks[i].version->funcs->wait_for_idle((void *)adev);
1743                        if (r)
1744                                return r;
1745                        break;
1746                }
1747        }
1748        return 0;
1749
1750}
1751
1752/**
1753 * amdgpu_device_ip_is_idle - is the hardware IP idle
1754 *
1755 * @adev: amdgpu_device pointer
1756 * @block_type: Type of hardware IP (SMU, GFX, UVD, etc.)
1757 *
1758 * Check if the hardware IP is idle or not.
1759 * Returns true if it the IP is idle, false if not.
1760 */
1761bool amdgpu_device_ip_is_idle(struct amdgpu_device *adev,
1762                              enum amd_ip_block_type block_type)
1763{
1764        int i;
1765
1766        for (i = 0; i < adev->num_ip_blocks; i++) {
1767                if (!adev->ip_blocks[i].status.valid)
1768                        continue;
1769                if (adev->ip_blocks[i].version->type == block_type)
1770                        return adev->ip_blocks[i].version->funcs->is_idle((void *)adev);
1771        }
1772        return true;
1773
1774}
1775
1776/**
1777 * amdgpu_device_ip_get_ip_block - get a hw IP pointer
1778 *
1779 * @adev: amdgpu_device pointer
1780 * @type: Type of hardware IP (SMU, GFX, UVD, etc.)
1781 *
1782 * Returns a pointer to the hardware IP block structure
1783 * if it exists for the asic, otherwise NULL.
1784 */
1785struct amdgpu_ip_block *
1786amdgpu_device_ip_get_ip_block(struct amdgpu_device *adev,
1787                              enum amd_ip_block_type type)
1788{
1789        int i;
1790
1791        for (i = 0; i < adev->num_ip_blocks; i++)
1792                if (adev->ip_blocks[i].version->type == type)
1793                        return &adev->ip_blocks[i];
1794
1795        return NULL;
1796}
1797
1798/**
1799 * amdgpu_device_ip_block_version_cmp
1800 *
1801 * @adev: amdgpu_device pointer
1802 * @type: enum amd_ip_block_type
1803 * @major: major version
1804 * @minor: minor version
1805 *
1806 * return 0 if equal or greater
1807 * return 1 if smaller or the ip_block doesn't exist
1808 */
1809int amdgpu_device_ip_block_version_cmp(struct amdgpu_device *adev,
1810                                       enum amd_ip_block_type type,
1811                                       u32 major, u32 minor)
1812{
1813        struct amdgpu_ip_block *ip_block = amdgpu_device_ip_get_ip_block(adev, type);
1814
1815        if (ip_block && ((ip_block->version->major > major) ||
1816                        ((ip_block->version->major == major) &&
1817                        (ip_block->version->minor >= minor))))
1818                return 0;
1819
1820        return 1;
1821}
1822
1823/**
1824 * amdgpu_device_ip_block_add
1825 *
1826 * @adev: amdgpu_device pointer
1827 * @ip_block_version: pointer to the IP to add
1828 *
1829 * Adds the IP block driver information to the collection of IPs
1830 * on the asic.
1831 */
1832int amdgpu_device_ip_block_add(struct amdgpu_device *adev,
1833                               const struct amdgpu_ip_block_version *ip_block_version)
1834{
1835        if (!ip_block_version)
1836                return -EINVAL;
1837
1838        switch (ip_block_version->type) {
1839        case AMD_IP_BLOCK_TYPE_VCN:
1840                if (adev->harvest_ip_mask & AMD_HARVEST_IP_VCN_MASK)
1841                        return 0;
1842                break;
1843        case AMD_IP_BLOCK_TYPE_JPEG:
1844                if (adev->harvest_ip_mask & AMD_HARVEST_IP_JPEG_MASK)
1845                        return 0;
1846                break;
1847        default:
1848                break;
1849        }
1850
1851        DRM_INFO("add ip block number %d <%s>\n", adev->num_ip_blocks,
1852                  ip_block_version->funcs->name);
1853
1854        adev->ip_blocks[adev->num_ip_blocks++].version = ip_block_version;
1855
1856        return 0;
1857}
1858
1859/**
1860 * amdgpu_device_enable_virtual_display - enable virtual display feature
1861 *
1862 * @adev: amdgpu_device pointer
1863 *
1864 * Enabled the virtual display feature if the user has enabled it via
1865 * the module parameter virtual_display.  This feature provides a virtual
1866 * display hardware on headless boards or in virtualized environments.
1867 * This function parses and validates the configuration string specified by
1868 * the user and configues the virtual display configuration (number of
1869 * virtual connectors, crtcs, etc.) specified.
1870 */
1871static void amdgpu_device_enable_virtual_display(struct amdgpu_device *adev)
1872{
1873        adev->enable_virtual_display = false;
1874
1875        if (amdgpu_virtual_display) {
1876                const char *pci_address_name = pci_name(adev->pdev);
1877                char *pciaddstr, *pciaddstr_tmp, *pciaddname_tmp, *pciaddname;
1878
1879                pciaddstr = kstrdup(amdgpu_virtual_display, GFP_KERNEL);
1880                pciaddstr_tmp = pciaddstr;
1881                while ((pciaddname_tmp = strsep(&pciaddstr_tmp, ";"))) {
1882                        pciaddname = strsep(&pciaddname_tmp, ",");
1883                        if (!strcmp("all", pciaddname)
1884                            || !strcmp(pci_address_name, pciaddname)) {
1885                                long num_crtc;
1886                                int res = -1;
1887
1888                                adev->enable_virtual_display = true;
1889
1890                                if (pciaddname_tmp)
1891                                        res = kstrtol(pciaddname_tmp, 10,
1892                                                      &num_crtc);
1893
1894                                if (!res) {
1895                                        if (num_crtc < 1)
1896                                                num_crtc = 1;
1897                                        if (num_crtc > 6)
1898                                                num_crtc = 6;
1899                                        adev->mode_info.num_crtc = num_crtc;
1900                                } else {
1901                                        adev->mode_info.num_crtc = 1;
1902                                }
1903                                break;
1904                        }
1905                }
1906
1907                DRM_INFO("virtual display string:%s, %s:virtual_display:%d, num_crtc:%d\n",
1908                         amdgpu_virtual_display, pci_address_name,
1909                         adev->enable_virtual_display, adev->mode_info.num_crtc);
1910
1911                kfree(pciaddstr);
1912        }
1913}
1914
1915/**
1916 * amdgpu_device_parse_gpu_info_fw - parse gpu info firmware
1917 *
1918 * @adev: amdgpu_device pointer
1919 *
1920 * Parses the asic configuration parameters specified in the gpu info
1921 * firmware and makes them availale to the driver for use in configuring
1922 * the asic.
1923 * Returns 0 on success, -EINVAL on failure.
1924 */
1925static int amdgpu_device_parse_gpu_info_fw(struct amdgpu_device *adev)
1926{
1927        const char *chip_name;
1928        char fw_name[40];
1929        int err;
1930        const struct gpu_info_firmware_header_v1_0 *hdr;
1931
1932        adev->firmware.gpu_info_fw = NULL;
1933
1934        if (adev->mman.discovery_bin) {
1935                /*
1936                 * FIXME: The bounding box is still needed by Navi12, so
1937                 * temporarily read it from gpu_info firmware. Should be dropped
1938                 * when DAL no longer needs it.
1939                 */
1940                if (adev->asic_type != CHIP_NAVI12)
1941                        return 0;
1942        }
1943
1944        switch (adev->asic_type) {
1945#ifdef CONFIG_DRM_AMDGPU_SI
1946        case CHIP_VERDE:
1947        case CHIP_TAHITI:
1948        case CHIP_PITCAIRN:
1949        case CHIP_OLAND:
1950        case CHIP_HAINAN:
1951#endif
1952#ifdef CONFIG_DRM_AMDGPU_CIK
1953        case CHIP_BONAIRE:
1954        case CHIP_HAWAII:
1955        case CHIP_KAVERI:
1956        case CHIP_KABINI:
1957        case CHIP_MULLINS:
1958#endif
1959        case CHIP_TOPAZ:
1960        case CHIP_TONGA:
1961        case CHIP_FIJI:
1962        case CHIP_POLARIS10:
1963        case CHIP_POLARIS11:
1964        case CHIP_POLARIS12:
1965        case CHIP_VEGAM:
1966        case CHIP_CARRIZO:
1967        case CHIP_STONEY:
1968        case CHIP_VEGA20:
1969        case CHIP_ALDEBARAN:
1970        case CHIP_SIENNA_CICHLID:
1971        case CHIP_NAVY_FLOUNDER:
1972        case CHIP_DIMGREY_CAVEFISH:
1973        case CHIP_BEIGE_GOBY:
1974        default:
1975                return 0;
1976        case CHIP_VEGA10:
1977                chip_name = "vega10";
1978                break;
1979        case CHIP_VEGA12:
1980                chip_name = "vega12";
1981                break;
1982        case CHIP_RAVEN:
1983                if (adev->apu_flags & AMD_APU_IS_RAVEN2)
1984                        chip_name = "raven2";
1985                else if (adev->apu_flags & AMD_APU_IS_PICASSO)
1986                        chip_name = "picasso";
1987                else
1988                        chip_name = "raven";
1989                break;
1990        case CHIP_ARCTURUS:
1991                chip_name = "arcturus";
1992                break;
1993        case CHIP_NAVI12:
1994                chip_name = "navi12";
1995                break;
1996        }
1997
1998        snprintf(fw_name, sizeof(fw_name), "amdgpu/%s_gpu_info.bin", chip_name);
1999        err = request_firmware(&adev->firmware.gpu_info_fw, fw_name, adev->dev);
2000        if (err) {

2001                dev_err(adev->dev,
2002                        "Failed to load gpu_info firmware \"%s\"\n",
2003                        fw_name);
2004                goto out;
2005        }
2006        err = amdgpu_ucode_validate(adev->firmware.gpu_info_fw);
2007        if (err) {
2008                dev_err(adev->dev,
2009                        "Failed to validate gpu_info firmware \"%s\"\n",
2010                        fw_name);
2011                goto out;
2012        }
2013
2014        hdr = (const struct gpu_info_firmware_header_v1_0 *)adev->firmware.gpu_info_fw->data;
2015        amdgpu_ucode_print_gpu_info_hdr(&hdr->header);
2016
2017        switch (hdr->version_major) {
2018        case 1:
2019        {
2020                const struct gpu_info_firmware_v1_0 *gpu_info_fw =
2021                        (const struct gpu_info_firmware_v1_0 *)(adev->firmware.gpu_info_fw->data +
2022                                                                le32_to_cpu(hdr->header.ucode_array_offset_bytes));
2023
2024                /*
2025                 * Should be droped when DAL no longer needs it.
2026                 */
2027                if (adev->asic_type == CHIP_NAVI12)
2028                        goto parse_soc_bounding_box;
2029
2030                adev->gfx.config.max_shader_engines = le32_to_cpu(gpu_info_fw->gc_num_se);
2031                adev->gfx.config.max_cu_per_sh = le32_to_cpu(gpu_info_fw->gc_num_cu_per_sh);
2032                adev->gfx.config.max_sh_per_se = le32_to_cpu(gpu_info_fw->gc_num_sh_per_se);
2033                adev->gfx.config.max_backends_per_se = le32_to_cpu(gpu_info_fw->gc_num_rb_per_se);
2034                adev->gfx.config.max_texture_channel_caches =
2035                        le32_to_cpu(gpu_info_fw->gc_num_tccs);
2036                adev->gfx.config.max_gprs = le32_to_cpu(gpu_info_fw->gc_num_gprs);
2037                adev->gfx.config.max_gs_threads = le32_to_cpu(gpu_info_fw->gc_num_max_gs_thds);
2038                adev->gfx.config.gs_vgt_table_depth = le32_to_cpu(gpu_info_fw->gc_gs_table_depth);
2039                adev->gfx.config.gs_prim_buffer_depth = le32_to_cpu(gpu_info_fw->gc_gsprim_buff_depth);
2040                adev->gfx.config.double_offchip_lds_buf =
2041                        le32_to_cpu(gpu_info_fw->gc_double_offchip_lds_buffer);
2042                adev->gfx.cu_info.wave_front_size = le32_to_cpu(gpu_info_fw->gc_wave_size);
2043                adev->gfx.cu_info.max_waves_per_simd =
2044                        le32_to_cpu(gpu_info_fw->gc_max_waves_per_simd);
2045                adev->gfx.cu_info.max_scratch_slots_per_cu =
2046                        le32_to_cpu(gpu_info_fw->gc_max_scratch_slots_per_cu);
2047                adev->gfx.cu_info.lds_size = le32_to_cpu(gpu_info_fw->gc_lds_size);
2048                if (hdr->version_minor >= 1) {
2049                        const struct gpu_info_firmware_v1_1 *gpu_info_fw =
2050                                (const struct gpu_info_firmware_v1_1 *)(adev->firmware.gpu_info_fw->data +
2051                                                                        le32_to_cpu(hdr->header.ucode_array_offset_bytes));
2052                        adev->gfx.config.num_sc_per_sh =
2053                                le32_to_cpu(gpu_info_fw->num_sc_per_sh);
2054                        adev->gfx.config.num_packer_per_sc =
2055                                le32_to_cpu(gpu_info_fw->num_packer_per_sc);
2056                }
2057
2058parse_soc_bounding_box:
2059                /*
2060                 * soc bounding box info is not integrated in disocovery table,
2061                 * we always need to parse it from gpu info firmware if needed.
2062                 */
2063                if (hdr->version_minor == 2) {
2064                        const struct gpu_info_firmware_v1_2 *gpu_info_fw =
2065                                (const struct gpu_info_firmware_v1_2 *)(adev->firmware.gpu_info_fw->data +
2066                                                                        le32_to_cpu(hdr->header.ucode_array_offset_bytes));
2067                        adev->dm.soc_bounding_box = &gpu_info_fw->soc_bounding_box;
2068                }
2069                break;
2070        }
2071        default:
2072                dev_err(adev->dev,
2073                        "Unsupported gpu_info table %d\n", hdr->header.ucode_version);
2074                err = -EINVAL;
2075                goto out;
2076        }
2077out:
2078        return err;
2079}
2080
2081/**
2082 * amdgpu_device_ip_early_init - run early init for hardware IPs
2083 *
2084 * @adev: amdgpu_device pointer
2085 *
2086 * Early initialization pass for hardware IPs.  The hardware IPs that make
2087 * up each asic are discovered each IP's early_init callback is run.  This
2088 * is the first stage in initializing the asic.
2089 * Returns 0 on success, negative error code on failure.
2090 */
2091static int amdgpu_device_ip_early_init(struct amdgpu_device *adev)
2092{
2093        struct drm_device *dev = adev_to_drm(adev);
2094        struct pci_dev *parent;
2095        int i, r;
2096
2097        amdgpu_device_enable_virtual_display(adev);
2098
2099        if (amdgpu_sriov_vf(adev)) {
2100                r = amdgpu_virt_request_full_gpu(adev, true);
2101                if (r)
2102                        return r;
2103        }
2104
2105        switch (adev->asic_type) {
2106#ifdef CONFIG_DRM_AMDGPU_SI
2107        case CHIP_VERDE:
2108        case CHIP_TAHITI:
2109        case CHIP_PITCAIRN:
2110        case CHIP_OLAND:
2111        case CHIP_HAINAN:
2112                adev->family = AMDGPU_FAMILY_SI;
2113                r = si_set_ip_blocks(adev);
2114                if (r)
2115                        return r;
2116                break;
2117#endif
2118#ifdef CONFIG_DRM_AMDGPU_CIK
2119        case CHIP_BONAIRE:
2120        case CHIP_HAWAII:
2121        case CHIP_KAVERI:
2122        case CHIP_KABINI:
2123        case CHIP_MULLINS:
2124                if (adev->flags & AMD_IS_APU)
2125                        adev->family = AMDGPU_FAMILY_KV;
2126                else
2127                        adev->family = AMDGPU_FAMILY_CI;
2128
2129                r = cik_set_ip_blocks(adev);
2130                if (r)
2131                        return r;
2132                break;
2133#endif
2134        case CHIP_TOPAZ:
2135        case CHIP_TONGA:
2136        case CHIP_FIJI:
2137        case CHIP_POLARIS10:
2138        case CHIP_POLARIS11:
2139        case CHIP_POLARIS12:
2140        case CHIP_VEGAM:
2141        case CHIP_CARRIZO:
2142        case CHIP_STONEY:
2143                if (adev->flags & AMD_IS_APU)
2144                        adev->family = AMDGPU_FAMILY_CZ;
2145                else
2146                        adev->family = AMDGPU_FAMILY_VI;
2147
2148                r = vi_set_ip_blocks(adev);
2149                if (r)
2150                        return r;
2151                break;
2152        default:
2153                r = amdgpu_discovery_set_ip_blocks(adev);
2154                if (r)
2155                        return r;
2156                break;
2157        }
2158
2159        if (amdgpu_has_atpx() &&
2160            (amdgpu_is_atpx_hybrid() ||
2161             amdgpu_has_atpx_dgpu_power_cntl()) &&
2162            ((adev->flags & AMD_IS_APU) == 0) &&
2163            !pci_is_thunderbolt_attached(to_pci_dev(dev->dev)))
2164                adev->flags |= AMD_IS_PX;
2165
2166        if (!(adev->flags & AMD_IS_APU)) {
2167                parent = pci_upstream_bridge(adev->pdev);
2168                adev->has_pr3 = parent ? pci_pr3_present(parent) : false;
2169        }
2170
2171        amdgpu_amdkfd_device_probe(adev);
2172
2173        adev->pm.pp_feature = amdgpu_pp_feature_mask;
2174        if (amdgpu_sriov_vf(adev) || sched_policy == KFD_SCHED_POLICY_NO_HWS)
2175                adev->pm.pp_feature &= ~PP_GFXOFF_MASK;
2176        if (amdgpu_sriov_vf(adev) && adev->asic_type == CHIP_SIENNA_CICHLID)
2177                adev->pm.pp_feature &= ~PP_OVERDRIVE_MASK;
2178
2179        for (i = 0; i < adev->num_ip_blocks; i++) {
2180                if ((amdgpu_ip_block_mask & (1 << i)) == 0) {
2181                        DRM_ERROR("disabled ip block: %d <%s>\n",
2182                                  i, adev->ip_blocks[i].version->funcs->name);
2183                        adev->ip_blocks[i].status.valid = false;
2184                } else {
2185                        if (adev->ip_blocks[i].version->funcs->early_init) {
2186                                r = adev->ip_blocks[i].version->funcs->early_init((void *)adev);
2187                                if (r == -ENOENT) {
2188                                        adev->ip_blocks[i].status.valid = false;
2189                                } else if (r) {
2190                                        DRM_ERROR("early_init of IP block <%s> failed %d\n",
2191                                                  adev->ip_blocks[i].version->funcs->name, r);
2192                                        return r;
2193                                } else {
2194                                        adev->ip_blocks[i].status.valid = true;
2195                                }
2196                        } else {
2197                                adev->ip_blocks[i].status.valid = true;
2198                        }
2199                }
2200                /* get the vbios after the asic_funcs are set up */
2201                if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_COMMON) {
2202                        r = amdgpu_device_parse_gpu_info_fw(adev);
2203                        if (r)
2204                                return r;
2205
2206                        /* Read BIOS */
2207                        if (!amdgpu_get_bios(adev))
2208                                return -EINVAL;
2209
2210                        r = amdgpu_atombios_init(adev);
2211                        if (r) {
2212                                dev_err(adev->dev, "amdgpu_atombios_init failed\n");
2213                                amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_ATOMBIOS_INIT_FAIL, 0, 0);
2214                                return r;
2215                        }
2216
2217                        /*get pf2vf msg info at it's earliest time*/
2218                        if (amdgpu_sriov_vf(adev))
2219                                amdgpu_virt_init_data_exchange(adev);
2220
2221                }
2222        }
2223
2224        adev->cg_flags &= amdgpu_cg_mask;
2225        adev->pg_flags &= amdgpu_pg_mask;
2226
2227        return 0;
2228}
2229
2230static int amdgpu_device_ip_hw_init_phase1(struct amdgpu_device *adev)
2231{
2232        int i, r;
2233
2234        for (i = 0; i < adev->num_ip_blocks; i++) {
2235                if (!adev->ip_blocks[i].status.sw)
2236                        continue;
2237                if (adev->ip_blocks[i].status.hw)
2238                        continue;
2239                if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_COMMON ||
2240                    (amdgpu_sriov_vf(adev) && (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_PSP)) ||
2241                    adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_IH) {
2242                        r = adev->ip_blocks[i].version->funcs->hw_init(adev);
2243                        if (r) {
2244                                DRM_ERROR("hw_init of IP block <%s> failed %d\n",
2245                                          adev->ip_blocks[i].version->funcs->name, r);
2246                                return r;
2247                        }
2248                        adev->ip_blocks[i].status.hw = true;
2249                }
2250        }
2251
2252        return 0;
2253}
2254
2255static int amdgpu_device_ip_hw_init_phase2(struct amdgpu_device *adev)
2256{
2257        int i, r;
2258
2259        for (i = 0; i < adev->num_ip_blocks; i++) {
2260                if (!adev->ip_blocks[i].status.sw)
2261                        continue;
2262                if (adev->ip_blocks[i].status.hw)
2263                        continue;
2264                r = adev->ip_blocks[i].version->funcs->hw_init(adev);
2265                if (r) {
2266                        DRM_ERROR("hw_init of IP block <%s> failed %d\n",
2267                                  adev->ip_blocks[i].version->funcs->name, r);
2268                        return r;
2269                }
2270                adev->ip_blocks[i].status.hw = true;
2271        }
2272
2273        return 0;
2274}
2275
2276static int amdgpu_device_fw_loading(struct amdgpu_device *adev)
2277{
2278        int r = 0;
2279        int i;
2280        uint32_t smu_version;
2281
2282        if (adev->asic_type >= CHIP_VEGA10) {
2283                for (i = 0; i < adev->num_ip_blocks; i++) {
2284                        if (adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_PSP)
2285                                continue;
2286
2287                        if (!adev->ip_blocks[i].status.sw)
2288                                continue;
2289
2290                        /* no need to do the fw loading again if already done*/
2291                        if (adev->ip_blocks[i].status.hw == true)
2292                                break;
2293
2294                        if (amdgpu_in_reset(adev) || adev->in_suspend) {
2295                                r = adev->ip_blocks[i].version->funcs->resume(adev);
2296                                if (r) {
2297                                        DRM_ERROR("resume of IP block <%s> failed %d\n",
2298                                                          adev->ip_blocks[i].version->funcs->name, r);
2299                                        return r;
2300                                }
2301                        } else {
2302                                r = adev->ip_blocks[i].version->funcs->hw_init(adev);
2303                                if (r) {
2304                                        DRM_ERROR("hw_init of IP block <%s> failed %d\n",
2305                                                          adev->ip_blocks[i].version->funcs->name, r);
2306                                        return r;
2307                                }
2308                        }
2309
2310                        adev->ip_blocks[i].status.hw = true;
2311                        break;
2312                }
2313        }
2314
2315        if (!amdgpu_sriov_vf(adev) || adev->asic_type == CHIP_TONGA)
2316                r = amdgpu_pm_load_smu_firmware(adev, &smu_version);
2317
2318        return r;
2319}
2320
2321static int amdgpu_device_init_schedulers(struct amdgpu_device *adev)
2322{
2323        long timeout;
2324        int r, i;
2325
2326        for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
2327                struct amdgpu_ring *ring = adev->rings[i];
2328
2329                /* No need to setup the GPU scheduler for rings that don't need it */
2330                if (!ring || ring->no_scheduler)
2331                        continue;
2332
2333                switch (ring->funcs->type) {
2334                case AMDGPU_RING_TYPE_GFX:
2335                        timeout = adev->gfx_timeout;
2336                        break;
2337                case AMDGPU_RING_TYPE_COMPUTE:
2338                        timeout = adev->compute_timeout;
2339                        break;
2340                case AMDGPU_RING_TYPE_SDMA:
2341                        timeout = adev->sdma_timeout;
2342                        break;
2343                default:
2344                        timeout = adev->video_timeout;
2345                        break;
2346                }
2347
2348                r = drm_sched_init(&ring->sched, &amdgpu_sched_ops,
2349                                   ring->num_hw_submission, amdgpu_job_hang_limit,
2350                                   timeout, adev->reset_domain->wq,
2351                                   ring->sched_score, ring->name,
2352                                   adev->dev);
2353                if (r) {
2354                        DRM_ERROR("Failed to create scheduler on ring %s.\n",
2355                                  ring->name);
2356                        return r;
2357                }
2358        }
2359
2360        return 0;
2361}
2362
2363
2364/**
2365 * amdgpu_device_ip_init - run init for hardware IPs
2366 *
2367 * @adev: amdgpu_device pointer
2368 *
2369 * Main initialization pass for hardware IPs.  The list of all the hardware
2370 * IPs that make up the asic is walked and the sw_init and hw_init callbacks
2371 * are run.  sw_init initializes the software state associated with each IP
2372 * and hw_init initializes the hardware associated with each IP.
2373 * Returns 0 on success, negative error code on failure.
2374 */
2375static int amdgpu_device_ip_init(struct amdgpu_device *adev)
2376{
2377        int i, r;
2378
2379        r = amdgpu_ras_init(adev);
2380        if (r)
2381                return r;
2382
2383        for (i = 0; i < adev->num_ip_blocks; i++) {
2384                if (!adev->ip_blocks[i].status.valid)
2385                        continue;
2386                r = adev->ip_blocks[i].version->funcs->sw_init((void *)adev);
2387                if (r) {
2388                        DRM_ERROR("sw_init of IP block <%s> failed %d\n",
2389                                  adev->ip_blocks[i].version->funcs->name, r);
2390                        goto init_failed;
2391                }
2392                adev->ip_blocks[i].status.sw = true;
2393
2394                /* need to do gmc hw init early so we can allocate gpu mem */
2395                if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GMC) {
2396                        /* Try to reserve bad pages early */
2397                        if (amdgpu_sriov_vf(adev))
2398                                amdgpu_virt_exchange_data(adev);
2399
2400                        r = amdgpu_device_vram_scratch_init(adev);
2401                        if (r) {
2402                                DRM_ERROR("amdgpu_vram_scratch_init failed %d\n", r);
2403                                goto init_failed;
2404                        }
2405                        r = adev->ip_blocks[i].version->funcs->hw_init((void *)adev);
2406                        if (r) {
2407                                DRM_ERROR("hw_init %d failed %d\n", i, r);
2408                                goto init_failed;
2409                        }
2410                        r = amdgpu_device_wb_init(adev);
2411                        if (r) {
2412                                DRM_ERROR("amdgpu_device_wb_init failed %d\n", r);
2413                                goto init_failed;
2414                        }
2415                        adev->ip_blocks[i].status.hw = true;
2416
2417                        /* right after GMC hw init, we create CSA */
2418                        if (amdgpu_mcbp || amdgpu_sriov_vf(adev)) {
2419                                r = amdgpu_allocate_static_csa(adev, &adev->virt.csa_obj,
2420                                                                AMDGPU_GEM_DOMAIN_VRAM,
2421                                                                AMDGPU_CSA_SIZE);
2422                                if (r) {
2423                                        DRM_ERROR("allocate CSA failed %d\n", r);
2424                                        goto init_failed;
2425                                }
2426                        }
2427                }
2428        }
2429
2430        if (amdgpu_sriov_vf(adev))
2431                amdgpu_virt_init_data_exchange(adev);
2432
2433        r = amdgpu_ib_pool_init(adev);
2434        if (r) {
2435                dev_err(adev->dev, "IB initialization failed (%d).\n", r);
2436                amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_IB_INIT_FAIL, 0, r);
2437                goto init_failed;
2438        }
2439
2440        r = amdgpu_ucode_create_bo(adev); /* create ucode bo when sw_init complete*/
2441        if (r)
2442                goto init_failed;
2443
2444        r = amdgpu_device_ip_hw_init_phase1(adev);
2445        if (r)
2446                goto init_failed;
2447
2448        r = amdgpu_device_fw_loading(adev);
2449        if (r)
2450                goto init_failed;
2451
2452        r = amdgpu_device_ip_hw_init_phase2(adev);
2453        if (r)
2454                goto init_failed;
2455
2456        /*
2457         * retired pages will be loaded from eeprom and reserved here,
2458         * it should be called after amdgpu_device_ip_hw_init_phase2  since
2459         * for some ASICs the RAS EEPROM code relies on SMU fully functioning
2460         * for I2C communication which only true at this point.
2461         *
2462         * amdgpu_ras_recovery_init may fail, but the upper only cares the
2463         * failure from bad gpu situation and stop amdgpu init process
2464         * accordingly. For other failed cases, it will still release all
2465         * the resource and print error message, rather than returning one
2466         * negative value to upper level.
2467         *
2468         * Note: theoretically, this should be called before all vram allocations
2469         * to protect retired page from abusing
2470         */
2471        r = amdgpu_ras_recovery_init(adev);
2472        if (r)
2473                goto init_failed;
2474
2475        /**
2476         * In case of XGMI grab extra reference for reset domain for this device
2477         */
2478        if (adev->gmc.xgmi.num_physical_nodes > 1) {
2479                if (amdgpu_xgmi_add_device(adev) == 0) {
2480                        struct amdgpu_hive_info *hive = amdgpu_get_xgmi_hive(adev);
2481
2482                        if (!hive->reset_domain ||
2483                            !amdgpu_reset_get_reset_domain(hive->reset_domain)) {
2484                                r = -ENOENT;
2485                                goto init_failed;
2486                        }
2487
2488                        /* Drop the early temporary reset domain we created for device */
2489                        amdgpu_reset_put_reset_domain(adev->reset_domain);
2490                        adev->reset_domain = hive->reset_domain;
2491                }
2492        }
2493
2494        r = amdgpu_device_init_schedulers(adev);
2495        if (r)
2496                goto init_failed;
2497
2498        /* Don't init kfd if whole hive need to be reset during init */
2499        if (!adev->gmc.xgmi.pending_reset)
2500                amdgpu_amdkfd_device_init(adev);
2501
2502        amdgpu_fru_get_product_info(adev);
2503
2504init_failed:
2505        if (amdgpu_sriov_vf(adev))
2506                amdgpu_virt_release_full_gpu(adev, true);
2507
2508        return r;
2509}
2510
2511/**
2512 * amdgpu_device_fill_reset_magic - writes reset magic to gart pointer
2513 *
2514 * @adev: amdgpu_device pointer
2515 *
2516 * Writes a reset magic value to the gart pointer in VRAM.  The driver calls
2517 * this function before a GPU reset.  If the value is retained after a
2518 * GPU reset, VRAM has not been lost.  Some GPU resets may destry VRAM contents.
2519 */
2520static void amdgpu_device_fill_reset_magic(struct amdgpu_device *adev)
2521{
2522        memcpy(adev->reset_magic, adev->gart.ptr, AMDGPU_RESET_MAGIC_NUM);
2523}
2524
2525/**
2526 * amdgpu_device_check_vram_lost - check if vram is valid
2527 *
2528 * @adev: amdgpu_device pointer
2529 *
2530 * Checks the reset magic value written to the gart pointer in VRAM.
2531 * The driver calls this after a GPU reset to see if the contents of
2532 * VRAM is lost or now.
2533 * returns true if vram is lost, false if not.
2534 */
2535static bool amdgpu_device_check_vram_lost(struct amdgpu_device *adev)
2536{
2537        if (memcmp(adev->gart.ptr, adev->reset_magic,
2538                        AMDGPU_RESET_MAGIC_NUM))
2539                return true;
2540
2541        if (!amdgpu_in_reset(adev))
2542                return false;
2543
2544        /*
2545         * For all ASICs with baco/mode1 reset, the VRAM is
2546         * always assumed to be lost.
2547         */
2548        switch (amdgpu_asic_reset_method(adev)) {
2549        case AMD_RESET_METHOD_BACO:
2550        case AMD_RESET_METHOD_MODE1:
2551                return true;
2552        default:
2553                return false;
2554        }
2555}
2556
2557/**
2558 * amdgpu_device_set_cg_state - set clockgating for amdgpu device
2559 *
2560 * @adev: amdgpu_device pointer
2561 * @state: clockgating state (gate or ungate)
2562 *
2563 * The list of all the hardware IPs that make up the asic is walked and the
2564 * set_clockgating_state callbacks are run.
2565 * Late initialization pass enabling clockgating for hardware IPs.
2566 * Fini or suspend, pass disabling clockgating for hardware IPs.
2567 * Returns 0 on success, negative error code on failure.
2568 */
2569
2570int amdgpu_device_set_cg_state(struct amdgpu_device *adev,
2571                               enum amd_clockgating_state state)
2572{
2573        int i, j, r;
2574
2575        if (amdgpu_emu_mode == 1)
2576                return 0;
2577
2578        for (j = 0; j < adev->num_ip_blocks; j++) {
2579                i = state == AMD_CG_STATE_GATE ? j : adev->num_ip_blocks - j - 1;
2580                if (!adev->ip_blocks[i].status.late_initialized)
2581                        continue;
2582                /* skip CG for GFX on S0ix */
2583                if (adev->in_s0ix &&
2584                    adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GFX)
2585                        continue;
2586                /* skip CG for VCE/UVD, it's handled specially */
2587                if (adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_UVD &&
2588                    adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_VCE &&
2589                    adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_VCN &&
2590                    adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_JPEG &&
2591                    adev->ip_blocks[i].version->funcs->set_clockgating_state) {
2592                        /* enable clockgating to save power */
2593                        r = adev->ip_blocks[i].version->funcs->set_clockgating_state((void *)adev,
2594                                                                                     state);
2595                        if (r) {
2596                                DRM_ERROR("set_clockgating_state(gate) of IP block <%s> failed %d\n",
2597                                          adev->ip_blocks[i].version->funcs->name, r);
2598                                return r;
2599                        }
2600                }
2601        }
2602
2603        return 0;
2604}
2605
2606int amdgpu_device_set_pg_state(struct amdgpu_device *adev,
2607                               enum amd_powergating_state state)
2608{
2609        int i, j, r;
2610
2611        if (amdgpu_emu_mode == 1)
2612                return 0;
2613
2614        for (j = 0; j < adev->num_ip_blocks; j++) {
2615                i = state == AMD_PG_STATE_GATE ? j : adev->num_ip_blocks - j - 1;
2616                if (!adev->ip_blocks[i].status.late_initialized)
2617                        continue;
2618                /* skip PG for GFX on S0ix */
2619                if (adev->in_s0ix &&
2620                    adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GFX)
2621                        continue;
2622                /* skip CG for VCE/UVD, it's handled specially */
2623                if (adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_UVD &&
2624                    adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_VCE &&
2625                    adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_VCN &&
2626                    adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_JPEG &&
2627                    adev->ip_blocks[i].version->funcs->set_powergating_state) {
2628                        /* enable powergating to save power */
2629                        r = adev->ip_blocks[i].version->funcs->set_powergating_state((void *)adev,
2630                                                                                        state);
2631                        if (r) {
2632                                DRM_ERROR("set_powergating_state(gate) of IP block <%s> failed %d\n",
2633                                          adev->ip_blocks[i].version->funcs->name, r);
2634                                return r;
2635                        }
2636                }
2637        }
2638        return 0;
2639}
2640
2641static int amdgpu_device_enable_mgpu_fan_boost(void)
2642{
2643        struct amdgpu_gpu_instance *gpu_ins;
2644        struct amdgpu_device *adev;
2645        int i, ret = 0;
2646
2647        mutex_lock(&mgpu_info.mutex);
2648
2649        /*
2650         * MGPU fan boost feature should be enabled
2651         * only when there are two or more dGPUs in
2652         * the system
2653         */
2654        if (mgpu_info.num_dgpu < 2)
2655                goto out;
2656
2657        for (i = 0; i < mgpu_info.num_dgpu; i++) {
2658                gpu_ins = &(mgpu_info.gpu_ins[i]);
2659                adev = gpu_ins->adev;
2660                if (!(adev->flags & AMD_IS_APU) &&
2661                    !gpu_ins->mgpu_fan_enabled) {
2662                        ret = amdgpu_dpm_enable_mgpu_fan_boost(adev);
2663                        if (ret)
2664                                break;
2665
2666                        gpu_ins->mgpu_fan_enabled = 1;
2667                }
2668        }
2669
2670out:
2671        mutex_unlock(&mgpu_info.mutex);
2672
2673        return ret;
2674}
2675
2676/**
2677 * amdgpu_device_ip_late_init - run late init for hardware IPs
2678 *
2679 * @adev: amdgpu_device pointer
2680 *
2681 * Late initialization pass for hardware IPs.  The list of all the hardware
2682 * IPs that make up the asic is walked and the late_init callbacks are run.
2683 * late_init covers any special initialization that an IP requires
2684 * after all of the have been initialized or something that needs to happen
2685 * late in the init process.
2686 * Returns 0 on success, negative error code on failure.
2687 */
2688static int amdgpu_device_ip_late_init(struct amdgpu_device *adev)
2689{
2690        struct amdgpu_gpu_instance *gpu_instance;
2691        int i = 0, r;
2692
2693        for (i = 0; i < adev->num_ip_blocks; i++) {
2694                if (!adev->ip_blocks[i].status.hw)
2695                        continue;
2696                if (adev->ip_blocks[i].version->funcs->late_init) {
2697                        r = adev->ip_blocks[i].version->funcs->late_init((void *)adev);
2698                        if (r) {
2699                                DRM_ERROR("late_init of IP block <%s> failed %d\n",
2700                                          adev->ip_blocks[i].version->funcs->name, r);
2701                                return r;
2702                        }
2703                }
2704                adev->ip_blocks[i].status.late_initialized = true;
2705        }
2706
2707        r = amdgpu_ras_late_init(adev);
2708        if (r) {
2709                DRM_ERROR("amdgpu_ras_late_init failed %d", r);
2710                return r;
2711        }
2712
2713        amdgpu_ras_set_error_query_ready(adev, true);
2714
2715        amdgpu_device_set_cg_state(adev, AMD_CG_STATE_GATE);
2716        amdgpu_device_set_pg_state(adev, AMD_PG_STATE_GATE);
2717
2718        amdgpu_device_fill_reset_magic(adev);
2719
2720        r = amdgpu_device_enable_mgpu_fan_boost();
2721        if (r)
2722                DRM_ERROR("enable mgpu fan boost failed (%d).\n", r);
2723
2724        /* For passthrough configuration on arcturus and aldebaran, enable special handling SBR */
2725        if (amdgpu_passthrough(adev) && ((adev->asic_type == CHIP_ARCTURUS && adev->gmc.xgmi.num_physical_nodes > 1)||
2726                               adev->asic_type == CHIP_ALDEBARAN ))
2727                amdgpu_dpm_handle_passthrough_sbr(adev, true);
2728
2729        if (adev->gmc.xgmi.num_physical_nodes > 1) {
2730                mutex_lock(&mgpu_info.mutex);
2731
2732                /*
2733                 * Reset device p-state to low as this was booted with high.
2734                 *
2735                 * This should be performed only after all devices from the same
2736                 * hive get initialized.
2737                 *
2738                 * However, it's unknown how many device in the hive in advance.
2739                 * As this is counted one by one during devices initializations.
2740                 *
2741                 * So, we wait for all XGMI interlinked devices initialized.
2742                 * This may bring some delays as those devices may come from
2743                 * different hives. But that should be OK.
2744                 */
2745                if (mgpu_info.num_dgpu == adev->gmc.xgmi.num_physical_nodes) {
2746                        for (i = 0; i < mgpu_info.num_gpu; i++) {
2747                                gpu_instance = &(mgpu_info.gpu_ins[i]);
2748                                if (gpu_instance->adev->flags & AMD_IS_APU)
2749                                        continue;
2750
2751                                r = amdgpu_xgmi_set_pstate(gpu_instance->adev,
2752                                                AMDGPU_XGMI_PSTATE_MIN);
2753                                if (r) {
2754                                        DRM_ERROR("pstate setting failed (%d).\n", r);
2755                                        break;
2756                                }
2757                        }
2758                }
2759
2760                mutex_unlock(&mgpu_info.mutex);
2761        }
2762
2763        return 0;
2764}
2765
2766/**
2767 * amdgpu_device_smu_fini_early - smu hw_fini wrapper
2768 *
2769 * @adev: amdgpu_device pointer
2770 *
2771 * For ASICs need to disable SMC first
2772 */
2773static void amdgpu_device_smu_fini_early(struct amdgpu_device *adev)
2774{
2775        int i, r;
2776
2777        if (adev->ip_versions[GC_HWIP][0] > IP_VERSION(9, 0, 0))
2778                return;
2779
2780        for (i = 0; i < adev->num_ip_blocks; i++) {
2781                if (!adev->ip_blocks[i].status.hw)
2782                        continue;
2783                if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_SMC) {
2784                        r = adev->ip_blocks[i].version->funcs->hw_fini((void *)adev);
2785                        /* XXX handle errors */
2786                        if (r) {
2787                                DRM_DEBUG("hw_fini of IP block <%s> failed %d\n",
2788                                          adev->ip_blocks[i].version->funcs->name, r);
2789                        }
2790                        adev->ip_blocks[i].status.hw = false;
2791                        break;
2792                }
2793        }
2794}
2795
2796static int amdgpu_device_ip_fini_early(struct amdgpu_device *adev)
2797{
2798        int i, r;
2799
2800        for (i = 0; i < adev->num_ip_blocks; i++) {
2801                if (!adev->ip_blocks[i].version->funcs->early_fini)
2802                        continue;
2803
2804                r = adev->ip_blocks[i].version->funcs->early_fini((void *)adev);
2805                if (r) {
2806                        DRM_DEBUG("early_fini of IP block <%s> failed %d\n",
2807                                  adev->ip_blocks[i].version->funcs->name, r);
2808                }
2809        }
2810
2811        amdgpu_device_set_pg_state(adev, AMD_PG_STATE_UNGATE);
2812        amdgpu_device_set_cg_state(adev, AMD_CG_STATE_UNGATE);
2813
2814        amdgpu_amdkfd_suspend(adev, false);
2815
2816        /* Workaroud for ASICs need to disable SMC first */
2817        amdgpu_device_smu_fini_early(adev);
2818
2819        for (i = adev->num_ip_blocks - 1; i >= 0; i--) {
2820                if (!adev->ip_blocks[i].status.hw)
2821                        continue;
2822
2823                r = adev->ip_blocks[i].version->funcs->hw_fini((void *)adev);
2824                /* XXX handle errors */
2825                if (r) {
2826                        DRM_DEBUG("hw_fini of IP block <%s> failed %d\n",
2827                                  adev->ip_blocks[i].version->funcs->name, r);
2828                }
2829
2830                adev->ip_blocks[i].status.hw = false;
2831        }
2832
2833        if (amdgpu_sriov_vf(adev)) {
2834                if (amdgpu_virt_release_full_gpu(adev, false))
2835                        DRM_ERROR("failed to release exclusive mode on fini\n");
2836        }
2837
2838        return 0;
2839}
2840
2841/**
2842 * amdgpu_device_ip_fini - run fini for hardware IPs
2843 *
2844 * @adev: amdgpu_device pointer
2845 *
2846 * Main teardown pass for hardware IPs.  The list of all the hardware
2847 * IPs that make up the asic is walked and the hw_fini and sw_fini callbacks
2848 * are run.  hw_fini tears down the hardware associated with each IP
2849 * and sw_fini tears down any software state associated with each IP.
2850 * Returns 0 on success, negative error code on failure.
2851 */
2852static int amdgpu_device_ip_fini(struct amdgpu_device *adev)
2853{
2854        int i, r;
2855
2856        if (amdgpu_sriov_vf(adev) && adev->virt.ras_init_done)
2857                amdgpu_virt_release_ras_err_handler_data(adev);
2858
2859        if (adev->gmc.xgmi.num_physical_nodes > 1)
2860                amdgpu_xgmi_remove_device(adev);
2861
2862        amdgpu_amdkfd_device_fini_sw(adev);
2863
2864        for (i = adev->num_ip_blocks - 1; i >= 0; i--) {
2865                if (!adev->ip_blocks[i].status.sw)
2866                        continue;
2867
2868                if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GMC) {
2869                        amdgpu_ucode_free_bo(adev);
2870                        amdgpu_free_static_csa(&adev->virt.csa_obj);
2871                        amdgpu_device_wb_fini(adev);
2872                        amdgpu_device_vram_scratch_fini(adev);
2873                        amdgpu_ib_pool_fini(adev);
2874                }
2875
2876                r = adev->ip_blocks[i].version->funcs->sw_fini((void *)adev);
2877                /* XXX handle errors */
2878                if (r) {
2879                        DRM_DEBUG("sw_fini of IP block <%s> failed %d\n",
2880                                  adev->ip_blocks[i].version->funcs->name, r);
2881                }
2882                adev->ip_blocks[i].status.sw = false;
2883                adev->ip_blocks[i].status.valid = false;
2884        }
2885
2886        for (i = adev->num_ip_blocks - 1; i >= 0; i--) {
2887                if (!adev->ip_blocks[i].status.late_initialized)
2888                        continue;
2889                if (adev->ip_blocks[i].version->funcs->late_fini)
2890                        adev->ip_blocks[i].version->funcs->late_fini((void *)adev);
2891                adev->ip_blocks[i].status.late_initialized = false;
2892        }
2893
2894        amdgpu_ras_fini(adev);
2895
2896        return 0;
2897}
2898
2899/**
2900 * amdgpu_device_delayed_init_work_handler - work handler for IB tests
2901 *
2902 * @work: work_struct.
2903 */
2904static void amdgpu_device_delayed_init_work_handler(struct work_struct *work)
2905{
2906        struct amdgpu_device *adev =
2907                container_of(work, struct amdgpu_device, delayed_init_work.work);
2908        int r;
2909
2910        r = amdgpu_ib_ring_tests(adev);
2911        if (r)
2912                DRM_ERROR("ib ring test failed (%d).\n", r);
2913}
2914
2915static void amdgpu_device_delay_enable_gfx_off(struct work_struct *work)
2916{
2917        struct amdgpu_device *adev =
2918                container_of(work, struct amdgpu_device, gfx.gfx_off_delay_work.work);
2919
2920        WARN_ON_ONCE(adev->gfx.gfx_off_state);
2921        WARN_ON_ONCE(adev->gfx.gfx_off_req_count);
2922
2923        if (!amdgpu_dpm_set_powergating_by_smu(adev, AMD_IP_BLOCK_TYPE_GFX, true))
2924                adev->gfx.gfx_off_state = true;
2925}
2926
2927/**
2928 * amdgpu_device_ip_suspend_phase1 - run suspend for hardware IPs (phase 1)
2929 *
2930 * @adev: amdgpu_device pointer
2931 *
2932 * Main suspend function for hardware IPs.  The list of all the hardware
2933 * IPs that make up the asic is walked, clockgating is disabled and the
2934 * suspend callbacks are run.  suspend puts the hardware and software state
2935 * in each IP into a state suitable for suspend.
2936 * Returns 0 on success, negative error code on failure.
2937 */
2938static int amdgpu_device_ip_suspend_phase1(struct amdgpu_device *adev)
2939{
2940        int i, r;
2941
2942        amdgpu_device_set_pg_state(adev, AMD_PG_STATE_UNGATE);
2943        amdgpu_device_set_cg_state(adev, AMD_CG_STATE_UNGATE);
2944
2945        for (i = adev->num_ip_blocks - 1; i >= 0; i--) {
2946                if (!adev->ip_blocks[i].status.valid)
2947                        continue;
2948
2949                /* displays are handled separately */
2950                if (adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_DCE)
2951                        continue;
2952
2953                /* XXX handle errors */
2954                r = adev->ip_blocks[i].version->funcs->suspend(adev);
2955                /* XXX handle errors */
2956                if (r) {
2957                        DRM_ERROR("suspend of IP block <%s> failed %d\n",
2958                                  adev->ip_blocks[i].version->funcs->name, r);
2959                        return r;
2960                }
2961
2962                adev->ip_blocks[i].status.hw = false;
2963        }
2964
2965        return 0;
2966}
2967
2968/**
2969 * amdgpu_device_ip_suspend_phase2 - run suspend for hardware IPs (phase 2)
2970 *
2971 * @adev: amdgpu_device pointer
2972 *
2973 * Main suspend function for hardware IPs.  The list of all the hardware
2974 * IPs that make up the asic is walked, clockgating is disabled and the
2975 * suspend callbacks are run.  suspend puts the hardware and software state
2976 * in each IP into a state suitable for suspend.
2977 * Returns 0 on success, negative error code on failure.
2978 */
2979static int amdgpu_device_ip_suspend_phase2(struct amdgpu_device *adev)
2980{
2981        int i, r;
2982
2983        if (adev->in_s0ix)
2984                amdgpu_dpm_gfx_state_change(adev, sGpuChangeState_D3Entry);
2985
2986        for (i = adev->num_ip_blocks - 1; i >= 0; i--) {
2987                if (!adev->ip_blocks[i].status.valid)
2988                        continue;
2989                /* displays are handled in phase1 */
2990                if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_DCE)
2991                        continue;
2992                /* PSP lost connection when err_event_athub occurs */
2993                if (amdgpu_ras_intr_triggered() &&
2994                    adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_PSP) {
2995                        adev->ip_blocks[i].status.hw = false;
2996                        continue;
2997                }
2998
2999                /* skip unnecessary suspend if we do not initialize them yet */
3000                if (adev->gmc.xgmi.pending_reset &&

3001                    !(adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GMC ||
3002                      adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_SMC ||
3003                      adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_COMMON ||
3004                      adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_IH)) {
3005                        adev->ip_blocks[i].status.hw = false;
3006                        continue;
3007                }
3008
3009                /* skip suspend of gfx and psp for S0ix
3010                 * gfx is in gfxoff state, so on resume it will exit gfxoff just
3011                 * like at runtime. PSP is also part of the always on hardware
3012                 * so no need to suspend it.
3013                 */
3014                if (adev->in_s0ix &&
3015                    (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_PSP ||
3016                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GFX))
3017                        continue;
3018
3019                /* XXX handle errors */
3020                r = adev->ip_blocks[i].version->funcs->suspend(adev);
3021                /* XXX handle errors */
3022                if (r) {
3023                        DRM_ERROR("suspend of IP block <%s> failed %d\n",
3024                                  adev->ip_blocks[i].version->funcs->name, r);
3025                }
3026                adev->ip_blocks[i].status.hw = false;
3027                /* handle putting the SMC in the appropriate state */
3028                if(!amdgpu_sriov_vf(adev)){
3029                        if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_SMC) {
3030                                r = amdgpu_dpm_set_mp1_state(adev, adev->mp1_state);
3031                                if (r) {
3032                                        DRM_ERROR("SMC failed to set mp1 state %d, %d\n",
3033                                                        adev->mp1_state, r);
3034                                        return r;
3035                                }
3036                        }
3037                }
3038        }
3039
3040        return 0;
3041}
3042
3043/**
3044 * amdgpu_device_ip_suspend - run suspend for hardware IPs
3045 *
3046 * @adev: amdgpu_device pointer
3047 *
3048 * Main suspend function for hardware IPs.  The list of all the hardware
3049 * IPs that make up the asic is walked, clockgating is disabled and the
3050 * suspend callbacks are run.  suspend puts the hardware and software state
3051 * in each IP into a state suitable for suspend.
3052 * Returns 0 on success, negative error code on failure.
3053 */
3054int amdgpu_device_ip_suspend(struct amdgpu_device *adev)
3055{
3056        int r;
3057
3058        if (amdgpu_sriov_vf(adev)) {
3059                amdgpu_virt_fini_data_exchange(adev);
3060                amdgpu_virt_request_full_gpu(adev, false);
3061        }
3062
3063        r = amdgpu_device_ip_suspend_phase1(adev);
3064        if (r)
3065                return r;
3066        r = amdgpu_device_ip_suspend_phase2(adev);
3067
3068        if (amdgpu_sriov_vf(adev))
3069                amdgpu_virt_release_full_gpu(adev, false);
3070
3071        return r;
3072}
3073
3074static int amdgpu_device_ip_reinit_early_sriov(struct amdgpu_device *adev)
3075{
3076        int i, r;
3077
3078        static enum amd_ip_block_type ip_order[] = {
3079                AMD_IP_BLOCK_TYPE_GMC,
3080                AMD_IP_BLOCK_TYPE_COMMON,
3081                AMD_IP_BLOCK_TYPE_PSP,
3082                AMD_IP_BLOCK_TYPE_IH,
3083        };
3084
3085        for (i = 0; i < adev->num_ip_blocks; i++) {
3086                int j;
3087                struct amdgpu_ip_block *block;
3088
3089                block = &adev->ip_blocks[i];
3090                block->status.hw = false;
3091
3092                for (j = 0; j < ARRAY_SIZE(ip_order); j++) {
3093
3094                        if (block->version->type != ip_order[j] ||
3095                                !block->status.valid)
3096                                continue;
3097
3098                        r = block->version->funcs->hw_init(adev);
3099                        DRM_INFO("RE-INIT-early: %s %s\n", block->version->funcs->name, r?"failed":"succeeded");
3100                        if (r)
3101                                return r;
3102                        block->status.hw = true;
3103                }
3104        }
3105
3106        return 0;
3107}
3108
3109static int amdgpu_device_ip_reinit_late_sriov(struct amdgpu_device *adev)
3110{
3111        int i, r;
3112
3113        static enum amd_ip_block_type ip_order[] = {
3114                AMD_IP_BLOCK_TYPE_SMC,
3115                AMD_IP_BLOCK_TYPE_DCE,
3116                AMD_IP_BLOCK_TYPE_GFX,
3117                AMD_IP_BLOCK_TYPE_SDMA,
3118                AMD_IP_BLOCK_TYPE_UVD,
3119                AMD_IP_BLOCK_TYPE_VCE,
3120                AMD_IP_BLOCK_TYPE_VCN
3121        };
3122
3123        for (i = 0; i < ARRAY_SIZE(ip_order); i++) {
3124                int j;
3125                struct amdgpu_ip_block *block;
3126
3127                for (j = 0; j < adev->num_ip_blocks; j++) {
3128                        block = &adev->ip_blocks[j];
3129
3130                        if (block->version->type != ip_order[i] ||
3131                                !block->status.valid ||
3132                                block->status.hw)
3133                                continue;
3134
3135                        if (block->version->type == AMD_IP_BLOCK_TYPE_SMC)
3136                                r = block->version->funcs->resume(adev);
3137                        else
3138                                r = block->version->funcs->hw_init(adev);
3139
3140                        DRM_INFO("RE-INIT-late: %s %s\n", block->version->funcs->name, r?"failed":"succeeded");
3141                        if (r)
3142                                return r;
3143                        block->status.hw = true;
3144                }
3145        }
3146
3147        return 0;
3148}
3149
3150/**
3151 * amdgpu_device_ip_resume_phase1 - run resume for hardware IPs
3152 *
3153 * @adev: amdgpu_device pointer
3154 *
3155 * First resume function for hardware IPs.  The list of all the hardware
3156 * IPs that make up the asic is walked and the resume callbacks are run for
3157 * COMMON, GMC, and IH.  resume puts the hardware into a functional state
3158 * after a suspend and updates the software state as necessary.  This
3159 * function is also used for restoring the GPU after a GPU reset.
3160 * Returns 0 on success, negative error code on failure.
3161 */
3162static int amdgpu_device_ip_resume_phase1(struct amdgpu_device *adev)
3163{
3164        int i, r;
3165
3166        for (i = 0; i < adev->num_ip_blocks; i++) {
3167                if (!adev->ip_blocks[i].status.valid || adev->ip_blocks[i].status.hw)
3168                        continue;
3169                if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_COMMON ||
3170                    adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GMC ||
3171                    adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_IH) {
3172
3173                        r = adev->ip_blocks[i].version->funcs->resume(adev);
3174                        if (r) {
3175                                DRM_ERROR("resume of IP block <%s> failed %d\n",
3176                                          adev->ip_blocks[i].version->funcs->name, r);
3177                                return r;
3178                        }
3179                        adev->ip_blocks[i].status.hw = true;
3180                }
3181        }
3182
3183        return 0;
3184}
3185
3186/**
3187 * amdgpu_device_ip_resume_phase2 - run resume for hardware IPs
3188 *
3189 * @adev: amdgpu_device pointer
3190 *
3191 * First resume function for hardware IPs.  The list of all the hardware
3192 * IPs that make up the asic is walked and the resume callbacks are run for
3193 * all blocks except COMMON, GMC, and IH.  resume puts the hardware into a
3194 * functional state after a suspend and updates the software state as
3195 * necessary.  This function is also used for restoring the GPU after a GPU
3196 * reset.
3197 * Returns 0 on success, negative error code on failure.
3198 */
3199static int amdgpu_device_ip_resume_phase2(struct amdgpu_device *adev)
3200{
3201        int i, r;
3202
3203        for (i = 0; i < adev->num_ip_blocks; i++) {
3204                if (!adev->ip_blocks[i].status.valid || adev->ip_blocks[i].status.hw)
3205                        continue;
3206                if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_COMMON ||
3207                    adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GMC ||
3208                    adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_IH ||
3209                    adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_PSP)
3210                        continue;
3211                r = adev->ip_blocks[i].version->funcs->resume(adev);
3212                if (r) {
3213                        DRM_ERROR("resume of IP block <%s> failed %d\n",
3214                                  adev->ip_blocks[i].version->funcs->name, r);
3215                        return r;
3216                }
3217                adev->ip_blocks[i].status.hw = true;
3218        }
3219
3220        return 0;
3221}
3222
3223/**
3224 * amdgpu_device_ip_resume - run resume for hardware IPs
3225 *
3226 * @adev: amdgpu_device pointer
3227 *
3228 * Main resume function for hardware IPs.  The hardware IPs
3229 * are split into two resume functions because they are
3230 * are also used in in recovering from a GPU reset and some additional
3231 * steps need to be take between them.  In this case (S3/S4) they are
3232 * run sequentially.
3233 * Returns 0 on success, negative error code on failure.
3234 */
3235static int amdgpu_device_ip_resume(struct amdgpu_device *adev)
3236{
3237        int r;
3238
3239        r = amdgpu_amdkfd_resume_iommu(adev);
3240        if (r)
3241                return r;
3242
3243        r = amdgpu_device_ip_resume_phase1(adev);
3244        if (r)
3245                return r;
3246
3247        r = amdgpu_device_fw_loading(adev);
3248        if (r)
3249                return r;
3250
3251        r = amdgpu_device_ip_resume_phase2(adev);
3252
3253        return r;
3254}
3255
3256/**
3257 * amdgpu_device_detect_sriov_bios - determine if the board supports SR-IOV
3258 *
3259 * @adev: amdgpu_device pointer
3260 *
3261 * Query the VBIOS data tables to determine if the board supports SR-IOV.
3262 */
3263static void amdgpu_device_detect_sriov_bios(struct amdgpu_device *adev)
3264{
3265        if (amdgpu_sriov_vf(adev)) {
3266                if (adev->is_atom_fw) {
3267                        if (amdgpu_atomfirmware_gpu_virtualization_supported(adev))
3268                                adev->virt.caps |= AMDGPU_SRIOV_CAPS_SRIOV_VBIOS;
3269                } else {
3270                        if (amdgpu_atombios_has_gpu_virtualization_table(adev))
3271                                adev->virt.caps |= AMDGPU_SRIOV_CAPS_SRIOV_VBIOS;
3272                }
3273
3274                if (!(adev->virt.caps & AMDGPU_SRIOV_CAPS_SRIOV_VBIOS))
3275                        amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_NO_VBIOS, 0, 0);
3276        }
3277}
3278
3279/**
3280 * amdgpu_device_asic_has_dc_support - determine if DC supports the asic
3281 *
3282 * @asic_type: AMD asic type
3283 *
3284 * Check if there is DC (new modesetting infrastructre) support for an asic.
3285 * returns true if DC has support, false if not.
3286 */
3287bool amdgpu_device_asic_has_dc_support(enum amd_asic_type asic_type)
3288{
3289        switch (asic_type) {
3290#ifdef CONFIG_DRM_AMDGPU_SI
3291        case CHIP_HAINAN:
3292#endif
3293        case CHIP_TOPAZ:
3294                /* chips with no display hardware */
3295                return false;
3296#if defined(CONFIG_DRM_AMD_DC)
3297        case CHIP_TAHITI:
3298        case CHIP_PITCAIRN:
3299        case CHIP_VERDE:
3300        case CHIP_OLAND:
3301                /*
3302                 * We have systems in the wild with these ASICs that require
3303                 * LVDS and VGA support which is not supported with DC.
3304                 *
3305                 * Fallback to the non-DC driver here by default so as not to
3306                 * cause regressions.
3307                 */
3308#if defined(CONFIG_DRM_AMD_DC_SI)
3309                return amdgpu_dc > 0;
3310#else
3311                return false;
3312#endif
3313        case CHIP_BONAIRE:
3314        case CHIP_KAVERI:
3315        case CHIP_KABINI:
3316        case CHIP_MULLINS:
3317                /*
3318                 * We have systems in the wild with these ASICs that require
3319                 * LVDS and VGA support which is not supported with DC.
3320                 *
3321                 * Fallback to the non-DC driver here by default so as not to
3322                 * cause regressions.
3323                 */
3324                return amdgpu_dc > 0;
3325        case CHIP_HAWAII:
3326        case CHIP_CARRIZO:
3327        case CHIP_STONEY:
3328        case CHIP_POLARIS10:
3329        case CHIP_POLARIS11:
3330        case CHIP_POLARIS12:
3331        case CHIP_VEGAM:
3332        case CHIP_TONGA:
3333        case CHIP_FIJI:
3334        case CHIP_VEGA10:
3335        case CHIP_VEGA12:
3336        case CHIP_VEGA20:
3337#if defined(CONFIG_DRM_AMD_DC_DCN)
3338        case CHIP_RAVEN:
3339        case CHIP_NAVI10:
3340        case CHIP_NAVI14:
3341        case CHIP_NAVI12:
3342        case CHIP_RENOIR:
3343        case CHIP_CYAN_SKILLFISH:
3344        case CHIP_SIENNA_CICHLID:
3345        case CHIP_NAVY_FLOUNDER:
3346        case CHIP_DIMGREY_CAVEFISH:
3347        case CHIP_BEIGE_GOBY:
3348        case CHIP_VANGOGH:
3349        case CHIP_YELLOW_CARP:
3350#endif
3351        default:
3352                return amdgpu_dc != 0;
3353#else
3354        default:
3355                if (amdgpu_dc > 0)
3356                        DRM_INFO_ONCE("Display Core has been requested via kernel parameter "
3357                                         "but isn't supported by ASIC, ignoring\n");
3358                return false;
3359#endif
3360        }
3361}
3362
3363/**
3364 * amdgpu_device_has_dc_support - check if dc is supported
3365 *
3366 * @adev: amdgpu_device pointer
3367 *
3368 * Returns true for supported, false for not supported
3369 */
3370bool amdgpu_device_has_dc_support(struct amdgpu_device *adev)
3371{
3372        if (amdgpu_sriov_vf(adev) || 
3373            adev->enable_virtual_display ||
3374            (adev->harvest_ip_mask & AMD_HARVEST_IP_DMU_MASK))
3375                return false;
3376
3377        return amdgpu_device_asic_has_dc_support(adev->asic_type);
3378}
3379
3380static void amdgpu_device_xgmi_reset_func(struct work_struct *__work)
3381{
3382        struct amdgpu_device *adev =
3383                container_of(__work, struct amdgpu_device, xgmi_reset_work);
3384        struct amdgpu_hive_info *hive = amdgpu_get_xgmi_hive(adev);
3385
3386        /* It's a bug to not have a hive within this function */
3387        if (WARN_ON(!hive))
3388                return;
3389
3390        /*
3391         * Use task barrier to synchronize all xgmi reset works across the
3392         * hive. task_barrier_enter and task_barrier_exit will block
3393         * until all the threads running the xgmi reset works reach
3394         * those points. task_barrier_full will do both blocks.
3395         */
3396        if (amdgpu_asic_reset_method(adev) == AMD_RESET_METHOD_BACO) {
3397
3398                task_barrier_enter(&hive->tb);
3399                adev->asic_reset_res = amdgpu_device_baco_enter(adev_to_drm(adev));
3400
3401                if (adev->asic_reset_res)
3402                        goto fail;
3403
3404                task_barrier_exit(&hive->tb);
3405                adev->asic_reset_res = amdgpu_device_baco_exit(adev_to_drm(adev));
3406
3407                if (adev->asic_reset_res)
3408                        goto fail;
3409
3410                if (adev->mmhub.ras && adev->mmhub.ras->ras_block.hw_ops &&
3411                    adev->mmhub.ras->ras_block.hw_ops->reset_ras_error_count)
3412                        adev->mmhub.ras->ras_block.hw_ops->reset_ras_error_count(adev);
3413        } else {
3414
3415                task_barrier_full(&hive->tb);
3416                adev->asic_reset_res =  amdgpu_asic_reset(adev);
3417        }
3418
3419fail:
3420        if (adev->asic_reset_res)
3421                DRM_WARN("ASIC reset failed with error, %d for drm dev, %s",
3422                         adev->asic_reset_res, adev_to_drm(adev)->unique);
3423        amdgpu_put_xgmi_hive(hive);
3424}
3425
3426static int amdgpu_device_get_job_timeout_settings(struct amdgpu_device *adev)
3427{
3428        char *input = amdgpu_lockup_timeout;
3429        char *timeout_setting = NULL;
3430        int index = 0;
3431        long timeout;
3432        int ret = 0;
3433
3434        /*
3435         * By default timeout for non compute jobs is 10000
3436         * and 60000 for compute jobs.
3437         * In SR-IOV or passthrough mode, timeout for compute
3438         * jobs are 60000 by default.
3439         */
3440        adev->gfx_timeout = msecs_to_jiffies(10000);
3441        adev->sdma_timeout = adev->video_timeout = adev->gfx_timeout;
3442        if (amdgpu_sriov_vf(adev))
3443                adev->compute_timeout = amdgpu_sriov_is_pp_one_vf(adev) ?
3444                                        msecs_to_jiffies(60000) : msecs_to_jiffies(10000);
3445        else
3446                adev->compute_timeout =  msecs_to_jiffies(60000);
3447
3448        if (strnlen(input, AMDGPU_MAX_TIMEOUT_PARAM_LENGTH)) {
3449                while ((timeout_setting = strsep(&input, ",")) &&
3450                                strnlen(timeout_setting, AMDGPU_MAX_TIMEOUT_PARAM_LENGTH)) {
3451                        ret = kstrtol(timeout_setting, 0, &timeout);
3452                        if (ret)
3453                                return ret;
3454
3455                        if (timeout == 0) {
3456                                index++;
3457                                continue;
3458                        } else if (timeout < 0) {
3459                                timeout = MAX_SCHEDULE_TIMEOUT;
3460                                dev_warn(adev->dev, "lockup timeout disabled");
3461                                add_taint(TAINT_SOFTLOCKUP, LOCKDEP_STILL_OK);
3462                        } else {
3463                                timeout = msecs_to_jiffies(timeout);
3464                        }
3465
3466                        switch (index++) {
3467                        case 0:
3468                                adev->gfx_timeout = timeout;
3469                                break;
3470                        case 1:
3471                                adev->compute_timeout = timeout;
3472                                break;
3473                        case 2:
3474                                adev->sdma_timeout = timeout;
3475                                break;
3476                        case 3:
3477                                adev->video_timeout = timeout;
3478                                break;
3479                        default:
3480                                break;
3481                        }
3482                }
3483                /*
3484                 * There is only one value specified and
3485                 * it should apply to all non-compute jobs.
3486                 */
3487                if (index == 1) {
3488                        adev->sdma_timeout = adev->video_timeout = adev->gfx_timeout;
3489                        if (amdgpu_sriov_vf(adev) || amdgpu_passthrough(adev))
3490                                adev->compute_timeout = adev->gfx_timeout;
3491                }
3492        }
3493
3494        return ret;
3495}
3496
3497/**
3498 * amdgpu_device_check_iommu_direct_map - check if RAM direct mapped to GPU
3499 *
3500 * @adev: amdgpu_device pointer
3501 *
3502 * RAM direct mapped to GPU if IOMMU is not enabled or is pass through mode
3503 */
3504static void amdgpu_device_check_iommu_direct_map(struct amdgpu_device *adev)
3505{
3506        struct iommu_domain *domain;
3507
3508        domain = iommu_get_domain_for_dev(adev->dev);
3509        if (!domain || domain->type == IOMMU_DOMAIN_IDENTITY)
3510                adev->ram_is_direct_mapped = true;
3511}
3512
3513static const struct attribute *amdgpu_dev_attributes[] = {
3514        &dev_attr_product_name.attr,
3515        &dev_attr_product_number.attr,
3516        &dev_attr_serial_number.attr,
3517        &dev_attr_pcie_replay_count.attr,
3518        NULL
3519};
3520
3521/**
3522 * amdgpu_device_init - initialize the driver
3523 *
3524 * @adev: amdgpu_device pointer
3525 * @flags: driver flags
3526 *
3527 * Initializes the driver info and hw (all asics).
3528 * Returns 0 for success or an error on failure.
3529 * Called at driver startup.
3530 */
3531int amdgpu_device_init(struct amdgpu_device *adev,
3532                       uint32_t flags)
3533{
3534        struct drm_device *ddev = adev_to_drm(adev);
3535        struct pci_dev *pdev = adev->pdev;
3536        int r, i;
3537        bool px = false;
3538        u32 max_MBps;
3539
3540        adev->shutdown = false;
3541        adev->flags = flags;
3542
3543        if (amdgpu_force_asic_type >= 0 && amdgpu_force_asic_type < CHIP_LAST)
3544                adev->asic_type = amdgpu_force_asic_type;
3545        else
3546                adev->asic_type = flags & AMD_ASIC_MASK;
3547
3548        adev->usec_timeout = AMDGPU_MAX_USEC_TIMEOUT;
3549        if (amdgpu_emu_mode == 1)
3550                adev->usec_timeout *= 10;
3551        adev->gmc.gart_size = 512 * 1024 * 1024;
3552        adev->accel_working = false;
3553        adev->num_rings = 0;
3554        adev->mman.buffer_funcs = NULL;
3555        adev->mman.buffer_funcs_ring = NULL;
3556        adev->vm_manager.vm_pte_funcs = NULL;
3557        adev->vm_manager.vm_pte_num_scheds = 0;
3558        adev->gmc.gmc_funcs = NULL;
3559        adev->harvest_ip_mask = 0x0;
3560        adev->fence_context = dma_fence_context_alloc(AMDGPU_MAX_RINGS);
3561        bitmap_zero(adev->gfx.pipe_reserve_bitmap, AMDGPU_MAX_COMPUTE_QUEUES);
3562
3563        adev->smc_rreg = &amdgpu_invalid_rreg;
3564        adev->smc_wreg = &amdgpu_invalid_wreg;
3565        adev->pcie_rreg = &amdgpu_invalid_rreg;
3566        adev->pcie_wreg = &amdgpu_invalid_wreg;
3567        adev->pciep_rreg = &amdgpu_invalid_rreg;
3568        adev->pciep_wreg = &amdgpu_invalid_wreg;
3569        adev->pcie_rreg64 = &amdgpu_invalid_rreg64;
3570        adev->pcie_wreg64 = &amdgpu_invalid_wreg64;
3571        adev->uvd_ctx_rreg = &amdgpu_invalid_rreg;
3572        adev->uvd_ctx_wreg = &amdgpu_invalid_wreg;
3573        adev->didt_rreg = &amdgpu_invalid_rreg;
3574        adev->didt_wreg = &amdgpu_invalid_wreg;
3575        adev->gc_cac_rreg = &amdgpu_invalid_rreg;
3576        adev->gc_cac_wreg = &amdgpu_invalid_wreg;
3577        adev->audio_endpt_rreg = &amdgpu_block_invalid_rreg;
3578        adev->audio_endpt_wreg = &amdgpu_block_invalid_wreg;
3579
3580        DRM_INFO("initializing kernel modesetting (%s 0x%04X:0x%04X 0x%04X:0x%04X 0x%02X).\n",
3581                 amdgpu_asic_name[adev->asic_type], pdev->vendor, pdev->device,
3582                 pdev->subsystem_vendor, pdev->subsystem_device, pdev->revision);
3583
3584        /* mutex initialization are all done here so we
3585         * can recall function without having locking issues */
3586        mutex_init(&adev->firmware.mutex);
3587        mutex_init(&adev->pm.mutex);
3588        mutex_init(&adev->gfx.gpu_clock_mutex);
3589        mutex_init(&adev->srbm_mutex);
3590        mutex_init(&adev->gfx.pipe_reserve_mutex);
3591        mutex_init(&adev->gfx.gfx_off_mutex);
3592        mutex_init(&adev->grbm_idx_mutex);
3593        mutex_init(&adev->mn_lock);
3594        mutex_init(&adev->virt.vf_errors.lock);
3595        hash_init(adev->mn_hash);
3596        mutex_init(&adev->psp.mutex);
3597        mutex_init(&adev->notifier_lock);
3598        mutex_init(&adev->pm.stable_pstate_ctx_lock);
3599        mutex_init(&adev->benchmark_mutex);
3600
3601        amdgpu_device_init_apu_flags(adev);
3602
3603        r = amdgpu_device_check_arguments(adev);
3604        if (r)
3605                return r;
3606
3607        spin_lock_init(&adev->mmio_idx_lock);
3608        spin_lock_init(&adev->smc_idx_lock);
3609        spin_lock_init(&adev->pcie_idx_lock);
3610        spin_lock_init(&adev->uvd_ctx_idx_lock);
3611        spin_lock_init(&adev->didt_idx_lock);
3612        spin_lock_init(&adev->gc_cac_idx_lock);
3613        spin_lock_init(&adev->se_cac_idx_lock);
3614        spin_lock_init(&adev->audio_endpt_idx_lock);
3615        spin_lock_init(&adev->mm_stats.lock);
3616
3617        INIT_LIST_HEAD(&adev->shadow_list);
3618        mutex_init(&adev->shadow_list_lock);
3619
3620        INIT_LIST_HEAD(&adev->reset_list);
3621
3622        INIT_LIST_HEAD(&adev->ras_list);
3623
3624        INIT_DELAYED_WORK(&adev->delayed_init_work,
3625                          amdgpu_device_delayed_init_work_handler);
3626        INIT_DELAYED_WORK(&adev->gfx.gfx_off_delay_work,
3627                          amdgpu_device_delay_enable_gfx_off);
3628
3629        INIT_WORK(&adev->xgmi_reset_work, amdgpu_device_xgmi_reset_func);
3630
3631        adev->gfx.gfx_off_req_count = 1;
3632        adev->pm.ac_power = power_supply_is_system_supplied() > 0;
3633
3634        atomic_set(&adev->throttling_logging_enabled, 1);
3635        /*
3636         * If throttling continues, logging will be performed every minute
3637         * to avoid log flooding. "-1" is subtracted since the thermal
3638         * throttling interrupt comes every second. Thus, the total logging
3639         * interval is 59 seconds(retelimited printk interval) + 1(waiting
3640         * for throttling interrupt) = 60 seconds.
3641         */
3642        ratelimit_state_init(&adev->throttling_logging_rs, (60 - 1) * HZ, 1);
3643        ratelimit_set_flags(&adev->throttling_logging_rs, RATELIMIT_MSG_ON_RELEASE);
3644
3645        /* Registers mapping */
3646        /* TODO: block userspace mapping of io register */
3647        if (adev->asic_type >= CHIP_BONAIRE) {
3648                adev->rmmio_base = pci_resource_start(adev->pdev, 5);
3649                adev->rmmio_size = pci_resource_len(adev->pdev, 5);
3650        } else {
3651                adev->rmmio_base = pci_resource_start(adev->pdev, 2);
3652                adev->rmmio_size = pci_resource_len(adev->pdev, 2);
3653        }
3654
3655        for (i = 0; i < AMD_IP_BLOCK_TYPE_NUM; i++)
3656                atomic_set(&adev->pm.pwr_state[i], POWER_STATE_UNKNOWN);
3657
3658        adev->rmmio = ioremap(adev->rmmio_base, adev->rmmio_size);
3659        if (adev->rmmio == NULL) {
3660                return -ENOMEM;
3661        }
3662        DRM_INFO("register mmio base: 0x%08X\n", (uint32_t)adev->rmmio_base);
3663        DRM_INFO("register mmio size: %u\n", (unsigned)adev->rmmio_size);
3664
3665        amdgpu_device_get_pcie_info(adev);
3666
3667        if (amdgpu_mcbp)
3668                DRM_INFO("MCBP is enabled\n");
3669
3670        if (adev->asic_type >= CHIP_NAVI10) {
3671                if (amdgpu_mes || amdgpu_mes_kiq)
3672                        adev->enable_mes = true;
3673
3674                if (amdgpu_mes_kiq)
3675                        adev->enable_mes_kiq = true;
3676        }
3677
3678        /*
3679         * Reset domain needs to be present early, before XGMI hive discovered
3680         * (if any) and intitialized to use reset sem and in_gpu reset flag
3681         * early on during init and before calling to RREG32.
3682         */
3683        adev->reset_domain = amdgpu_reset_create_reset_domain(SINGLE_DEVICE, "amdgpu-reset-dev");
3684        if (!adev->reset_domain)
3685                return -ENOMEM;
3686
3687        /* detect hw virtualization here */
3688        amdgpu_detect_virtualization(adev);
3689
3690        r = amdgpu_device_get_job_timeout_settings(adev);
3691        if (r) {
3692                dev_err(adev->dev, "invalid lockup_timeout parameter syntax\n");
3693                return r;
3694        }
3695
3696        /* early init functions */
3697        r = amdgpu_device_ip_early_init(adev);
3698        if (r)
3699                return r;
3700
3701        /* Enable TMZ based on IP_VERSION */
3702        amdgpu_gmc_tmz_set(adev);
3703
3704        amdgpu_gmc_noretry_set(adev);
3705        /* Need to get xgmi info early to decide the reset behavior*/
3706        if (adev->gmc.xgmi.supported) {
3707                r = adev->gfxhub.funcs->get_xgmi_info(adev);
3708                if (r)
3709                        return r;
3710        }
3711
3712        /* enable PCIE atomic ops */
3713        if (amdgpu_sriov_vf(adev))
3714                adev->have_atomics_support = ((struct amd_sriov_msg_pf2vf_info *)
3715                        adev->virt.fw_reserve.p_pf2vf)->pcie_atomic_ops_support_flags ==
3716                        (PCI_EXP_DEVCAP2_ATOMIC_COMP32 | PCI_EXP_DEVCAP2_ATOMIC_COMP64);
3717        else
3718                adev->have_atomics_support =
3719                        !pci_enable_atomic_ops_to_root(adev->pdev,
3720                                          PCI_EXP_DEVCAP2_ATOMIC_COMP32 |
3721                                          PCI_EXP_DEVCAP2_ATOMIC_COMP64);
3722        if (!adev->have_atomics_support)
3723                dev_info(adev->dev, "PCIE atomic ops is not supported\n");
3724
3725        /* doorbell bar mapping and doorbell index init*/
3726        amdgpu_device_doorbell_init(adev);
3727
3728        if (amdgpu_emu_mode == 1) {
3729                /* post the asic on emulation mode */
3730                emu_soc_asic_init(adev);
3731                goto fence_driver_init;
3732        }
3733
3734        amdgpu_reset_init(adev);
3735
3736        /* detect if we are with an SRIOV vbios */
3737        amdgpu_device_detect_sriov_bios(adev);
3738
3739        /* check if we need to reset the asic
3740         *  E.g., driver was not cleanly unloaded previously, etc.
3741         */
3742        if (!amdgpu_sriov_vf(adev) && amdgpu_asic_need_reset_on_init(adev)) {
3743                if (adev->gmc.xgmi.num_physical_nodes) {
3744                        dev_info(adev->dev, "Pending hive reset.\n");
3745                        adev->gmc.xgmi.pending_reset = true;
3746                        /* Only need to init necessary block for SMU to handle the reset */
3747                        for (i = 0; i < adev->num_ip_blocks; i++) {
3748                                if (!adev->ip_blocks[i].status.valid)
3749                                        continue;
3750                                if (!(adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GMC ||
3751                                      adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_COMMON ||
3752                                      adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_IH ||
3753                                      adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_SMC)) {
3754                                        DRM_DEBUG("IP %s disabled for hw_init.\n",
3755                                                adev->ip_blocks[i].version->funcs->name);
3756                                        adev->ip_blocks[i].status.hw = true;
3757                                }
3758                        }
3759                } else {
3760                        r = amdgpu_asic_reset(adev);
3761                        if (r) {
3762                                dev_err(adev->dev, "asic reset on init failed\n");
3763                                goto failed;
3764                        }
3765                }
3766        }
3767
3768        pci_enable_pcie_error_reporting(adev->pdev);
3769
3770        /* Post card if necessary */
3771        if (amdgpu_device_need_post(adev)) {
3772                if (!adev->bios) {
3773                        dev_err(adev->dev, "no vBIOS found\n");
3774                        r = -EINVAL;
3775                        goto failed;
3776                }
3777                DRM_INFO("GPU posting now...\n");
3778                r = amdgpu_device_asic_init(adev);
3779                if (r) {
3780                        dev_err(adev->dev, "gpu post error!\n");
3781                        goto failed;
3782                }
3783        }
3784
3785        if (adev->is_atom_fw) {
3786                /* Initialize clocks */
3787                r = amdgpu_atomfirmware_get_clock_info(adev);
3788                if (r) {
3789                        dev_err(adev->dev, "amdgpu_atomfirmware_get_clock_info failed\n");
3790                        amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_ATOMBIOS_GET_CLOCK_FAIL, 0, 0);
3791                        goto failed;
3792                }
3793        } else {
3794                /* Initialize clocks */
3795                r = amdgpu_atombios_get_clock_info(adev);
3796                if (r) {
3797                        dev_err(adev->dev, "amdgpu_atombios_get_clock_info failed\n");
3798                        amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_ATOMBIOS_GET_CLOCK_FAIL, 0, 0);
3799                        goto failed;
3800                }
3801                /* init i2c buses */
3802                if (!amdgpu_device_has_dc_support(adev))
3803                        amdgpu_atombios_i2c_init(adev);
3804        }
3805
3806fence_driver_init:
3807        /* Fence driver */
3808        r = amdgpu_fence_driver_sw_init(adev);
3809        if (r) {
3810                dev_err(adev->dev, "amdgpu_fence_driver_sw_init failed\n");
3811                amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_FENCE_INIT_FAIL, 0, 0);
3812                goto failed;
3813        }
3814
3815        /* init the mode config */
3816        drm_mode_config_init(adev_to_drm(adev));
3817
3818        r = amdgpu_device_ip_init(adev);
3819        if (r) {
3820                /* failed in exclusive mode due to timeout */
3821                if (amdgpu_sriov_vf(adev) &&
3822                    !amdgpu_sriov_runtime(adev) &&
3823                    amdgpu_virt_mmio_blocked(adev) &&
3824                    !amdgpu_virt_wait_reset(adev)) {
3825                        dev_err(adev->dev, "VF exclusive mode timeout\n");
3826                        /* Don't send request since VF is inactive. */
3827                        adev->virt.caps &= ~AMDGPU_SRIOV_CAPS_RUNTIME;
3828                        adev->virt.ops = NULL;
3829                        r = -EAGAIN;
3830                        goto release_ras_con;
3831                }
3832                dev_err(adev->dev, "amdgpu_device_ip_init failed\n");
3833                amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_AMDGPU_INIT_FAIL, 0, 0);
3834                goto release_ras_con;
3835        }
3836
3837        amdgpu_fence_driver_hw_init(adev);
3838
3839        dev_info(adev->dev,
3840                "SE %d, SH per SE %d, CU per SH %d, active_cu_number %d\n",
3841                        adev->gfx.config.max_shader_engines,
3842                        adev->gfx.config.max_sh_per_se,
3843                        adev->gfx.config.max_cu_per_sh,
3844                        adev->gfx.cu_info.number);
3845
3846        adev->accel_working = true;
3847
3848        amdgpu_vm_check_compute_bug(adev);
3849
3850        /* Initialize the buffer migration limit. */
3851        if (amdgpu_moverate >= 0)
3852                max_MBps = amdgpu_moverate;
3853        else
3854                max_MBps = 8; /* Allow 8 MB/s. */
3855        /* Get a log2 for easy divisions. */
3856        adev->mm_stats.log2_max_MBps = ilog2(max(1u, max_MBps));
3857
3858        r = amdgpu_pm_sysfs_init(adev);
3859        if (r) {
3860                adev->pm_sysfs_en = false;
3861                DRM_ERROR("registering pm debugfs failed (%d).\n", r);
3862        } else
3863                adev->pm_sysfs_en = true;
3864
3865        r = amdgpu_ucode_sysfs_init(adev);
3866        if (r) {
3867                adev->ucode_sysfs_en = false;
3868                DRM_ERROR("Creating firmware sysfs failed (%d).\n", r);
3869        } else
3870                adev->ucode_sysfs_en = true;
3871
3872        r = amdgpu_psp_sysfs_init(adev);
3873        if (r) {
3874                adev->psp_sysfs_en = false;
3875                if (!amdgpu_sriov_vf(adev))
3876                        DRM_ERROR("Creating psp sysfs failed\n");
3877        } else
3878                adev->psp_sysfs_en = true;
3879
3880        /*
3881         * Register gpu instance before amdgpu_device_enable_mgpu_fan_boost.
3882         * Otherwise the mgpu fan boost feature will be skipped due to the
3883         * gpu instance is counted less.
3884         */
3885        amdgpu_register_gpu_instance(adev);
3886
3887        /* enable clockgating, etc. after ib tests, etc. since some blocks require
3888         * explicit gating rather than handling it automatically.
3889         */
3890        if (!adev->gmc.xgmi.pending_reset) {
3891                r = amdgpu_device_ip_late_init(adev);
3892                if (r) {
3893                        dev_err(adev->dev, "amdgpu_device_ip_late_init failed\n");
3894                        amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_AMDGPU_LATE_INIT_FAIL, 0, r);
3895                        goto release_ras_con;
3896                }
3897                /* must succeed. */
3898                amdgpu_ras_resume(adev);
3899                queue_delayed_work(system_wq, &adev->delayed_init_work,
3900                                   msecs_to_jiffies(AMDGPU_RESUME_MS));
3901        }
3902
3903        if (amdgpu_sriov_vf(adev))
3904                flush_delayed_work(&adev->delayed_init_work);
3905
3906        r = sysfs_create_files(&adev->dev->kobj, amdgpu_dev_attributes);
3907        if (r)
3908                dev_err(adev->dev, "Could not create amdgpu device attr\n");
3909
3910        if (IS_ENABLED(CONFIG_PERF_EVENTS))
3911                r = amdgpu_pmu_init(adev);
3912        if (r)
3913                dev_err(adev->dev, "amdgpu_pmu_init failed\n");
3914
3915        /* Have stored pci confspace at hand for restore in sudden PCI error */
3916        if (amdgpu_device_cache_pci_state(adev->pdev))
3917                pci_restore_state(pdev);
3918
3919        /* if we have > 1 VGA cards, then disable the amdgpu VGA resources */
3920        /* this will fail for cards that aren't VGA class devices, just
3921         * ignore it */
3922        if ((adev->pdev->class >> 8) == PCI_CLASS_DISPLAY_VGA)
3923                vga_client_register(adev->pdev, amdgpu_device_vga_set_decode);
3924
3925        if (amdgpu_device_supports_px(ddev)) {
3926                px = true;
3927                vga_switcheroo_register_client(adev->pdev,
3928                                               &amdgpu_switcheroo_ops, px);
3929                vga_switcheroo_init_domain_pm_ops(adev->dev, &adev->vga_pm_domain);
3930        }
3931
3932        if (adev->gmc.xgmi.pending_reset)
3933                queue_delayed_work(system_wq, &mgpu_info.delayed_reset_work,
3934                                   msecs_to_jiffies(AMDGPU_RESUME_MS));
3935
3936        amdgpu_device_check_iommu_direct_map(adev);
3937
3938        return 0;
3939
3940release_ras_con:
3941        amdgpu_release_ras_context(adev);
3942
3943failed:
3944        amdgpu_vf_error_trans_all(adev);
3945
3946        return r;
3947}
3948
3949static void amdgpu_device_unmap_mmio(struct amdgpu_device *adev)
3950{
3951
3952        /* Clear all CPU mappings pointing to this device */
3953        unmap_mapping_range(adev->ddev.anon_inode->i_mapping, 0, 0, 1);
3954
3955        /* Unmap all mapped bars - Doorbell, registers and VRAM */
3956        amdgpu_device_doorbell_fini(adev);
3957
3958        iounmap(adev->rmmio);
3959        adev->rmmio = NULL;
3960        if (adev->mman.aper_base_kaddr)
3961                iounmap(adev->mman.aper_base_kaddr);
3962        adev->mman.aper_base_kaddr = NULL;
3963
3964        /* Memory manager related */
3965        if (!adev->gmc.xgmi.connected_to_cpu) {
3966                arch_phys_wc_del(adev->gmc.vram_mtrr);
3967                arch_io_free_memtype_wc(adev->gmc.aper_base, adev->gmc.aper_size);
3968        }
3969}
3970
3971/**
3972 * amdgpu_device_fini_hw - tear down the driver
3973 *
3974 * @adev: amdgpu_device pointer
3975 *
3976 * Tear down the driver info (all asics).
3977 * Called at driver shutdown.
3978 */
3979void amdgpu_device_fini_hw(struct amdgpu_device *adev)
3980{
3981        dev_info(adev->dev, "amdgpu: finishing device.\n");
3982        flush_delayed_work(&adev->delayed_init_work);
3983        adev->shutdown = true;
3984
3985        /* make sure IB test finished before entering exclusive mode
3986         * to avoid preemption on IB test
3987         * */
3988        if (amdgpu_sriov_vf(adev)) {
3989                amdgpu_virt_request_full_gpu(adev, false);
3990                amdgpu_virt_fini_data_exchange(adev);
3991        }
3992
3993        /* disable all interrupts */
3994        amdgpu_irq_disable_all(adev);
3995        if (adev->mode_info.mode_config_initialized){
3996                if (!drm_drv_uses_atomic_modeset(adev_to_drm(adev)))
3997                        drm_helper_force_disable_all(adev_to_drm(adev));
3998                else
3999                        drm_atomic_helper_shutdown(adev_to_drm(adev));
4000        }

4001        amdgpu_fence_driver_hw_fini(adev);
4002
4003        if (adev->mman.initialized) {
4004                flush_delayed_work(&adev->mman.bdev.wq);
4005                ttm_bo_lock_delayed_workqueue(&adev->mman.bdev);
4006        }
4007
4008        if (adev->pm_sysfs_en)
4009                amdgpu_pm_sysfs_fini(adev);
4010        if (adev->ucode_sysfs_en)
4011                amdgpu_ucode_sysfs_fini(adev);
4012        if (adev->psp_sysfs_en)
4013                amdgpu_psp_sysfs_fini(adev);
4014        sysfs_remove_files(&adev->dev->kobj, amdgpu_dev_attributes);
4015
4016        /* disable ras feature must before hw fini */
4017        amdgpu_ras_pre_fini(adev);
4018
4019        amdgpu_device_ip_fini_early(adev);
4020
4021        amdgpu_irq_fini_hw(adev);
4022
4023        if (adev->mman.initialized)
4024                ttm_device_clear_dma_mappings(&adev->mman.bdev);
4025
4026        amdgpu_gart_dummy_page_fini(adev);
4027
4028        if (drm_dev_is_unplugged(adev_to_drm(adev)))
4029                amdgpu_device_unmap_mmio(adev);
4030
4031}
4032
4033void amdgpu_device_fini_sw(struct amdgpu_device *adev)
4034{
4035        int idx;
4036
4037        amdgpu_fence_driver_sw_fini(adev);
4038        amdgpu_device_ip_fini(adev);
4039        release_firmware(adev->firmware.gpu_info_fw);
4040        adev->firmware.gpu_info_fw = NULL;
4041        adev->accel_working = false;
4042
4043        amdgpu_reset_fini(adev);
4044
4045        /* free i2c buses */
4046        if (!amdgpu_device_has_dc_support(adev))
4047                amdgpu_i2c_fini(adev);
4048
4049        if (amdgpu_emu_mode != 1)
4050                amdgpu_atombios_fini(adev);
4051
4052        kfree(adev->bios);
4053        adev->bios = NULL;
4054        if (amdgpu_device_supports_px(adev_to_drm(adev))) {
4055                vga_switcheroo_unregister_client(adev->pdev);
4056                vga_switcheroo_fini_domain_pm_ops(adev->dev);
4057        }
4058        if ((adev->pdev->class >> 8) == PCI_CLASS_DISPLAY_VGA)
4059                vga_client_unregister(adev->pdev);
4060
4061        if (drm_dev_enter(adev_to_drm(adev), &idx)) {
4062
4063                iounmap(adev->rmmio);
4064                adev->rmmio = NULL;
4065                amdgpu_device_doorbell_fini(adev);
4066                drm_dev_exit(idx);
4067        }
4068
4069        if (IS_ENABLED(CONFIG_PERF_EVENTS))
4070                amdgpu_pmu_fini(adev);
4071        if (adev->mman.discovery_bin)
4072                amdgpu_discovery_fini(adev);
4073
4074        amdgpu_reset_put_reset_domain(adev->reset_domain);
4075        adev->reset_domain = NULL;
4076
4077        kfree(adev->pci_state);
4078
4079}
4080
4081/**
4082 * amdgpu_device_evict_resources - evict device resources
4083 * @adev: amdgpu device object
4084 *
4085 * Evicts all ttm device resources(vram BOs, gart table) from the lru list
4086 * of the vram memory type. Mainly used for evicting device resources
4087 * at suspend time.
4088 *
4089 */
4090static void amdgpu_device_evict_resources(struct amdgpu_device *adev)
4091{
4092        /* No need to evict vram on APUs for suspend to ram or s2idle */
4093        if ((adev->in_s3 || adev->in_s0ix) && (adev->flags & AMD_IS_APU))
4094                return;
4095
4096        if (amdgpu_ttm_evict_resources(adev, TTM_PL_VRAM))
4097                DRM_WARN("evicting device resources failed\n");
4098
4099}
4100
4101/*
4102 * Suspend & resume.
4103 */
4104/**
4105 * amdgpu_device_suspend - initiate device suspend
4106 *
4107 * @dev: drm dev pointer
4108 * @fbcon : notify the fbdev of suspend
4109 *
4110 * Puts the hw in the suspend state (all asics).
4111 * Returns 0 for success or an error on failure.
4112 * Called at driver suspend.
4113 */
4114int amdgpu_device_suspend(struct drm_device *dev, bool fbcon)
4115{
4116        struct amdgpu_device *adev = drm_to_adev(dev);
4117
4118        if (dev->switch_power_state == DRM_SWITCH_POWER_OFF)
4119                return 0;
4120
4121        adev->in_suspend = true;
4122
4123        if (amdgpu_acpi_smart_shift_update(dev, AMDGPU_SS_DEV_D3))
4124                DRM_WARN("smart shift update failed\n");
4125
4126        drm_kms_helper_poll_disable(dev);
4127
4128        if (fbcon)
4129                drm_fb_helper_set_suspend_unlocked(adev_to_drm(adev)->fb_helper, true);
4130
4131        cancel_delayed_work_sync(&adev->delayed_init_work);
4132
4133        amdgpu_ras_suspend(adev);
4134
4135        amdgpu_device_ip_suspend_phase1(adev);
4136
4137        if (!adev->in_s0ix)
4138                amdgpu_amdkfd_suspend(adev, adev->in_runpm);
4139
4140        amdgpu_device_evict_resources(adev);
4141
4142        amdgpu_fence_driver_hw_fini(adev);
4143
4144        amdgpu_device_ip_suspend_phase2(adev);
4145
4146        return 0;
4147}
4148
4149/**
4150 * amdgpu_device_resume - initiate device resume
4151 *
4152 * @dev: drm dev pointer
4153 * @fbcon : notify the fbdev of resume
4154 *
4155 * Bring the hw back to operating state (all asics).
4156 * Returns 0 for success or an error on failure.
4157 * Called at driver resume.
4158 */
4159int amdgpu_device_resume(struct drm_device *dev, bool fbcon)
4160{
4161        struct amdgpu_device *adev = drm_to_adev(dev);
4162        int r = 0;
4163
4164        if (dev->switch_power_state == DRM_SWITCH_POWER_OFF)
4165                return 0;
4166
4167        if (adev->in_s0ix)
4168                amdgpu_dpm_gfx_state_change(adev, sGpuChangeState_D0Entry);
4169
4170        /* post card */
4171        if (amdgpu_device_need_post(adev)) {
4172                r = amdgpu_device_asic_init(adev);
4173                if (r)
4174                        dev_err(adev->dev, "amdgpu asic init failed\n");
4175        }
4176
4177        r = amdgpu_device_ip_resume(adev);
4178        if (r) {
4179                dev_err(adev->dev, "amdgpu_device_ip_resume failed (%d).\n", r);
4180                return r;
4181        }
4182        amdgpu_fence_driver_hw_init(adev);
4183
4184        r = amdgpu_device_ip_late_init(adev);
4185        if (r)
4186                return r;
4187
4188        queue_delayed_work(system_wq, &adev->delayed_init_work,
4189                           msecs_to_jiffies(AMDGPU_RESUME_MS));
4190
4191        if (!adev->in_s0ix) {
4192                r = amdgpu_amdkfd_resume(adev, adev->in_runpm);
4193                if (r)
4194                        return r;
4195        }
4196
4197        /* Make sure IB tests flushed */
4198        flush_delayed_work(&adev->delayed_init_work);
4199
4200        if (fbcon)
4201                drm_fb_helper_set_suspend_unlocked(adev_to_drm(adev)->fb_helper, false);
4202
4203        drm_kms_helper_poll_enable(dev);
4204
4205        amdgpu_ras_resume(adev);
4206
4207        /*
4208         * Most of the connector probing functions try to acquire runtime pm
4209         * refs to ensure that the GPU is powered on when connector polling is
4210         * performed. Since we're calling this from a runtime PM callback,
4211         * trying to acquire rpm refs will cause us to deadlock.
4212         *
4213         * Since we're guaranteed to be holding the rpm lock, it's safe to
4214         * temporarily disable the rpm helpers so this doesn't deadlock us.
4215         */
4216#ifdef CONFIG_PM
4217        dev->dev->power.disable_depth++;
4218#endif
4219        if (!amdgpu_device_has_dc_support(adev))
4220                drm_helper_hpd_irq_event(dev);
4221        else
4222                drm_kms_helper_hotplug_event(dev);
4223#ifdef CONFIG_PM
4224        dev->dev->power.disable_depth--;
4225#endif
4226        adev->in_suspend = false;
4227
4228        if (amdgpu_acpi_smart_shift_update(dev, AMDGPU_SS_DEV_D0))
4229                DRM_WARN("smart shift update failed\n");
4230
4231        return 0;
4232}
4233
4234/**
4235 * amdgpu_device_ip_check_soft_reset - did soft reset succeed
4236 *
4237 * @adev: amdgpu_device pointer
4238 *
4239 * The list of all the hardware IPs that make up the asic is walked and
4240 * the check_soft_reset callbacks are run.  check_soft_reset determines
4241 * if the asic is still hung or not.
4242 * Returns true if any of the IPs are still in a hung state, false if not.
4243 */
4244static bool amdgpu_device_ip_check_soft_reset(struct amdgpu_device *adev)
4245{
4246        int i;
4247        bool asic_hang = false;
4248
4249        if (amdgpu_sriov_vf(adev))
4250                return true;
4251
4252        if (amdgpu_asic_need_full_reset(adev))
4253                return true;
4254
4255        for (i = 0; i < adev->num_ip_blocks; i++) {
4256                if (!adev->ip_blocks[i].status.valid)
4257                        continue;
4258                if (adev->ip_blocks[i].version->funcs->check_soft_reset)
4259                        adev->ip_blocks[i].status.hang =
4260                                adev->ip_blocks[i].version->funcs->check_soft_reset(adev);
4261                if (adev->ip_blocks[i].status.hang) {
4262                        dev_info(adev->dev, "IP block:%s is hung!\n", adev->ip_blocks[i].version->funcs->name);
4263                        asic_hang = true;
4264                }
4265        }
4266        return asic_hang;
4267}
4268
4269/**
4270 * amdgpu_device_ip_pre_soft_reset - prepare for soft reset
4271 *
4272 * @adev: amdgpu_device pointer
4273 *
4274 * The list of all the hardware IPs that make up the asic is walked and the
4275 * pre_soft_reset callbacks are run if the block is hung.  pre_soft_reset
4276 * handles any IP specific hardware or software state changes that are
4277 * necessary for a soft reset to succeed.
4278 * Returns 0 on success, negative error code on failure.
4279 */
4280static int amdgpu_device_ip_pre_soft_reset(struct amdgpu_device *adev)
4281{
4282        int i, r = 0;
4283
4284        for (i = 0; i < adev->num_ip_blocks; i++) {
4285                if (!adev->ip_blocks[i].status.valid)
4286                        continue;
4287                if (adev->ip_blocks[i].status.hang &&
4288                    adev->ip_blocks[i].version->funcs->pre_soft_reset) {
4289                        r = adev->ip_blocks[i].version->funcs->pre_soft_reset(adev);
4290                        if (r)
4291                                return r;
4292                }
4293        }
4294
4295        return 0;
4296}
4297
4298/**
4299 * amdgpu_device_ip_need_full_reset - check if a full asic reset is needed
4300 *
4301 * @adev: amdgpu_device pointer
4302 *
4303 * Some hardware IPs cannot be soft reset.  If they are hung, a full gpu
4304 * reset is necessary to recover.
4305 * Returns true if a full asic reset is required, false if not.
4306 */
4307static bool amdgpu_device_ip_need_full_reset(struct amdgpu_device *adev)
4308{
4309        int i;
4310
4311        if (amdgpu_asic_need_full_reset(adev))
4312                return true;
4313
4314        for (i = 0; i < adev->num_ip_blocks; i++) {
4315                if (!adev->ip_blocks[i].status.valid)
4316                        continue;
4317                if ((adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GMC) ||
4318                    (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_SMC) ||
4319                    (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_ACP) ||
4320                    (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_DCE) ||
4321                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_PSP) {
4322                        if (adev->ip_blocks[i].status.hang) {
4323                                dev_info(adev->dev, "Some block need full reset!\n");
4324                                return true;
4325                        }
4326                }
4327        }
4328        return false;
4329}
4330
4331/**
4332 * amdgpu_device_ip_soft_reset - do a soft reset
4333 *
4334 * @adev: amdgpu_device pointer
4335 *
4336 * The list of all the hardware IPs that make up the asic is walked and the
4337 * soft_reset callbacks are run if the block is hung.  soft_reset handles any
4338 * IP specific hardware or software state changes that are necessary to soft
4339 * reset the IP.
4340 * Returns 0 on success, negative error code on failure.
4341 */
4342static int amdgpu_device_ip_soft_reset(struct amdgpu_device *adev)
4343{
4344        int i, r = 0;
4345
4346        for (i = 0; i < adev->num_ip_blocks; i++) {
4347                if (!adev->ip_blocks[i].status.valid)
4348                        continue;
4349                if (adev->ip_blocks[i].status.hang &&
4350                    adev->ip_blocks[i].version->funcs->soft_reset) {
4351                        r = adev->ip_blocks[i].version->funcs->soft_reset(adev);
4352                        if (r)
4353                                return r;
4354                }
4355        }
4356
4357        return 0;
4358}
4359
4360/**
4361 * amdgpu_device_ip_post_soft_reset - clean up from soft reset
4362 *
4363 * @adev: amdgpu_device pointer
4364 *
4365 * The list of all the hardware IPs that make up the asic is walked and the
4366 * post_soft_reset callbacks are run if the asic was hung.  post_soft_reset
4367 * handles any IP specific hardware or software state changes that are
4368 * necessary after the IP has been soft reset.
4369 * Returns 0 on success, negative error code on failure.
4370 */
4371static int amdgpu_device_ip_post_soft_reset(struct amdgpu_device *adev)
4372{
4373        int i, r = 0;
4374
4375        for (i = 0; i < adev->num_ip_blocks; i++) {
4376                if (!adev->ip_blocks[i].status.valid)
4377                        continue;
4378                if (adev->ip_blocks[i].status.hang &&
4379                    adev->ip_blocks[i].version->funcs->post_soft_reset)
4380                        r = adev->ip_blocks[i].version->funcs->post_soft_reset(adev);
4381                if (r)
4382                        return r;
4383        }
4384
4385        return 0;
4386}
4387
4388/**
4389 * amdgpu_device_recover_vram - Recover some VRAM contents
4390 *
4391 * @adev: amdgpu_device pointer
4392 *
4393 * Restores the contents of VRAM buffers from the shadows in GTT.  Used to
4394 * restore things like GPUVM page tables after a GPU reset where
4395 * the contents of VRAM might be lost.
4396 *
4397 * Returns:
4398 * 0 on success, negative error code on failure.
4399 */
4400static int amdgpu_device_recover_vram(struct amdgpu_device *adev)
4401{
4402        struct dma_fence *fence = NULL, *next = NULL;
4403        struct amdgpu_bo *shadow;
4404        struct amdgpu_bo_vm *vmbo;
4405        long r = 1, tmo;
4406
4407        if (amdgpu_sriov_runtime(adev))
4408                tmo = msecs_to_jiffies(8000);
4409        else
4410                tmo = msecs_to_jiffies(100);
4411
4412        dev_info(adev->dev, "recover vram bo from shadow start\n");
4413        mutex_lock(&adev->shadow_list_lock);
4414        list_for_each_entry(vmbo, &adev->shadow_list, shadow_list) {
4415                shadow = &vmbo->bo;
4416                /* No need to recover an evicted BO */
4417                if (shadow->tbo.resource->mem_type != TTM_PL_TT ||
4418                    shadow->tbo.resource->start == AMDGPU_BO_INVALID_OFFSET ||
4419                    shadow->parent->tbo.resource->mem_type != TTM_PL_VRAM)
4420                        continue;
4421
4422                r = amdgpu_bo_restore_shadow(shadow, &next);
4423                if (r)
4424                        break;
4425
4426                if (fence) {
4427                        tmo = dma_fence_wait_timeout(fence, false, tmo);
4428                        dma_fence_put(fence);
4429                        fence = next;
4430                        if (tmo == 0) {
4431                                r = -ETIMEDOUT;
4432                                break;
4433                        } else if (tmo < 0) {
4434                                r = tmo;
4435                                break;
4436                        }
4437                } else {
4438                        fence = next;
4439                }
4440        }
4441        mutex_unlock(&adev->shadow_list_lock);
4442
4443        if (fence)
4444                tmo = dma_fence_wait_timeout(fence, false, tmo);
4445        dma_fence_put(fence);
4446
4447        if (r < 0 || tmo <= 0) {
4448                dev_err(adev->dev, "recover vram bo from shadow failed, r is %ld, tmo is %ld\n", r, tmo);
4449                return -EIO;
4450        }
4451
4452        dev_info(adev->dev, "recover vram bo from shadow done\n");
4453        return 0;
4454}
4455
4456
4457/**
4458 * amdgpu_device_reset_sriov - reset ASIC for SR-IOV vf
4459 *
4460 * @adev: amdgpu_device pointer
4461 * @from_hypervisor: request from hypervisor
4462 *
4463 * do VF FLR and reinitialize Asic
4464 * return 0 means succeeded otherwise failed
4465 */
4466static int amdgpu_device_reset_sriov(struct amdgpu_device *adev,
4467                                     bool from_hypervisor)
4468{
4469        int r;
4470        struct amdgpu_hive_info *hive = NULL;
4471        int retry_limit = 0;
4472
4473retry:
4474        amdgpu_amdkfd_pre_reset(adev);
4475
4476        amdgpu_amdkfd_pre_reset(adev);
4477
4478        if (from_hypervisor)
4479                r = amdgpu_virt_request_full_gpu(adev, true);
4480        else
4481                r = amdgpu_virt_reset_gpu(adev);
4482        if (r)
4483                return r;
4484
4485        /* Resume IP prior to SMC */
4486        r = amdgpu_device_ip_reinit_early_sriov(adev);
4487        if (r)
4488                goto error;
4489
4490        amdgpu_virt_init_data_exchange(adev);
4491
4492        r = amdgpu_device_fw_loading(adev);
4493        if (r)
4494                return r;
4495
4496        /* now we are okay to resume SMC/CP/SDMA */
4497        r = amdgpu_device_ip_reinit_late_sriov(adev);
4498        if (r)
4499                goto error;
4500
4501        hive = amdgpu_get_xgmi_hive(adev);
4502        /* Update PSP FW topology after reset */
4503        if (hive && adev->gmc.xgmi.num_physical_nodes > 1)
4504                r = amdgpu_xgmi_update_topology(hive, adev);
4505
4506        if (hive)
4507                amdgpu_put_xgmi_hive(hive);
4508
4509        if (!r) {
4510                amdgpu_irq_gpu_reset_resume_helper(adev);
4511                r = amdgpu_ib_ring_tests(adev);
4512
4513                amdgpu_amdkfd_post_reset(adev);
4514        }
4515
4516error:
4517        if (!r && adev->virt.gim_feature & AMDGIM_FEATURE_GIM_FLR_VRAMLOST) {
4518                amdgpu_inc_vram_lost(adev);
4519                r = amdgpu_device_recover_vram(adev);
4520        }
4521        amdgpu_virt_release_full_gpu(adev, true);
4522
4523        if (AMDGPU_RETRY_SRIOV_RESET(r)) {
4524                if (retry_limit < AMDGPU_MAX_RETRY_LIMIT) {
4525                        retry_limit++;
4526                        goto retry;
4527                } else
4528                        DRM_ERROR("GPU reset retry is beyond the retry limit\n");
4529        }
4530
4531        return r;
4532}
4533
4534/**
4535 * amdgpu_device_has_job_running - check if there is any job in mirror list
4536 *
4537 * @adev: amdgpu_device pointer
4538 *
4539 * check if there is any job in mirror list
4540 */
4541bool amdgpu_device_has_job_running(struct amdgpu_device *adev)
4542{
4543        int i;
4544        struct drm_sched_job *job;
4545
4546        for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
4547                struct amdgpu_ring *ring = adev->rings[i];
4548
4549                if (!ring || !ring->sched.thread)
4550                        continue;
4551
4552                spin_lock(&ring->sched.job_list_lock);
4553                job = list_first_entry_or_null(&ring->sched.pending_list,
4554                                               struct drm_sched_job, list);
4555                spin_unlock(&ring->sched.job_list_lock);
4556                if (job)
4557                        return true;
4558        }
4559        return false;
4560}
4561
4562/**
4563 * amdgpu_device_should_recover_gpu - check if we should try GPU recovery
4564 *
4565 * @adev: amdgpu_device pointer
4566 *
4567 * Check amdgpu_gpu_recovery and SRIOV status to see if we should try to recover
4568 * a hung GPU.
4569 */
4570bool amdgpu_device_should_recover_gpu(struct amdgpu_device *adev)
4571{
4572        if (!amdgpu_device_ip_check_soft_reset(adev)) {
4573                dev_info(adev->dev, "Timeout, but no hardware hang detected.\n");
4574                return false;
4575        }
4576
4577        if (amdgpu_gpu_recovery == 0)
4578                goto disabled;
4579
4580        if (amdgpu_sriov_vf(adev))
4581                return true;
4582
4583        if (amdgpu_gpu_recovery == -1) {
4584                switch (adev->asic_type) {
4585#ifdef CONFIG_DRM_AMDGPU_SI
4586                case CHIP_VERDE:
4587                case CHIP_TAHITI:
4588                case CHIP_PITCAIRN:
4589                case CHIP_OLAND:
4590                case CHIP_HAINAN:
4591#endif
4592#ifdef CONFIG_DRM_AMDGPU_CIK
4593                case CHIP_KAVERI:
4594                case CHIP_KABINI:
4595                case CHIP_MULLINS:
4596#endif
4597                case CHIP_CARRIZO:
4598                case CHIP_STONEY:
4599                case CHIP_CYAN_SKILLFISH:
4600                        goto disabled;
4601                default:
4602                        break;
4603                }
4604        }
4605
4606        return true;
4607
4608disabled:
4609                dev_info(adev->dev, "GPU recovery disabled.\n");
4610                return false;
4611}
4612
4613int amdgpu_device_mode1_reset(struct amdgpu_device *adev)
4614{
4615        u32 i;
4616        int ret = 0;
4617
4618        amdgpu_atombios_scratch_regs_engine_hung(adev, true);
4619
4620        dev_info(adev->dev, "GPU mode1 reset\n");
4621
4622        /* disable BM */
4623        pci_clear_master(adev->pdev);
4624
4625        amdgpu_device_cache_pci_state(adev->pdev);
4626
4627        if (amdgpu_dpm_is_mode1_reset_supported(adev)) {
4628                dev_info(adev->dev, "GPU smu mode1 reset\n");
4629                ret = amdgpu_dpm_mode1_reset(adev);
4630        } else {
4631                dev_info(adev->dev, "GPU psp mode1 reset\n");
4632                ret = psp_gpu_reset(adev);
4633        }
4634
4635        if (ret)
4636                dev_err(adev->dev, "GPU mode1 reset failed\n");
4637
4638        amdgpu_device_load_pci_state(adev->pdev);
4639
4640        /* wait for asic to come out of reset */
4641        for (i = 0; i < adev->usec_timeout; i++) {
4642                u32 memsize = adev->nbio.funcs->get_memsize(adev);
4643
4644                if (memsize != 0xffffffff)
4645                        break;
4646                udelay(1);
4647        }
4648
4649        amdgpu_atombios_scratch_regs_engine_hung(adev, false);
4650        return ret;
4651}
4652
4653int amdgpu_device_pre_asic_reset(struct amdgpu_device *adev,
4654                                 struct amdgpu_reset_context *reset_context)
4655{
4656        int i, r = 0;
4657        struct amdgpu_job *job = NULL;
4658        bool need_full_reset =
4659                test_bit(AMDGPU_NEED_FULL_RESET, &reset_context->flags);
4660
4661        if (reset_context->reset_req_dev == adev)
4662                job = reset_context->job;
4663
4664        if (amdgpu_sriov_vf(adev)) {
4665                /* stop the data exchange thread */
4666                amdgpu_virt_fini_data_exchange(adev);
4667        }
4668
4669        /* block all schedulers and reset given job's ring */
4670        for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
4671                struct amdgpu_ring *ring = adev->rings[i];
4672
4673                if (!ring || !ring->sched.thread)
4674                        continue;
4675
4676                /*clear job fence from fence drv to avoid force_completion
4677                 *leave NULL and vm flush fence in fence drv */
4678                amdgpu_fence_driver_clear_job_fences(ring);
4679
4680                /* after all hw jobs are reset, hw fence is meaningless, so force_completion */
4681                amdgpu_fence_driver_force_completion(ring);
4682        }
4683
4684        if (job && job->vm)
4685                drm_sched_increase_karma(&job->base);
4686
4687        r = amdgpu_reset_prepare_hwcontext(adev, reset_context);
4688        /* If reset handler not implemented, continue; otherwise return */
4689        if (r == -ENOSYS)
4690                r = 0;
4691        else
4692                return r;
4693
4694        /* Don't suspend on bare metal if we are not going to HW reset the ASIC */
4695        if (!amdgpu_sriov_vf(adev)) {
4696
4697                if (!need_full_reset)
4698                        need_full_reset = amdgpu_device_ip_need_full_reset(adev);
4699
4700                if (!need_full_reset) {
4701                        amdgpu_device_ip_pre_soft_reset(adev);
4702                        r = amdgpu_device_ip_soft_reset(adev);
4703                        amdgpu_device_ip_post_soft_reset(adev);
4704                        if (r || amdgpu_device_ip_check_soft_reset(adev)) {
4705                                dev_info(adev->dev, "soft reset failed, will fallback to full reset!\n");
4706                                need_full_reset = true;
4707                        }
4708                }
4709
4710                if (need_full_reset)
4711                        r = amdgpu_device_ip_suspend(adev);
4712                if (need_full_reset)
4713                        set_bit(AMDGPU_NEED_FULL_RESET, &reset_context->flags);
4714                else
4715                        clear_bit(AMDGPU_NEED_FULL_RESET,
4716                                  &reset_context->flags);
4717        }
4718
4719        return r;
4720}
4721
4722static int amdgpu_reset_reg_dumps(struct amdgpu_device *adev)
4723{
4724        uint32_t reg_value;
4725        int i;
4726
4727        lockdep_assert_held(&adev->reset_domain->sem);
4728        dump_stack();
4729
4730        for (i = 0; i < adev->num_regs; i++) {
4731                reg_value = RREG32(adev->reset_dump_reg_list[i]);
4732                trace_amdgpu_reset_reg_dumps(adev->reset_dump_reg_list[i], reg_value);
4733        }
4734
4735        return 0;
4736}
4737
4738int amdgpu_do_asic_reset(struct list_head *device_list_handle,
4739                         struct amdgpu_reset_context *reset_context)
4740{
4741        struct amdgpu_device *tmp_adev = NULL;
4742        bool need_full_reset, skip_hw_reset, vram_lost = false;
4743        int r = 0;
4744
4745        /* Try reset handler method first */
4746        tmp_adev = list_first_entry(device_list_handle, struct amdgpu_device,
4747                                    reset_list);
4748        amdgpu_reset_reg_dumps(tmp_adev);
4749        r = amdgpu_reset_perform_reset(tmp_adev, reset_context);
4750        /* If reset handler not implemented, continue; otherwise return */
4751        if (r == -ENOSYS)
4752                r = 0;
4753        else
4754                return r;
4755
4756        /* Reset handler not implemented, use the default method */
4757        need_full_reset =
4758                test_bit(AMDGPU_NEED_FULL_RESET, &reset_context->flags);
4759        skip_hw_reset = test_bit(AMDGPU_SKIP_HW_RESET, &reset_context->flags);
4760
4761        /*
4762         * ASIC reset has to be done on all XGMI hive nodes ASAP
4763         * to allow proper links negotiation in FW (within 1 sec)
4764         */
4765        if (!skip_hw_reset && need_full_reset) {
4766                list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
4767                        /* For XGMI run all resets in parallel to speed up the process */
4768                        if (tmp_adev->gmc.xgmi.num_physical_nodes > 1) {
4769                                tmp_adev->gmc.xgmi.pending_reset = false;
4770                                if (!queue_work(system_unbound_wq, &tmp_adev->xgmi_reset_work))
4771                                        r = -EALREADY;
4772                        } else
4773                                r = amdgpu_asic_reset(tmp_adev);
4774
4775                        if (r) {
4776                                dev_err(tmp_adev->dev, "ASIC reset failed with error, %d for drm dev, %s",
4777                                         r, adev_to_drm(tmp_adev)->unique);
4778                                break;
4779                        }
4780                }
4781
4782                /* For XGMI wait for all resets to complete before proceed */
4783                if (!r) {
4784                        list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
4785                                if (tmp_adev->gmc.xgmi.num_physical_nodes > 1) {
4786                                        flush_work(&tmp_adev->xgmi_reset_work);
4787                                        r = tmp_adev->asic_reset_res;
4788                                        if (r)
4789                                                break;
4790                                }
4791                        }
4792                }
4793        }
4794
4795        if (!r && amdgpu_ras_intr_triggered()) {
4796                list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
4797                        if (tmp_adev->mmhub.ras && tmp_adev->mmhub.ras->ras_block.hw_ops &&
4798                            tmp_adev->mmhub.ras->ras_block.hw_ops->reset_ras_error_count)
4799                                tmp_adev->mmhub.ras->ras_block.hw_ops->reset_ras_error_count(tmp_adev);
4800                }
4801
4802                amdgpu_ras_intr_cleared();
4803        }
4804
4805        list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
4806                if (need_full_reset) {
4807                        /* post card */
4808                        r = amdgpu_device_asic_init(tmp_adev);
4809                        if (r) {
4810                                dev_warn(tmp_adev->dev, "asic atom init failed!");
4811                        } else {
4812                                dev_info(tmp_adev->dev, "GPU reset succeeded, trying to resume\n");
4813                                r = amdgpu_amdkfd_resume_iommu(tmp_adev);
4814                                if (r)
4815                                        goto out;
4816
4817                                r = amdgpu_device_ip_resume_phase1(tmp_adev);
4818                                if (r)
4819                                        goto out;
4820
4821                                vram_lost = amdgpu_device_check_vram_lost(tmp_adev);
4822                                if (vram_lost) {
4823                                        DRM_INFO("VRAM is lost due to GPU reset!\n");
4824                                        amdgpu_inc_vram_lost(tmp_adev);
4825                                }
4826
4827                                r = amdgpu_device_fw_loading(tmp_adev);
4828                                if (r)
4829                                        return r;
4830
4831                                r = amdgpu_device_ip_resume_phase2(tmp_adev);
4832                                if (r)
4833                                        goto out;
4834
4835                                if (vram_lost)
4836                                        amdgpu_device_fill_reset_magic(tmp_adev);
4837
4838                                /*
4839                                 * Add this ASIC as tracked as reset was already
4840                                 * complete successfully.
4841                                 */
4842                                amdgpu_register_gpu_instance(tmp_adev);
4843
4844                                if (!reset_context->hive &&
4845                                    tmp_adev->gmc.xgmi.num_physical_nodes > 1)
4846                                        amdgpu_xgmi_add_device(tmp_adev);
4847
4848                                r = amdgpu_device_ip_late_init(tmp_adev);
4849                                if (r)
4850                                        goto out;
4851
4852                                drm_fb_helper_set_suspend_unlocked(adev_to_drm(tmp_adev)->fb_helper, false);
4853
4854                                /*
4855                                 * The GPU enters bad state once faulty pages
4856                                 * by ECC has reached the threshold, and ras
4857                                 * recovery is scheduled next. So add one check
4858                                 * here to break recovery if it indeed exceeds
4859                                 * bad page threshold, and remind user to
4860                                 * retire this GPU or setting one bigger
4861                                 * bad_page_threshold value to fix this once
4862                                 * probing driver again.
4863                                 */
4864                                if (!amdgpu_ras_eeprom_check_err_threshold(tmp_adev)) {
4865                                        /* must succeed. */
4866                                        amdgpu_ras_resume(tmp_adev);
4867                                } else {
4868                                        r = -EINVAL;
4869                                        goto out;
4870                                }
4871
4872                                /* Update PSP FW topology after reset */
4873                                if (reset_context->hive &&
4874                                    tmp_adev->gmc.xgmi.num_physical_nodes > 1)
4875                                        r = amdgpu_xgmi_update_topology(
4876                                                reset_context->hive, tmp_adev);
4877                        }
4878                }
4879
4880out:
4881                if (!r) {
4882                        amdgpu_irq_gpu_reset_resume_helper(tmp_adev);
4883                        r = amdgpu_ib_ring_tests(tmp_adev);
4884                        if (r) {
4885                                dev_err(tmp_adev->dev, "ib ring test failed (%d).\n", r);
4886                                need_full_reset = true;
4887                                r = -EAGAIN;
4888                                goto end;
4889                        }
4890                }
4891
4892                if (!r)
4893                        r = amdgpu_device_recover_vram(tmp_adev);
4894                else
4895                        tmp_adev->asic_reset_res = r;
4896        }
4897
4898end:
4899        if (need_full_reset)
4900                set_bit(AMDGPU_NEED_FULL_RESET, &reset_context->flags);
4901        else
4902                clear_bit(AMDGPU_NEED_FULL_RESET, &reset_context->flags);
4903        return r;
4904}
4905
4906static void amdgpu_device_set_mp1_state(struct amdgpu_device *adev)
4907{
4908
4909        switch (amdgpu_asic_reset_method(adev)) {
4910        case AMD_RESET_METHOD_MODE1:
4911                adev->mp1_state = PP_MP1_STATE_SHUTDOWN;
4912                break;
4913        case AMD_RESET_METHOD_MODE2:
4914                adev->mp1_state = PP_MP1_STATE_RESET;
4915                break;
4916        default:
4917                adev->mp1_state = PP_MP1_STATE_NONE;
4918                break;
4919        }
4920}
4921
4922static void amdgpu_device_unset_mp1_state(struct amdgpu_device *adev)
4923{
4924        amdgpu_vf_error_trans_all(adev);
4925        adev->mp1_state = PP_MP1_STATE_NONE;
4926}
4927
4928static void amdgpu_device_resume_display_audio(struct amdgpu_device *adev)
4929{
4930        struct pci_dev *p = NULL;
4931
4932        p = pci_get_domain_bus_and_slot(pci_domain_nr(adev->pdev->bus),
4933                        adev->pdev->bus->number, 1);
4934        if (p) {
4935                pm_runtime_enable(&(p->dev));
4936                pm_runtime_resume(&(p->dev));
4937        }
4938}
4939
4940static int amdgpu_device_suspend_display_audio(struct amdgpu_device *adev)
4941{
4942        enum amd_reset_method reset_method;
4943        struct pci_dev *p = NULL;
4944        u64 expires;
4945
4946        /*
4947         * For now, only BACO and mode1 reset are confirmed
4948         * to suffer the audio issue without proper suspended.
4949         */
4950        reset_method = amdgpu_asic_reset_method(adev);
4951        if ((reset_method != AMD_RESET_METHOD_BACO) &&
4952             (reset_method != AMD_RESET_METHOD_MODE1))
4953                return -EINVAL;
4954
4955        p = pci_get_domain_bus_and_slot(pci_domain_nr(adev->pdev->bus),
4956                        adev->pdev->bus->number, 1);
4957        if (!p)
4958                return -ENODEV;
4959
4960        expires = pm_runtime_autosuspend_expiration(&(p->dev));
4961        if (!expires)
4962                /*
4963                 * If we cannot get the audio device autosuspend delay,
4964                 * a fixed 4S interval will be used. Considering 3S is
4965                 * the audio controller default autosuspend delay setting.
4966                 * 4S used here is guaranteed to cover that.
4967                 */
4968                expires = ktime_get_mono_fast_ns() + NSEC_PER_SEC * 4ULL;
4969
4970        while (!pm_runtime_status_suspended(&(p->dev))) {
4971                if (!pm_runtime_suspend(&(p->dev)))
4972                        break;
4973
4974                if (expires < ktime_get_mono_fast_ns()) {
4975                        dev_warn(adev->dev, "failed to suspend display audio\n");
4976                        /* TODO: abort the succeeding gpu reset? */
4977                        return -ETIMEDOUT;
4978                }
4979        }
4980
4981        pm_runtime_disable(&(p->dev));
4982
4983        return 0;
4984}
4985
4986static void amdgpu_device_recheck_guilty_jobs(
4987        struct amdgpu_device *adev, struct list_head *device_list_handle,
4988        struct amdgpu_reset_context *reset_context)
4989{
4990        int i, r = 0;
4991
4992        for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
4993                struct amdgpu_ring *ring = adev->rings[i];
4994                int ret = 0;
4995                struct drm_sched_job *s_job;
4996
4997                if (!ring || !ring->sched.thread)
4998                        continue;
4999
5000                s_job = list_first_entry_or_null(&ring->sched.pending_list,

5001                                struct drm_sched_job, list);
5002                if (s_job == NULL)
5003                        continue;
5004
5005                /* clear job's guilty and depend the folowing step to decide the real one */
5006                drm_sched_reset_karma(s_job);
5007                /* for the real bad job, it will be resubmitted twice, adding a dma_fence_get
5008                 * to make sure fence is balanced */
5009                dma_fence_get(s_job->s_fence->parent);
5010                drm_sched_resubmit_jobs_ext(&ring->sched, 1);
5011
5012                ret = dma_fence_wait_timeout(s_job->s_fence->parent, false, ring->sched.timeout);
5013                if (ret == 0) { /* timeout */
5014                        DRM_ERROR("Found the real bad job! ring:%s, job_id:%llx\n",
5015                                                ring->sched.name, s_job->id);
5016
5017                        /* set guilty */
5018                        drm_sched_increase_karma(s_job);
5019retry:
5020                        /* do hw reset */
5021                        if (amdgpu_sriov_vf(adev)) {
5022                                amdgpu_virt_fini_data_exchange(adev);
5023                                r = amdgpu_device_reset_sriov(adev, false);
5024                                if (r)
5025                                        adev->asic_reset_res = r;
5026                        } else {
5027                                clear_bit(AMDGPU_SKIP_HW_RESET,
5028                                          &reset_context->flags);
5029                                r = amdgpu_do_asic_reset(device_list_handle,
5030                                                         reset_context);
5031                                if (r && r == -EAGAIN)
5032                                        goto retry;
5033                        }
5034
5035                        /*
5036                         * add reset counter so that the following
5037                         * resubmitted job could flush vmid
5038                         */
5039                        atomic_inc(&adev->gpu_reset_counter);
5040                        continue;
5041                }
5042
5043                /* got the hw fence, signal finished fence */
5044                atomic_dec(ring->sched.score);
5045                dma_fence_put(s_job->s_fence->parent);
5046                dma_fence_get(&s_job->s_fence->finished);
5047                dma_fence_signal(&s_job->s_fence->finished);
5048                dma_fence_put(&s_job->s_fence->finished);
5049
5050                /* remove node from list and free the job */
5051                spin_lock(&ring->sched.job_list_lock);
5052                list_del_init(&s_job->list);
5053                spin_unlock(&ring->sched.job_list_lock);
5054                ring->sched.ops->free_job(s_job);
5055        }
5056}
5057
5058/**
5059 * amdgpu_device_gpu_recover_imp - reset the asic and recover scheduler
5060 *
5061 * @adev: amdgpu_device pointer
5062 * @job: which job trigger hang
5063 *
5064 * Attempt to reset the GPU if it has hung (all asics).
5065 * Attempt to do soft-reset or full-reset and reinitialize Asic
5066 * Returns 0 for success or an error on failure.
5067 */
5068
5069int amdgpu_device_gpu_recover_imp(struct amdgpu_device *adev,
5070                              struct amdgpu_job *job)
5071{
5072        struct list_head device_list, *device_list_handle =  NULL;
5073        bool job_signaled = false;
5074        struct amdgpu_hive_info *hive = NULL;
5075        struct amdgpu_device *tmp_adev = NULL;
5076        int i, r = 0;
5077        bool need_emergency_restart = false;
5078        bool audio_suspended = false;
5079        int tmp_vram_lost_counter;
5080        struct amdgpu_reset_context reset_context;
5081
5082        memset(&reset_context, 0, sizeof(reset_context));
5083
5084        /*
5085         * Special case: RAS triggered and full reset isn't supported
5086         */
5087        need_emergency_restart = amdgpu_ras_need_emergency_restart(adev);
5088
5089        /*
5090         * Flush RAM to disk so that after reboot
5091         * the user can read log and see why the system rebooted.
5092         */
5093        if (need_emergency_restart && amdgpu_ras_get_context(adev)->reboot) {
5094                DRM_WARN("Emergency reboot.");
5095
5096                ksys_sync_helper();
5097                emergency_restart();
5098        }
5099
5100        dev_info(adev->dev, "GPU %s begin!\n",
5101                need_emergency_restart ? "jobs stop":"reset");
5102
5103        if (!amdgpu_sriov_vf(adev))
5104                hive = amdgpu_get_xgmi_hive(adev);
5105        if (hive)
5106                mutex_lock(&hive->hive_lock);
5107
5108        reset_context.method = AMD_RESET_METHOD_NONE;
5109        reset_context.reset_req_dev = adev;
5110        reset_context.job = job;
5111        reset_context.hive = hive;
5112        clear_bit(AMDGPU_NEED_FULL_RESET, &reset_context.flags);
5113
5114        /*
5115         * Build list of devices to reset.
5116         * In case we are in XGMI hive mode, resort the device list
5117         * to put adev in the 1st position.
5118         */
5119        INIT_LIST_HEAD(&device_list);
5120        if (!amdgpu_sriov_vf(adev) && (adev->gmc.xgmi.num_physical_nodes > 1)) {
5121                list_for_each_entry(tmp_adev, &hive->device_list, gmc.xgmi.head)
5122                        list_add_tail(&tmp_adev->reset_list, &device_list);
5123                if (!list_is_first(&adev->reset_list, &device_list))
5124                        list_rotate_to_front(&adev->reset_list, &device_list);
5125                device_list_handle = &device_list;
5126        } else {
5127                list_add_tail(&adev->reset_list, &device_list);
5128                device_list_handle = &device_list;
5129        }
5130
5131        /* We need to lock reset domain only once both for XGMI and single device */
5132        tmp_adev = list_first_entry(device_list_handle, struct amdgpu_device,
5133                                    reset_list);
5134        amdgpu_device_lock_reset_domain(tmp_adev->reset_domain);
5135
5136        /* block all schedulers and reset given job's ring */
5137        list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
5138
5139                amdgpu_device_set_mp1_state(tmp_adev);
5140
5141                /*
5142                 * Try to put the audio codec into suspend state
5143                 * before gpu reset started.
5144                 *
5145                 * Due to the power domain of the graphics device
5146                 * is shared with AZ power domain. Without this,
5147                 * we may change the audio hardware from behind
5148                 * the audio driver's back. That will trigger
5149                 * some audio codec errors.
5150                 */
5151                if (!amdgpu_device_suspend_display_audio(tmp_adev))
5152                        audio_suspended = true;
5153
5154                amdgpu_ras_set_error_query_ready(tmp_adev, false);
5155
5156                cancel_delayed_work_sync(&tmp_adev->delayed_init_work);
5157
5158                if (!amdgpu_sriov_vf(tmp_adev))
5159                        amdgpu_amdkfd_pre_reset(tmp_adev);
5160
5161                /*
5162                 * Mark these ASICs to be reseted as untracked first
5163                 * And add them back after reset completed
5164                 */
5165                amdgpu_unregister_gpu_instance(tmp_adev);
5166
5167                drm_fb_helper_set_suspend_unlocked(adev_to_drm(tmp_adev)->fb_helper, true);
5168
5169                /* disable ras on ALL IPs */
5170                if (!need_emergency_restart &&
5171                      amdgpu_device_ip_need_full_reset(tmp_adev))
5172                        amdgpu_ras_suspend(tmp_adev);
5173
5174                for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
5175                        struct amdgpu_ring *ring = tmp_adev->rings[i];
5176
5177                        if (!ring || !ring->sched.thread)
5178                                continue;
5179
5180                        drm_sched_stop(&ring->sched, job ? &job->base : NULL);
5181
5182                        if (need_emergency_restart)
5183                                amdgpu_job_stop_all_jobs_on_sched(&ring->sched);
5184                }
5185                atomic_inc(&tmp_adev->gpu_reset_counter);
5186        }
5187
5188        if (need_emergency_restart)
5189                goto skip_sched_resume;
5190
5191        /*
5192         * Must check guilty signal here since after this point all old
5193         * HW fences are force signaled.
5194         *
5195         * job->base holds a reference to parent fence
5196         */
5197        if (job && job->base.s_fence->parent &&
5198            dma_fence_is_signaled(job->base.s_fence->parent)) {
5199                job_signaled = true;
5200                dev_info(adev->dev, "Guilty job already signaled, skipping HW reset");
5201                goto skip_hw_reset;
5202        }
5203
5204retry:  /* Rest of adevs pre asic reset from XGMI hive. */
5205        list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
5206                r = amdgpu_device_pre_asic_reset(tmp_adev, &reset_context);
5207                /*TODO Should we stop ?*/
5208                if (r) {
5209                        dev_err(tmp_adev->dev, "GPU pre asic reset failed with err, %d for drm dev, %s ",
5210                                  r, adev_to_drm(tmp_adev)->unique);
5211                        tmp_adev->asic_reset_res = r;
5212                }
5213        }
5214
5215        tmp_vram_lost_counter = atomic_read(&((adev)->vram_lost_counter));
5216        /* Actual ASIC resets if needed.*/
5217        /* Host driver will handle XGMI hive reset for SRIOV */
5218        if (amdgpu_sriov_vf(adev)) {
5219                r = amdgpu_device_reset_sriov(adev, job ? false : true);
5220                if (r)
5221                        adev->asic_reset_res = r;
5222
5223                /* Aldebaran supports ras in SRIOV, so need resume ras during reset */
5224                if (adev->ip_versions[GC_HWIP][0] == IP_VERSION(9, 4, 2))
5225                        amdgpu_ras_resume(adev);
5226        } else {
5227                r = amdgpu_do_asic_reset(device_list_handle, &reset_context);
5228                if (r && r == -EAGAIN)
5229                        goto retry;
5230        }
5231
5232skip_hw_reset:
5233
5234        /* Post ASIC reset for all devs .*/
5235        list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
5236
5237                /*
5238                 * Sometimes a later bad compute job can block a good gfx job as gfx
5239                 * and compute ring share internal GC HW mutually. We add an additional
5240                 * guilty jobs recheck step to find the real guilty job, it synchronously
5241                 * submits and pends for the first job being signaled. If it gets timeout,
5242                 * we identify it as a real guilty job.
5243                 */
5244                if (amdgpu_gpu_recovery == 2 &&
5245                        !(tmp_vram_lost_counter < atomic_read(&adev->vram_lost_counter)))
5246                        amdgpu_device_recheck_guilty_jobs(
5247                                tmp_adev, device_list_handle, &reset_context);
5248
5249                for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
5250                        struct amdgpu_ring *ring = tmp_adev->rings[i];
5251
5252                        if (!ring || !ring->sched.thread)
5253                                continue;
5254
5255                        /* No point to resubmit jobs if we didn't HW reset*/
5256                        if (!tmp_adev->asic_reset_res && !job_signaled)
5257                                drm_sched_resubmit_jobs(&ring->sched);
5258
5259                        drm_sched_start(&ring->sched, !tmp_adev->asic_reset_res);
5260                }
5261
5262                if (!drm_drv_uses_atomic_modeset(adev_to_drm(tmp_adev)) && !job_signaled) {
5263                        drm_helper_resume_force_mode(adev_to_drm(tmp_adev));
5264                }
5265
5266                if (tmp_adev->asic_reset_res)
5267                        r = tmp_adev->asic_reset_res;
5268
5269                tmp_adev->asic_reset_res = 0;
5270
5271                if (r) {
5272                        /* bad news, how to tell it to userspace ? */
5273                        dev_info(tmp_adev->dev, "GPU reset(%d) failed\n", atomic_read(&tmp_adev->gpu_reset_counter));
5274                        amdgpu_vf_error_put(tmp_adev, AMDGIM_ERROR_VF_GPU_RESET_FAIL, 0, r);
5275                } else {
5276                        dev_info(tmp_adev->dev, "GPU reset(%d) succeeded!\n", atomic_read(&tmp_adev->gpu_reset_counter));
5277                        if (amdgpu_acpi_smart_shift_update(adev_to_drm(tmp_adev), AMDGPU_SS_DEV_D0))
5278                                DRM_WARN("smart shift update failed\n");
5279                }
5280        }
5281
5282skip_sched_resume:
5283        list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
5284                /* unlock kfd: SRIOV would do it separately */
5285                if (!need_emergency_restart && !amdgpu_sriov_vf(tmp_adev))
5286                        amdgpu_amdkfd_post_reset(tmp_adev);
5287
5288                /* kfd_post_reset will do nothing if kfd device is not initialized,
5289                 * need to bring up kfd here if it's not be initialized before
5290                 */
5291                if (!adev->kfd.init_complete)
5292                        amdgpu_amdkfd_device_init(adev);
5293
5294                if (audio_suspended)
5295                        amdgpu_device_resume_display_audio(tmp_adev);
5296
5297                amdgpu_device_unset_mp1_state(tmp_adev);
5298        }
5299
5300        tmp_adev = list_first_entry(device_list_handle, struct amdgpu_device,
5301                                            reset_list);
5302        amdgpu_device_unlock_reset_domain(tmp_adev->reset_domain);
5303
5304        if (hive) {
5305                mutex_unlock(&hive->hive_lock);
5306                amdgpu_put_xgmi_hive(hive);
5307        }
5308
5309        if (r)
5310                dev_info(adev->dev, "GPU reset end with ret = %d\n", r);
5311        return r;
5312}
5313
5314struct amdgpu_recover_work_struct {
5315        struct work_struct base;
5316        struct amdgpu_device *adev;
5317        struct amdgpu_job *job;
5318        int ret;
5319};
5320
5321static void amdgpu_device_queue_gpu_recover_work(struct work_struct *work)
5322{
5323        struct amdgpu_recover_work_struct *recover_work = container_of(work, struct amdgpu_recover_work_struct, base);
5324
5325        recover_work->ret = amdgpu_device_gpu_recover_imp(recover_work->adev, recover_work->job);
5326}
5327/*
5328 * Serialize gpu recover into reset domain single threaded wq
5329 */
5330int amdgpu_device_gpu_recover(struct amdgpu_device *adev,
5331                                    struct amdgpu_job *job)
5332{
5333        struct amdgpu_recover_work_struct work = {.adev = adev, .job = job};
5334
5335        INIT_WORK(&work.base, amdgpu_device_queue_gpu_recover_work);
5336
5337        if (!amdgpu_reset_domain_schedule(adev->reset_domain, &work.base))
5338                return -EAGAIN;
5339
5340        flush_work(&work.base);
5341
5342        return work.ret;
5343}
5344
5345/**
5346 * amdgpu_device_get_pcie_info - fence pcie info about the PCIE slot
5347 *
5348 * @adev: amdgpu_device pointer
5349 *
5350 * Fetchs and stores in the driver the PCIE capabilities (gen speed
5351 * and lanes) of the slot the device is in. Handles APUs and
5352 * virtualized environments where PCIE config space may not be available.
5353 */
5354static void amdgpu_device_get_pcie_info(struct amdgpu_device *adev)
5355{
5356        struct pci_dev *pdev;
5357        enum pci_bus_speed speed_cap, platform_speed_cap;
5358        enum pcie_link_width platform_link_width;
5359
5360        if (amdgpu_pcie_gen_cap)
5361                adev->pm.pcie_gen_mask = amdgpu_pcie_gen_cap;
5362
5363        if (amdgpu_pcie_lane_cap)
5364                adev->pm.pcie_mlw_mask = amdgpu_pcie_lane_cap;
5365
5366        /* covers APUs as well */
5367        if (pci_is_root_bus(adev->pdev->bus)) {
5368                if (adev->pm.pcie_gen_mask == 0)
5369                        adev->pm.pcie_gen_mask = AMDGPU_DEFAULT_PCIE_GEN_MASK;
5370                if (adev->pm.pcie_mlw_mask == 0)
5371                        adev->pm.pcie_mlw_mask = AMDGPU_DEFAULT_PCIE_MLW_MASK;
5372                return;
5373        }
5374
5375        if (adev->pm.pcie_gen_mask && adev->pm.pcie_mlw_mask)
5376                return;
5377
5378        pcie_bandwidth_available(adev->pdev, NULL,
5379                                 &platform_speed_cap, &platform_link_width);
5380
5381        if (adev->pm.pcie_gen_mask == 0) {
5382                /* asic caps */
5383                pdev = adev->pdev;
5384                speed_cap = pcie_get_speed_cap(pdev);
5385                if (speed_cap == PCI_SPEED_UNKNOWN) {
5386                        adev->pm.pcie_gen_mask |= (CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN1 |
5387                                                  CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN2 |
5388                                                  CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN3);
5389                } else {
5390                        if (speed_cap == PCIE_SPEED_32_0GT)
5391                                adev->pm.pcie_gen_mask |= (CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN1 |
5392                                                          CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN2 |
5393                                                          CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN3 |
5394                                                          CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN4 |
5395                                                          CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN5);
5396                        else if (speed_cap == PCIE_SPEED_16_0GT)
5397                                adev->pm.pcie_gen_mask |= (CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN1 |
5398                                                          CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN2 |
5399                                                          CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN3 |
5400                                                          CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN4);
5401                        else if (speed_cap == PCIE_SPEED_8_0GT)
5402                                adev->pm.pcie_gen_mask |= (CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN1 |
5403                                                          CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN2 |
5404                                                          CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN3);
5405                        else if (speed_cap == PCIE_SPEED_5_0GT)
5406                                adev->pm.pcie_gen_mask |= (CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN1 |
5407                                                          CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN2);
5408                        else
5409                                adev->pm.pcie_gen_mask |= CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN1;
5410                }
5411                /* platform caps */
5412                if (platform_speed_cap == PCI_SPEED_UNKNOWN) {
5413                        adev->pm.pcie_gen_mask |= (CAIL_PCIE_LINK_SPEED_SUPPORT_GEN1 |
5414                                                   CAIL_PCIE_LINK_SPEED_SUPPORT_GEN2);
5415                } else {
5416                        if (platform_speed_cap == PCIE_SPEED_32_0GT)
5417                                adev->pm.pcie_gen_mask |= (CAIL_PCIE_LINK_SPEED_SUPPORT_GEN1 |
5418                                                           CAIL_PCIE_LINK_SPEED_SUPPORT_GEN2 |
5419                                                           CAIL_PCIE_LINK_SPEED_SUPPORT_GEN3 |
5420                                                           CAIL_PCIE_LINK_SPEED_SUPPORT_GEN4 |
5421                                                           CAIL_PCIE_LINK_SPEED_SUPPORT_GEN5);
5422                        else if (platform_speed_cap == PCIE_SPEED_16_0GT)
5423                                adev->pm.pcie_gen_mask |= (CAIL_PCIE_LINK_SPEED_SUPPORT_GEN1 |
5424                                                           CAIL_PCIE_LINK_SPEED_SUPPORT_GEN2 |
5425                                                           CAIL_PCIE_LINK_SPEED_SUPPORT_GEN3 |
5426                                                           CAIL_PCIE_LINK_SPEED_SUPPORT_GEN4);
5427                        else if (platform_speed_cap == PCIE_SPEED_8_0GT)
5428                                adev->pm.pcie_gen_mask |= (CAIL_PCIE_LINK_SPEED_SUPPORT_GEN1 |
5429                                                           CAIL_PCIE_LINK_SPEED_SUPPORT_GEN2 |
5430                                                           CAIL_PCIE_LINK_SPEED_SUPPORT_GEN3);
5431                        else if (platform_speed_cap == PCIE_SPEED_5_0GT)
5432                                adev->pm.pcie_gen_mask |= (CAIL_PCIE_LINK_SPEED_SUPPORT_GEN1 |
5433                                                           CAIL_PCIE_LINK_SPEED_SUPPORT_GEN2);
5434                        else
5435                                adev->pm.pcie_gen_mask |= CAIL_PCIE_LINK_SPEED_SUPPORT_GEN1;
5436
5437                }
5438        }
5439        if (adev->pm.pcie_mlw_mask == 0) {
5440                if (platform_link_width == PCIE_LNK_WIDTH_UNKNOWN) {
5441                        adev->pm.pcie_mlw_mask |= AMDGPU_DEFAULT_PCIE_MLW_MASK;
5442                } else {
5443                        switch (platform_link_width) {
5444                        case PCIE_LNK_X32:
5445                                adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X32 |
5446                                                          CAIL_PCIE_LINK_WIDTH_SUPPORT_X16 |
5447                                                          CAIL_PCIE_LINK_WIDTH_SUPPORT_X12 |
5448                                                          CAIL_PCIE_LINK_WIDTH_SUPPORT_X8 |
5449                                                          CAIL_PCIE_LINK_WIDTH_SUPPORT_X4 |
5450                                                          CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
5451                                                          CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
5452                                break;
5453                        case PCIE_LNK_X16:
5454                                adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X16 |
5455                                                          CAIL_PCIE_LINK_WIDTH_SUPPORT_X12 |
5456                                                          CAIL_PCIE_LINK_WIDTH_SUPPORT_X8 |
5457                                                          CAIL_PCIE_LINK_WIDTH_SUPPORT_X4 |
5458                                                          CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
5459                                                          CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
5460                                break;
5461                        case PCIE_LNK_X12:
5462                                adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X12 |
5463                                                          CAIL_PCIE_LINK_WIDTH_SUPPORT_X8 |
5464                                                          CAIL_PCIE_LINK_WIDTH_SUPPORT_X4 |
5465                                                          CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
5466                                                          CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
5467                                break;
5468                        case PCIE_LNK_X8:
5469                                adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X8 |
5470                                                          CAIL_PCIE_LINK_WIDTH_SUPPORT_X4 |
5471                                                          CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
5472                                                          CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
5473                                break;
5474                        case PCIE_LNK_X4:
5475                                adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X4 |
5476                                                          CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
5477                                                          CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
5478                                break;
5479                        case PCIE_LNK_X2:
5480                                adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
5481                                                          CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
5482                                break;
5483                        case PCIE_LNK_X1:
5484                                adev->pm.pcie_mlw_mask = CAIL_PCIE_LINK_WIDTH_SUPPORT_X1;
5485                                break;
5486                        default:
5487                                break;
5488                        }
5489                }
5490        }
5491}
5492
5493int amdgpu_device_baco_enter(struct drm_device *dev)
5494{
5495        struct amdgpu_device *adev = drm_to_adev(dev);
5496        struct amdgpu_ras *ras = amdgpu_ras_get_context(adev);
5497
5498        if (!amdgpu_device_supports_baco(adev_to_drm(adev)))
5499                return -ENOTSUPP;
5500
5501        if (ras && adev->ras_enabled &&
5502            adev->nbio.funcs->enable_doorbell_interrupt)
5503                adev->nbio.funcs->enable_doorbell_interrupt(adev, false);
5504
5505        return amdgpu_dpm_baco_enter(adev);
5506}
5507
5508int amdgpu_device_baco_exit(struct drm_device *dev)
5509{
5510        struct amdgpu_device *adev = drm_to_adev(dev);
5511        struct amdgpu_ras *ras = amdgpu_ras_get_context(adev);
5512        int ret = 0;
5513
5514        if (!amdgpu_device_supports_baco(adev_to_drm(adev)))
5515                return -ENOTSUPP;
5516
5517        ret = amdgpu_dpm_baco_exit(adev);
5518        if (ret)
5519                return ret;
5520
5521        if (ras && adev->ras_enabled &&
5522            adev->nbio.funcs->enable_doorbell_interrupt)
5523                adev->nbio.funcs->enable_doorbell_interrupt(adev, true);
5524
5525        if (amdgpu_passthrough(adev) &&
5526            adev->nbio.funcs->clear_doorbell_interrupt)
5527                adev->nbio.funcs->clear_doorbell_interrupt(adev);
5528
5529        return 0;
5530}
5531
5532/**
5533 * amdgpu_pci_error_detected - Called when a PCI error is detected.
5534 * @pdev: PCI device struct
5535 * @state: PCI channel state
5536 *
5537 * Description: Called when a PCI error is detected.
5538 *
5539 * Return: PCI_ERS_RESULT_NEED_RESET or PCI_ERS_RESULT_DISCONNECT.
5540 */
5541pci_ers_result_t amdgpu_pci_error_detected(struct pci_dev *pdev, pci_channel_state_t state)
5542{
5543        struct drm_device *dev = pci_get_drvdata(pdev);
5544        struct amdgpu_device *adev = drm_to_adev(dev);
5545        int i;
5546
5547        DRM_INFO("PCI error: detected callback, state(%d)!!\n", state);
5548
5549        if (adev->gmc.xgmi.num_physical_nodes > 1) {
5550                DRM_WARN("No support for XGMI hive yet...");
5551                return PCI_ERS_RESULT_DISCONNECT;
5552        }
5553
5554        adev->pci_channel_state = state;
5555
5556        switch (state) {
5557        case pci_channel_io_normal:
5558                return PCI_ERS_RESULT_CAN_RECOVER;
5559        /* Fatal error, prepare for slot reset */
5560        case pci_channel_io_frozen:
5561                /*
5562                 * Locking adev->reset_domain->sem will prevent any external access
5563                 * to GPU during PCI error recovery
5564                 */
5565                amdgpu_device_lock_reset_domain(adev->reset_domain);
5566                amdgpu_device_set_mp1_state(adev);
5567
5568                /*
5569                 * Block any work scheduling as we do for regular GPU reset
5570                 * for the duration of the recovery
5571                 */
5572                for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
5573                        struct amdgpu_ring *ring = adev->rings[i];
5574
5575                        if (!ring || !ring->sched.thread)
5576                                continue;
5577
5578                        drm_sched_stop(&ring->sched, NULL);
5579                }
5580                atomic_inc(&adev->gpu_reset_counter);
5581                return PCI_ERS_RESULT_NEED_RESET;
5582        case pci_channel_io_perm_failure:
5583                /* Permanent error, prepare for device removal */
5584                return PCI_ERS_RESULT_DISCONNECT;
5585        }
5586
5587        return PCI_ERS_RESULT_NEED_RESET;
5588}
5589
5590/**
5591 * amdgpu_pci_mmio_enabled - Enable MMIO and dump debug registers
5592 * @pdev: pointer to PCI device
5593 */
5594pci_ers_result_t amdgpu_pci_mmio_enabled(struct pci_dev *pdev)
5595{
5596
5597        DRM_INFO("PCI error: mmio enabled callback!!\n");
5598
5599        /* TODO - dump whatever for debugging purposes */
5600
5601        /* This called only if amdgpu_pci_error_detected returns
5602         * PCI_ERS_RESULT_CAN_RECOVER. Read/write to the device still
5603         * works, no need to reset slot.
5604         */
5605
5606        return PCI_ERS_RESULT_RECOVERED;
5607}
5608
5609/**
5610 * amdgpu_pci_slot_reset - Called when PCI slot has been reset.
5611 * @pdev: PCI device struct
5612 *
5613 * Description: This routine is called by the pci error recovery
5614 * code after the PCI slot has been reset, just before we
5615 * should resume normal operations.
5616 */
5617pci_ers_result_t amdgpu_pci_slot_reset(struct pci_dev *pdev)
5618{
5619        struct drm_device *dev = pci_get_drvdata(pdev);
5620        struct amdgpu_device *adev = drm_to_adev(dev);
5621        int r, i;
5622        struct amdgpu_reset_context reset_context;
5623        u32 memsize;
5624        struct list_head device_list;
5625
5626        DRM_INFO("PCI error: slot reset callback!!\n");
5627
5628        memset(&reset_context, 0, sizeof(reset_context));
5629
5630        INIT_LIST_HEAD(&device_list);
5631        list_add_tail(&adev->reset_list, &device_list);
5632
5633        /* wait for asic to come out of reset */
5634        msleep(500);
5635
5636        /* Restore PCI confspace */
5637        amdgpu_device_load_pci_state(pdev);
5638
5639        /* confirm  ASIC came out of reset */
5640        for (i = 0; i < adev->usec_timeout; i++) {
5641                memsize = amdgpu_asic_get_config_memsize(adev);
5642
5643                if (memsize != 0xffffffff)
5644                        break;
5645                udelay(1);
5646        }
5647        if (memsize == 0xffffffff) {
5648                r = -ETIME;
5649                goto out;
5650        }
5651
5652        reset_context.method = AMD_RESET_METHOD_NONE;
5653        reset_context.reset_req_dev = adev;
5654        set_bit(AMDGPU_NEED_FULL_RESET, &reset_context.flags);
5655        set_bit(AMDGPU_SKIP_HW_RESET, &reset_context.flags);
5656
5657        adev->no_hw_access = true;
5658        r = amdgpu_device_pre_asic_reset(adev, &reset_context);
5659        adev->no_hw_access = false;
5660        if (r)
5661                goto out;
5662
5663        r = amdgpu_do_asic_reset(&device_list, &reset_context);
5664
5665out:
5666        if (!r) {
5667                if (amdgpu_device_cache_pci_state(adev->pdev))
5668                        pci_restore_state(adev->pdev);
5669
5670                DRM_INFO("PCIe error recovery succeeded\n");
5671        } else {
5672                DRM_ERROR("PCIe error recovery failed, err:%d", r);
5673                amdgpu_device_unset_mp1_state(adev);
5674                amdgpu_device_unlock_reset_domain(adev->reset_domain);
5675        }
5676
5677        return r ? PCI_ERS_RESULT_DISCONNECT : PCI_ERS_RESULT_RECOVERED;
5678}
5679
5680/**
5681 * amdgpu_pci_resume() - resume normal ops after PCI reset
5682 * @pdev: pointer to PCI device
5683 *
5684 * Called when the error recovery driver tells us that its
5685 * OK to resume normal operation.
5686 */
5687void amdgpu_pci_resume(struct pci_dev *pdev)
5688{
5689        struct drm_device *dev = pci_get_drvdata(pdev);
5690        struct amdgpu_device *adev = drm_to_adev(dev);
5691        int i;
5692
5693
5694        DRM_INFO("PCI error: resume callback!!\n");
5695
5696        /* Only continue execution for the case of pci_channel_io_frozen */
5697        if (adev->pci_channel_state != pci_channel_io_frozen)
5698                return;
5699
5700        for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
5701                struct amdgpu_ring *ring = adev->rings[i];
5702
5703                if (!ring || !ring->sched.thread)
5704                        continue;
5705
5706
5707                drm_sched_resubmit_jobs(&ring->sched);
5708                drm_sched_start(&ring->sched, true);
5709        }
5710
5711        amdgpu_device_unset_mp1_state(adev);
5712        amdgpu_device_unlock_reset_domain(adev->reset_domain);
5713}
5714
5715bool amdgpu_device_cache_pci_state(struct pci_dev *pdev)
5716{
5717        struct drm_device *dev = pci_get_drvdata(pdev);
5718        struct amdgpu_device *adev = drm_to_adev(dev);
5719        int r;
5720
5721        r = pci_save_state(pdev);
5722        if (!r) {
5723                kfree(adev->pci_state);
5724
5725                adev->pci_state = pci_store_saved_state(pdev);
5726
5727                if (!adev->pci_state) {
5728                        DRM_ERROR("Failed to store PCI saved state");
5729                        return false;
5730                }
5731        } else {
5732                DRM_WARN("Failed to save PCI state, err:%d\n", r);
5733                return false;
5734        }
5735
5736        return true;
5737}
5738
5739bool amdgpu_device_load_pci_state(struct pci_dev *pdev)
5740{
5741        struct drm_device *dev = pci_get_drvdata(pdev);
5742        struct amdgpu_device *adev = drm_to_adev(dev);
5743        int r;
5744
5745        if (!adev->pci_state)
5746                return false;
5747
5748        r = pci_load_saved_state(pdev, adev->pci_state);
5749
5750        if (!r) {
5751                pci_restore_state(pdev);
5752        } else {
5753                DRM_WARN("Failed to load PCI state, err:%d\n", r);
5754                return false;
5755        }
5756
5757        return true;
5758}
5759
5760void amdgpu_device_flush_hdp(struct amdgpu_device *adev,
5761                struct amdgpu_ring *ring)
5762{
5763#ifdef CONFIG_X86_64
5764        if ((adev->flags & AMD_IS_APU) && !amdgpu_passthrough(adev))
5765                return;
5766#endif
5767        if (adev->gmc.xgmi.connected_to_cpu)
5768                return;
5769
5770        if (ring && ring->funcs->emit_hdp_flush)
5771                amdgpu_ring_emit_hdp_flush(ring);
5772        else
5773                amdgpu_asic_flush_hdp(adev, ring);
5774}
5775
5776void amdgpu_device_invalidate_hdp(struct amdgpu_device *adev,
5777                struct amdgpu_ring *ring)
5778{
5779#ifdef CONFIG_X86_64
5780        if ((adev->flags & AMD_IS_APU) && !amdgpu_passthrough(adev))
5781                return;
5782#endif
5783        if (adev->gmc.xgmi.connected_to_cpu)
5784                return;
5785
5786        amdgpu_asic_invalidate_hdp(adev, ring);
5787}
5788
5789int amdgpu_in_reset(struct amdgpu_device *adev)
5790{
5791        return atomic_read(&adev->reset_domain->in_gpu_reset);
5792        }
5793        
5794/**
5795 * amdgpu_device_halt() - bring hardware to some kind of halt state
5796 *
5797 * @adev: amdgpu_device pointer
5798 *
5799 * Bring hardware to some kind of halt state so that no one can touch it
5800 * any more. It will help to maintain error context when error occurred.
5801 * Compare to a simple hang, the system will keep stable at least for SSH
5802 * access. Then it should be trivial to inspect the hardware state and
5803 * see what's going on. Implemented as following:
5804 *
5805 * 1. drm_dev_unplug() makes device inaccessible to user space(IOCTLs, etc),
5806 *    clears all CPU mappings to device, disallows remappings through page faults
5807 * 2. amdgpu_irq_disable_all() disables all interrupts
5808 * 3. amdgpu_fence_driver_hw_fini() signals all HW fences
5809 * 4. set adev->no_hw_access to avoid potential crashes after setp 5
5810 * 5. amdgpu_device_unmap_mmio() clears all MMIO mappings
5811 * 6. pci_disable_device() and pci_wait_for_pending_transaction()
5812 *    flush any in flight DMA operations
5813 */
5814void amdgpu_device_halt(struct amdgpu_device *adev)
5815{
5816        struct pci_dev *pdev = adev->pdev;
5817        struct drm_device *ddev = adev_to_drm(adev);
5818
5819        drm_dev_unplug(ddev);
5820
5821        amdgpu_irq_disable_all(adev);
5822
5823        amdgpu_fence_driver_hw_fini(adev);
5824
5825        adev->no_hw_access = true;
5826
5827        amdgpu_device_unmap_mmio(adev);
5828
5829        pci_disable_device(pdev);
5830        pci_wait_for_pending_transaction(pdev);
5831}
5832
5833u32 amdgpu_device_pcie_port_rreg(struct amdgpu_device *adev,
5834                                u32 reg)
5835{
5836        unsigned long flags, address, data;
5837        u32 r;
5838
5839        address = adev->nbio.funcs->get_pcie_port_index_offset(adev);
5840        data = adev->nbio.funcs->get_pcie_port_data_offset(adev);
5841
5842        spin_lock_irqsave(&adev->pcie_idx_lock, flags);
5843        WREG32(address, reg * 4);
5844        (void)RREG32(address);
5845        r = RREG32(data);
5846        spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
5847        return r;
5848}
5849
5850void amdgpu_device_pcie_port_wreg(struct amdgpu_device *adev,
5851                                u32 reg, u32 v)
5852{
5853        unsigned long flags, address, data;
5854
5855        address = adev->nbio.funcs->get_pcie_port_index_offset(adev);
5856        data = adev->nbio.funcs->get_pcie_port_data_offset(adev);
5857
5858        spin_lock_irqsave(&adev->pcie_idx_lock, flags);
5859        WREG32(address, reg * 4);
5860        (void)RREG32(address);
5861        WREG32(data, v);
5862        (void)RREG32(data);
5863        spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
5864}
5865