drivers/gpu/drm/amd/amdgpu/amdgpu_device.c

   1 /*
   2  * Copyright 2008 Advanced Micro Devices, Inc.
   3  * Copyright 2008 Red Hat Inc.
   4  * Copyright 2009 Jerome Glisse.
   5  *
   6  * Permission is hereby granted, free of charge, to any person obtaining a
   7  * copy of this software and associated documentation files (the "Software"),
   8  * to deal in the Software without restriction, including without limitation
   9  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  10  * and/or sell copies of the Software, and to permit persons to whom the
  11  * Software is furnished to do so, subject to the following conditions:
  12  *
  13  * The above copyright notice and this permission notice shall be included in
  14  * all copies or substantial portions of the Software.
  15  *
  16  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  17  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  18  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
  19  * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  20  * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  21  * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  22  * OTHER DEALINGS IN THE SOFTWARE.
  23  *
  24  * Authors: Dave Airlie
  25  *          Alex Deucher
  26  *          Jerome Glisse
  27  */
  28 #include <linux/power_supply.h>
  29 #include <linux/kthread.h>
  30 #include <linux/module.h>
  31 #include <linux/console.h>
  32 #include <linux/slab.h>
  33 #include <linux/iommu.h>
  34 #include <linux/pci.h>
  35 #include <linux/devcoredump.h>
  36 #include <generated/utsrelease.h>
  37 #include <linux/pci-p2pdma.h>
  38
  39 #include <drm/drm_atomic_helper.h>
  40 #include <drm/drm_fb_helper.h>
  41 #include <drm/drm_probe_helper.h>
  42 #include <drm/amdgpu_drm.h>
  43 #include <linux/vgaarb.h>
  44 #include <linux/vga_switcheroo.h>
  45 #include <linux/efi.h>
  46 #include "amdgpu.h"
  47 #include "amdgpu_trace.h"
  48 #include "amdgpu_i2c.h"
  49 #include "atom.h"
  50 #include "amdgpu_atombios.h"
  51 #include "amdgpu_atomfirmware.h"
  52 #include "amd_pcie.h"
  53 #ifdef CONFIG_DRM_AMDGPU_SI
  54 #include "si.h"
  55 #endif
  56 #ifdef CONFIG_DRM_AMDGPU_CIK
  57 #include "cik.h"
  58 #endif
  59 #include "vi.h"
  60 #include "soc15.h"
  61 #include "nv.h"
  62 #include "bif/bif_4_1_d.h"
  63 #include <linux/firmware.h>
  64 #include "amdgpu_vf_error.h"
  65
  66 #include "amdgpu_amdkfd.h"
  67 #include "amdgpu_pm.h"
  68
  69 #include "amdgpu_xgmi.h"
  70 #include "amdgpu_ras.h"
  71 #include "amdgpu_pmu.h"
  72 #include "amdgpu_fru_eeprom.h"
  73 #include "amdgpu_reset.h"
  74
  75 #include <linux/suspend.h>
  76 #include <drm/task_barrier.h>
  77 #include <linux/pm_runtime.h>
  78
  79 #include <drm/drm_drv.h>
  80
  81 MODULE_FIRMWARE("amdgpu/vega10_gpu_info.bin");
  82 MODULE_FIRMWARE("amdgpu/vega12_gpu_info.bin");
  83 MODULE_FIRMWARE("amdgpu/raven_gpu_info.bin");
  84 MODULE_FIRMWARE("amdgpu/picasso_gpu_info.bin");
  85 MODULE_FIRMWARE("amdgpu/raven2_gpu_info.bin");
  86 MODULE_FIRMWARE("amdgpu/arcturus_gpu_info.bin");
  87 MODULE_FIRMWARE("amdgpu/navi12_gpu_info.bin");
  88
  89 #define AMDGPU_RESUME_MS                2000
  90 #define AMDGPU_MAX_RETRY_LIMIT          2
  91 #define AMDGPU_RETRY_SRIOV_RESET(r) ((r) == -EBUSY || (r) == -ETIMEDOUT || (r) == -EINVAL)
  92
  93 const char *amdgpu_asic_name[] = {
  94         "TAHITI",
  95         "PITCAIRN",
  96         "VERDE",
  97         "OLAND",
  98         "HAINAN",
  99         "BONAIRE",
 100         "KAVERI",
 101         "KABINI",
 102         "HAWAII",
 103         "MULLINS",
 104         "TOPAZ",
 105         "TONGA",
 106         "FIJI",
 107         "CARRIZO",
 108         "STONEY",
 109         "POLARIS10",
 110         "POLARIS11",
 111         "POLARIS12",
 112         "VEGAM",
 113         "VEGA10",
 114         "VEGA12",
 115         "VEGA20",
 116         "RAVEN",
 117         "ARCTURUS",
 118         "RENOIR",
 119         "ALDEBARAN",
 120         "NAVI10",
 121         "CYAN_SKILLFISH",
 122         "NAVI14",
 123         "NAVI12",
 124         "SIENNA_CICHLID",
 125         "NAVY_FLOUNDER",
 126         "VANGOGH",
 127         "DIMGREY_CAVEFISH",
 128         "BEIGE_GOBY",
 129         "YELLOW_CARP",
 130         "IP DISCOVERY",
 131         "LAST",
 132 };
 133
 134 /**
 135  * DOC: pcie_replay_count
 136  *
 137  * The amdgpu driver provides a sysfs API for reporting the total number
 138  * of PCIe replays (NAKs)
 139  * The file pcie_replay_count is used for this and returns the total
 140  * number of replays as a sum of the NAKs generated and NAKs received
 141  */
 142
 143 static ssize_t amdgpu_device_get_pcie_replay_count(struct device *dev,
 144                 struct device_attribute *attr, char *buf)
 145 {
 146         struct drm_device *ddev = dev_get_drvdata(dev);
 147         struct amdgpu_device *adev = drm_to_adev(ddev);
 148         uint64_t cnt = amdgpu_asic_get_pcie_replay_count(adev);
 149
 150         return sysfs_emit(buf, "%llu\n", cnt);
 151 }
 152
 153 static DEVICE_ATTR(pcie_replay_count, S_IRUGO,
 154                 amdgpu_device_get_pcie_replay_count, NULL);
 155
 156 static void amdgpu_device_get_pcie_info(struct amdgpu_device *adev);
 157
 158 /**
 159  * DOC: product_name
 160  *
 161  * The amdgpu driver provides a sysfs API for reporting the product name
 162  * for the device
 163  * The file serial_number is used for this and returns the product name
 164  * as returned from the FRU.
 165  * NOTE: This is only available for certain server cards
 166  */
 167
 168 static ssize_t amdgpu_device_get_product_name(struct device *dev,
 169                 struct device_attribute *attr, char *buf)
 170 {
 171         struct drm_device *ddev = dev_get_drvdata(dev);
 172         struct amdgpu_device *adev = drm_to_adev(ddev);
 173
 174         return sysfs_emit(buf, "%s\n", adev->product_name);
 175 }
 176
 177 static DEVICE_ATTR(product_name, S_IRUGO,
 178                 amdgpu_device_get_product_name, NULL);
 179
 180 /**
 181  * DOC: product_number
 182  *
 183  * The amdgpu driver provides a sysfs API for reporting the part number
 184  * for the device
 185  * The file serial_number is used for this and returns the part number
 186  * as returned from the FRU.
 187  * NOTE: This is only available for certain server cards
 188  */
 189
 190 static ssize_t amdgpu_device_get_product_number(struct device *dev,
 191                 struct device_attribute *attr, char *buf)
 192 {
 193         struct drm_device *ddev = dev_get_drvdata(dev);
 194         struct amdgpu_device *adev = drm_to_adev(ddev);
 195
 196         return sysfs_emit(buf, "%s\n", adev->product_number);
 197 }
 198
 199 static DEVICE_ATTR(product_number, S_IRUGO,
 200                 amdgpu_device_get_product_number, NULL);
 201
 202 /**
 203  * DOC: serial_number
 204  *
 205  * The amdgpu driver provides a sysfs API for reporting the serial number
 206  * for the device
 207  * The file serial_number is used for this and returns the serial number
 208  * as returned from the FRU.
 209  * NOTE: This is only available for certain server cards
 210  */
 211
 212 static ssize_t amdgpu_device_get_serial_number(struct device *dev,
 213                 struct device_attribute *attr, char *buf)
 214 {
 215         struct drm_device *ddev = dev_get_drvdata(dev);
 216         struct amdgpu_device *adev = drm_to_adev(ddev);
 217
 218         return sysfs_emit(buf, "%s\n", adev->serial);
 219 }
 220
 221 static DEVICE_ATTR(serial_number, S_IRUGO,
 222                 amdgpu_device_get_serial_number, NULL);
 223
 224 /**
 225  * amdgpu_device_supports_px - Is the device a dGPU with ATPX power control
 226  *
 227  * @dev: drm_device pointer
 228  *
 229  * Returns true if the device is a dGPU with ATPX power control,
 230  * otherwise return false.
 231  */
 232 bool amdgpu_device_supports_px(struct drm_device *dev)
 233 {
 234         struct amdgpu_device *adev = drm_to_adev(dev);
 235
 236         if ((adev->flags & AMD_IS_PX) && !amdgpu_is_atpx_hybrid())
 237                 return true;
 238         return false;
 239 }
 240
 241 /**
 242  * amdgpu_device_supports_boco - Is the device a dGPU with ACPI power resources
 243  *
 244  * @dev: drm_device pointer
 245  *
 246  * Returns true if the device is a dGPU with ACPI power control,
 247  * otherwise return false.
 248  */
 249 bool amdgpu_device_supports_boco(struct drm_device *dev)
 250 {
 251         struct amdgpu_device *adev = drm_to_adev(dev);
 252
 253         if (adev->has_pr3 ||
 254             ((adev->flags & AMD_IS_PX) && amdgpu_is_atpx_hybrid()))
 255                 return true;
 256         return false;
 257 }
 258
 259 /**
 260  * amdgpu_device_supports_baco - Does the device support BACO
 261  *
 262  * @dev: drm_device pointer
 263  *
 264  * Returns true if the device supporte BACO,
 265  * otherwise return false.
 266  */
 267 bool amdgpu_device_supports_baco(struct drm_device *dev)
 268 {
 269         struct amdgpu_device *adev = drm_to_adev(dev);
 270
 271         return amdgpu_asic_supports_baco(adev);
 272 }
 273
 274 /**
 275  * amdgpu_device_supports_smart_shift - Is the device dGPU with
 276  * smart shift support
 277  *
 278  * @dev: drm_device pointer
 279  *
 280  * Returns true if the device is a dGPU with Smart Shift support,
 281  * otherwise returns false.
 282  */
 283 bool amdgpu_device_supports_smart_shift(struct drm_device *dev)
 284 {
 285         return (amdgpu_device_supports_boco(dev) &&
 286                 amdgpu_acpi_is_power_shift_control_supported());
 287 }
 288
 289 /*
 290  * VRAM access helper functions
 291  */
 292
 293 /**
 294  * amdgpu_device_mm_access - access vram by MM_INDEX/MM_DATA
 295  *
 296  * @adev: amdgpu_device pointer
 297  * @pos: offset of the buffer in vram
 298  * @buf: virtual address of the buffer in system memory
 299  * @size: read/write size, sizeof(@buf) must > @size
 300  * @write: true - write to vram, otherwise - read from vram
 301  */
 302 void amdgpu_device_mm_access(struct amdgpu_device *adev, loff_t pos,
 303                              void *buf, size_t size, bool write)
 304 {
 305         unsigned long flags;
 306         uint32_t hi = ~0, tmp = 0;
 307         uint32_t *data = buf;
 308         uint64_t last;
 309         int idx;
 310
 311         if (!drm_dev_enter(adev_to_drm(adev), &idx))
 312                 return;
 313
 314         BUG_ON(!IS_ALIGNED(pos, 4) || !IS_ALIGNED(size, 4));
 315
 316         spin_lock_irqsave(&adev->mmio_idx_lock, flags);
 317         for (last = pos + size; pos < last; pos += 4) {
 318                 tmp = pos >> 31;
 319
 320                 WREG32_NO_KIQ(mmMM_INDEX, ((uint32_t)pos) | 0x80000000);
 321                 if (tmp != hi) {
 322                         WREG32_NO_KIQ(mmMM_INDEX_HI, tmp);
 323                         hi = tmp;
 324                 }
 325                 if (write)
 326                         WREG32_NO_KIQ(mmMM_DATA, *data++);
 327                 else
 328                         *data++ = RREG32_NO_KIQ(mmMM_DATA);
 329         }
 330
 331         spin_unlock_irqrestore(&adev->mmio_idx_lock, flags);
 332         drm_dev_exit(idx);
 333 }
 334
 335 /**
 336  * amdgpu_device_aper_access - access vram by vram aperature
 337  *
 338  * @adev: amdgpu_device pointer
 339  * @pos: offset of the buffer in vram
 340  * @buf: virtual address of the buffer in system memory
 341  * @size: read/write size, sizeof(@buf) must > @size
 342  * @write: true - write to vram, otherwise - read from vram
 343  *
 344  * The return value means how many bytes have been transferred.
 345  */
 346 size_t amdgpu_device_aper_access(struct amdgpu_device *adev, loff_t pos,
 347                                  void *buf, size_t size, bool write)
 348 {
 349 #ifdef CONFIG_64BIT
 350         void __iomem *addr;
 351         size_t count = 0;
 352         uint64_t last;
 353
 354         if (!adev->mman.aper_base_kaddr)
 355                 return 0;
 356
 357         last = min(pos + size, adev->gmc.visible_vram_size);
 358         if (last > pos) {
 359                 addr = adev->mman.aper_base_kaddr + pos;
 360                 count = last - pos;
 361
 362                 if (write) {
 363                         memcpy_toio(addr, buf, count);
 364                         mb();
 365                         amdgpu_device_flush_hdp(adev, NULL);
 366                 } else {
 367                         amdgpu_device_invalidate_hdp(adev, NULL);
 368                         mb();
 369                         memcpy_fromio(buf, addr, count);
 370                 }
 371
 372         }
 373
 374         return count;
 375 #else
 376         return 0;
 377 #endif
 378 }
 379
 380 /**
 381  * amdgpu_device_vram_access - read/write a buffer in vram
 382  *
 383  * @adev: amdgpu_device pointer
 384  * @pos: offset of the buffer in vram
 385  * @buf: virtual address of the buffer in system memory
 386  * @size: read/write size, sizeof(@buf) must > @size
 387  * @write: true - write to vram, otherwise - read from vram
 388  */
 389 void amdgpu_device_vram_access(struct amdgpu_device *adev, loff_t pos,
 390                                void *buf, size_t size, bool write)
 391 {
 392         size_t count;
 393
 394         /* try to using vram apreature to access vram first */
 395         count = amdgpu_device_aper_access(adev, pos, buf, size, write);
 396         size -= count;
 397         if (size) {
 398                 /* using MM to access rest vram */
 399                 pos += count;
 400                 buf += count;
 401                 amdgpu_device_mm_access(adev, pos, buf, size, write);
 402         }
 403 }
 404
 405 /*
 406  * register access helper functions.
 407  */
 408
 409 /* Check if hw access should be skipped because of hotplug or device error */
 410 bool amdgpu_device_skip_hw_access(struct amdgpu_device *adev)
 411 {
 412         if (adev->no_hw_access)
 413                 return true;
 414
 415 #ifdef CONFIG_LOCKDEP
 416         /*
 417          * This is a bit complicated to understand, so worth a comment. What we assert
 418          * here is that the GPU reset is not running on another thread in parallel.
 419          *
 420          * For this we trylock the read side of the reset semaphore, if that succeeds
 421          * we know that the reset is not running in paralell.
 422          *
 423          * If the trylock fails we assert that we are either already holding the read
 424          * side of the lock or are the reset thread itself and hold the write side of
 425          * the lock.
 426          */
 427         if (in_task()) {
 428                 if (down_read_trylock(&adev->reset_domain->sem))
 429                         up_read(&adev->reset_domain->sem);
 430                 else
 431                         lockdep_assert_held(&adev->reset_domain->sem);
 432         }
 433 #endif
 434         return false;
 435 }
 436
 437 /**
 438  * amdgpu_device_rreg - read a memory mapped IO or indirect register
 439  *
 440  * @adev: amdgpu_device pointer
 441  * @reg: dword aligned register offset
 442  * @acc_flags: access flags which require special behavior
 443  *
 444  * Returns the 32 bit value from the offset specified.
 445  */
 446 uint32_t amdgpu_device_rreg(struct amdgpu_device *adev,
 447                             uint32_t reg, uint32_t acc_flags)
 448 {
 449         uint32_t ret;
 450
 451         if (amdgpu_device_skip_hw_access(adev))
 452                 return 0;
 453
 454         if ((reg * 4) < adev->rmmio_size) {
 455                 if (!(acc_flags & AMDGPU_REGS_NO_KIQ) &&
 456                     amdgpu_sriov_runtime(adev) &&
 457                     down_read_trylock(&adev->reset_domain->sem)) {
 458                         ret = amdgpu_kiq_rreg(adev, reg);
 459                         up_read(&adev->reset_domain->sem);
 460                 } else {
 461                         ret = readl(((void __iomem *)adev->rmmio) + (reg * 4));
 462                 }
 463         } else {
 464                 ret = adev->pcie_rreg(adev, reg * 4);
 465         }
 466
 467         trace_amdgpu_device_rreg(adev->pdev->device, reg, ret);
 468
 469         return ret;
 470 }
 471
 472 /*
 473  * MMIO register read with bytes helper functions
 474  * @offset:bytes offset from MMIO start
 475  *
 476 */
 477
 478 /**
 479  * amdgpu_mm_rreg8 - read a memory mapped IO register
 480  *
 481  * @adev: amdgpu_device pointer
 482  * @offset: byte aligned register offset
 483  *
 484  * Returns the 8 bit value from the offset specified.
 485  */
 486 uint8_t amdgpu_mm_rreg8(struct amdgpu_device *adev, uint32_t offset)
 487 {
 488         if (amdgpu_device_skip_hw_access(adev))
 489                 return 0;
 490
 491         if (offset < adev->rmmio_size)
 492                 return (readb(adev->rmmio + offset));
 493         BUG();
 494 }
 495
 496 /*
 497  * MMIO register write with bytes helper functions
 498  * @offset:bytes offset from MMIO start
 499  * @value: the value want to be written to the register
 500  *
 501 */
 502 /**
 503  * amdgpu_mm_wreg8 - read a memory mapped IO register
 504  *
 505  * @adev: amdgpu_device pointer
 506  * @offset: byte aligned register offset
 507  * @value: 8 bit value to write
 508  *
 509  * Writes the value specified to the offset specified.
 510  */
 511 void amdgpu_mm_wreg8(struct amdgpu_device *adev, uint32_t offset, uint8_t value)
 512 {
 513         if (amdgpu_device_skip_hw_access(adev))
 514                 return;
 515
 516         if (offset < adev->rmmio_size)
 517                 writeb(value, adev->rmmio + offset);
 518         else
 519                 BUG();
 520 }
 521
 522 /**
 523  * amdgpu_device_wreg - write to a memory mapped IO or indirect register
 524  *
 525  * @adev: amdgpu_device pointer
 526  * @reg: dword aligned register offset
 527  * @v: 32 bit value to write to the register
 528  * @acc_flags: access flags which require special behavior
 529  *
 530  * Writes the value specified to the offset specified.
 531  */
 532 void amdgpu_device_wreg(struct amdgpu_device *adev,
 533                         uint32_t reg, uint32_t v,
 534                         uint32_t acc_flags)
 535 {
 536         if (amdgpu_device_skip_hw_access(adev))
 537                 return;
 538
 539         if ((reg * 4) < adev->rmmio_size) {
 540                 if (!(acc_flags & AMDGPU_REGS_NO_KIQ) &&
 541                     amdgpu_sriov_runtime(adev) &&
 542                     down_read_trylock(&adev->reset_domain->sem)) {
 543                         amdgpu_kiq_wreg(adev, reg, v);
 544                         up_read(&adev->reset_domain->sem);
 545                 } else {
 546                         writel(v, ((void __iomem *)adev->rmmio) + (reg * 4));
 547                 }
 548         } else {
 549                 adev->pcie_wreg(adev, reg * 4, v);
 550         }
 551
 552         trace_amdgpu_device_wreg(adev->pdev->device, reg, v);
 553 }
 554
 555 /**
 556  * amdgpu_mm_wreg_mmio_rlc -  write register either with direct/indirect mmio or with RLC path if in range
 557  *
 558  * @adev: amdgpu_device pointer
 559  * @reg: mmio/rlc register
 560  * @v: value to write
 561  *
 562  * this function is invoked only for the debugfs register access
 563  */
 564 void amdgpu_mm_wreg_mmio_rlc(struct amdgpu_device *adev,
 565                              uint32_t reg, uint32_t v)
 566 {
 567         if (amdgpu_device_skip_hw_access(adev))
 568                 return;
 569
 570         if (amdgpu_sriov_fullaccess(adev) &&
 571             adev->gfx.rlc.funcs &&
 572             adev->gfx.rlc.funcs->is_rlcg_access_range) {
 573                 if (adev->gfx.rlc.funcs->is_rlcg_access_range(adev, reg))
 574                         return amdgpu_sriov_wreg(adev, reg, v, 0, 0);
 575         } else if ((reg * 4) >= adev->rmmio_size) {
 576                 adev->pcie_wreg(adev, reg * 4, v);
 577         } else {
 578                 writel(v, ((void __iomem *)adev->rmmio) + (reg * 4));
 579         }
 580 }
 581
 582 /**
 583  * amdgpu_mm_rdoorbell - read a doorbell dword
 584  *
 585  * @adev: amdgpu_device pointer
 586  * @index: doorbell index
 587  *
 588  * Returns the value in the doorbell aperture at the
 589  * requested doorbell index (CIK).
 590  */
 591 u32 amdgpu_mm_rdoorbell(struct amdgpu_device *adev, u32 index)
 592 {
 593         if (amdgpu_device_skip_hw_access(adev))
 594                 return 0;
 595
 596         if (index < adev->doorbell.num_doorbells) {
 597                 return readl(adev->doorbell.ptr + index);
 598         } else {
 599                 DRM_ERROR("reading beyond doorbell aperture: 0x%08x!\n", index);
 600                 return 0;
 601         }
 602 }
 603
 604 /**
 605  * amdgpu_mm_wdoorbell - write a doorbell dword
 606  *
 607  * @adev: amdgpu_device pointer
 608  * @index: doorbell index
 609  * @v: value to write
 610  *
 611  * Writes @v to the doorbell aperture at the
 612  * requested doorbell index (CIK).
 613  */
 614 void amdgpu_mm_wdoorbell(struct amdgpu_device *adev, u32 index, u32 v)
 615 {
 616         if (amdgpu_device_skip_hw_access(adev))
 617                 return;
 618
 619         if (index < adev->doorbell.num_doorbells) {
 620                 writel(v, adev->doorbell.ptr + index);
 621         } else {
 622                 DRM_ERROR("writing beyond doorbell aperture: 0x%08x!\n", index);
 623         }
 624 }
 625
 626 /**
 627  * amdgpu_mm_rdoorbell64 - read a doorbell Qword
 628  *
 629  * @adev: amdgpu_device pointer
 630  * @index: doorbell index
 631  *
 632  * Returns the value in the doorbell aperture at the
 633  * requested doorbell index (VEGA10+).
 634  */
 635 u64 amdgpu_mm_rdoorbell64(struct amdgpu_device *adev, u32 index)
 636 {
 637         if (amdgpu_device_skip_hw_access(adev))
 638                 return 0;
 639
 640         if (index < adev->doorbell.num_doorbells) {
 641                 return atomic64_read((atomic64_t *)(adev->doorbell.ptr + index));
 642         } else {
 643                 DRM_ERROR("reading beyond doorbell aperture: 0x%08x!\n", index);
 644                 return 0;
 645         }
 646 }
 647
 648 /**
 649  * amdgpu_mm_wdoorbell64 - write a doorbell Qword
 650  *
 651  * @adev: amdgpu_device pointer
 652  * @index: doorbell index
 653  * @v: value to write
 654  *
 655  * Writes @v to the doorbell aperture at the
 656  * requested doorbell index (VEGA10+).
 657  */
 658 void amdgpu_mm_wdoorbell64(struct amdgpu_device *adev, u32 index, u64 v)
 659 {
 660         if (amdgpu_device_skip_hw_access(adev))
 661                 return;
 662
 663         if (index < adev->doorbell.num_doorbells) {
 664                 atomic64_set((atomic64_t *)(adev->doorbell.ptr + index), v);
 665         } else {
 666                 DRM_ERROR("writing beyond doorbell aperture: 0x%08x!\n", index);
 667         }
 668 }
 669
 670 /**
 671  * amdgpu_device_indirect_rreg - read an indirect register
 672  *
 673  * @adev: amdgpu_device pointer
 674  * @pcie_index: mmio register offset
 675  * @pcie_data: mmio register offset
 676  * @reg_addr: indirect register address to read from
 677  *
 678  * Returns the value of indirect register @reg_addr
 679  */
 680 u32 amdgpu_device_indirect_rreg(struct amdgpu_device *adev,
 681                                 u32 pcie_index, u32 pcie_data,
 682                                 u32 reg_addr)
 683 {
 684         unsigned long flags;
 685         u32 r;
 686         void __iomem *pcie_index_offset;
 687         void __iomem *pcie_data_offset;
 688
 689         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
 690         pcie_index_offset = (void __iomem *)adev->rmmio + pcie_index * 4;
 691         pcie_data_offset = (void __iomem *)adev->rmmio + pcie_data * 4;
 692
 693         writel(reg_addr, pcie_index_offset);
 694         readl(pcie_index_offset);
 695         r = readl(pcie_data_offset);
 696         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
 697
 698         return r;
 699 }
 700
 701 /**
 702  * amdgpu_device_indirect_rreg64 - read a 64bits indirect register
 703  *
 704  * @adev: amdgpu_device pointer
 705  * @pcie_index: mmio register offset
 706  * @pcie_data: mmio register offset
 707  * @reg_addr: indirect register address to read from
 708  *
 709  * Returns the value of indirect register @reg_addr
 710  */
 711 u64 amdgpu_device_indirect_rreg64(struct amdgpu_device *adev,
 712                                   u32 pcie_index, u32 pcie_data,
 713                                   u32 reg_addr)
 714 {
 715         unsigned long flags;
 716         u64 r;
 717         void __iomem *pcie_index_offset;
 718         void __iomem *pcie_data_offset;
 719
 720         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
 721         pcie_index_offset = (void __iomem *)adev->rmmio + pcie_index * 4;
 722         pcie_data_offset = (void __iomem *)adev->rmmio + pcie_data * 4;
 723
 724         /* read low 32 bits */
 725         writel(reg_addr, pcie_index_offset);
 726         readl(pcie_index_offset);
 727         r = readl(pcie_data_offset);
 728         /* read high 32 bits */
 729         writel(reg_addr + 4, pcie_index_offset);
 730         readl(pcie_index_offset);
 731         r |= ((u64)readl(pcie_data_offset) << 32);
 732         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
 733
 734         return r;
 735 }
 736
 737 /**
 738  * amdgpu_device_indirect_wreg - write an indirect register address
 739  *
 740  * @adev: amdgpu_device pointer
 741  * @pcie_index: mmio register offset
 742  * @pcie_data: mmio register offset
 743  * @reg_addr: indirect register offset
 744  * @reg_data: indirect register data
 745  *
 746  */
 747 void amdgpu_device_indirect_wreg(struct amdgpu_device *adev,
 748                                  u32 pcie_index, u32 pcie_data,
 749                                  u32 reg_addr, u32 reg_data)
 750 {
 751         unsigned long flags;
 752         void __iomem *pcie_index_offset;
 753         void __iomem *pcie_data_offset;
 754
 755         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
 756         pcie_index_offset = (void __iomem *)adev->rmmio + pcie_index * 4;
 757         pcie_data_offset = (void __iomem *)adev->rmmio + pcie_data * 4;
 758
 759         writel(reg_addr, pcie_index_offset);
 760         readl(pcie_index_offset);
 761         writel(reg_data, pcie_data_offset);
 762         readl(pcie_data_offset);
 763         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
 764 }
 765
 766 /**
 767  * amdgpu_device_indirect_wreg64 - write a 64bits indirect register address
 768  *
 769  * @adev: amdgpu_device pointer
 770  * @pcie_index: mmio register offset
 771  * @pcie_data: mmio register offset
 772  * @reg_addr: indirect register offset
 773  * @reg_data: indirect register data
 774  *
 775  */
 776 void amdgpu_device_indirect_wreg64(struct amdgpu_device *adev,
 777                                    u32 pcie_index, u32 pcie_data,
 778                                    u32 reg_addr, u64 reg_data)
 779 {
 780         unsigned long flags;
 781         void __iomem *pcie_index_offset;
 782         void __iomem *pcie_data_offset;
 783
 784         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
 785         pcie_index_offset = (void __iomem *)adev->rmmio + pcie_index * 4;
 786         pcie_data_offset = (void __iomem *)adev->rmmio + pcie_data * 4;
 787
 788         /* write low 32 bits */
 789         writel(reg_addr, pcie_index_offset);
 790         readl(pcie_index_offset);
 791         writel((u32)(reg_data & 0xffffffffULL), pcie_data_offset);
 792         readl(pcie_data_offset);
 793         /* write high 32 bits */
 794         writel(reg_addr + 4, pcie_index_offset);
 795         readl(pcie_index_offset);
 796         writel((u32)(reg_data >> 32), pcie_data_offset);
 797         readl(pcie_data_offset);
 798         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
 799 }
 800
 801 /**
 802  * amdgpu_invalid_rreg - dummy reg read function
 803  *
 804  * @adev: amdgpu_device pointer
 805  * @reg: offset of register
 806  *
 807  * Dummy register read function.  Used for register blocks
 808  * that certain asics don't have (all asics).
 809  * Returns the value in the register.
 810  */
 811 static uint32_t amdgpu_invalid_rreg(struct amdgpu_device *adev, uint32_t reg)
 812 {
 813         DRM_ERROR("Invalid callback to read register 0x%04X\n", reg);
 814         BUG();
 815         return 0;
 816 }
 817
 818 /**
 819  * amdgpu_invalid_wreg - dummy reg write function
 820  *
 821  * @adev: amdgpu_device pointer
 822  * @reg: offset of register
 823  * @v: value to write to the register
 824  *
 825  * Dummy register read function.  Used for register blocks
 826  * that certain asics don't have (all asics).
 827  */
 828 static void amdgpu_invalid_wreg(struct amdgpu_device *adev, uint32_t reg, uint32_t v)
 829 {
 830         DRM_ERROR("Invalid callback to write register 0x%04X with 0x%08X\n",
 831                   reg, v);
 832         BUG();
 833 }
 834
 835 /**
 836  * amdgpu_invalid_rreg64 - dummy 64 bit reg read function
 837  *
 838  * @adev: amdgpu_device pointer
 839  * @reg: offset of register
 840  *
 841  * Dummy register read function.  Used for register blocks
 842  * that certain asics don't have (all asics).
 843  * Returns the value in the register.
 844  */
 845 static uint64_t amdgpu_invalid_rreg64(struct amdgpu_device *adev, uint32_t reg)
 846 {
 847         DRM_ERROR("Invalid callback to read 64 bit register 0x%04X\n", reg);
 848         BUG();
 849         return 0;
 850 }
 851
 852 /**
 853  * amdgpu_invalid_wreg64 - dummy reg write function
 854  *
 855  * @adev: amdgpu_device pointer
 856  * @reg: offset of register
 857  * @v: value to write to the register
 858  *
 859  * Dummy register read function.  Used for register blocks
 860  * that certain asics don't have (all asics).
 861  */
 862 static void amdgpu_invalid_wreg64(struct amdgpu_device *adev, uint32_t reg, uint64_t v)
 863 {
 864         DRM_ERROR("Invalid callback to write 64 bit register 0x%04X with 0x%08llX\n",
 865                   reg, v);
 866         BUG();
 867 }
 868
 869 /**
 870  * amdgpu_block_invalid_rreg - dummy reg read function
 871  *
 872  * @adev: amdgpu_device pointer
 873  * @block: offset of instance
 874  * @reg: offset of register
 875  *
 876  * Dummy register read function.  Used for register blocks
 877  * that certain asics don't have (all asics).
 878  * Returns the value in the register.
 879  */
 880 static uint32_t amdgpu_block_invalid_rreg(struct amdgpu_device *adev,
 881                                           uint32_t block, uint32_t reg)
 882 {
 883         DRM_ERROR("Invalid callback to read register 0x%04X in block 0x%04X\n",
 884                   reg, block);
 885         BUG();
 886         return 0;
 887 }
 888
 889 /**
 890  * amdgpu_block_invalid_wreg - dummy reg write function
 891  *
 892  * @adev: amdgpu_device pointer
 893  * @block: offset of instance
 894  * @reg: offset of register
 895  * @v: value to write to the register
 896  *
 897  * Dummy register read function.  Used for register blocks
 898  * that certain asics don't have (all asics).
 899  */
 900 static void amdgpu_block_invalid_wreg(struct amdgpu_device *adev,
 901                                       uint32_t block,
 902                                       uint32_t reg, uint32_t v)
 903 {
 904         DRM_ERROR("Invalid block callback to write register 0x%04X in block 0x%04X with 0x%08X\n",
 905                   reg, block, v);
 906         BUG();
 907 }
 908
 909 /**
 910  * amdgpu_device_asic_init - Wrapper for atom asic_init
 911  *
 912  * @adev: amdgpu_device pointer
 913  *
 914  * Does any asic specific work and then calls atom asic init.
 915  */
 916 static int amdgpu_device_asic_init(struct amdgpu_device *adev)
 917 {
 918         amdgpu_asic_pre_asic_init(adev);
 919
 920         if (adev->ip_versions[GC_HWIP][0] >= IP_VERSION(11, 0, 0))
 921                 return amdgpu_atomfirmware_asic_init(adev, true);
 922         else
 923                 return amdgpu_atom_asic_init(adev->mode_info.atom_context);
 924 }
 925
 926 /**
 927  * amdgpu_device_vram_scratch_init - allocate the VRAM scratch page
 928  *
 929  * @adev: amdgpu_device pointer
 930  *
 931  * Allocates a scratch page of VRAM for use by various things in the
 932  * driver.
 933  */
 934 static int amdgpu_device_vram_scratch_init(struct amdgpu_device *adev)
 935 {
 936         return amdgpu_bo_create_kernel(adev, AMDGPU_GPU_PAGE_SIZE,
 937                                        PAGE_SIZE, AMDGPU_GEM_DOMAIN_VRAM,
 938                                        &adev->vram_scratch.robj,
 939                                        &adev->vram_scratch.gpu_addr,
 940                                        (void **)&adev->vram_scratch.ptr);
 941 }
 942
 943 /**
 944  * amdgpu_device_vram_scratch_fini - Free the VRAM scratch page
 945  *
 946  * @adev: amdgpu_device pointer
 947  *
 948  * Frees the VRAM scratch page.
 949  */
 950 static void amdgpu_device_vram_scratch_fini(struct amdgpu_device *adev)
 951 {
 952         amdgpu_bo_free_kernel(&adev->vram_scratch.robj, NULL, NULL);
 953 }
 954
 955 /**
 956  * amdgpu_device_program_register_sequence - program an array of registers.
 957  *
 958  * @adev: amdgpu_device pointer
 959  * @registers: pointer to the register array
 960  * @array_size: size of the register array
 961  *
 962  * Programs an array or registers with and and or masks.
 963  * This is a helper for setting golden registers.
 964  */
 965 void amdgpu_device_program_register_sequence(struct amdgpu_device *adev,
 966                                              const u32 *registers,
 967                                              const u32 array_size)
 968 {
 969         u32 tmp, reg, and_mask, or_mask;
 970         int i;
 971
 972         if (array_size % 3)
 973                 return;
 974
 975         for (i = 0; i < array_size; i +=3) {
 976                 reg = registers[i + 0];
 977                 and_mask = registers[i + 1];
 978                 or_mask = registers[i + 2];
 979
 980                 if (and_mask == 0xffffffff) {
 981                         tmp = or_mask;
 982                 } else {
 983                         tmp = RREG32(reg);
 984                         tmp &= ~and_mask;
 985                         if (adev->family >= AMDGPU_FAMILY_AI)
 986                                 tmp |= (or_mask & and_mask);
 987                         else
 988                                 tmp |= or_mask;
 989                 }
 990                 WREG32(reg, tmp);
 991         }
 992 }
 993
 994 /**
 995  * amdgpu_device_pci_config_reset - reset the GPU
 996  *
 997  * @adev: amdgpu_device pointer
 998  *
 999  * Resets the GPU using the pci config reset sequence.
1000  * Only applicable to asics prior to vega10.
1001  */
1002 void amdgpu_device_pci_config_reset(struct amdgpu_device *adev)
1003 {
1004         pci_write_config_dword(adev->pdev, 0x7c, AMDGPU_ASIC_RESET_DATA);
1005 }
1006
1007 /**
1008  * amdgpu_device_pci_reset - reset the GPU using generic PCI means
1009  *
1010  * @adev: amdgpu_device pointer
1011  *
1012  * Resets the GPU using generic pci reset interfaces (FLR, SBR, etc.).
1013  */
1014 int amdgpu_device_pci_reset(struct amdgpu_device *adev)
1015 {
1016         return pci_reset_function(adev->pdev);
1017 }
1018
1019 /*
1020  * GPU doorbell aperture helpers function.
1021  */
1022 /**
1023  * amdgpu_device_doorbell_init - Init doorbell driver information.
1024  *
1025  * @adev: amdgpu_device pointer
1026  *
1027  * Init doorbell driver information (CIK)
1028  * Returns 0 on success, error on failure.
1029  */
1030 static int amdgpu_device_doorbell_init(struct amdgpu_device *adev)
1031 {
1032
1033         /* No doorbell on SI hardware generation */
1034         if (adev->asic_type < CHIP_BONAIRE) {
1035                 adev->doorbell.base = 0;
1036                 adev->doorbell.size = 0;
1037                 adev->doorbell.num_doorbells = 0;
1038                 adev->doorbell.ptr = NULL;
1039                 return 0;
1040         }
1041
1042         if (pci_resource_flags(adev->pdev, 2) & IORESOURCE_UNSET)
1043                 return -EINVAL;
1044
1045         amdgpu_asic_init_doorbell_index(adev);
1046
1047         /* doorbell bar mapping */
1048         adev->doorbell.base = pci_resource_start(adev->pdev, 2);
1049         adev->doorbell.size = pci_resource_len(adev->pdev, 2);
1050
1051         if (adev->enable_mes) {
1052                 adev->doorbell.num_doorbells =
1053                         adev->doorbell.size / sizeof(u32);
1054         } else {
1055                 adev->doorbell.num_doorbells =
1056                         min_t(u32, adev->doorbell.size / sizeof(u32),
1057                               adev->doorbell_index.max_assignment+1);
1058                 if (adev->doorbell.num_doorbells == 0)
1059                         return -EINVAL;
1060
1061                 /* For Vega, reserve and map two pages on doorbell BAR since SDMA
1062                  * paging queue doorbell use the second page. The
1063                  * AMDGPU_DOORBELL64_MAX_ASSIGNMENT definition assumes all the
1064                  * doorbells are in the first page. So with paging queue enabled,
1065                  * the max num_doorbells should + 1 page (0x400 in dword)
1066                  */
1067                 if (adev->asic_type >= CHIP_VEGA10)
1068                         adev->doorbell.num_doorbells += 0x400;
1069         }
1070
1071         adev->doorbell.ptr = ioremap(adev->doorbell.base,
1072                                      adev->doorbell.num_doorbells *
1073                                      sizeof(u32));
1074         if (adev->doorbell.ptr == NULL)
1075                 return -ENOMEM;
1076
1077         return 0;
1078 }
1079
1080 /**
1081  * amdgpu_device_doorbell_fini - Tear down doorbell driver information.
1082  *
1083  * @adev: amdgpu_device pointer
1084  *
1085  * Tear down doorbell driver information (CIK)
1086  */
1087 static void amdgpu_device_doorbell_fini(struct amdgpu_device *adev)
1088 {
1089         iounmap(adev->doorbell.ptr);
1090         adev->doorbell.ptr = NULL;
1091 }
1092
1093
1094
1095 /*
1096  * amdgpu_device_wb_*()
1097  * Writeback is the method by which the GPU updates special pages in memory
1098  * with the status of certain GPU events (fences, ring pointers,etc.).
1099  */
1100
1101 /**
1102  * amdgpu_device_wb_fini - Disable Writeback and free memory
1103  *
1104  * @adev: amdgpu_device pointer
1105  *
1106  * Disables Writeback and frees the Writeback memory (all asics).
1107  * Used at driver shutdown.
1108  */
1109 static void amdgpu_device_wb_fini(struct amdgpu_device *adev)
1110 {
1111         if (adev->wb.wb_obj) {
1112                 amdgpu_bo_free_kernel(&adev->wb.wb_obj,
1113                                       &adev->wb.gpu_addr,
1114                                       (void **)&adev->wb.wb);
1115                 adev->wb.wb_obj = NULL;
1116         }
1117 }
1118
1119 /**
1120  * amdgpu_device_wb_init - Init Writeback driver info and allocate memory
1121  *
1122  * @adev: amdgpu_device pointer
1123  *
1124  * Initializes writeback and allocates writeback memory (all asics).
1125  * Used at driver startup.
1126  * Returns 0 on success or an -error on failure.
1127  */
1128 static int amdgpu_device_wb_init(struct amdgpu_device *adev)
1129 {
1130         int r;
1131
1132         if (adev->wb.wb_obj == NULL) {
1133                 /* AMDGPU_MAX_WB * sizeof(uint32_t) * 8 = AMDGPU_MAX_WB 256bit slots */
1134                 r = amdgpu_bo_create_kernel(adev, AMDGPU_MAX_WB * sizeof(uint32_t) * 8,
1135                                             PAGE_SIZE, AMDGPU_GEM_DOMAIN_GTT,
1136                                             &adev->wb.wb_obj, &adev->wb.gpu_addr,
1137                                             (void **)&adev->wb.wb);
1138                 if (r) {
1139                         dev_warn(adev->dev, "(%d) create WB bo failed\n", r);
1140                         return r;
1141                 }
1142
1143                 adev->wb.num_wb = AMDGPU_MAX_WB;
1144                 memset(&adev->wb.used, 0, sizeof(adev->wb.used));
1145
1146                 /* clear wb memory */
1147                 memset((char *)adev->wb.wb, 0, AMDGPU_MAX_WB * sizeof(uint32_t) * 8);
1148         }
1149
1150         return 0;
1151 }
1152
1153 /**
1154  * amdgpu_device_wb_get - Allocate a wb entry
1155  *
1156  * @adev: amdgpu_device pointer
1157  * @wb: wb index
1158  *
1159  * Allocate a wb slot for use by the driver (all asics).
1160  * Returns 0 on success or -EINVAL on failure.
1161  */
1162 int amdgpu_device_wb_get(struct amdgpu_device *adev, u32 *wb)
1163 {
1164         unsigned long offset = find_first_zero_bit(adev->wb.used, adev->wb.num_wb);
1165
1166         if (offset < adev->wb.num_wb) {
1167                 __set_bit(offset, adev->wb.used);
1168                 *wb = offset << 3; /* convert to dw offset */
1169                 return 0;
1170         } else {
1171                 return -EINVAL;
1172         }
1173 }
1174
1175 /**
1176  * amdgpu_device_wb_free - Free a wb entry
1177  *
1178  * @adev: amdgpu_device pointer
1179  * @wb: wb index
1180  *
1181  * Free a wb slot allocated for use by the driver (all asics)
1182  */
1183 void amdgpu_device_wb_free(struct amdgpu_device *adev, u32 wb)
1184 {
1185         wb >>= 3;
1186         if (wb < adev->wb.num_wb)
1187                 __clear_bit(wb, adev->wb.used);
1188 }
1189
1190 /**
1191  * amdgpu_device_resize_fb_bar - try to resize FB BAR
1192  *
1193  * @adev: amdgpu_device pointer
1194  *
1195  * Try to resize FB BAR to make all VRAM CPU accessible. We try very hard not
1196  * to fail, but if any of the BARs is not accessible after the size we abort
1197  * driver loading by returning -ENODEV.
1198  */
1199 int amdgpu_device_resize_fb_bar(struct amdgpu_device *adev)
1200 {
1201         int rbar_size = pci_rebar_bytes_to_size(adev->gmc.real_vram_size);
1202         struct pci_bus *root;
1203         struct resource *res;
1204         unsigned i;
1205         u16 cmd;
1206         int r;
1207
1208         /* Bypass for VF */
1209         if (amdgpu_sriov_vf(adev))
1210                 return 0;
1211
1212         /* skip if the bios has already enabled large BAR */
1213         if (adev->gmc.real_vram_size &&
1214             (pci_resource_len(adev->pdev, 0) >= adev->gmc.real_vram_size))
1215                 return 0;
1216
1217         /* Check if the root BUS has 64bit memory resources */
1218         root = adev->pdev->bus;
1219         while (root->parent)
1220                 root = root->parent;
1221
1222         pci_bus_for_each_resource(root, res, i) {
1223                 if (res && res->flags & (IORESOURCE_MEM | IORESOURCE_MEM_64) &&
1224                     res->start > 0x100000000ull)
1225                         break;
1226         }
1227
1228         /* Trying to resize is pointless without a root hub window above 4GB */
1229         if (!res)
1230                 return 0;
1231
1232         /* Limit the BAR size to what is available */
1233         rbar_size = min(fls(pci_rebar_get_possible_sizes(adev->pdev, 0)) - 1,
1234                         rbar_size);
1235
1236         /* Disable memory decoding while we change the BAR addresses and size */
1237         pci_read_config_word(adev->pdev, PCI_COMMAND, &cmd);
1238         pci_write_config_word(adev->pdev, PCI_COMMAND,
1239                               cmd & ~PCI_COMMAND_MEMORY);
1240
1241         /* Free the VRAM and doorbell BAR, we most likely need to move both. */
1242         amdgpu_device_doorbell_fini(adev);
1243         if (adev->asic_type >= CHIP_BONAIRE)
1244                 pci_release_resource(adev->pdev, 2);
1245
1246         pci_release_resource(adev->pdev, 0);
1247
1248         r = pci_resize_resource(adev->pdev, 0, rbar_size);
1249         if (r == -ENOSPC)
1250                 DRM_INFO("Not enough PCI address space for a large BAR.");
1251         else if (r && r != -ENOTSUPP)
1252                 DRM_ERROR("Problem resizing BAR0 (%d).", r);
1253
1254         pci_assign_unassigned_bus_resources(adev->pdev->bus);
1255
1256         /* When the doorbell or fb BAR isn't available we have no chance of
1257          * using the device.
1258          */
1259         r = amdgpu_device_doorbell_init(adev);
1260         if (r || (pci_resource_flags(adev->pdev, 0) & IORESOURCE_UNSET))
1261                 return -ENODEV;
1262
1263         pci_write_config_word(adev->pdev, PCI_COMMAND, cmd);
1264
1265         return 0;
1266 }
1267
1268 /*
1269  * GPU helpers function.
1270  */
1271 /**
1272  * amdgpu_device_need_post - check if the hw need post or not
1273  *
1274  * @adev: amdgpu_device pointer
1275  *
1276  * Check if the asic has been initialized (all asics) at driver startup
1277  * or post is needed if  hw reset is performed.
1278  * Returns true if need or false if not.
1279  */
1280 bool amdgpu_device_need_post(struct amdgpu_device *adev)
1281 {
1282         uint32_t reg;
1283
1284         if (amdgpu_sriov_vf(adev))
1285                 return false;
1286
1287         if (amdgpu_passthrough(adev)) {
1288                 /* for FIJI: In whole GPU pass-through virtualization case, after VM reboot
1289                  * some old smc fw still need driver do vPost otherwise gpu hang, while
1290                  * those smc fw version above 22.15 doesn't have this flaw, so we force
1291                  * vpost executed for smc version below 22.15
1292                  */
1293                 if (adev->asic_type == CHIP_FIJI) {
1294                         int err;
1295                         uint32_t fw_ver;
1296                         err = request_firmware(&adev->pm.fw, "amdgpu/fiji_smc.bin", adev->dev);
1297                         /* force vPost if error occured */
1298                         if (err)
1299                                 return true;
1300
1301                         fw_ver = *((uint32_t *)adev->pm.fw->data + 69);
1302                         if (fw_ver < 0x00160e00)
1303                                 return true;
1304                 }
1305         }
1306
1307         /* Don't post if we need to reset whole hive on init */
1308         if (adev->gmc.xgmi.pending_reset)
1309                 return false;
1310
1311         if (adev->has_hw_reset) {
1312                 adev->has_hw_reset = false;
1313                 return true;
1314         }
1315
1316         /* bios scratch used on CIK+ */
1317         if (adev->asic_type >= CHIP_BONAIRE)
1318                 return amdgpu_atombios_scratch_need_asic_init(adev);
1319
1320         /* check MEM_SIZE for older asics */
1321         reg = amdgpu_asic_get_config_memsize(adev);
1322
1323         if ((reg != 0) && (reg != 0xffffffff))
1324                 return false;
1325
1326         return true;
1327 }
1328
1329 /**
1330  * amdgpu_device_should_use_aspm - check if the device should program ASPM
1331  *
1332  * @adev: amdgpu_device pointer
1333  *
1334  * Confirm whether the module parameter and pcie bridge agree that ASPM should
1335  * be set for this device.
1336  *
1337  * Returns true if it should be used or false if not.
1338  */
1339 bool amdgpu_device_should_use_aspm(struct amdgpu_device *adev)
1340 {
1341         switch (amdgpu_aspm) {
1342         case -1:
1343                 break;
1344         case 0:
1345                 return false;
1346         case 1:
1347                 return true;
1348         default:
1349                 return false;
1350         }
1351         return pcie_aspm_enabled(adev->pdev);
1352 }
1353
1354 /* if we get transitioned to only one device, take VGA back */
1355 /**
1356  * amdgpu_device_vga_set_decode - enable/disable vga decode
1357  *
1358  * @pdev: PCI device pointer
1359  * @state: enable/disable vga decode
1360  *
1361  * Enable/disable vga decode (all asics).
1362  * Returns VGA resource flags.
1363  */
1364 static unsigned int amdgpu_device_vga_set_decode(struct pci_dev *pdev,
1365                 bool state)
1366 {
1367         struct amdgpu_device *adev = drm_to_adev(pci_get_drvdata(pdev));
1368         amdgpu_asic_set_vga_state(adev, state);
1369         if (state)
1370                 return VGA_RSRC_LEGACY_IO | VGA_RSRC_LEGACY_MEM |
1371                        VGA_RSRC_NORMAL_IO | VGA_RSRC_NORMAL_MEM;
1372         else
1373                 return VGA_RSRC_NORMAL_IO | VGA_RSRC_NORMAL_MEM;
1374 }
1375
1376 /**
1377  * amdgpu_device_check_block_size - validate the vm block size
1378  *
1379  * @adev: amdgpu_device pointer
1380  *
1381  * Validates the vm block size specified via module parameter.
1382  * The vm block size defines number of bits in page table versus page directory,
1383  * a page is 4KB so we have 12 bits offset, minimum 9 bits in the
1384  * page table and the remaining bits are in the page directory.
1385  */
1386 static void amdgpu_device_check_block_size(struct amdgpu_device *adev)
1387 {
1388         /* defines number of bits in page table versus page directory,
1389          * a page is 4KB so we have 12 bits offset, minimum 9 bits in the
1390          * page table and the remaining bits are in the page directory */
1391         if (amdgpu_vm_block_size == -1)
1392                 return;
1393
1394         if (amdgpu_vm_block_size < 9) {
1395                 dev_warn(adev->dev, "VM page table size (%d) too small\n",
1396                          amdgpu_vm_block_size);
1397                 amdgpu_vm_block_size = -1;
1398         }
1399 }
1400
1401 /**
1402  * amdgpu_device_check_vm_size - validate the vm size
1403  *
1404  * @adev: amdgpu_device pointer
1405  *
1406  * Validates the vm size in GB specified via module parameter.
1407  * The VM size is the size of the GPU virtual memory space in GB.
1408  */
1409 static void amdgpu_device_check_vm_size(struct amdgpu_device *adev)
1410 {
1411         /* no need to check the default value */
1412         if (amdgpu_vm_size == -1)
1413                 return;
1414
1415         if (amdgpu_vm_size < 1) {
1416                 dev_warn(adev->dev, "VM size (%d) too small, min is 1GB\n",
1417                          amdgpu_vm_size);
1418                 amdgpu_vm_size = -1;
1419         }
1420 }
1421
1422 static void amdgpu_device_check_smu_prv_buffer_size(struct amdgpu_device *adev)
1423 {
1424         struct sysinfo si;
1425         bool is_os_64 = (sizeof(void *) == 8);
1426         uint64_t total_memory;
1427         uint64_t dram_size_seven_GB = 0x1B8000000;
1428         uint64_t dram_size_three_GB = 0xB8000000;
1429
1430         if (amdgpu_smu_memory_pool_size == 0)
1431                 return;
1432
1433         if (!is_os_64) {
1434                 DRM_WARN("Not 64-bit OS, feature not supported\n");
1435                 goto def_value;
1436         }
1437         si_meminfo(&si);
1438         total_memory = (uint64_t)si.totalram * si.mem_unit;
1439
1440         if ((amdgpu_smu_memory_pool_size == 1) ||
1441                 (amdgpu_smu_memory_pool_size == 2)) {
1442                 if (total_memory < dram_size_three_GB)
1443                         goto def_value1;
1444         } else if ((amdgpu_smu_memory_pool_size == 4) ||
1445                 (amdgpu_smu_memory_pool_size == 8)) {
1446                 if (total_memory < dram_size_seven_GB)
1447                         goto def_value1;
1448         } else {
1449                 DRM_WARN("Smu memory pool size not supported\n");
1450                 goto def_value;
1451         }
1452         adev->pm.smu_prv_buffer_size = amdgpu_smu_memory_pool_size << 28;
1453
1454         return;
1455
1456 def_value1:
1457         DRM_WARN("No enough system memory\n");
1458 def_value:
1459         adev->pm.smu_prv_buffer_size = 0;
1460 }
1461
1462 static int amdgpu_device_init_apu_flags(struct amdgpu_device *adev)
1463 {
1464         if (!(adev->flags & AMD_IS_APU) ||
1465             adev->asic_type < CHIP_RAVEN)
1466                 return 0;
1467
1468         switch (adev->asic_type) {
1469         case CHIP_RAVEN:
1470                 if (adev->pdev->device == 0x15dd)
1471                         adev->apu_flags |= AMD_APU_IS_RAVEN;
1472                 if (adev->pdev->device == 0x15d8)
1473                         adev->apu_flags |= AMD_APU_IS_PICASSO;
1474                 break;
1475         case CHIP_RENOIR:
1476                 if ((adev->pdev->device == 0x1636) ||
1477                     (adev->pdev->device == 0x164c))
1478                         adev->apu_flags |= AMD_APU_IS_RENOIR;
1479                 else
1480                         adev->apu_flags |= AMD_APU_IS_GREEN_SARDINE;
1481                 break;
1482         case CHIP_VANGOGH:
1483                 adev->apu_flags |= AMD_APU_IS_VANGOGH;
1484                 break;
1485         case CHIP_YELLOW_CARP:
1486                 break;
1487         case CHIP_CYAN_SKILLFISH:
1488                 if ((adev->pdev->device == 0x13FE) ||
1489                     (adev->pdev->device == 0x143F))
1490                         adev->apu_flags |= AMD_APU_IS_CYAN_SKILLFISH2;
1491                 break;
1492         default:
1493                 break;
1494         }
1495
1496         return 0;
1497 }
1498
1499 /**
1500  * amdgpu_device_check_arguments - validate module params
1501  *
1502  * @adev: amdgpu_device pointer
1503  *
1504  * Validates certain module parameters and updates
1505  * the associated values used by the driver (all asics).
1506  */
1507 static int amdgpu_device_check_arguments(struct amdgpu_device *adev)
1508 {
1509         if (amdgpu_sched_jobs < 4) {
1510                 dev_warn(adev->dev, "sched jobs (%d) must be at least 4\n",
1511                          amdgpu_sched_jobs);
1512                 amdgpu_sched_jobs = 4;
1513         } else if (!is_power_of_2(amdgpu_sched_jobs)){
1514                 dev_warn(adev->dev, "sched jobs (%d) must be a power of 2\n",
1515                          amdgpu_sched_jobs);
1516                 amdgpu_sched_jobs = roundup_pow_of_two(amdgpu_sched_jobs);
1517         }
1518
1519         if (amdgpu_gart_size != -1 && amdgpu_gart_size < 32) {
1520                 /* gart size must be greater or equal to 32M */
1521                 dev_warn(adev->dev, "gart size (%d) too small\n",
1522                          amdgpu_gart_size);
1523                 amdgpu_gart_size = -1;
1524         }
1525
1526         if (amdgpu_gtt_size != -1 && amdgpu_gtt_size < 32) {
1527                 /* gtt size must be greater or equal to 32M */
1528                 dev_warn(adev->dev, "gtt size (%d) too small\n",
1529                                  amdgpu_gtt_size);
1530                 amdgpu_gtt_size = -1;
1531         }
1532
1533         /* valid range is between 4 and 9 inclusive */
1534         if (amdgpu_vm_fragment_size != -1 &&
1535             (amdgpu_vm_fragment_size > 9 || amdgpu_vm_fragment_size < 4)) {
1536                 dev_warn(adev->dev, "valid range is between 4 and 9\n");
1537                 amdgpu_vm_fragment_size = -1;
1538         }
1539
1540         if (amdgpu_sched_hw_submission < 2) {
1541                 dev_warn(adev->dev, "sched hw submission jobs (%d) must be at least 2\n",
1542                          amdgpu_sched_hw_submission);
1543                 amdgpu_sched_hw_submission = 2;
1544         } else if (!is_power_of_2(amdgpu_sched_hw_submission)) {
1545                 dev_warn(adev->dev, "sched hw submission jobs (%d) must be a power of 2\n",
1546                          amdgpu_sched_hw_submission);
1547                 amdgpu_sched_hw_submission = roundup_pow_of_two(amdgpu_sched_hw_submission);
1548         }
1549
1550         if (amdgpu_reset_method < -1 || amdgpu_reset_method > 4) {
1551                 dev_warn(adev->dev, "invalid option for reset method, reverting to default\n");
1552                 amdgpu_reset_method = -1;
1553         }
1554
1555         amdgpu_device_check_smu_prv_buffer_size(adev);
1556
1557         amdgpu_device_check_vm_size(adev);
1558
1559         amdgpu_device_check_block_size(adev);
1560
1561         adev->firmware.load_type = amdgpu_ucode_get_load_type(adev, amdgpu_fw_load_type);
1562
1563         return 0;
1564 }
1565
1566 /**
1567  * amdgpu_switcheroo_set_state - set switcheroo state
1568  *
1569  * @pdev: pci dev pointer
1570  * @state: vga_switcheroo state
1571  *
1572  * Callback for the switcheroo driver.  Suspends or resumes the
1573  * the asics before or after it is powered up using ACPI methods.
1574  */
1575 static void amdgpu_switcheroo_set_state(struct pci_dev *pdev,
1576                                         enum vga_switcheroo_state state)
1577 {
1578         struct drm_device *dev = pci_get_drvdata(pdev);
1579         int r;
1580
1581         if (amdgpu_device_supports_px(dev) && state == VGA_SWITCHEROO_OFF)
1582                 return;
1583
1584         if (state == VGA_SWITCHEROO_ON) {
1585                 pr_info("switched on\n");
1586                 /* don't suspend or resume card normally */
1587                 dev->switch_power_state = DRM_SWITCH_POWER_CHANGING;
1588
1589                 pci_set_power_state(pdev, PCI_D0);
1590                 amdgpu_device_load_pci_state(pdev);
1591                 r = pci_enable_device(pdev);
1592                 if (r)
1593                         DRM_WARN("pci_enable_device failed (%d)\n", r);
1594                 amdgpu_device_resume(dev, true);
1595
1596                 dev->switch_power_state = DRM_SWITCH_POWER_ON;
1597         } else {
1598                 pr_info("switched off\n");
1599                 dev->switch_power_state = DRM_SWITCH_POWER_CHANGING;
1600                 amdgpu_device_suspend(dev, true);
1601                 amdgpu_device_cache_pci_state(pdev);
1602                 /* Shut down the device */
1603                 pci_disable_device(pdev);
1604                 pci_set_power_state(pdev, PCI_D3cold);
1605                 dev->switch_power_state = DRM_SWITCH_POWER_OFF;
1606         }
1607 }
1608
1609 /**
1610  * amdgpu_switcheroo_can_switch - see if switcheroo state can change
1611  *
1612  * @pdev: pci dev pointer
1613  *
1614  * Callback for the switcheroo driver.  Check of the switcheroo
1615  * state can be changed.
1616  * Returns true if the state can be changed, false if not.
1617  */
1618 static bool amdgpu_switcheroo_can_switch(struct pci_dev *pdev)
1619 {
1620         struct drm_device *dev = pci_get_drvdata(pdev);
1621
1622         /*
1623         * FIXME: open_count is protected by drm_global_mutex but that would lead to
1624         * locking inversion with the driver load path. And the access here is
1625         * completely racy anyway. So don't bother with locking for now.
1626         */
1627         return atomic_read(&dev->open_count) == 0;
1628 }
1629
1630 static const struct vga_switcheroo_client_ops amdgpu_switcheroo_ops = {
1631         .set_gpu_state = amdgpu_switcheroo_set_state,
1632         .reprobe = NULL,
1633         .can_switch = amdgpu_switcheroo_can_switch,
1634 };
1635
1636 /**
1637  * amdgpu_device_ip_set_clockgating_state - set the CG state
1638  *
1639  * @dev: amdgpu_device pointer
1640  * @block_type: Type of hardware IP (SMU, GFX, UVD, etc.)
1641  * @state: clockgating state (gate or ungate)
1642  *
1643  * Sets the requested clockgating state for all instances of
1644  * the hardware IP specified.
1645  * Returns the error code from the last instance.
1646  */
1647 int amdgpu_device_ip_set_clockgating_state(void *dev,
1648                                            enum amd_ip_block_type block_type,
1649                                            enum amd_clockgating_state state)
1650 {
1651         struct amdgpu_device *adev = dev;
1652         int i, r = 0;
1653
1654         for (i = 0; i < adev->num_ip_blocks; i++) {
1655                 if (!adev->ip_blocks[i].status.valid)
1656                         continue;
1657                 if (adev->ip_blocks[i].version->type != block_type)
1658                         continue;
1659                 if (!adev->ip_blocks[i].version->funcs->set_clockgating_state)
1660                         continue;
1661                 r = adev->ip_blocks[i].version->funcs->set_clockgating_state(
1662                         (void *)adev, state);
1663                 if (r)
1664                         DRM_ERROR("set_clockgating_state of IP block <%s> failed %d\n",
1665                                   adev->ip_blocks[i].version->funcs->name, r);
1666         }
1667         return r;
1668 }
1669
1670 /**
1671  * amdgpu_device_ip_set_powergating_state - set the PG state
1672  *
1673  * @dev: amdgpu_device pointer
1674  * @block_type: Type of hardware IP (SMU, GFX, UVD, etc.)
1675  * @state: powergating state (gate or ungate)
1676  *
1677  * Sets the requested powergating state for all instances of
1678  * the hardware IP specified.
1679  * Returns the error code from the last instance.
1680  */
1681 int amdgpu_device_ip_set_powergating_state(void *dev,
1682                                            enum amd_ip_block_type block_type,
1683                                            enum amd_powergating_state state)
1684 {
1685         struct amdgpu_device *adev = dev;
1686         int i, r = 0;
1687
1688         for (i = 0; i < adev->num_ip_blocks; i++) {
1689                 if (!adev->ip_blocks[i].status.valid)
1690                         continue;
1691                 if (adev->ip_blocks[i].version->type != block_type)
1692                         continue;
1693                 if (!adev->ip_blocks[i].version->funcs->set_powergating_state)
1694                         continue;
1695                 r = adev->ip_blocks[i].version->funcs->set_powergating_state(
1696                         (void *)adev, state);
1697                 if (r)
1698                         DRM_ERROR("set_powergating_state of IP block <%s> failed %d\n",
1699                                   adev->ip_blocks[i].version->funcs->name, r);
1700         }
1701         return r;
1702 }
1703
1704 /**
1705  * amdgpu_device_ip_get_clockgating_state - get the CG state
1706  *
1707  * @adev: amdgpu_device pointer
1708  * @flags: clockgating feature flags
1709  *
1710  * Walks the list of IPs on the device and updates the clockgating
1711  * flags for each IP.
1712  * Updates @flags with the feature flags for each hardware IP where
1713  * clockgating is enabled.
1714  */
1715 void amdgpu_device_ip_get_clockgating_state(struct amdgpu_device *adev,
1716                                             u64 *flags)
1717 {
1718         int i;
1719
1720         for (i = 0; i < adev->num_ip_blocks; i++) {
1721                 if (!adev->ip_blocks[i].status.valid)
1722                         continue;
1723                 if (adev->ip_blocks[i].version->funcs->get_clockgating_state)
1724                         adev->ip_blocks[i].version->funcs->get_clockgating_state((void *)adev, flags);
1725         }
1726 }
1727
1728 /**
1729  * amdgpu_device_ip_wait_for_idle - wait for idle
1730  *
1731  * @adev: amdgpu_device pointer
1732  * @block_type: Type of hardware IP (SMU, GFX, UVD, etc.)
1733  *
1734  * Waits for the request hardware IP to be idle.
1735  * Returns 0 for success or a negative error code on failure.
1736  */
1737 int amdgpu_device_ip_wait_for_idle(struct amdgpu_device *adev,
1738                                    enum amd_ip_block_type block_type)
1739 {
1740         int i, r;
1741
1742         for (i = 0; i < adev->num_ip_blocks; i++) {
1743                 if (!adev->ip_blocks[i].status.valid)
1744                         continue;
1745                 if (adev->ip_blocks[i].version->type == block_type) {
1746                         r = adev->ip_blocks[i].version->funcs->wait_for_idle((void *)adev);
1747                         if (r)
1748                                 return r;
1749                         break;
1750                 }
1751         }
1752         return 0;
1753
1754 }
1755
1756 /**
1757  * amdgpu_device_ip_is_idle - is the hardware IP idle
1758  *
1759  * @adev: amdgpu_device pointer
1760  * @block_type: Type of hardware IP (SMU, GFX, UVD, etc.)
1761  *
1762  * Check if the hardware IP is idle or not.
1763  * Returns true if it the IP is idle, false if not.
1764  */
1765 bool amdgpu_device_ip_is_idle(struct amdgpu_device *adev,
1766                               enum amd_ip_block_type block_type)
1767 {
1768         int i;
1769
1770         for (i = 0; i < adev->num_ip_blocks; i++) {
1771                 if (!adev->ip_blocks[i].status.valid)
1772                         continue;
1773                 if (adev->ip_blocks[i].version->type == block_type)
1774                         return adev->ip_blocks[i].version->funcs->is_idle((void *)adev);
1775         }
1776         return true;
1777
1778 }
1779
1780 /**
1781  * amdgpu_device_ip_get_ip_block - get a hw IP pointer
1782  *
1783  * @adev: amdgpu_device pointer
1784  * @type: Type of hardware IP (SMU, GFX, UVD, etc.)
1785  *
1786  * Returns a pointer to the hardware IP block structure
1787  * if it exists for the asic, otherwise NULL.
1788  */
1789 struct amdgpu_ip_block *
1790 amdgpu_device_ip_get_ip_block(struct amdgpu_device *adev,
1791                               enum amd_ip_block_type type)
1792 {
1793         int i;
1794
1795         for (i = 0; i < adev->num_ip_blocks; i++)
1796                 if (adev->ip_blocks[i].version->type == type)
1797                         return &adev->ip_blocks[i];
1798
1799         return NULL;
1800 }
1801
1802 /**
1803  * amdgpu_device_ip_block_version_cmp
1804  *
1805  * @adev: amdgpu_device pointer
1806  * @type: enum amd_ip_block_type
1807  * @major: major version
1808  * @minor: minor version
1809  *
1810  * return 0 if equal or greater
1811  * return 1 if smaller or the ip_block doesn't exist
1812  */
1813 int amdgpu_device_ip_block_version_cmp(struct amdgpu_device *adev,
1814                                        enum amd_ip_block_type type,
1815                                        u32 major, u32 minor)
1816 {
1817         struct amdgpu_ip_block *ip_block = amdgpu_device_ip_get_ip_block(adev, type);
1818
1819         if (ip_block && ((ip_block->version->major > major) ||
1820                         ((ip_block->version->major == major) &&
1821                         (ip_block->version->minor >= minor))))
1822                 return 0;
1823
1824         return 1;
1825 }
1826
1827 /**
1828  * amdgpu_device_ip_block_add
1829  *
1830  * @adev: amdgpu_device pointer
1831  * @ip_block_version: pointer to the IP to add
1832  *
1833  * Adds the IP block driver information to the collection of IPs
1834  * on the asic.
1835  */
1836 int amdgpu_device_ip_block_add(struct amdgpu_device *adev,
1837                                const struct amdgpu_ip_block_version *ip_block_version)
1838 {
1839         if (!ip_block_version)
1840                 return -EINVAL;
1841
1842         switch (ip_block_version->type) {
1843         case AMD_IP_BLOCK_TYPE_VCN:
1844                 if (adev->harvest_ip_mask & AMD_HARVEST_IP_VCN_MASK)
1845                         return 0;
1846                 break;
1847         case AMD_IP_BLOCK_TYPE_JPEG:
1848                 if (adev->harvest_ip_mask & AMD_HARVEST_IP_JPEG_MASK)
1849                         return 0;
1850                 break;
1851         default:
1852                 break;
1853         }
1854
1855         DRM_INFO("add ip block number %d <%s>\n", adev->num_ip_blocks,
1856                   ip_block_version->funcs->name);
1857
1858         adev->ip_blocks[adev->num_ip_blocks++].version = ip_block_version;
1859
1860         return 0;
1861 }
1862
1863 /**
1864  * amdgpu_device_enable_virtual_display - enable virtual display feature
1865  *
1866  * @adev: amdgpu_device pointer
1867  *
1868  * Enabled the virtual display feature if the user has enabled it via
1869  * the module parameter virtual_display.  This feature provides a virtual
1870  * display hardware on headless boards or in virtualized environments.
1871  * This function parses and validates the configuration string specified by
1872  * the user and configues the virtual display configuration (number of
1873  * virtual connectors, crtcs, etc.) specified.
1874  */
1875 static void amdgpu_device_enable_virtual_display(struct amdgpu_device *adev)
1876 {
1877         adev->enable_virtual_display = false;
1878
1879         if (amdgpu_virtual_display) {
1880                 const char *pci_address_name = pci_name(adev->pdev);
1881                 char *pciaddstr, *pciaddstr_tmp, *pciaddname_tmp, *pciaddname;
1882
1883                 pciaddstr = kstrdup(amdgpu_virtual_display, GFP_KERNEL);
1884                 pciaddstr_tmp = pciaddstr;
1885                 while ((pciaddname_tmp = strsep(&pciaddstr_tmp, ";"))) {
1886                         pciaddname = strsep(&pciaddname_tmp, ",");
1887                         if (!strcmp("all", pciaddname)
1888                             || !strcmp(pci_address_name, pciaddname)) {
1889                                 long num_crtc;
1890                                 int res = -1;
1891
1892                                 adev->enable_virtual_display = true;
1893
1894                                 if (pciaddname_tmp)
1895                                         res = kstrtol(pciaddname_tmp, 10,
1896                                                       &num_crtc);
1897
1898                                 if (!res) {
1899                                         if (num_crtc < 1)
1900                                                 num_crtc = 1;
1901                                         if (num_crtc > 6)
1902                                                 num_crtc = 6;
1903                                         adev->mode_info.num_crtc = num_crtc;
1904                                 } else {
1905                                         adev->mode_info.num_crtc = 1;
1906                                 }
1907                                 break;
1908                         }
1909                 }
1910
1911                 DRM_INFO("virtual display string:%s, %s:virtual_display:%d, num_crtc:%d\n",
1912                          amdgpu_virtual_display, pci_address_name,
1913                          adev->enable_virtual_display, adev->mode_info.num_crtc);
1914
1915                 kfree(pciaddstr);
1916         }
1917 }
1918
1919 /**
1920  * amdgpu_device_parse_gpu_info_fw - parse gpu info firmware
1921  *
1922  * @adev: amdgpu_device pointer
1923  *
1924  * Parses the asic configuration parameters specified in the gpu info
1925  * firmware and makes them availale to the driver for use in configuring
1926  * the asic.
1927  * Returns 0 on success, -EINVAL on failure.
1928  */
1929 static int amdgpu_device_parse_gpu_info_fw(struct amdgpu_device *adev)
1930 {
1931         const char *chip_name;
1932         char fw_name[40];
1933         int err;
1934         const struct gpu_info_firmware_header_v1_0 *hdr;
1935
1936         adev->firmware.gpu_info_fw = NULL;
1937
1938         if (adev->mman.discovery_bin) {
1939                 /*
1940                  * FIXME: The bounding box is still needed by Navi12, so
1941                  * temporarily read it from gpu_info firmware. Should be dropped
1942                  * when DAL no longer needs it.
1943                  */
1944                 if (adev->asic_type != CHIP_NAVI12)
1945                         return 0;
1946         }
1947
1948         switch (adev->asic_type) {
1949         default:
1950                 return 0;
1951         case CHIP_VEGA10:
1952                 chip_name = "vega10";
1953                 break;
1954         case CHIP_VEGA12:
1955                 chip_name = "vega12";
1956                 break;
1957         case CHIP_RAVEN:
1958                 if (adev->apu_flags & AMD_APU_IS_RAVEN2)
1959                         chip_name = "raven2";
1960                 else if (adev->apu_flags & AMD_APU_IS_PICASSO)
1961                         chip_name = "picasso";
1962                 else
1963                         chip_name = "raven";
1964                 break;
1965         case CHIP_ARCTURUS:
1966                 chip_name = "arcturus";
1967                 break;
1968         case CHIP_NAVI12:
1969                 chip_name = "navi12";
1970                 break;
1971         }
1972
1973         snprintf(fw_name, sizeof(fw_name), "amdgpu/%s_gpu_info.bin", chip_name);
1974         err = request_firmware(&adev->firmware.gpu_info_fw, fw_name, adev->dev);
1975         if (err) {
1976                 dev_err(adev->dev,
1977                         "Failed to load gpu_info firmware \"%s\"\n",
1978                         fw_name);
1979                 goto out;
1980         }
1981         err = amdgpu_ucode_validate(adev->firmware.gpu_info_fw);
1982         if (err) {
1983                 dev_err(adev->dev,
1984                         "Failed to validate gpu_info firmware \"%s\"\n",
1985                         fw_name);
1986                 goto out;
1987         }
1988
1989         hdr = (const struct gpu_info_firmware_header_v1_0 *)adev->firmware.gpu_info_fw->data;
1990         amdgpu_ucode_print_gpu_info_hdr(&hdr->header);
1991
1992         switch (hdr->version_major) {
1993         case 1:
1994         {
1995                 const struct gpu_info_firmware_v1_0 *gpu_info_fw =
1996                         (const struct gpu_info_firmware_v1_0 *)(adev->firmware.gpu_info_fw->data +
1997                                                                 le32_to_cpu(hdr->header.ucode_array_offset_bytes));
1998
1999                 /*
2000                  * Should be droped when DAL no longer needs it.
2001                  */
2002                 if (adev->asic_type == CHIP_NAVI12)
2003                         goto parse_soc_bounding_box;
2004
2005                 adev->gfx.config.max_shader_engines = le32_to_cpu(gpu_info_fw->gc_num_se);
2006                 adev->gfx.config.max_cu_per_sh = le32_to_cpu(gpu_info_fw->gc_num_cu_per_sh);
2007                 adev->gfx.config.max_sh_per_se = le32_to_cpu(gpu_info_fw->gc_num_sh_per_se);
2008                 adev->gfx.config.max_backends_per_se = le32_to_cpu(gpu_info_fw->gc_num_rb_per_se);
2009                 adev->gfx.config.max_texture_channel_caches =
2010                         le32_to_cpu(gpu_info_fw->gc_num_tccs);
2011                 adev->gfx.config.max_gprs = le32_to_cpu(gpu_info_fw->gc_num_gprs);
2012                 adev->gfx.config.max_gs_threads = le32_to_cpu(gpu_info_fw->gc_num_max_gs_thds);
2013                 adev->gfx.config.gs_vgt_table_depth = le32_to_cpu(gpu_info_fw->gc_gs_table_depth);
2014                 adev->gfx.config.gs_prim_buffer_depth = le32_to_cpu(gpu_info_fw->gc_gsprim_buff_depth);
2015                 adev->gfx.config.double_offchip_lds_buf =
2016                         le32_to_cpu(gpu_info_fw->gc_double_offchip_lds_buffer);
2017                 adev->gfx.cu_info.wave_front_size = le32_to_cpu(gpu_info_fw->gc_wave_size);
2018                 adev->gfx.cu_info.max_waves_per_simd =
2019                         le32_to_cpu(gpu_info_fw->gc_max_waves_per_simd);
2020                 adev->gfx.cu_info.max_scratch_slots_per_cu =
2021                         le32_to_cpu(gpu_info_fw->gc_max_scratch_slots_per_cu);
2022                 adev->gfx.cu_info.lds_size = le32_to_cpu(gpu_info_fw->gc_lds_size);
2023                 if (hdr->version_minor >= 1) {
2024                         const struct gpu_info_firmware_v1_1 *gpu_info_fw =
2025                                 (const struct gpu_info_firmware_v1_1 *)(adev->firmware.gpu_info_fw->data +
2026                                                                         le32_to_cpu(hdr->header.ucode_array_offset_bytes));
2027                         adev->gfx.config.num_sc_per_sh =
2028                                 le32_to_cpu(gpu_info_fw->num_sc_per_sh);
2029                         adev->gfx.config.num_packer_per_sc =
2030                                 le32_to_cpu(gpu_info_fw->num_packer_per_sc);
2031                 }
2032
2033 parse_soc_bounding_box:
2034                 /*
2035                  * soc bounding box info is not integrated in disocovery table,
2036                  * we always need to parse it from gpu info firmware if needed.
2037                  */
2038                 if (hdr->version_minor == 2) {
2039                         const struct gpu_info_firmware_v1_2 *gpu_info_fw =
2040                                 (const struct gpu_info_firmware_v1_2 *)(adev->firmware.gpu_info_fw->data +
2041                                                                         le32_to_cpu(hdr->header.ucode_array_offset_bytes));
2042                         adev->dm.soc_bounding_box = &gpu_info_fw->soc_bounding_box;
2043                 }
2044                 break;
2045         }
2046         default:
2047                 dev_err(adev->dev,
2048                         "Unsupported gpu_info table %d\n", hdr->header.ucode_version);
2049                 err = -EINVAL;
2050                 goto out;
2051         }
2052 out:
2053         return err;
2054 }
2055
2056 /**
2057  * amdgpu_device_ip_early_init - run early init for hardware IPs
2058  *
2059  * @adev: amdgpu_device pointer
2060  *
2061  * Early initialization pass for hardware IPs.  The hardware IPs that make
2062  * up each asic are discovered each IP's early_init callback is run.  This
2063  * is the first stage in initializing the asic.
2064  * Returns 0 on success, negative error code on failure.
2065  */
2066 static int amdgpu_device_ip_early_init(struct amdgpu_device *adev)
2067 {
2068         struct drm_device *dev = adev_to_drm(adev);
2069         struct pci_dev *parent;
2070         int i, r;
2071
2072         amdgpu_device_enable_virtual_display(adev);
2073
2074         if (amdgpu_sriov_vf(adev)) {
2075                 r = amdgpu_virt_request_full_gpu(adev, true);
2076                 if (r)
2077                         return r;
2078         }
2079
2080         switch (adev->asic_type) {
2081 #ifdef CONFIG_DRM_AMDGPU_SI
2082         case CHIP_VERDE:
2083         case CHIP_TAHITI:
2084         case CHIP_PITCAIRN:
2085         case CHIP_OLAND:
2086         case CHIP_HAINAN:
2087                 adev->family = AMDGPU_FAMILY_SI;
2088                 r = si_set_ip_blocks(adev);
2089                 if (r)
2090                         return r;
2091                 break;
2092 #endif
2093 #ifdef CONFIG_DRM_AMDGPU_CIK
2094         case CHIP_BONAIRE:
2095         case CHIP_HAWAII:
2096         case CHIP_KAVERI:
2097         case CHIP_KABINI:
2098         case CHIP_MULLINS:
2099                 if (adev->flags & AMD_IS_APU)
2100                         adev->family = AMDGPU_FAMILY_KV;
2101                 else
2102                         adev->family = AMDGPU_FAMILY_CI;
2103
2104                 r = cik_set_ip_blocks(adev);
2105                 if (r)
2106                         return r;
2107                 break;
2108 #endif
2109         case CHIP_TOPAZ:
2110         case CHIP_TONGA:
2111         case CHIP_FIJI:
2112         case CHIP_POLARIS10:
2113         case CHIP_POLARIS11:
2114         case CHIP_POLARIS12:
2115         case CHIP_VEGAM:
2116         case CHIP_CARRIZO:
2117         case CHIP_STONEY:
2118                 if (adev->flags & AMD_IS_APU)
2119                         adev->family = AMDGPU_FAMILY_CZ;
2120                 else
2121                         adev->family = AMDGPU_FAMILY_VI;
2122
2123                 r = vi_set_ip_blocks(adev);
2124                 if (r)
2125                         return r;
2126                 break;
2127         default:
2128                 r = amdgpu_discovery_set_ip_blocks(adev);
2129                 if (r)
2130                         return r;
2131                 break;
2132         }
2133
2134         if (amdgpu_has_atpx() &&
2135             (amdgpu_is_atpx_hybrid() ||
2136              amdgpu_has_atpx_dgpu_power_cntl()) &&
2137             ((adev->flags & AMD_IS_APU) == 0) &&
2138             !pci_is_thunderbolt_attached(to_pci_dev(dev->dev)))
2139                 adev->flags |= AMD_IS_PX;
2140
2141         if (!(adev->flags & AMD_IS_APU)) {
2142                 parent = pci_upstream_bridge(adev->pdev);
2143                 adev->has_pr3 = parent ? pci_pr3_present(parent) : false;
2144         }
2145
2146         amdgpu_amdkfd_device_probe(adev);
2147
2148         adev->pm.pp_feature = amdgpu_pp_feature_mask;
2149         if (amdgpu_sriov_vf(adev) || sched_policy == KFD_SCHED_POLICY_NO_HWS)
2150                 adev->pm.pp_feature &= ~PP_GFXOFF_MASK;
2151         if (amdgpu_sriov_vf(adev) && adev->asic_type == CHIP_SIENNA_CICHLID)
2152                 adev->pm.pp_feature &= ~PP_OVERDRIVE_MASK;
2153
2154         for (i = 0; i < adev->num_ip_blocks; i++) {
2155                 if ((amdgpu_ip_block_mask & (1 << i)) == 0) {
2156                         DRM_ERROR("disabled ip block: %d <%s>\n",
2157                                   i, adev->ip_blocks[i].version->funcs->name);
2158                         adev->ip_blocks[i].status.valid = false;
2159                 } else {
2160                         if (adev->ip_blocks[i].version->funcs->early_init) {
2161                                 r = adev->ip_blocks[i].version->funcs->early_init((void *)adev);
2162                                 if (r == -ENOENT) {
2163                                         adev->ip_blocks[i].status.valid = false;
2164                                 } else if (r) {
2165                                         DRM_ERROR("early_init of IP block <%s> failed %d\n",
2166                                                   adev->ip_blocks[i].version->funcs->name, r);
2167                                         return r;
2168                                 } else {
2169                                         adev->ip_blocks[i].status.valid = true;
2170                                 }
2171                         } else {
2172                                 adev->ip_blocks[i].status.valid = true;
2173                         }
2174                 }
2175                 /* get the vbios after the asic_funcs are set up */
2176                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_COMMON) {
2177                         r = amdgpu_device_parse_gpu_info_fw(adev);
2178                         if (r)
2179                                 return r;
2180
2181                         /* Read BIOS */
2182                         if (!amdgpu_get_bios(adev))
2183                                 return -EINVAL;
2184
2185                         r = amdgpu_atombios_init(adev);
2186                         if (r) {
2187                                 dev_err(adev->dev, "amdgpu_atombios_init failed\n");
2188                                 amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_ATOMBIOS_INIT_FAIL, 0, 0);
2189                                 return r;
2190                         }
2191
2192                         /*get pf2vf msg info at it's earliest time*/
2193                         if (amdgpu_sriov_vf(adev))
2194                                 amdgpu_virt_init_data_exchange(adev);
2195
2196                 }
2197         }
2198
2199         adev->cg_flags &= amdgpu_cg_mask;
2200         adev->pg_flags &= amdgpu_pg_mask;
2201
2202         return 0;
2203 }
2204
2205 static int amdgpu_device_ip_hw_init_phase1(struct amdgpu_device *adev)
2206 {
2207         int i, r;
2208
2209         for (i = 0; i < adev->num_ip_blocks; i++) {
2210                 if (!adev->ip_blocks[i].status.sw)
2211                         continue;
2212                 if (adev->ip_blocks[i].status.hw)
2213                         continue;
2214                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_COMMON ||
2215                     (amdgpu_sriov_vf(adev) && (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_PSP)) ||
2216                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_IH) {
2217                         r = adev->ip_blocks[i].version->funcs->hw_init(adev);
2218                         if (r) {
2219                                 DRM_ERROR("hw_init of IP block <%s> failed %d\n",
2220                                           adev->ip_blocks[i].version->funcs->name, r);
2221                                 return r;
2222                         }
2223                         adev->ip_blocks[i].status.hw = true;
2224                 }
2225         }
2226
2227         return 0;
2228 }
2229
2230 static int amdgpu_device_ip_hw_init_phase2(struct amdgpu_device *adev)
2231 {
2232         int i, r;
2233
2234         for (i = 0; i < adev->num_ip_blocks; i++) {
2235                 if (!adev->ip_blocks[i].status.sw)
2236                         continue;
2237                 if (adev->ip_blocks[i].status.hw)
2238                         continue;
2239                 r = adev->ip_blocks[i].version->funcs->hw_init(adev);
2240                 if (r) {
2241                         DRM_ERROR("hw_init of IP block <%s> failed %d\n",
2242                                   adev->ip_blocks[i].version->funcs->name, r);
2243                         return r;
2244                 }
2245                 adev->ip_blocks[i].status.hw = true;
2246         }
2247
2248         return 0;
2249 }
2250
2251 static int amdgpu_device_fw_loading(struct amdgpu_device *adev)
2252 {
2253         int r = 0;
2254         int i;
2255         uint32_t smu_version;
2256
2257         if (adev->asic_type >= CHIP_VEGA10) {
2258                 for (i = 0; i < adev->num_ip_blocks; i++) {
2259                         if (adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_PSP)
2260                                 continue;
2261
2262                         if (!adev->ip_blocks[i].status.sw)
2263                                 continue;
2264
2265                         /* no need to do the fw loading again if already done*/
2266                         if (adev->ip_blocks[i].status.hw == true)
2267                                 break;
2268
2269                         if (amdgpu_in_reset(adev) || adev->in_suspend) {
2270                                 r = adev->ip_blocks[i].version->funcs->resume(adev);
2271                                 if (r) {
2272                                         DRM_ERROR("resume of IP block <%s> failed %d\n",
2273                                                           adev->ip_blocks[i].version->funcs->name, r);
2274                                         return r;
2275                                 }
2276                         } else {
2277                                 r = adev->ip_blocks[i].version->funcs->hw_init(adev);
2278                                 if (r) {
2279                                         DRM_ERROR("hw_init of IP block <%s> failed %d\n",
2280                                                           adev->ip_blocks[i].version->funcs->name, r);
2281                                         return r;
2282                                 }
2283                         }
2284
2285                         adev->ip_blocks[i].status.hw = true;
2286                         break;
2287                 }
2288         }
2289
2290         if (!amdgpu_sriov_vf(adev) || adev->asic_type == CHIP_TONGA)
2291                 r = amdgpu_pm_load_smu_firmware(adev, &smu_version);
2292
2293         return r;
2294 }
2295
2296 static int amdgpu_device_init_schedulers(struct amdgpu_device *adev)
2297 {
2298         long timeout;
2299         int r, i;
2300
2301         for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
2302                 struct amdgpu_ring *ring = adev->rings[i];
2303
2304                 /* No need to setup the GPU scheduler for rings that don't need it */
2305                 if (!ring || ring->no_scheduler)
2306                         continue;
2307
2308                 switch (ring->funcs->type) {
2309                 case AMDGPU_RING_TYPE_GFX:
2310                         timeout = adev->gfx_timeout;
2311                         break;
2312                 case AMDGPU_RING_TYPE_COMPUTE:
2313                         timeout = adev->compute_timeout;
2314                         break;
2315                 case AMDGPU_RING_TYPE_SDMA:
2316                         timeout = adev->sdma_timeout;
2317                         break;
2318                 default:
2319                         timeout = adev->video_timeout;
2320                         break;
2321                 }
2322
2323                 r = drm_sched_init(&ring->sched, &amdgpu_sched_ops,
2324                                    ring->num_hw_submission, amdgpu_job_hang_limit,
2325                                    timeout, adev->reset_domain->wq,
2326                                    ring->sched_score, ring->name,
2327                                    adev->dev);
2328                 if (r) {
2329                         DRM_ERROR("Failed to create scheduler on ring %s.\n",
2330                                   ring->name);
2331                         return r;
2332                 }
2333         }
2334
2335         return 0;
2336 }
2337
2338
2339 /**
2340  * amdgpu_device_ip_init - run init for hardware IPs
2341  *
2342  * @adev: amdgpu_device pointer
2343  *
2344  * Main initialization pass for hardware IPs.  The list of all the hardware
2345  * IPs that make up the asic is walked and the sw_init and hw_init callbacks
2346  * are run.  sw_init initializes the software state associated with each IP
2347  * and hw_init initializes the hardware associated with each IP.
2348  * Returns 0 on success, negative error code on failure.
2349  */
2350 static int amdgpu_device_ip_init(struct amdgpu_device *adev)
2351 {
2352         int i, r;
2353
2354         r = amdgpu_ras_init(adev);
2355         if (r)
2356                 return r;
2357
2358         for (i = 0; i < adev->num_ip_blocks; i++) {
2359                 if (!adev->ip_blocks[i].status.valid)
2360                         continue;
2361                 r = adev->ip_blocks[i].version->funcs->sw_init((void *)adev);
2362                 if (r) {
2363                         DRM_ERROR("sw_init of IP block <%s> failed %d\n",
2364                                   adev->ip_blocks[i].version->funcs->name, r);
2365                         goto init_failed;
2366                 }
2367                 adev->ip_blocks[i].status.sw = true;
2368
2369                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_COMMON) {
2370                         /* need to do common hw init early so everything is set up for gmc */
2371                         r = adev->ip_blocks[i].version->funcs->hw_init((void *)adev);
2372                         if (r) {
2373                                 DRM_ERROR("hw_init %d failed %d\n", i, r);
2374                                 goto init_failed;
2375                         }
2376                         adev->ip_blocks[i].status.hw = true;
2377                 } else if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GMC) {
2378                         /* need to do gmc hw init early so we can allocate gpu mem */
2379                         /* Try to reserve bad pages early */
2380                         if (amdgpu_sriov_vf(adev))
2381                                 amdgpu_virt_exchange_data(adev);
2382
2383                         r = amdgpu_device_vram_scratch_init(adev);
2384                         if (r) {
2385                                 DRM_ERROR("amdgpu_vram_scratch_init failed %d\n", r);
2386                                 goto init_failed;
2387                         }
2388                         r = adev->ip_blocks[i].version->funcs->hw_init((void *)adev);
2389                         if (r) {
2390                                 DRM_ERROR("hw_init %d failed %d\n", i, r);
2391                                 goto init_failed;
2392                         }
2393                         r = amdgpu_device_wb_init(adev);
2394                         if (r) {
2395                                 DRM_ERROR("amdgpu_device_wb_init failed %d\n", r);
2396                                 goto init_failed;
2397                         }
2398                         adev->ip_blocks[i].status.hw = true;
2399
2400                         /* right after GMC hw init, we create CSA */
2401                         if (amdgpu_mcbp || amdgpu_sriov_vf(adev)) {
2402                                 r = amdgpu_allocate_static_csa(adev, &adev->virt.csa_obj,
2403                                                                 AMDGPU_GEM_DOMAIN_VRAM,
2404                                                                 AMDGPU_CSA_SIZE);
2405                                 if (r) {
2406                                         DRM_ERROR("allocate CSA failed %d\n", r);
2407                                         goto init_failed;
2408                                 }
2409                         }
2410                 }
2411         }
2412
2413         if (amdgpu_sriov_vf(adev))
2414                 amdgpu_virt_init_data_exchange(adev);
2415
2416         r = amdgpu_ib_pool_init(adev);
2417         if (r) {
2418                 dev_err(adev->dev, "IB initialization failed (%d).\n", r);
2419                 amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_IB_INIT_FAIL, 0, r);
2420                 goto init_failed;
2421         }
2422
2423         r = amdgpu_ucode_create_bo(adev); /* create ucode bo when sw_init complete*/
2424         if (r)
2425                 goto init_failed;
2426
2427         r = amdgpu_device_ip_hw_init_phase1(adev);
2428         if (r)
2429                 goto init_failed;
2430
2431         r = amdgpu_device_fw_loading(adev);
2432         if (r)
2433                 goto init_failed;
2434
2435         r = amdgpu_device_ip_hw_init_phase2(adev);
2436         if (r)
2437                 goto init_failed;
2438
2439         /*
2440          * retired pages will be loaded from eeprom and reserved here,
2441          * it should be called after amdgpu_device_ip_hw_init_phase2  since
2442          * for some ASICs the RAS EEPROM code relies on SMU fully functioning
2443          * for I2C communication which only true at this point.
2444          *
2445          * amdgpu_ras_recovery_init may fail, but the upper only cares the
2446          * failure from bad gpu situation and stop amdgpu init process
2447          * accordingly. For other failed cases, it will still release all
2448          * the resource and print error message, rather than returning one
2449          * negative value to upper level.
2450          *
2451          * Note: theoretically, this should be called before all vram allocations
2452          * to protect retired page from abusing
2453          */
2454         r = amdgpu_ras_recovery_init(adev);
2455         if (r)
2456                 goto init_failed;
2457
2458         /**
2459          * In case of XGMI grab extra reference for reset domain for this device
2460          */
2461         if (adev->gmc.xgmi.num_physical_nodes > 1) {
2462                 if (amdgpu_xgmi_add_device(adev) == 0) {
2463                         if (!amdgpu_sriov_vf(adev)) {
2464                                 struct amdgpu_hive_info *hive = amdgpu_get_xgmi_hive(adev);
2465
2466                                 if (!hive->reset_domain ||
2467                                     !amdgpu_reset_get_reset_domain(hive->reset_domain)) {
2468                                         r = -ENOENT;
2469                                         amdgpu_put_xgmi_hive(hive);
2470                                         goto init_failed;
2471                                 }
2472
2473                                 /* Drop the early temporary reset domain we created for device */
2474                                 amdgpu_reset_put_reset_domain(adev->reset_domain);
2475                                 adev->reset_domain = hive->reset_domain;
2476                                 amdgpu_put_xgmi_hive(hive);
2477                         }
2478                 }
2479         }
2480
2481         r = amdgpu_device_init_schedulers(adev);
2482         if (r)
2483                 goto init_failed;
2484
2485         /* Don't init kfd if whole hive need to be reset during init */
2486         if (!adev->gmc.xgmi.pending_reset)
2487                 amdgpu_amdkfd_device_init(adev);
2488
2489         amdgpu_fru_get_product_info(adev);
2490
2491 init_failed:
2492         if (amdgpu_sriov_vf(adev))
2493                 amdgpu_virt_release_full_gpu(adev, true);
2494
2495         return r;
2496 }
2497
2498 /**
2499  * amdgpu_device_fill_reset_magic - writes reset magic to gart pointer
2500  *
2501  * @adev: amdgpu_device pointer
2502  *
2503  * Writes a reset magic value to the gart pointer in VRAM.  The driver calls
2504  * this function before a GPU reset.  If the value is retained after a
2505  * GPU reset, VRAM has not been lost.  Some GPU resets may destry VRAM contents.
2506  */
2507 static void amdgpu_device_fill_reset_magic(struct amdgpu_device *adev)
2508 {
2509         memcpy(adev->reset_magic, adev->gart.ptr, AMDGPU_RESET_MAGIC_NUM);
2510 }
2511
2512 /**
2513  * amdgpu_device_check_vram_lost - check if vram is valid
2514  *
2515  * @adev: amdgpu_device pointer
2516  *
2517  * Checks the reset magic value written to the gart pointer in VRAM.
2518  * The driver calls this after a GPU reset to see if the contents of
2519  * VRAM is lost or now.
2520  * returns true if vram is lost, false if not.
2521  */
2522 static bool amdgpu_device_check_vram_lost(struct amdgpu_device *adev)
2523 {
2524         if (memcmp(adev->gart.ptr, adev->reset_magic,
2525                         AMDGPU_RESET_MAGIC_NUM))
2526                 return true;
2527
2528         if (!amdgpu_in_reset(adev))
2529                 return false;
2530
2531         /*
2532          * For all ASICs with baco/mode1 reset, the VRAM is
2533          * always assumed to be lost.
2534          */
2535         switch (amdgpu_asic_reset_method(adev)) {
2536         case AMD_RESET_METHOD_BACO:
2537         case AMD_RESET_METHOD_MODE1:
2538                 return true;
2539         default:
2540                 return false;
2541         }
2542 }
2543
2544 /**
2545  * amdgpu_device_set_cg_state - set clockgating for amdgpu device
2546  *
2547  * @adev: amdgpu_device pointer
2548  * @state: clockgating state (gate or ungate)
2549  *
2550  * The list of all the hardware IPs that make up the asic is walked and the
2551  * set_clockgating_state callbacks are run.
2552  * Late initialization pass enabling clockgating for hardware IPs.
2553  * Fini or suspend, pass disabling clockgating for hardware IPs.
2554  * Returns 0 on success, negative error code on failure.
2555  */
2556
2557 int amdgpu_device_set_cg_state(struct amdgpu_device *adev,
2558                                enum amd_clockgating_state state)
2559 {
2560         int i, j, r;
2561
2562         if (amdgpu_emu_mode == 1)
2563                 return 0;
2564
2565         for (j = 0; j < adev->num_ip_blocks; j++) {
2566                 i = state == AMD_CG_STATE_GATE ? j : adev->num_ip_blocks - j - 1;
2567                 if (!adev->ip_blocks[i].status.late_initialized)
2568                         continue;
2569                 /* skip CG for GFX on S0ix */
2570                 if (adev->in_s0ix &&
2571                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GFX)
2572                         continue;
2573                 /* skip CG for VCE/UVD, it's handled specially */
2574                 if (adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_UVD &&
2575                     adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_VCE &&
2576                     adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_VCN &&
2577                     adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_JPEG &&
2578                     adev->ip_blocks[i].version->funcs->set_clockgating_state) {
2579                         /* enable clockgating to save power */
2580                         r = adev->ip_blocks[i].version->funcs->set_clockgating_state((void *)adev,
2581                                                                                      state);
2582                         if (r) {
2583                                 DRM_ERROR("set_clockgating_state(gate) of IP block <%s> failed %d\n",
2584                                           adev->ip_blocks[i].version->funcs->name, r);
2585                                 return r;
2586                         }
2587                 }
2588         }
2589
2590         return 0;
2591 }
2592
2593 int amdgpu_device_set_pg_state(struct amdgpu_device *adev,
2594                                enum amd_powergating_state state)
2595 {
2596         int i, j, r;
2597
2598         if (amdgpu_emu_mode == 1)
2599                 return 0;
2600
2601         for (j = 0; j < adev->num_ip_blocks; j++) {
2602                 i = state == AMD_PG_STATE_GATE ? j : adev->num_ip_blocks - j - 1;
2603                 if (!adev->ip_blocks[i].status.late_initialized)
2604                         continue;
2605                 /* skip PG for GFX on S0ix */
2606                 if (adev->in_s0ix &&
2607                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GFX)
2608                         continue;
2609                 /* skip CG for VCE/UVD, it's handled specially */
2610                 if (adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_UVD &&
2611                     adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_VCE &&
2612                     adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_VCN &&
2613                     adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_JPEG &&
2614                     adev->ip_blocks[i].version->funcs->set_powergating_state) {
2615                         /* enable powergating to save power */
2616                         r = adev->ip_blocks[i].version->funcs->set_powergating_state((void *)adev,
2617                                                                                         state);
2618                         if (r) {
2619                                 DRM_ERROR("set_powergating_state(gate) of IP block <%s> failed %d\n",
2620                                           adev->ip_blocks[i].version->funcs->name, r);
2621                                 return r;
2622                         }
2623                 }
2624         }
2625         return 0;
2626 }
2627
2628 static int amdgpu_device_enable_mgpu_fan_boost(void)
2629 {
2630         struct amdgpu_gpu_instance *gpu_ins;
2631         struct amdgpu_device *adev;
2632         int i, ret = 0;
2633
2634         mutex_lock(&mgpu_info.mutex);
2635
2636         /*
2637          * MGPU fan boost feature should be enabled
2638          * only when there are two or more dGPUs in
2639          * the system
2640          */
2641         if (mgpu_info.num_dgpu < 2)
2642                 goto out;
2643
2644         for (i = 0; i < mgpu_info.num_dgpu; i++) {
2645                 gpu_ins = &(mgpu_info.gpu_ins[i]);
2646                 adev = gpu_ins->adev;
2647                 if (!(adev->flags & AMD_IS_APU) &&
2648                     !gpu_ins->mgpu_fan_enabled) {
2649                         ret = amdgpu_dpm_enable_mgpu_fan_boost(adev);
2650                         if (ret)
2651                                 break;
2652
2653                         gpu_ins->mgpu_fan_enabled = 1;
2654                 }
2655         }
2656
2657 out:
2658         mutex_unlock(&mgpu_info.mutex);
2659
2660         return ret;
2661 }
2662
2663 /**
2664  * amdgpu_device_ip_late_init - run late init for hardware IPs
2665  *
2666  * @adev: amdgpu_device pointer
2667  *
2668  * Late initialization pass for hardware IPs.  The list of all the hardware
2669  * IPs that make up the asic is walked and the late_init callbacks are run.
2670  * late_init covers any special initialization that an IP requires
2671  * after all of the have been initialized or something that needs to happen
2672  * late in the init process.
2673  * Returns 0 on success, negative error code on failure.
2674  */
2675 static int amdgpu_device_ip_late_init(struct amdgpu_device *adev)
2676 {
2677         struct amdgpu_gpu_instance *gpu_instance;
2678         int i = 0, r;
2679
2680         for (i = 0; i < adev->num_ip_blocks; i++) {
2681                 if (!adev->ip_blocks[i].status.hw)
2682                         continue;
2683                 if (adev->ip_blocks[i].version->funcs->late_init) {
2684                         r = adev->ip_blocks[i].version->funcs->late_init((void *)adev);
2685                         if (r) {
2686                                 DRM_ERROR("late_init of IP block <%s> failed %d\n",
2687                                           adev->ip_blocks[i].version->funcs->name, r);
2688                                 return r;
2689                         }
2690                 }
2691                 adev->ip_blocks[i].status.late_initialized = true;
2692         }
2693
2694         r = amdgpu_ras_late_init(adev);
2695         if (r) {
2696                 DRM_ERROR("amdgpu_ras_late_init failed %d", r);
2697                 return r;
2698         }
2699
2700         amdgpu_ras_set_error_query_ready(adev, true);
2701
2702         amdgpu_device_set_cg_state(adev, AMD_CG_STATE_GATE);
2703         amdgpu_device_set_pg_state(adev, AMD_PG_STATE_GATE);
2704
2705         amdgpu_device_fill_reset_magic(adev);
2706
2707         r = amdgpu_device_enable_mgpu_fan_boost();
2708         if (r)
2709                 DRM_ERROR("enable mgpu fan boost failed (%d).\n", r);
2710
2711         /* For passthrough configuration on arcturus and aldebaran, enable special handling SBR */
2712         if (amdgpu_passthrough(adev) && ((adev->asic_type == CHIP_ARCTURUS && adev->gmc.xgmi.num_physical_nodes > 1)||
2713                                adev->asic_type == CHIP_ALDEBARAN ))
2714                 amdgpu_dpm_handle_passthrough_sbr(adev, true);
2715
2716         if (adev->gmc.xgmi.num_physical_nodes > 1) {
2717                 mutex_lock(&mgpu_info.mutex);
2718
2719                 /*
2720                  * Reset device p-state to low as this was booted with high.
2721                  *
2722                  * This should be performed only after all devices from the same
2723                  * hive get initialized.
2724                  *
2725                  * However, it's unknown how many device in the hive in advance.
2726                  * As this is counted one by one during devices initializations.
2727                  *
2728                  * So, we wait for all XGMI interlinked devices initialized.
2729                  * This may bring some delays as those devices may come from
2730                  * different hives. But that should be OK.
2731                  */
2732                 if (mgpu_info.num_dgpu == adev->gmc.xgmi.num_physical_nodes) {
2733                         for (i = 0; i < mgpu_info.num_gpu; i++) {
2734                                 gpu_instance = &(mgpu_info.gpu_ins[i]);
2735                                 if (gpu_instance->adev->flags & AMD_IS_APU)
2736                                         continue;
2737
2738                                 r = amdgpu_xgmi_set_pstate(gpu_instance->adev,
2739                                                 AMDGPU_XGMI_PSTATE_MIN);
2740                                 if (r) {
2741                                         DRM_ERROR("pstate setting failed (%d).\n", r);
2742                                         break;
2743                                 }
2744                         }
2745                 }
2746
2747                 mutex_unlock(&mgpu_info.mutex);
2748         }
2749
2750         return 0;
2751 }
2752
2753 /**
2754  * amdgpu_device_smu_fini_early - smu hw_fini wrapper
2755  *
2756  * @adev: amdgpu_device pointer
2757  *
2758  * For ASICs need to disable SMC first
2759  */
2760 static void amdgpu_device_smu_fini_early(struct amdgpu_device *adev)
2761 {
2762         int i, r;
2763
2764         if (adev->ip_versions[GC_HWIP][0] > IP_VERSION(9, 0, 0))
2765                 return;
2766
2767         for (i = 0; i < adev->num_ip_blocks; i++) {
2768                 if (!adev->ip_blocks[i].status.hw)
2769                         continue;
2770                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_SMC) {
2771                         r = adev->ip_blocks[i].version->funcs->hw_fini((void *)adev);
2772                         /* XXX handle errors */
2773                         if (r) {
2774                                 DRM_DEBUG("hw_fini of IP block <%s> failed %d\n",
2775                                           adev->ip_blocks[i].version->funcs->name, r);
2776                         }
2777                         adev->ip_blocks[i].status.hw = false;
2778                         break;
2779                 }
2780         }
2781 }
2782
2783 static int amdgpu_device_ip_fini_early(struct amdgpu_device *adev)
2784 {
2785         int i, r;
2786
2787         for (i = 0; i < adev->num_ip_blocks; i++) {
2788                 if (!adev->ip_blocks[i].version->funcs->early_fini)
2789                         continue;
2790
2791                 r = adev->ip_blocks[i].version->funcs->early_fini((void *)adev);
2792                 if (r) {
2793                         DRM_DEBUG("early_fini of IP block <%s> failed %d\n",
2794                                   adev->ip_blocks[i].version->funcs->name, r);
2795                 }
2796         }
2797
2798         amdgpu_device_set_pg_state(adev, AMD_PG_STATE_UNGATE);
2799         amdgpu_device_set_cg_state(adev, AMD_CG_STATE_UNGATE);
2800
2801         amdgpu_amdkfd_suspend(adev, false);
2802
2803         /* Workaroud for ASICs need to disable SMC first */
2804         amdgpu_device_smu_fini_early(adev);
2805
2806         for (i = adev->num_ip_blocks - 1; i >= 0; i--) {
2807                 if (!adev->ip_blocks[i].status.hw)
2808                         continue;
2809
2810                 r = adev->ip_blocks[i].version->funcs->hw_fini((void *)adev);
2811                 /* XXX handle errors */
2812                 if (r) {
2813                         DRM_DEBUG("hw_fini of IP block <%s> failed %d\n",
2814                                   adev->ip_blocks[i].version->funcs->name, r);
2815                 }
2816
2817                 adev->ip_blocks[i].status.hw = false;
2818         }
2819
2820         if (amdgpu_sriov_vf(adev)) {
2821                 if (amdgpu_virt_release_full_gpu(adev, false))
2822                         DRM_ERROR("failed to release exclusive mode on fini\n");
2823         }
2824
2825         return 0;
2826 }
2827
2828 /**
2829  * amdgpu_device_ip_fini - run fini for hardware IPs
2830  *
2831  * @adev: amdgpu_device pointer
2832  *
2833  * Main teardown pass for hardware IPs.  The list of all the hardware
2834  * IPs that make up the asic is walked and the hw_fini and sw_fini callbacks
2835  * are run.  hw_fini tears down the hardware associated with each IP
2836  * and sw_fini tears down any software state associated with each IP.
2837  * Returns 0 on success, negative error code on failure.
2838  */
2839 static int amdgpu_device_ip_fini(struct amdgpu_device *adev)
2840 {
2841         int i, r;
2842
2843         if (amdgpu_sriov_vf(adev) && adev->virt.ras_init_done)
2844                 amdgpu_virt_release_ras_err_handler_data(adev);
2845
2846         if (adev->gmc.xgmi.num_physical_nodes > 1)
2847                 amdgpu_xgmi_remove_device(adev);
2848
2849         amdgpu_amdkfd_device_fini_sw(adev);
2850
2851         for (i = adev->num_ip_blocks - 1; i >= 0; i--) {
2852                 if (!adev->ip_blocks[i].status.sw)
2853                         continue;
2854
2855                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GMC) {
2856                         amdgpu_ucode_free_bo(adev);
2857                         amdgpu_free_static_csa(&adev->virt.csa_obj);
2858                         amdgpu_device_wb_fini(adev);
2859                         amdgpu_device_vram_scratch_fini(adev);
2860                         amdgpu_ib_pool_fini(adev);
2861                 }
2862
2863                 r = adev->ip_blocks[i].version->funcs->sw_fini((void *)adev);
2864                 /* XXX handle errors */
2865                 if (r) {
2866                         DRM_DEBUG("sw_fini of IP block <%s> failed %d\n",
2867                                   adev->ip_blocks[i].version->funcs->name, r);
2868                 }
2869                 adev->ip_blocks[i].status.sw = false;
2870                 adev->ip_blocks[i].status.valid = false;
2871         }
2872
2873         for (i = adev->num_ip_blocks - 1; i >= 0; i--) {
2874                 if (!adev->ip_blocks[i].status.late_initialized)
2875                         continue;
2876                 if (adev->ip_blocks[i].version->funcs->late_fini)
2877                         adev->ip_blocks[i].version->funcs->late_fini((void *)adev);
2878                 adev->ip_blocks[i].status.late_initialized = false;
2879         }
2880
2881         amdgpu_ras_fini(adev);
2882
2883         return 0;
2884 }
2885
2886 /**
2887  * amdgpu_device_delayed_init_work_handler - work handler for IB tests
2888  *
2889  * @work: work_struct.
2890  */
2891 static void amdgpu_device_delayed_init_work_handler(struct work_struct *work)
2892 {
2893         struct amdgpu_device *adev =
2894                 container_of(work, struct amdgpu_device, delayed_init_work.work);
2895         int r;
2896
2897         r = amdgpu_ib_ring_tests(adev);
2898         if (r)
2899                 DRM_ERROR("ib ring test failed (%d).\n", r);
2900 }
2901
2902 static void amdgpu_device_delay_enable_gfx_off(struct work_struct *work)
2903 {
2904         struct amdgpu_device *adev =
2905                 container_of(work, struct amdgpu_device, gfx.gfx_off_delay_work.work);
2906
2907         WARN_ON_ONCE(adev->gfx.gfx_off_state);
2908         WARN_ON_ONCE(adev->gfx.gfx_off_req_count);
2909
2910         if (!amdgpu_dpm_set_powergating_by_smu(adev, AMD_IP_BLOCK_TYPE_GFX, true))
2911                 adev->gfx.gfx_off_state = true;
2912 }
2913
2914 /**
2915  * amdgpu_device_ip_suspend_phase1 - run suspend for hardware IPs (phase 1)
2916  *
2917  * @adev: amdgpu_device pointer
2918  *
2919  * Main suspend function for hardware IPs.  The list of all the hardware
2920  * IPs that make up the asic is walked, clockgating is disabled and the
2921  * suspend callbacks are run.  suspend puts the hardware and software state
2922  * in each IP into a state suitable for suspend.
2923  * Returns 0 on success, negative error code on failure.
2924  */
2925 static int amdgpu_device_ip_suspend_phase1(struct amdgpu_device *adev)
2926 {
2927         int i, r;
2928
2929         amdgpu_device_set_pg_state(adev, AMD_PG_STATE_UNGATE);
2930         amdgpu_device_set_cg_state(adev, AMD_CG_STATE_UNGATE);
2931
2932         /*
2933          * Per PMFW team's suggestion, driver needs to handle gfxoff
2934          * and df cstate features disablement for gpu reset(e.g. Mode1Reset)
2935          * scenario. Add the missing df cstate disablement here.
2936          */
2937         if (amdgpu_dpm_set_df_cstate(adev, DF_CSTATE_DISALLOW))
2938                 dev_warn(adev->dev, "Failed to disallow df cstate");
2939
2940         for (i = adev->num_ip_blocks - 1; i >= 0; i--) {
2941                 if (!adev->ip_blocks[i].status.valid)
2942                         continue;
2943
2944                 /* displays are handled separately */
2945                 if (adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_DCE)
2946                         continue;
2947
2948                 /* XXX handle errors */
2949                 r = adev->ip_blocks[i].version->funcs->suspend(adev);
2950                 /* XXX handle errors */
2951                 if (r) {
2952                         DRM_ERROR("suspend of IP block <%s> failed %d\n",
2953                                   adev->ip_blocks[i].version->funcs->name, r);
2954                         return r;
2955                 }
2956
2957                 adev->ip_blocks[i].status.hw = false;
2958         }
2959
2960         return 0;
2961 }
2962
2963 /**
2964  * amdgpu_device_ip_suspend_phase2 - run suspend for hardware IPs (phase 2)
2965  *
2966  * @adev: amdgpu_device pointer
2967  *
2968  * Main suspend function for hardware IPs.  The list of all the hardware
2969  * IPs that make up the asic is walked, clockgating is disabled and the
2970  * suspend callbacks are run.  suspend puts the hardware and software state
2971  * in each IP into a state suitable for suspend.
2972  * Returns 0 on success, negative error code on failure.
2973  */
2974 static int amdgpu_device_ip_suspend_phase2(struct amdgpu_device *adev)
2975 {
2976         int i, r;
2977
2978         if (adev->in_s0ix)
2979                 amdgpu_dpm_gfx_state_change(adev, sGpuChangeState_D3Entry);
2980
2981         for (i = adev->num_ip_blocks - 1; i >= 0; i--) {
2982                 if (!adev->ip_blocks[i].status.valid)
2983                         continue;
2984                 /* displays are handled in phase1 */
2985                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_DCE)
2986                         continue;
2987                 /* PSP lost connection when err_event_athub occurs */
2988                 if (amdgpu_ras_intr_triggered() &&
2989                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_PSP) {
2990                         adev->ip_blocks[i].status.hw = false;
2991                         continue;
2992                 }
2993
2994                 /* skip unnecessary suspend if we do not initialize them yet */
2995                 if (adev->gmc.xgmi.pending_reset &&
2996                     !(adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GMC ||
2997                       adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_SMC ||
2998                       adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_COMMON ||
2999                       adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_IH)) {
3000                         adev->ip_blocks[i].status.hw = false;
3001                         continue;
3002                 }
3003
3004                 /* skip suspend of gfx and psp for S0ix
3005                  * gfx is in gfxoff state, so on resume it will exit gfxoff just
3006                  * like at runtime. PSP is also part of the always on hardware
3007                  * so no need to suspend it.
3008                  */
3009                 if (adev->in_s0ix &&
3010                     (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_PSP ||
3011                      adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GFX))
3012                         continue;
3013
3014                 /* XXX handle errors */
3015                 r = adev->ip_blocks[i].version->funcs->suspend(adev);
3016                 /* XXX handle errors */
3017                 if (r) {
3018                         DRM_ERROR("suspend of IP block <%s> failed %d\n",
3019                                   adev->ip_blocks[i].version->funcs->name, r);
3020                 }
3021                 adev->ip_blocks[i].status.hw = false;
3022                 /* handle putting the SMC in the appropriate state */
3023                 if(!amdgpu_sriov_vf(adev)){
3024                         if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_SMC) {
3025                                 r = amdgpu_dpm_set_mp1_state(adev, adev->mp1_state);
3026                                 if (r) {
3027                                         DRM_ERROR("SMC failed to set mp1 state %d, %d\n",
3028                                                         adev->mp1_state, r);
3029                                         return r;
3030                                 }
3031                         }
3032                 }
3033         }
3034
3035         return 0;
3036 }
3037
3038 /**
3039  * amdgpu_device_ip_suspend - run suspend for hardware IPs
3040  *
3041  * @adev: amdgpu_device pointer
3042  *
3043  * Main suspend function for hardware IPs.  The list of all the hardware
3044  * IPs that make up the asic is walked, clockgating is disabled and the
3045  * suspend callbacks are run.  suspend puts the hardware and software state
3046  * in each IP into a state suitable for suspend.
3047  * Returns 0 on success, negative error code on failure.
3048  */
3049 int amdgpu_device_ip_suspend(struct amdgpu_device *adev)
3050 {
3051         int r;
3052
3053         if (amdgpu_sriov_vf(adev)) {
3054                 amdgpu_virt_fini_data_exchange(adev);
3055                 amdgpu_virt_request_full_gpu(adev, false);
3056         }
3057
3058         r = amdgpu_device_ip_suspend_phase1(adev);
3059         if (r)
3060                 return r;
3061         r = amdgpu_device_ip_suspend_phase2(adev);
3062
3063         if (amdgpu_sriov_vf(adev))
3064                 amdgpu_virt_release_full_gpu(adev, false);
3065
3066         return r;
3067 }
3068
3069 static int amdgpu_device_ip_reinit_early_sriov(struct amdgpu_device *adev)
3070 {
3071         int i, r;
3072
3073         static enum amd_ip_block_type ip_order[] = {
3074                 AMD_IP_BLOCK_TYPE_COMMON,
3075                 AMD_IP_BLOCK_TYPE_GMC,
3076                 AMD_IP_BLOCK_TYPE_PSP,
3077                 AMD_IP_BLOCK_TYPE_IH,
3078         };
3079
3080         for (i = 0; i < adev->num_ip_blocks; i++) {
3081                 int j;
3082                 struct amdgpu_ip_block *block;
3083
3084                 block = &adev->ip_blocks[i];
3085                 block->status.hw = false;
3086
3087                 for (j = 0; j < ARRAY_SIZE(ip_order); j++) {
3088
3089                         if (block->version->type != ip_order[j] ||
3090                                 !block->status.valid)
3091                                 continue;
3092
3093                         r = block->version->funcs->hw_init(adev);
3094                         DRM_INFO("RE-INIT-early: %s %s\n", block->version->funcs->name, r?"failed":"succeeded");
3095                         if (r)
3096                                 return r;
3097                         block->status.hw = true;
3098                 }
3099         }
3100
3101         return 0;
3102 }
3103
3104 static int amdgpu_device_ip_reinit_late_sriov(struct amdgpu_device *adev)
3105 {
3106         int i, r;
3107
3108         static enum amd_ip_block_type ip_order[] = {
3109                 AMD_IP_BLOCK_TYPE_SMC,
3110                 AMD_IP_BLOCK_TYPE_DCE,
3111                 AMD_IP_BLOCK_TYPE_GFX,
3112                 AMD_IP_BLOCK_TYPE_SDMA,
3113                 AMD_IP_BLOCK_TYPE_UVD,
3114                 AMD_IP_BLOCK_TYPE_VCE,
3115                 AMD_IP_BLOCK_TYPE_VCN
3116         };
3117
3118         for (i = 0; i < ARRAY_SIZE(ip_order); i++) {
3119                 int j;
3120                 struct amdgpu_ip_block *block;
3121
3122                 for (j = 0; j < adev->num_ip_blocks; j++) {
3123                         block = &adev->ip_blocks[j];
3124
3125                         if (block->version->type != ip_order[i] ||
3126                                 !block->status.valid ||
3127                                 block->status.hw)
3128                                 continue;
3129
3130                         if (block->version->type == AMD_IP_BLOCK_TYPE_SMC)
3131                                 r = block->version->funcs->resume(adev);
3132                         else
3133                                 r = block->version->funcs->hw_init(adev);
3134
3135                         DRM_INFO("RE-INIT-late: %s %s\n", block->version->funcs->name, r?"failed":"succeeded");
3136                         if (r)
3137                                 return r;
3138                         block->status.hw = true;
3139                 }
3140         }
3141
3142         return 0;
3143 }
3144
3145 /**
3146  * amdgpu_device_ip_resume_phase1 - run resume for hardware IPs
3147  *
3148  * @adev: amdgpu_device pointer
3149  *
3150  * First resume function for hardware IPs.  The list of all the hardware
3151  * IPs that make up the asic is walked and the resume callbacks are run for
3152  * COMMON, GMC, and IH.  resume puts the hardware into a functional state
3153  * after a suspend and updates the software state as necessary.  This
3154  * function is also used for restoring the GPU after a GPU reset.
3155  * Returns 0 on success, negative error code on failure.
3156  */
3157 static int amdgpu_device_ip_resume_phase1(struct amdgpu_device *adev)
3158 {
3159         int i, r;
3160
3161         for (i = 0; i < adev->num_ip_blocks; i++) {
3162                 if (!adev->ip_blocks[i].status.valid || adev->ip_blocks[i].status.hw)
3163                         continue;
3164                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_COMMON ||
3165                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GMC ||
3166                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_IH ||
3167                     (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_PSP && amdgpu_sriov_vf(adev))) {
3168
3169                         r = adev->ip_blocks[i].version->funcs->resume(adev);
3170                         if (r) {
3171                                 DRM_ERROR("resume of IP block <%s> failed %d\n",
3172                                           adev->ip_blocks[i].version->funcs->name, r);
3173                                 return r;
3174                         }
3175                         adev->ip_blocks[i].status.hw = true;
3176                 }
3177         }
3178
3179         return 0;
3180 }
3181
3182 /**
3183  * amdgpu_device_ip_resume_phase2 - run resume for hardware IPs
3184  *
3185  * @adev: amdgpu_device pointer
3186  *
3187  * First resume function for hardware IPs.  The list of all the hardware
3188  * IPs that make up the asic is walked and the resume callbacks are run for
3189  * all blocks except COMMON, GMC, and IH.  resume puts the hardware into a
3190  * functional state after a suspend and updates the software state as
3191  * necessary.  This function is also used for restoring the GPU after a GPU
3192  * reset.
3193  * Returns 0 on success, negative error code on failure.
3194  */
3195 static int amdgpu_device_ip_resume_phase2(struct amdgpu_device *adev)
3196 {
3197         int i, r;
3198
3199         for (i = 0; i < adev->num_ip_blocks; i++) {
3200                 if (!adev->ip_blocks[i].status.valid || adev->ip_blocks[i].status.hw)
3201                         continue;
3202                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_COMMON ||
3203                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GMC ||
3204                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_IH ||
3205                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_PSP)
3206                         continue;
3207                 r = adev->ip_blocks[i].version->funcs->resume(adev);
3208                 if (r) {
3209                         DRM_ERROR("resume of IP block <%s> failed %d\n",
3210                                   adev->ip_blocks[i].version->funcs->name, r);
3211                         return r;
3212                 }
3213                 adev->ip_blocks[i].status.hw = true;
3214         }
3215
3216         return 0;
3217 }
3218
3219 /**
3220  * amdgpu_device_ip_resume - run resume for hardware IPs
3221  *
3222  * @adev: amdgpu_device pointer
3223  *
3224  * Main resume function for hardware IPs.  The hardware IPs
3225  * are split into two resume functions because they are
3226  * are also used in in recovering from a GPU reset and some additional
3227  * steps need to be take between them.  In this case (S3/S4) they are
3228  * run sequentially.
3229  * Returns 0 on success, negative error code on failure.
3230  */
3231 static int amdgpu_device_ip_resume(struct amdgpu_device *adev)
3232 {
3233         int r;
3234
3235         r = amdgpu_amdkfd_resume_iommu(adev);
3236         if (r)
3237                 return r;
3238
3239         r = amdgpu_device_ip_resume_phase1(adev);
3240         if (r)
3241                 return r;
3242
3243         r = amdgpu_device_fw_loading(adev);
3244         if (r)
3245                 return r;
3246
3247         r = amdgpu_device_ip_resume_phase2(adev);
3248
3249         return r;
3250 }
3251
3252 /**
3253  * amdgpu_device_detect_sriov_bios - determine if the board supports SR-IOV
3254  *
3255  * @adev: amdgpu_device pointer
3256  *
3257  * Query the VBIOS data tables to determine if the board supports SR-IOV.
3258  */
3259 static void amdgpu_device_detect_sriov_bios(struct amdgpu_device *adev)
3260 {
3261         if (amdgpu_sriov_vf(adev)) {
3262                 if (adev->is_atom_fw) {
3263                         if (amdgpu_atomfirmware_gpu_virtualization_supported(adev))
3264                                 adev->virt.caps |= AMDGPU_SRIOV_CAPS_SRIOV_VBIOS;
3265                 } else {
3266                         if (amdgpu_atombios_has_gpu_virtualization_table(adev))
3267                                 adev->virt.caps |= AMDGPU_SRIOV_CAPS_SRIOV_VBIOS;
3268                 }
3269
3270                 if (!(adev->virt.caps & AMDGPU_SRIOV_CAPS_SRIOV_VBIOS))
3271                         amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_NO_VBIOS, 0, 0);
3272         }
3273 }
3274
3275 /**
3276  * amdgpu_device_asic_has_dc_support - determine if DC supports the asic
3277  *
3278  * @asic_type: AMD asic type
3279  *
3280  * Check if there is DC (new modesetting infrastructre) support for an asic.
3281  * returns true if DC has support, false if not.
3282  */
3283 bool amdgpu_device_asic_has_dc_support(enum amd_asic_type asic_type)
3284 {
3285         switch (asic_type) {
3286 #ifdef CONFIG_DRM_AMDGPU_SI
3287         case CHIP_HAINAN:
3288 #endif
3289         case CHIP_TOPAZ:
3290                 /* chips with no display hardware */
3291                 return false;
3292 #if defined(CONFIG_DRM_AMD_DC)
3293         case CHIP_TAHITI:
3294         case CHIP_PITCAIRN:
3295         case CHIP_VERDE:
3296         case CHIP_OLAND:
3297                 /*
3298                  * We have systems in the wild with these ASICs that require
3299                  * LVDS and VGA support which is not supported with DC.
3300                  *
3301                  * Fallback to the non-DC driver here by default so as not to
3302                  * cause regressions.
3303                  */
3304 #if defined(CONFIG_DRM_AMD_DC_SI)
3305                 return amdgpu_dc > 0;
3306 #else
3307                 return false;
3308 #endif
3309         case CHIP_BONAIRE:
3310         case CHIP_KAVERI:
3311         case CHIP_KABINI:
3312         case CHIP_MULLINS:
3313                 /*
3314                  * We have systems in the wild with these ASICs that require
3315                  * VGA support which is not supported with DC.
3316                  *
3317                  * Fallback to the non-DC driver here by default so as not to
3318                  * cause regressions.
3319                  */
3320                 return amdgpu_dc > 0;
3321         default:
3322                 return amdgpu_dc != 0;
3323 #else
3324         default:
3325                 if (amdgpu_dc > 0)
3326                         DRM_INFO_ONCE("Display Core has been requested via kernel parameter "
3327                                          "but isn't supported by ASIC, ignoring\n");
3328                 return false;
3329 #endif
3330         }
3331 }
3332
3333 /**
3334  * amdgpu_device_has_dc_support - check if dc is supported
3335  *
3336  * @adev: amdgpu_device pointer
3337  *
3338  * Returns true for supported, false for not supported
3339  */
3340 bool amdgpu_device_has_dc_support(struct amdgpu_device *adev)
3341 {
3342         if (amdgpu_sriov_vf(adev) ||
3343             adev->enable_virtual_display ||
3344             (adev->harvest_ip_mask & AMD_HARVEST_IP_DMU_MASK))
3345                 return false;
3346
3347         return amdgpu_device_asic_has_dc_support(adev->asic_type);
3348 }
3349
3350 static void amdgpu_device_xgmi_reset_func(struct work_struct *__work)
3351 {
3352         struct amdgpu_device *adev =
3353                 container_of(__work, struct amdgpu_device, xgmi_reset_work);
3354         struct amdgpu_hive_info *hive = amdgpu_get_xgmi_hive(adev);
3355
3356         /* It's a bug to not have a hive within this function */
3357         if (WARN_ON(!hive))
3358                 return;
3359
3360         /*
3361          * Use task barrier to synchronize all xgmi reset works across the
3362          * hive. task_barrier_enter and task_barrier_exit will block
3363          * until all the threads running the xgmi reset works reach
3364          * those points. task_barrier_full will do both blocks.
3365          */
3366         if (amdgpu_asic_reset_method(adev) == AMD_RESET_METHOD_BACO) {
3367
3368                 task_barrier_enter(&hive->tb);
3369                 adev->asic_reset_res = amdgpu_device_baco_enter(adev_to_drm(adev));
3370
3371                 if (adev->asic_reset_res)
3372                         goto fail;
3373
3374                 task_barrier_exit(&hive->tb);
3375                 adev->asic_reset_res = amdgpu_device_baco_exit(adev_to_drm(adev));
3376
3377                 if (adev->asic_reset_res)
3378                         goto fail;
3379
3380                 if (adev->mmhub.ras && adev->mmhub.ras->ras_block.hw_ops &&
3381                     adev->mmhub.ras->ras_block.hw_ops->reset_ras_error_count)
3382                         adev->mmhub.ras->ras_block.hw_ops->reset_ras_error_count(adev);
3383         } else {
3384
3385                 task_barrier_full(&hive->tb);
3386                 adev->asic_reset_res =  amdgpu_asic_reset(adev);
3387         }
3388
3389 fail:
3390         if (adev->asic_reset_res)
3391                 DRM_WARN("ASIC reset failed with error, %d for drm dev, %s",
3392                          adev->asic_reset_res, adev_to_drm(adev)->unique);
3393         amdgpu_put_xgmi_hive(hive);
3394 }
3395
3396 static int amdgpu_device_get_job_timeout_settings(struct amdgpu_device *adev)
3397 {
3398         char *input = amdgpu_lockup_timeout;
3399         char *timeout_setting = NULL;
3400         int index = 0;
3401         long timeout;
3402         int ret = 0;
3403
3404         /*
3405          * By default timeout for non compute jobs is 10000
3406          * and 60000 for compute jobs.
3407          * In SR-IOV or passthrough mode, timeout for compute
3408          * jobs are 60000 by default.
3409          */
3410         adev->gfx_timeout = msecs_to_jiffies(10000);
3411         adev->sdma_timeout = adev->video_timeout = adev->gfx_timeout;
3412         if (amdgpu_sriov_vf(adev))
3413                 adev->compute_timeout = amdgpu_sriov_is_pp_one_vf(adev) ?
3414                                         msecs_to_jiffies(60000) : msecs_to_jiffies(10000);
3415         else
3416                 adev->compute_timeout =  msecs_to_jiffies(60000);
3417
3418         if (strnlen(input, AMDGPU_MAX_TIMEOUT_PARAM_LENGTH)) {
3419                 while ((timeout_setting = strsep(&input, ",")) &&
3420                                 strnlen(timeout_setting, AMDGPU_MAX_TIMEOUT_PARAM_LENGTH)) {
3421                         ret = kstrtol(timeout_setting, 0, &timeout);
3422                         if (ret)
3423                                 return ret;
3424
3425                         if (timeout == 0) {
3426                                 index++;
3427                                 continue;
3428                         } else if (timeout < 0) {
3429                                 timeout = MAX_SCHEDULE_TIMEOUT;
3430                                 dev_warn(adev->dev, "lockup timeout disabled");
3431                                 add_taint(TAINT_SOFTLOCKUP, LOCKDEP_STILL_OK);
3432                         } else {
3433                                 timeout = msecs_to_jiffies(timeout);
3434                         }
3435
3436                         switch (index++) {
3437                         case 0:
3438                                 adev->gfx_timeout = timeout;
3439                                 break;
3440                         case 1:
3441                                 adev->compute_timeout = timeout;
3442                                 break;
3443                         case 2:
3444                                 adev->sdma_timeout = timeout;
3445                                 break;
3446                         case 3:
3447                                 adev->video_timeout = timeout;
3448                                 break;
3449                         default:
3450                                 break;
3451                         }
3452                 }
3453                 /*
3454                  * There is only one value specified and
3455                  * it should apply to all non-compute jobs.
3456                  */
3457                 if (index == 1) {
3458                         adev->sdma_timeout = adev->video_timeout = adev->gfx_timeout;
3459                         if (amdgpu_sriov_vf(adev) || amdgpu_passthrough(adev))
3460                                 adev->compute_timeout = adev->gfx_timeout;
3461                 }
3462         }
3463
3464         return ret;
3465 }
3466
3467 /**
3468  * amdgpu_device_check_iommu_direct_map - check if RAM direct mapped to GPU
3469  *
3470  * @adev: amdgpu_device pointer
3471  *
3472  * RAM direct mapped to GPU if IOMMU is not enabled or is pass through mode
3473  */
3474 static void amdgpu_device_check_iommu_direct_map(struct amdgpu_device *adev)
3475 {
3476         struct iommu_domain *domain;
3477
3478         domain = iommu_get_domain_for_dev(adev->dev);
3479         if (!domain || domain->type == IOMMU_DOMAIN_IDENTITY)
3480                 adev->ram_is_direct_mapped = true;
3481 }
3482
3483 static const struct attribute *amdgpu_dev_attributes[] = {
3484         &dev_attr_product_name.attr,
3485         &dev_attr_product_number.attr,
3486         &dev_attr_serial_number.attr,
3487         &dev_attr_pcie_replay_count.attr,
3488         NULL
3489 };
3490
3491 /**
3492  * amdgpu_device_init - initialize the driver
3493  *
3494  * @adev: amdgpu_device pointer
3495  * @flags: driver flags
3496  *
3497  * Initializes the driver info and hw (all asics).
3498  * Returns 0 for success or an error on failure.
3499  * Called at driver startup.
3500  */
3501 int amdgpu_device_init(struct amdgpu_device *adev,
3502                        uint32_t flags)
3503 {
3504         struct drm_device *ddev = adev_to_drm(adev);
3505         struct pci_dev *pdev = adev->pdev;
3506         int r, i;
3507         bool px = false;
3508         u32 max_MBps;
3509
3510         adev->shutdown = false;
3511         adev->flags = flags;
3512
3513         if (amdgpu_force_asic_type >= 0 && amdgpu_force_asic_type < CHIP_LAST)
3514                 adev->asic_type = amdgpu_force_asic_type;
3515         else
3516                 adev->asic_type = flags & AMD_ASIC_MASK;
3517
3518         adev->usec_timeout = AMDGPU_MAX_USEC_TIMEOUT;
3519         if (amdgpu_emu_mode == 1)
3520                 adev->usec_timeout *= 10;
3521         adev->gmc.gart_size = 512 * 1024 * 1024;
3522         adev->accel_working = false;
3523         adev->num_rings = 0;
3524         RCU_INIT_POINTER(adev->gang_submit, dma_fence_get_stub());
3525         adev->mman.buffer_funcs = NULL;
3526         adev->mman.buffer_funcs_ring = NULL;
3527         adev->vm_manager.vm_pte_funcs = NULL;
3528         adev->vm_manager.vm_pte_num_scheds = 0;
3529         adev->gmc.gmc_funcs = NULL;
3530         adev->harvest_ip_mask = 0x0;
3531         adev->fence_context = dma_fence_context_alloc(AMDGPU_MAX_RINGS);
3532         bitmap_zero(adev->gfx.pipe_reserve_bitmap, AMDGPU_MAX_COMPUTE_QUEUES);
3533
3534         adev->smc_rreg = &amdgpu_invalid_rreg;
3535         adev->smc_wreg = &amdgpu_invalid_wreg;
3536         adev->pcie_rreg = &amdgpu_invalid_rreg;
3537         adev->pcie_wreg = &amdgpu_invalid_wreg;
3538         adev->pciep_rreg = &amdgpu_invalid_rreg;
3539         adev->pciep_wreg = &amdgpu_invalid_wreg;
3540         adev->pcie_rreg64 = &amdgpu_invalid_rreg64;
3541         adev->pcie_wreg64 = &amdgpu_invalid_wreg64;
3542         adev->uvd_ctx_rreg = &amdgpu_invalid_rreg;
3543         adev->uvd_ctx_wreg = &amdgpu_invalid_wreg;
3544         adev->didt_rreg = &amdgpu_invalid_rreg;
3545         adev->didt_wreg = &amdgpu_invalid_wreg;
3546         adev->gc_cac_rreg = &amdgpu_invalid_rreg;
3547         adev->gc_cac_wreg = &amdgpu_invalid_wreg;
3548         adev->audio_endpt_rreg = &amdgpu_block_invalid_rreg;
3549         adev->audio_endpt_wreg = &amdgpu_block_invalid_wreg;
3550
3551         DRM_INFO("initializing kernel modesetting (%s 0x%04X:0x%04X 0x%04X:0x%04X 0x%02X).\n",
3552                  amdgpu_asic_name[adev->asic_type], pdev->vendor, pdev->device,
3553                  pdev->subsystem_vendor, pdev->subsystem_device, pdev->revision);
3554
3555         /* mutex initialization are all done here so we
3556          * can recall function without having locking issues */
3557         mutex_init(&adev->firmware.mutex);
3558         mutex_init(&adev->pm.mutex);
3559         mutex_init(&adev->gfx.gpu_clock_mutex);
3560         mutex_init(&adev->srbm_mutex);
3561         mutex_init(&adev->gfx.pipe_reserve_mutex);
3562         mutex_init(&adev->gfx.gfx_off_mutex);
3563         mutex_init(&adev->grbm_idx_mutex);
3564         mutex_init(&adev->mn_lock);
3565         mutex_init(&adev->virt.vf_errors.lock);
3566         hash_init(adev->mn_hash);
3567         mutex_init(&adev->psp.mutex);
3568         mutex_init(&adev->notifier_lock);
3569         mutex_init(&adev->pm.stable_pstate_ctx_lock);
3570         mutex_init(&adev->benchmark_mutex);
3571
3572         amdgpu_device_init_apu_flags(adev);
3573
3574         r = amdgpu_device_check_arguments(adev);
3575         if (r)
3576                 return r;
3577
3578         spin_lock_init(&adev->mmio_idx_lock);
3579         spin_lock_init(&adev->smc_idx_lock);
3580         spin_lock_init(&adev->pcie_idx_lock);
3581         spin_lock_init(&adev->uvd_ctx_idx_lock);
3582         spin_lock_init(&adev->didt_idx_lock);
3583         spin_lock_init(&adev->gc_cac_idx_lock);
3584         spin_lock_init(&adev->se_cac_idx_lock);
3585         spin_lock_init(&adev->audio_endpt_idx_lock);
3586         spin_lock_init(&adev->mm_stats.lock);
3587
3588         INIT_LIST_HEAD(&adev->shadow_list);
3589         mutex_init(&adev->shadow_list_lock);
3590
3591         INIT_LIST_HEAD(&adev->reset_list);
3592
3593         INIT_LIST_HEAD(&adev->ras_list);
3594
3595         INIT_DELAYED_WORK(&adev->delayed_init_work,
3596                           amdgpu_device_delayed_init_work_handler);
3597         INIT_DELAYED_WORK(&adev->gfx.gfx_off_delay_work,
3598                           amdgpu_device_delay_enable_gfx_off);
3599
3600         INIT_WORK(&adev->xgmi_reset_work, amdgpu_device_xgmi_reset_func);
3601
3602         adev->gfx.gfx_off_req_count = 1;
3603         adev->gfx.gfx_off_residency = 0;
3604         adev->gfx.gfx_off_entrycount = 0;
3605         adev->pm.ac_power = power_supply_is_system_supplied() > 0;
3606
3607         atomic_set(&adev->throttling_logging_enabled, 1);
3608         /*
3609          * If throttling continues, logging will be performed every minute
3610          * to avoid log flooding. "-1" is subtracted since the thermal
3611          * throttling interrupt comes every second. Thus, the total logging
3612          * interval is 59 seconds(retelimited printk interval) + 1(waiting
3613          * for throttling interrupt) = 60 seconds.
3614          */
3615         ratelimit_state_init(&adev->throttling_logging_rs, (60 - 1) * HZ, 1);
3616         ratelimit_set_flags(&adev->throttling_logging_rs, RATELIMIT_MSG_ON_RELEASE);
3617
3618         /* Registers mapping */
3619         /* TODO: block userspace mapping of io register */
3620         if (adev->asic_type >= CHIP_BONAIRE) {
3621                 adev->rmmio_base = pci_resource_start(adev->pdev, 5);
3622                 adev->rmmio_size = pci_resource_len(adev->pdev, 5);
3623         } else {
3624                 adev->rmmio_base = pci_resource_start(adev->pdev, 2);
3625                 adev->rmmio_size = pci_resource_len(adev->pdev, 2);
3626         }
3627
3628         for (i = 0; i < AMD_IP_BLOCK_TYPE_NUM; i++)
3629                 atomic_set(&adev->pm.pwr_state[i], POWER_STATE_UNKNOWN);
3630
3631         adev->rmmio = ioremap(adev->rmmio_base, adev->rmmio_size);
3632         if (adev->rmmio == NULL) {
3633                 return -ENOMEM;
3634         }
3635         DRM_INFO("register mmio base: 0x%08X\n", (uint32_t)adev->rmmio_base);
3636         DRM_INFO("register mmio size: %u\n", (unsigned)adev->rmmio_size);
3637
3638         amdgpu_device_get_pcie_info(adev);
3639
3640         if (amdgpu_mcbp)
3641                 DRM_INFO("MCBP is enabled\n");
3642
3643         /*
3644          * Reset domain needs to be present early, before XGMI hive discovered
3645          * (if any) and intitialized to use reset sem and in_gpu reset flag
3646          * early on during init and before calling to RREG32.
3647          */
3648         adev->reset_domain = amdgpu_reset_create_reset_domain(SINGLE_DEVICE, "amdgpu-reset-dev");
3649         if (!adev->reset_domain)
3650                 return -ENOMEM;
3651
3652         /* detect hw virtualization here */
3653         amdgpu_detect_virtualization(adev);
3654
3655         r = amdgpu_device_get_job_timeout_settings(adev);
3656         if (r) {
3657                 dev_err(adev->dev, "invalid lockup_timeout parameter syntax\n");
3658                 return r;
3659         }
3660
3661         /* early init functions */
3662         r = amdgpu_device_ip_early_init(adev);
3663         if (r)
3664                 return r;
3665
3666         /* Enable TMZ based on IP_VERSION */
3667         amdgpu_gmc_tmz_set(adev);
3668
3669         amdgpu_gmc_noretry_set(adev);
3670         /* Need to get xgmi info early to decide the reset behavior*/
3671         if (adev->gmc.xgmi.supported) {
3672                 r = adev->gfxhub.funcs->get_xgmi_info(adev);
3673                 if (r)
3674                         return r;
3675         }
3676
3677         /* enable PCIE atomic ops */
3678         if (amdgpu_sriov_vf(adev))
3679                 adev->have_atomics_support = ((struct amd_sriov_msg_pf2vf_info *)
3680                         adev->virt.fw_reserve.p_pf2vf)->pcie_atomic_ops_support_flags ==
3681                         (PCI_EXP_DEVCAP2_ATOMIC_COMP32 | PCI_EXP_DEVCAP2_ATOMIC_COMP64);
3682         else
3683                 adev->have_atomics_support =
3684                         !pci_enable_atomic_ops_to_root(adev->pdev,
3685                                           PCI_EXP_DEVCAP2_ATOMIC_COMP32 |
3686                                           PCI_EXP_DEVCAP2_ATOMIC_COMP64);
3687         if (!adev->have_atomics_support)
3688                 dev_info(adev->dev, "PCIE atomic ops is not supported\n");
3689
3690         /* doorbell bar mapping and doorbell index init*/
3691         amdgpu_device_doorbell_init(adev);
3692
3693         if (amdgpu_emu_mode == 1) {
3694                 /* post the asic on emulation mode */
3695                 emu_soc_asic_init(adev);
3696                 goto fence_driver_init;
3697         }
3698
3699         amdgpu_reset_init(adev);
3700
3701         /* detect if we are with an SRIOV vbios */
3702         amdgpu_device_detect_sriov_bios(adev);
3703
3704         /* check if we need to reset the asic
3705          *  E.g., driver was not cleanly unloaded previously, etc.
3706          */
3707         if (!amdgpu_sriov_vf(adev) && amdgpu_asic_need_reset_on_init(adev)) {
3708                 if (adev->gmc.xgmi.num_physical_nodes) {
3709                         dev_info(adev->dev, "Pending hive reset.\n");
3710                         adev->gmc.xgmi.pending_reset = true;
3711                         /* Only need to init necessary block for SMU to handle the reset */
3712                         for (i = 0; i < adev->num_ip_blocks; i++) {
3713                                 if (!adev->ip_blocks[i].status.valid)
3714                                         continue;
3715                                 if (!(adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GMC ||
3716                                       adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_COMMON ||
3717                                       adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_IH ||
3718                                       adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_SMC)) {
3719                                         DRM_DEBUG("IP %s disabled for hw_init.\n",
3720                                                 adev->ip_blocks[i].version->funcs->name);
3721                                         adev->ip_blocks[i].status.hw = true;
3722                                 }
3723                         }
3724                 } else {
3725                         r = amdgpu_asic_reset(adev);
3726                         if (r) {
3727                                 dev_err(adev->dev, "asic reset on init failed\n");
3728                                 goto failed;
3729                         }
3730                 }
3731         }
3732
3733         pci_enable_pcie_error_reporting(adev->pdev);
3734
3735         /* Post card if necessary */
3736         if (amdgpu_device_need_post(adev)) {
3737                 if (!adev->bios) {
3738                         dev_err(adev->dev, "no vBIOS found\n");
3739                         r = -EINVAL;
3740                         goto failed;
3741                 }
3742                 DRM_INFO("GPU posting now...\n");
3743                 r = amdgpu_device_asic_init(adev);
3744                 if (r) {
3745                         dev_err(adev->dev, "gpu post error!\n");
3746                         goto failed;
3747                 }
3748         }
3749
3750         if (adev->is_atom_fw) {
3751                 /* Initialize clocks */
3752                 r = amdgpu_atomfirmware_get_clock_info(adev);
3753                 if (r) {
3754                         dev_err(adev->dev, "amdgpu_atomfirmware_get_clock_info failed\n");
3755                         amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_ATOMBIOS_GET_CLOCK_FAIL, 0, 0);
3756                         goto failed;
3757                 }
3758         } else {
3759                 /* Initialize clocks */
3760                 r = amdgpu_atombios_get_clock_info(adev);
3761                 if (r) {
3762                         dev_err(adev->dev, "amdgpu_atombios_get_clock_info failed\n");
3763                         amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_ATOMBIOS_GET_CLOCK_FAIL, 0, 0);
3764                         goto failed;
3765                 }
3766                 /* init i2c buses */
3767                 if (!amdgpu_device_has_dc_support(adev))
3768                         amdgpu_atombios_i2c_init(adev);
3769         }
3770
3771 fence_driver_init:
3772         /* Fence driver */
3773         r = amdgpu_fence_driver_sw_init(adev);
3774         if (r) {
3775                 dev_err(adev->dev, "amdgpu_fence_driver_sw_init failed\n");
3776                 amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_FENCE_INIT_FAIL, 0, 0);
3777                 goto failed;
3778         }
3779
3780         /* init the mode config */
3781         drm_mode_config_init(adev_to_drm(adev));
3782
3783         r = amdgpu_device_ip_init(adev);
3784         if (r) {
3785                 /* failed in exclusive mode due to timeout */
3786                 if (amdgpu_sriov_vf(adev) &&
3787                     !amdgpu_sriov_runtime(adev) &&
3788                     amdgpu_virt_mmio_blocked(adev) &&
3789                     !amdgpu_virt_wait_reset(adev)) {
3790                         dev_err(adev->dev, "VF exclusive mode timeout\n");
3791                         /* Don't send request since VF is inactive. */
3792                         adev->virt.caps &= ~AMDGPU_SRIOV_CAPS_RUNTIME;
3793                         adev->virt.ops = NULL;
3794                         r = -EAGAIN;
3795                         goto release_ras_con;
3796                 }
3797                 dev_err(adev->dev, "amdgpu_device_ip_init failed\n");
3798                 amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_AMDGPU_INIT_FAIL, 0, 0);
3799                 goto release_ras_con;
3800         }
3801
3802         amdgpu_fence_driver_hw_init(adev);
3803
3804         dev_info(adev->dev,
3805                 "SE %d, SH per SE %d, CU per SH %d, active_cu_number %d\n",
3806                         adev->gfx.config.max_shader_engines,
3807                         adev->gfx.config.max_sh_per_se,
3808                         adev->gfx.config.max_cu_per_sh,
3809                         adev->gfx.cu_info.number);
3810
3811         adev->accel_working = true;
3812
3813         amdgpu_vm_check_compute_bug(adev);
3814
3815         /* Initialize the buffer migration limit. */
3816         if (amdgpu_moverate >= 0)
3817                 max_MBps = amdgpu_moverate;
3818         else
3819                 max_MBps = 8; /* Allow 8 MB/s. */
3820         /* Get a log2 for easy divisions. */
3821         adev->mm_stats.log2_max_MBps = ilog2(max(1u, max_MBps));
3822
3823         r = amdgpu_pm_sysfs_init(adev);
3824         if (r) {
3825                 adev->pm_sysfs_en = false;
3826                 DRM_ERROR("registering pm debugfs failed (%d).\n", r);
3827         } else
3828                 adev->pm_sysfs_en = true;
3829
3830         r = amdgpu_ucode_sysfs_init(adev);
3831         if (r) {
3832                 adev->ucode_sysfs_en = false;
3833                 DRM_ERROR("Creating firmware sysfs failed (%d).\n", r);
3834         } else
3835                 adev->ucode_sysfs_en = true;
3836
3837         r = amdgpu_psp_sysfs_init(adev);
3838         if (r) {
3839                 adev->psp_sysfs_en = false;
3840                 if (!amdgpu_sriov_vf(adev))
3841                         DRM_ERROR("Creating psp sysfs failed\n");
3842         } else
3843                 adev->psp_sysfs_en = true;
3844
3845         /*
3846          * Register gpu instance before amdgpu_device_enable_mgpu_fan_boost.
3847          * Otherwise the mgpu fan boost feature will be skipped due to the
3848          * gpu instance is counted less.
3849          */
3850         amdgpu_register_gpu_instance(adev);
3851
3852         /* enable clockgating, etc. after ib tests, etc. since some blocks require
3853          * explicit gating rather than handling it automatically.
3854          */
3855         if (!adev->gmc.xgmi.pending_reset) {
3856                 r = amdgpu_device_ip_late_init(adev);
3857                 if (r) {
3858                         dev_err(adev->dev, "amdgpu_device_ip_late_init failed\n");
3859                         amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_AMDGPU_LATE_INIT_FAIL, 0, r);
3860                         goto release_ras_con;
3861                 }
3862                 /* must succeed. */
3863                 amdgpu_ras_resume(adev);
3864                 queue_delayed_work(system_wq, &adev->delayed_init_work,
3865                                    msecs_to_jiffies(AMDGPU_RESUME_MS));
3866         }
3867
3868         if (amdgpu_sriov_vf(adev))
3869                 flush_delayed_work(&adev->delayed_init_work);
3870
3871         r = sysfs_create_files(&adev->dev->kobj, amdgpu_dev_attributes);
3872         if (r)
3873                 dev_err(adev->dev, "Could not create amdgpu device attr\n");
3874
3875         if (IS_ENABLED(CONFIG_PERF_EVENTS))
3876                 r = amdgpu_pmu_init(adev);
3877         if (r)
3878                 dev_err(adev->dev, "amdgpu_pmu_init failed\n");
3879
3880         /* Have stored pci confspace at hand for restore in sudden PCI error */
3881         if (amdgpu_device_cache_pci_state(adev->pdev))
3882                 pci_restore_state(pdev);
3883
3884         /* if we have > 1 VGA cards, then disable the amdgpu VGA resources */
3885         /* this will fail for cards that aren't VGA class devices, just
3886          * ignore it */
3887         if ((adev->pdev->class >> 8) == PCI_CLASS_DISPLAY_VGA)
3888                 vga_client_register(adev->pdev, amdgpu_device_vga_set_decode);
3889
3890         if (amdgpu_device_supports_px(ddev)) {
3891                 px = true;
3892                 vga_switcheroo_register_client(adev->pdev,
3893                                                &amdgpu_switcheroo_ops, px);
3894                 vga_switcheroo_init_domain_pm_ops(adev->dev, &adev->vga_pm_domain);
3895         }
3896
3897         if (adev->gmc.xgmi.pending_reset)
3898                 queue_delayed_work(system_wq, &mgpu_info.delayed_reset_work,
3899                                    msecs_to_jiffies(AMDGPU_RESUME_MS));
3900
3901         amdgpu_device_check_iommu_direct_map(adev);
3902
3903         return 0;
3904
3905 release_ras_con:
3906         amdgpu_release_ras_context(adev);
3907
3908 failed:
3909         amdgpu_vf_error_trans_all(adev);
3910
3911         return r;
3912 }
3913
3914 static void amdgpu_device_unmap_mmio(struct amdgpu_device *adev)
3915 {
3916
3917         /* Clear all CPU mappings pointing to this device */
3918         unmap_mapping_range(adev->ddev.anon_inode->i_mapping, 0, 0, 1);
3919
3920         /* Unmap all mapped bars - Doorbell, registers and VRAM */
3921         amdgpu_device_doorbell_fini(adev);
3922
3923         iounmap(adev->rmmio);
3924         adev->rmmio = NULL;
3925         if (adev->mman.aper_base_kaddr)
3926                 iounmap(adev->mman.aper_base_kaddr);
3927         adev->mman.aper_base_kaddr = NULL;
3928
3929         /* Memory manager related */
3930         if (!adev->gmc.xgmi.connected_to_cpu) {
3931                 arch_phys_wc_del(adev->gmc.vram_mtrr);
3932                 arch_io_free_memtype_wc(adev->gmc.aper_base, adev->gmc.aper_size);
3933         }
3934 }
3935
3936 /**
3937  * amdgpu_device_fini_hw - tear down the driver
3938  *
3939  * @adev: amdgpu_device pointer
3940  *
3941  * Tear down the driver info (all asics).
3942  * Called at driver shutdown.
3943  */
3944 void amdgpu_device_fini_hw(struct amdgpu_device *adev)
3945 {
3946         dev_info(adev->dev, "amdgpu: finishing device.\n");
3947         flush_delayed_work(&adev->delayed_init_work);
3948         adev->shutdown = true;
3949
3950         /* make sure IB test finished before entering exclusive mode
3951          * to avoid preemption on IB test
3952          * */
3953         if (amdgpu_sriov_vf(adev)) {
3954                 amdgpu_virt_request_full_gpu(adev, false);
3955                 amdgpu_virt_fini_data_exchange(adev);
3956         }
3957
3958         /* disable all interrupts */
3959         amdgpu_irq_disable_all(adev);
3960         if (adev->mode_info.mode_config_initialized){
3961                 if (!drm_drv_uses_atomic_modeset(adev_to_drm(adev)))
3962                         drm_helper_force_disable_all(adev_to_drm(adev));
3963                 else
3964                         drm_atomic_helper_shutdown(adev_to_drm(adev));
3965         }
3966         amdgpu_fence_driver_hw_fini(adev);
3967
3968         if (adev->mman.initialized) {
3969                 flush_delayed_work(&adev->mman.bdev.wq);
3970                 ttm_bo_lock_delayed_workqueue(&adev->mman.bdev);
3971         }
3972
3973         if (adev->pm_sysfs_en)
3974                 amdgpu_pm_sysfs_fini(adev);
3975         if (adev->ucode_sysfs_en)
3976                 amdgpu_ucode_sysfs_fini(adev);
3977         if (adev->psp_sysfs_en)
3978                 amdgpu_psp_sysfs_fini(adev);
3979         sysfs_remove_files(&adev->dev->kobj, amdgpu_dev_attributes);
3980
3981         /* disable ras feature must before hw fini */
3982         amdgpu_ras_pre_fini(adev);
3983
3984         amdgpu_device_ip_fini_early(adev);
3985
3986         amdgpu_irq_fini_hw(adev);
3987
3988         if (adev->mman.initialized)
3989                 ttm_device_clear_dma_mappings(&adev->mman.bdev);
3990
3991         amdgpu_gart_dummy_page_fini(adev);
3992
3993         amdgpu_device_unmap_mmio(adev);
3994
3995 }
3996
3997 void amdgpu_device_fini_sw(struct amdgpu_device *adev)
3998 {
3999         int idx;
4000
4001         amdgpu_fence_driver_sw_fini(adev);
4002         amdgpu_device_ip_fini(adev);
4003         release_firmware(adev->firmware.gpu_info_fw);
4004         adev->firmware.gpu_info_fw = NULL;
4005         adev->accel_working = false;
4006         dma_fence_put(rcu_dereference_protected(adev->gang_submit, true));
4007
4008         amdgpu_reset_fini(adev);
4009
4010         /* free i2c buses */
4011         if (!amdgpu_device_has_dc_support(adev))
4012                 amdgpu_i2c_fini(adev);
4013
4014         if (amdgpu_emu_mode != 1)
4015                 amdgpu_atombios_fini(adev);
4016
4017         kfree(adev->bios);
4018         adev->bios = NULL;
4019         if (amdgpu_device_supports_px(adev_to_drm(adev))) {
4020                 vga_switcheroo_unregister_client(adev->pdev);
4021                 vga_switcheroo_fini_domain_pm_ops(adev->dev);
4022         }
4023         if ((adev->pdev->class >> 8) == PCI_CLASS_DISPLAY_VGA)
4024                 vga_client_unregister(adev->pdev);
4025
4026         if (drm_dev_enter(adev_to_drm(adev), &idx)) {
4027
4028                 iounmap(adev->rmmio);
4029                 adev->rmmio = NULL;
4030                 amdgpu_device_doorbell_fini(adev);
4031                 drm_dev_exit(idx);
4032         }
4033
4034         if (IS_ENABLED(CONFIG_PERF_EVENTS))
4035                 amdgpu_pmu_fini(adev);
4036         if (adev->mman.discovery_bin)
4037                 amdgpu_discovery_fini(adev);
4038
4039         amdgpu_reset_put_reset_domain(adev->reset_domain);
4040         adev->reset_domain = NULL;
4041
4042         kfree(adev->pci_state);
4043
4044 }
4045
4046 /**
4047  * amdgpu_device_evict_resources - evict device resources
4048  * @adev: amdgpu device object
4049  *
4050  * Evicts all ttm device resources(vram BOs, gart table) from the lru list
4051  * of the vram memory type. Mainly used for evicting device resources
4052  * at suspend time.
4053  *
4054  */
4055 static void amdgpu_device_evict_resources(struct amdgpu_device *adev)
4056 {
4057         /* No need to evict vram on APUs for suspend to ram or s2idle */
4058         if ((adev->in_s3 || adev->in_s0ix) && (adev->flags & AMD_IS_APU))
4059                 return;
4060
4061         if (amdgpu_ttm_evict_resources(adev, TTM_PL_VRAM))
4062                 DRM_WARN("evicting device resources failed\n");
4063
4064 }
4065
4066 /*
4067  * Suspend & resume.
4068  */
4069 /**
4070  * amdgpu_device_suspend - initiate device suspend
4071  *
4072  * @dev: drm dev pointer
4073  * @fbcon : notify the fbdev of suspend
4074  *
4075  * Puts the hw in the suspend state (all asics).
4076  * Returns 0 for success or an error on failure.
4077  * Called at driver suspend.
4078  */
4079 int amdgpu_device_suspend(struct drm_device *dev, bool fbcon)
4080 {
4081         struct amdgpu_device *adev = drm_to_adev(dev);
4082         int r = 0;
4083
4084         if (dev->switch_power_state == DRM_SWITCH_POWER_OFF)
4085                 return 0;
4086
4087         adev->in_suspend = true;
4088
4089         if (amdgpu_sriov_vf(adev)) {
4090                 amdgpu_virt_fini_data_exchange(adev);
4091                 r = amdgpu_virt_request_full_gpu(adev, false);
4092                 if (r)
4093                         return r;
4094         }
4095
4096         if (amdgpu_acpi_smart_shift_update(dev, AMDGPU_SS_DEV_D3))
4097                 DRM_WARN("smart shift update failed\n");
4098
4099         drm_kms_helper_poll_disable(dev);
4100
4101         if (fbcon)
4102                 drm_fb_helper_set_suspend_unlocked(adev_to_drm(adev)->fb_helper, true);
4103
4104         cancel_delayed_work_sync(&adev->delayed_init_work);
4105
4106         amdgpu_ras_suspend(adev);
4107
4108         amdgpu_device_ip_suspend_phase1(adev);
4109
4110         if (!adev->in_s0ix)
4111                 amdgpu_amdkfd_suspend(adev, adev->in_runpm);
4112
4113         amdgpu_device_evict_resources(adev);
4114
4115         amdgpu_fence_driver_hw_fini(adev);
4116
4117         amdgpu_device_ip_suspend_phase2(adev);
4118
4119         if (amdgpu_sriov_vf(adev))
4120                 amdgpu_virt_release_full_gpu(adev, false);
4121
4122         return 0;
4123 }
4124
4125 /**
4126  * amdgpu_device_resume - initiate device resume
4127  *
4128  * @dev: drm dev pointer
4129  * @fbcon : notify the fbdev of resume
4130  *
4131  * Bring the hw back to operating state (all asics).
4132  * Returns 0 for success or an error on failure.
4133  * Called at driver resume.
4134  */
4135 int amdgpu_device_resume(struct drm_device *dev, bool fbcon)
4136 {
4137         struct amdgpu_device *adev = drm_to_adev(dev);
4138         int r = 0;
4139
4140         if (amdgpu_sriov_vf(adev)) {
4141                 r = amdgpu_virt_request_full_gpu(adev, true);
4142                 if (r)
4143                         return r;
4144         }
4145
4146         if (dev->switch_power_state == DRM_SWITCH_POWER_OFF)
4147                 return 0;
4148
4149         if (adev->in_s0ix)
4150                 amdgpu_dpm_gfx_state_change(adev, sGpuChangeState_D0Entry);
4151
4152         /* post card */
4153         if (amdgpu_device_need_post(adev)) {
4154                 r = amdgpu_device_asic_init(adev);
4155                 if (r)
4156                         dev_err(adev->dev, "amdgpu asic init failed\n");
4157         }
4158
4159         r = amdgpu_device_ip_resume(adev);
4160
4161         /* no matter what r is, always need to properly release full GPU */
4162         if (amdgpu_sriov_vf(adev)) {
4163                 amdgpu_virt_init_data_exchange(adev);
4164                 amdgpu_virt_release_full_gpu(adev, true);
4165         }
4166
4167         if (r) {
4168                 dev_err(adev->dev, "amdgpu_device_ip_resume failed (%d).\n", r);
4169                 return r;
4170         }
4171         amdgpu_fence_driver_hw_init(adev);
4172
4173         r = amdgpu_device_ip_late_init(adev);
4174         if (r)
4175                 return r;
4176
4177         queue_delayed_work(system_wq, &adev->delayed_init_work,
4178                            msecs_to_jiffies(AMDGPU_RESUME_MS));
4179
4180         if (!adev->in_s0ix) {
4181                 r = amdgpu_amdkfd_resume(adev, adev->in_runpm);
4182                 if (r)
4183                         return r;
4184         }
4185
4186         /* Make sure IB tests flushed */
4187         flush_delayed_work(&adev->delayed_init_work);
4188
4189         if (fbcon)
4190                 drm_fb_helper_set_suspend_unlocked(adev_to_drm(adev)->fb_helper, false);
4191
4192         drm_kms_helper_poll_enable(dev);
4193
4194         amdgpu_ras_resume(adev);
4195
4196         /*
4197          * Most of the connector probing functions try to acquire runtime pm
4198          * refs to ensure that the GPU is powered on when connector polling is
4199          * performed. Since we're calling this from a runtime PM callback,
4200          * trying to acquire rpm refs will cause us to deadlock.
4201          *
4202          * Since we're guaranteed to be holding the rpm lock, it's safe to
4203          * temporarily disable the rpm helpers so this doesn't deadlock us.
4204          */
4205 #ifdef CONFIG_PM
4206         dev->dev->power.disable_depth++;
4207 #endif
4208         if (!amdgpu_device_has_dc_support(adev))
4209                 drm_helper_hpd_irq_event(dev);
4210         else
4211                 drm_kms_helper_hotplug_event(dev);
4212 #ifdef CONFIG_PM
4213         dev->dev->power.disable_depth--;
4214 #endif
4215         adev->in_suspend = false;
4216
4217         if (amdgpu_acpi_smart_shift_update(dev, AMDGPU_SS_DEV_D0))
4218                 DRM_WARN("smart shift update failed\n");
4219
4220         return 0;
4221 }
4222
4223 /**
4224  * amdgpu_device_ip_check_soft_reset - did soft reset succeed
4225  *
4226  * @adev: amdgpu_device pointer
4227  *
4228  * The list of all the hardware IPs that make up the asic is walked and
4229  * the check_soft_reset callbacks are run.  check_soft_reset determines
4230  * if the asic is still hung or not.
4231  * Returns true if any of the IPs are still in a hung state, false if not.
4232  */
4233 static bool amdgpu_device_ip_check_soft_reset(struct amdgpu_device *adev)
4234 {
4235         int i;
4236         bool asic_hang = false;
4237
4238         if (amdgpu_sriov_vf(adev))
4239                 return true;
4240
4241         if (amdgpu_asic_need_full_reset(adev))
4242                 return true;
4243
4244         for (i = 0; i < adev->num_ip_blocks; i++) {
4245                 if (!adev->ip_blocks[i].status.valid)
4246                         continue;
4247                 if (adev->ip_blocks[i].version->funcs->check_soft_reset)
4248                         adev->ip_blocks[i].status.hang =
4249                                 adev->ip_blocks[i].version->funcs->check_soft_reset(adev);
4250                 if (adev->ip_blocks[i].status.hang) {
4251                         dev_info(adev->dev, "IP block:%s is hung!\n", adev->ip_blocks[i].version->funcs->name);
4252                         asic_hang = true;
4253                 }
4254         }
4255         return asic_hang;
4256 }
4257
4258 /**
4259  * amdgpu_device_ip_pre_soft_reset - prepare for soft reset
4260  *
4261  * @adev: amdgpu_device pointer
4262  *
4263  * The list of all the hardware IPs that make up the asic is walked and the
4264  * pre_soft_reset callbacks are run if the block is hung.  pre_soft_reset
4265  * handles any IP specific hardware or software state changes that are
4266  * necessary for a soft reset to succeed.
4267  * Returns 0 on success, negative error code on failure.
4268  */
4269 static int amdgpu_device_ip_pre_soft_reset(struct amdgpu_device *adev)
4270 {
4271         int i, r = 0;
4272
4273         for (i = 0; i < adev->num_ip_blocks; i++) {
4274                 if (!adev->ip_blocks[i].status.valid)
4275                         continue;
4276                 if (adev->ip_blocks[i].status.hang &&
4277                     adev->ip_blocks[i].version->funcs->pre_soft_reset) {
4278                         r = adev->ip_blocks[i].version->funcs->pre_soft_reset(adev);
4279                         if (r)
4280                                 return r;
4281                 }
4282         }
4283
4284         return 0;
4285 }
4286
4287 /**
4288  * amdgpu_device_ip_need_full_reset - check if a full asic reset is needed
4289  *
4290  * @adev: amdgpu_device pointer
4291  *
4292  * Some hardware IPs cannot be soft reset.  If they are hung, a full gpu
4293  * reset is necessary to recover.
4294  * Returns true if a full asic reset is required, false if not.
4295  */
4296 static bool amdgpu_device_ip_need_full_reset(struct amdgpu_device *adev)
4297 {
4298         int i;
4299
4300         if (amdgpu_asic_need_full_reset(adev))
4301                 return true;
4302
4303         for (i = 0; i < adev->num_ip_blocks; i++) {
4304                 if (!adev->ip_blocks[i].status.valid)
4305                         continue;
4306                 if ((adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GMC) ||
4307                     (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_SMC) ||
4308                     (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_ACP) ||
4309                     (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_DCE) ||
4310                      adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_PSP) {
4311                         if (adev->ip_blocks[i].status.hang) {
4312                                 dev_info(adev->dev, "Some block need full reset!\n");
4313                                 return true;
4314                         }
4315                 }
4316         }
4317         return false;
4318 }
4319
4320 /**
4321  * amdgpu_device_ip_soft_reset - do a soft reset
4322  *
4323  * @adev: amdgpu_device pointer
4324  *
4325  * The list of all the hardware IPs that make up the asic is walked and the
4326  * soft_reset callbacks are run if the block is hung.  soft_reset handles any
4327  * IP specific hardware or software state changes that are necessary to soft
4328  * reset the IP.
4329  * Returns 0 on success, negative error code on failure.
4330  */
4331 static int amdgpu_device_ip_soft_reset(struct amdgpu_device *adev)
4332 {
4333         int i, r = 0;
4334
4335         for (i = 0; i < adev->num_ip_blocks; i++) {
4336                 if (!adev->ip_blocks[i].status.valid)
4337                         continue;
4338                 if (adev->ip_blocks[i].status.hang &&
4339                     adev->ip_blocks[i].version->funcs->soft_reset) {
4340                         r = adev->ip_blocks[i].version->funcs->soft_reset(adev);
4341                         if (r)
4342                                 return r;
4343                 }
4344         }
4345
4346         return 0;
4347 }
4348
4349 /**
4350  * amdgpu_device_ip_post_soft_reset - clean up from soft reset
4351  *
4352  * @adev: amdgpu_device pointer
4353  *
4354  * The list of all the hardware IPs that make up the asic is walked and the
4355  * post_soft_reset callbacks are run if the asic was hung.  post_soft_reset
4356  * handles any IP specific hardware or software state changes that are
4357  * necessary after the IP has been soft reset.
4358  * Returns 0 on success, negative error code on failure.
4359  */
4360 static int amdgpu_device_ip_post_soft_reset(struct amdgpu_device *adev)
4361 {
4362         int i, r = 0;
4363
4364         for (i = 0; i < adev->num_ip_blocks; i++) {
4365                 if (!adev->ip_blocks[i].status.valid)
4366                         continue;
4367                 if (adev->ip_blocks[i].status.hang &&
4368                     adev->ip_blocks[i].version->funcs->post_soft_reset)
4369                         r = adev->ip_blocks[i].version->funcs->post_soft_reset(adev);
4370                 if (r)
4371                         return r;
4372         }
4373
4374         return 0;
4375 }
4376
4377 /**
4378  * amdgpu_device_recover_vram - Recover some VRAM contents
4379  *
4380  * @adev: amdgpu_device pointer
4381  *
4382  * Restores the contents of VRAM buffers from the shadows in GTT.  Used to
4383  * restore things like GPUVM page tables after a GPU reset where
4384  * the contents of VRAM might be lost.
4385  *
4386  * Returns:
4387  * 0 on success, negative error code on failure.
4388  */
4389 static int amdgpu_device_recover_vram(struct amdgpu_device *adev)
4390 {
4391         struct dma_fence *fence = NULL, *next = NULL;
4392         struct amdgpu_bo *shadow;
4393         struct amdgpu_bo_vm *vmbo;
4394         long r = 1, tmo;
4395
4396         if (amdgpu_sriov_runtime(adev))
4397                 tmo = msecs_to_jiffies(8000);
4398         else
4399                 tmo = msecs_to_jiffies(100);
4400
4401         dev_info(adev->dev, "recover vram bo from shadow start\n");
4402         mutex_lock(&adev->shadow_list_lock);
4403         list_for_each_entry(vmbo, &adev->shadow_list, shadow_list) {
4404                 shadow = &vmbo->bo;
4405                 /* No need to recover an evicted BO */
4406                 if (shadow->tbo.resource->mem_type != TTM_PL_TT ||
4407                     shadow->tbo.resource->start == AMDGPU_BO_INVALID_OFFSET ||
4408                     shadow->parent->tbo.resource->mem_type != TTM_PL_VRAM)
4409                         continue;
4410
4411                 r = amdgpu_bo_restore_shadow(shadow, &next);
4412                 if (r)
4413                         break;
4414
4415                 if (fence) {
4416                         tmo = dma_fence_wait_timeout(fence, false, tmo);
4417                         dma_fence_put(fence);
4418                         fence = next;
4419                         if (tmo == 0) {
4420                                 r = -ETIMEDOUT;
4421                                 break;
4422                         } else if (tmo < 0) {
4423                                 r = tmo;
4424                                 break;
4425                         }
4426                 } else {
4427                         fence = next;
4428                 }
4429         }
4430         mutex_unlock(&adev->shadow_list_lock);
4431
4432         if (fence)
4433                 tmo = dma_fence_wait_timeout(fence, false, tmo);
4434         dma_fence_put(fence);
4435
4436         if (r < 0 || tmo <= 0) {
4437                 dev_err(adev->dev, "recover vram bo from shadow failed, r is %ld, tmo is %ld\n", r, tmo);
4438                 return -EIO;
4439         }
4440
4441         dev_info(adev->dev, "recover vram bo from shadow done\n");
4442         return 0;
4443 }
4444
4445
4446 /**
4447  * amdgpu_device_reset_sriov - reset ASIC for SR-IOV vf
4448  *
4449  * @adev: amdgpu_device pointer
4450  * @from_hypervisor: request from hypervisor
4451  *
4452  * do VF FLR and reinitialize Asic
4453  * return 0 means succeeded otherwise failed
4454  */
4455 static int amdgpu_device_reset_sriov(struct amdgpu_device *adev,
4456                                      bool from_hypervisor)
4457 {
4458         int r;
4459         struct amdgpu_hive_info *hive = NULL;
4460         int retry_limit = 0;
4461
4462 retry:
4463         amdgpu_amdkfd_pre_reset(adev);
4464
4465         if (from_hypervisor)
4466                 r = amdgpu_virt_request_full_gpu(adev, true);
4467         else
4468                 r = amdgpu_virt_reset_gpu(adev);
4469         if (r)
4470                 return r;
4471
4472         /* Resume IP prior to SMC */
4473         r = amdgpu_device_ip_reinit_early_sriov(adev);
4474         if (r)
4475                 goto error;
4476
4477         amdgpu_virt_init_data_exchange(adev);
4478
4479         r = amdgpu_device_fw_loading(adev);
4480         if (r)
4481                 return r;
4482
4483         /* now we are okay to resume SMC/CP/SDMA */
4484         r = amdgpu_device_ip_reinit_late_sriov(adev);
4485         if (r)
4486                 goto error;
4487
4488         hive = amdgpu_get_xgmi_hive(adev);
4489         /* Update PSP FW topology after reset */
4490         if (hive && adev->gmc.xgmi.num_physical_nodes > 1)
4491                 r = amdgpu_xgmi_update_topology(hive, adev);
4492
4493         if (hive)
4494                 amdgpu_put_xgmi_hive(hive);
4495
4496         if (!r) {
4497                 amdgpu_irq_gpu_reset_resume_helper(adev);
4498                 r = amdgpu_ib_ring_tests(adev);
4499
4500                 amdgpu_amdkfd_post_reset(adev);
4501         }
4502
4503 error:
4504         if (!r && adev->virt.gim_feature & AMDGIM_FEATURE_GIM_FLR_VRAMLOST) {
4505                 amdgpu_inc_vram_lost(adev);
4506                 r = amdgpu_device_recover_vram(adev);
4507         }
4508         amdgpu_virt_release_full_gpu(adev, true);
4509
4510         if (AMDGPU_RETRY_SRIOV_RESET(r)) {
4511                 if (retry_limit < AMDGPU_MAX_RETRY_LIMIT) {
4512                         retry_limit++;
4513                         goto retry;
4514                 } else
4515                         DRM_ERROR("GPU reset retry is beyond the retry limit\n");
4516         }
4517
4518         return r;
4519 }
4520
4521 /**
4522  * amdgpu_device_has_job_running - check if there is any job in mirror list
4523  *
4524  * @adev: amdgpu_device pointer
4525  *
4526  * check if there is any job in mirror list
4527  */
4528 bool amdgpu_device_has_job_running(struct amdgpu_device *adev)
4529 {
4530         int i;
4531         struct drm_sched_job *job;
4532
4533         for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
4534                 struct amdgpu_ring *ring = adev->rings[i];
4535
4536                 if (!ring || !ring->sched.thread)
4537                         continue;
4538
4539                 spin_lock(&ring->sched.job_list_lock);
4540                 job = list_first_entry_or_null(&ring->sched.pending_list,
4541                                                struct drm_sched_job, list);
4542                 spin_unlock(&ring->sched.job_list_lock);
4543                 if (job)
4544                         return true;
4545         }
4546         return false;
4547 }
4548
4549 /**
4550  * amdgpu_device_should_recover_gpu - check if we should try GPU recovery
4551  *
4552  * @adev: amdgpu_device pointer
4553  *
4554  * Check amdgpu_gpu_recovery and SRIOV status to see if we should try to recover
4555  * a hung GPU.
4556  */
4557 bool amdgpu_device_should_recover_gpu(struct amdgpu_device *adev)
4558 {
4559
4560         if (amdgpu_gpu_recovery == 0)
4561                 goto disabled;
4562
4563         if (!amdgpu_device_ip_check_soft_reset(adev)) {
4564                 dev_info(adev->dev,"Timeout, but no hardware hang detected.\n");
4565                 return false;
4566         }
4567
4568         if (amdgpu_sriov_vf(adev))
4569                 return true;
4570
4571         if (amdgpu_gpu_recovery == -1) {
4572                 switch (adev->asic_type) {
4573 #ifdef CONFIG_DRM_AMDGPU_SI
4574                 case CHIP_VERDE:
4575                 case CHIP_TAHITI:
4576                 case CHIP_PITCAIRN:
4577                 case CHIP_OLAND:
4578                 case CHIP_HAINAN:
4579 #endif
4580 #ifdef CONFIG_DRM_AMDGPU_CIK
4581                 case CHIP_KAVERI:
4582                 case CHIP_KABINI:
4583                 case CHIP_MULLINS:
4584 #endif
4585                 case CHIP_CARRIZO:
4586                 case CHIP_STONEY:
4587                 case CHIP_CYAN_SKILLFISH:
4588                         goto disabled;
4589                 default:
4590                         break;
4591                 }
4592         }
4593
4594         return true;
4595
4596 disabled:
4597                 dev_info(adev->dev, "GPU recovery disabled.\n");
4598                 return false;
4599 }
4600
4601 int amdgpu_device_mode1_reset(struct amdgpu_device *adev)
4602 {
4603         u32 i;
4604         int ret = 0;
4605
4606         amdgpu_atombios_scratch_regs_engine_hung(adev, true);
4607
4608         dev_info(adev->dev, "GPU mode1 reset\n");
4609
4610         /* disable BM */
4611         pci_clear_master(adev->pdev);
4612
4613         amdgpu_device_cache_pci_state(adev->pdev);
4614
4615         if (amdgpu_dpm_is_mode1_reset_supported(adev)) {
4616                 dev_info(adev->dev, "GPU smu mode1 reset\n");
4617                 ret = amdgpu_dpm_mode1_reset(adev);
4618         } else {
4619                 dev_info(adev->dev, "GPU psp mode1 reset\n");
4620                 ret = psp_gpu_reset(adev);
4621         }
4622
4623         if (ret)
4624                 dev_err(adev->dev, "GPU mode1 reset failed\n");
4625
4626         amdgpu_device_load_pci_state(adev->pdev);
4627
4628         /* wait for asic to come out of reset */
4629         for (i = 0; i < adev->usec_timeout; i++) {
4630                 u32 memsize = adev->nbio.funcs->get_memsize(adev);
4631
4632                 if (memsize != 0xffffffff)
4633                         break;
4634                 udelay(1);
4635         }
4636
4637         amdgpu_atombios_scratch_regs_engine_hung(adev, false);
4638         return ret;
4639 }
4640
4641 int amdgpu_device_pre_asic_reset(struct amdgpu_device *adev,
4642                                  struct amdgpu_reset_context *reset_context)
4643 {
4644         int i, r = 0;
4645         struct amdgpu_job *job = NULL;
4646         bool need_full_reset =
4647                 test_bit(AMDGPU_NEED_FULL_RESET, &reset_context->flags);
4648
4649         if (reset_context->reset_req_dev == adev)
4650                 job = reset_context->job;
4651
4652         if (amdgpu_sriov_vf(adev)) {
4653                 /* stop the data exchange thread */
4654                 amdgpu_virt_fini_data_exchange(adev);
4655         }
4656
4657         amdgpu_fence_driver_isr_toggle(adev, true);
4658
4659         /* block all schedulers and reset given job's ring */
4660         for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
4661                 struct amdgpu_ring *ring = adev->rings[i];
4662
4663                 if (!ring || !ring->sched.thread)
4664                         continue;
4665
4666                 /*clear job fence from fence drv to avoid force_completion
4667                  *leave NULL and vm flush fence in fence drv */
4668                 amdgpu_fence_driver_clear_job_fences(ring);
4669
4670                 /* after all hw jobs are reset, hw fence is meaningless, so force_completion */
4671                 amdgpu_fence_driver_force_completion(ring);
4672         }
4673
4674         amdgpu_fence_driver_isr_toggle(adev, false);
4675
4676         if (job && job->vm)
4677                 drm_sched_increase_karma(&job->base);
4678
4679         r = amdgpu_reset_prepare_hwcontext(adev, reset_context);
4680         /* If reset handler not implemented, continue; otherwise return */
4681         if (r == -ENOSYS)
4682                 r = 0;
4683         else
4684                 return r;
4685
4686         /* Don't suspend on bare metal if we are not going to HW reset the ASIC */
4687         if (!amdgpu_sriov_vf(adev)) {
4688
4689                 if (!need_full_reset)
4690                         need_full_reset = amdgpu_device_ip_need_full_reset(adev);
4691
4692                 if (!need_full_reset && amdgpu_gpu_recovery) {
4693                         amdgpu_device_ip_pre_soft_reset(adev);
4694                         r = amdgpu_device_ip_soft_reset(adev);
4695                         amdgpu_device_ip_post_soft_reset(adev);
4696                         if (r || amdgpu_device_ip_check_soft_reset(adev)) {
4697                                 dev_info(adev->dev, "soft reset failed, will fallback to full reset!\n");
4698                                 need_full_reset = true;
4699                         }
4700                 }
4701
4702                 if (need_full_reset)
4703                         r = amdgpu_device_ip_suspend(adev);
4704                 if (need_full_reset)
4705                         set_bit(AMDGPU_NEED_FULL_RESET, &reset_context->flags);
4706                 else
4707                         clear_bit(AMDGPU_NEED_FULL_RESET,
4708                                   &reset_context->flags);
4709         }
4710
4711         return r;
4712 }
4713
4714 static int amdgpu_reset_reg_dumps(struct amdgpu_device *adev)
4715 {
4716         int i;
4717
4718         lockdep_assert_held(&adev->reset_domain->sem);
4719
4720         for (i = 0; i < adev->num_regs; i++) {
4721                 adev->reset_dump_reg_value[i] = RREG32(adev->reset_dump_reg_list[i]);
4722                 trace_amdgpu_reset_reg_dumps(adev->reset_dump_reg_list[i],
4723                                              adev->reset_dump_reg_value[i]);
4724         }
4725
4726         return 0;
4727 }
4728
4729 #ifdef CONFIG_DEV_COREDUMP
4730 static ssize_t amdgpu_devcoredump_read(char *buffer, loff_t offset,
4731                 size_t count, void *data, size_t datalen)
4732 {
4733         struct drm_printer p;
4734         struct amdgpu_device *adev = data;
4735         struct drm_print_iterator iter;
4736         int i;
4737
4738         iter.data = buffer;
4739         iter.offset = 0;
4740         iter.start = offset;
4741         iter.remain = count;
4742
4743         p = drm_coredump_printer(&iter);
4744
4745         drm_printf(&p, "**** AMDGPU Device Coredump ****\n");
4746         drm_printf(&p, "kernel: " UTS_RELEASE "\n");
4747         drm_printf(&p, "module: " KBUILD_MODNAME "\n");
4748         drm_printf(&p, "time: %lld.%09ld\n", adev->reset_time.tv_sec, adev->reset_time.tv_nsec);
4749         if (adev->reset_task_info.pid)
4750                 drm_printf(&p, "process_name: %s PID: %d\n",
4751                            adev->reset_task_info.process_name,
4752                            adev->reset_task_info.pid);
4753
4754         if (adev->reset_vram_lost)
4755                 drm_printf(&p, "VRAM is lost due to GPU reset!\n");
4756         if (adev->num_regs) {
4757                 drm_printf(&p, "AMDGPU register dumps:\nOffset:     Value:\n");
4758
4759                 for (i = 0; i < adev->num_regs; i++)
4760                         drm_printf(&p, "0x%08x: 0x%08x\n",
4761                                    adev->reset_dump_reg_list[i],
4762                                    adev->reset_dump_reg_value[i]);
4763         }
4764
4765         return count - iter.remain;
4766 }
4767
4768 static void amdgpu_devcoredump_free(void *data)
4769 {
4770 }
4771
4772 static void amdgpu_reset_capture_coredumpm(struct amdgpu_device *adev)
4773 {
4774         struct drm_device *dev = adev_to_drm(adev);
4775
4776         ktime_get_ts64(&adev->reset_time);
4777         dev_coredumpm(dev->dev, THIS_MODULE, adev, 0, GFP_KERNEL,
4778                       amdgpu_devcoredump_read, amdgpu_devcoredump_free);
4779 }
4780 #endif
4781
4782 int amdgpu_do_asic_reset(struct list_head *device_list_handle,
4783                          struct amdgpu_reset_context *reset_context)
4784 {
4785         struct amdgpu_device *tmp_adev = NULL;
4786         bool need_full_reset, skip_hw_reset, vram_lost = false;
4787         int r = 0;
4788         bool gpu_reset_for_dev_remove = 0;
4789
4790         /* Try reset handler method first */
4791         tmp_adev = list_first_entry(device_list_handle, struct amdgpu_device,
4792                                     reset_list);
4793         amdgpu_reset_reg_dumps(tmp_adev);
4794
4795         reset_context->reset_device_list = device_list_handle;
4796         r = amdgpu_reset_perform_reset(tmp_adev, reset_context);
4797         /* If reset handler not implemented, continue; otherwise return */
4798         if (r == -ENOSYS)
4799                 r = 0;
4800         else
4801                 return r;
4802
4803         /* Reset handler not implemented, use the default method */
4804         need_full_reset =
4805                 test_bit(AMDGPU_NEED_FULL_RESET, &reset_context->flags);
4806         skip_hw_reset = test_bit(AMDGPU_SKIP_HW_RESET, &reset_context->flags);
4807
4808         gpu_reset_for_dev_remove =
4809                 test_bit(AMDGPU_RESET_FOR_DEVICE_REMOVE, &reset_context->flags) &&
4810                         test_bit(AMDGPU_NEED_FULL_RESET, &reset_context->flags);
4811
4812         /*
4813          * ASIC reset has to be done on all XGMI hive nodes ASAP
4814          * to allow proper links negotiation in FW (within 1 sec)
4815          */
4816         if (!skip_hw_reset && need_full_reset) {
4817                 list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
4818                         /* For XGMI run all resets in parallel to speed up the process */
4819                         if (tmp_adev->gmc.xgmi.num_physical_nodes > 1) {
4820                                 tmp_adev->gmc.xgmi.pending_reset = false;
4821                                 if (!queue_work(system_unbound_wq, &tmp_adev->xgmi_reset_work))
4822                                         r = -EALREADY;
4823                         } else
4824                                 r = amdgpu_asic_reset(tmp_adev);
4825
4826                         if (r) {
4827                                 dev_err(tmp_adev->dev, "ASIC reset failed with error, %d for drm dev, %s",
4828                                          r, adev_to_drm(tmp_adev)->unique);
4829                                 break;
4830                         }
4831                 }
4832
4833                 /* For XGMI wait for all resets to complete before proceed */
4834                 if (!r) {
4835                         list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
4836                                 if (tmp_adev->gmc.xgmi.num_physical_nodes > 1) {
4837                                         flush_work(&tmp_adev->xgmi_reset_work);
4838                                         r = tmp_adev->asic_reset_res;
4839                                         if (r)
4840                                                 break;
4841                                 }
4842                         }
4843                 }
4844         }
4845
4846         if (!r && amdgpu_ras_intr_triggered()) {
4847                 list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
4848                         if (tmp_adev->mmhub.ras && tmp_adev->mmhub.ras->ras_block.hw_ops &&
4849                             tmp_adev->mmhub.ras->ras_block.hw_ops->reset_ras_error_count)
4850                                 tmp_adev->mmhub.ras->ras_block.hw_ops->reset_ras_error_count(tmp_adev);
4851                 }
4852
4853                 amdgpu_ras_intr_cleared();
4854         }
4855
4856         /* Since the mode1 reset affects base ip blocks, the
4857          * phase1 ip blocks need to be resumed. Otherwise there
4858          * will be a BIOS signature error and the psp bootloader
4859          * can't load kdb on the next amdgpu install.
4860          */
4861         if (gpu_reset_for_dev_remove) {
4862                 list_for_each_entry(tmp_adev, device_list_handle, reset_list)
4863                         amdgpu_device_ip_resume_phase1(tmp_adev);
4864
4865                 goto end;
4866         }
4867
4868         list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
4869                 if (need_full_reset) {
4870                         /* post card */
4871                         r = amdgpu_device_asic_init(tmp_adev);
4872                         if (r) {
4873                                 dev_warn(tmp_adev->dev, "asic atom init failed!");
4874                         } else {
4875                                 dev_info(tmp_adev->dev, "GPU reset succeeded, trying to resume\n");
4876                                 r = amdgpu_amdkfd_resume_iommu(tmp_adev);
4877                                 if (r)
4878                                         goto out;
4879
4880                                 r = amdgpu_device_ip_resume_phase1(tmp_adev);
4881                                 if (r)
4882                                         goto out;
4883
4884                                 vram_lost = amdgpu_device_check_vram_lost(tmp_adev);
4885 #ifdef CONFIG_DEV_COREDUMP
4886                                 tmp_adev->reset_vram_lost = vram_lost;
4887                                 memset(&tmp_adev->reset_task_info, 0,
4888                                                 sizeof(tmp_adev->reset_task_info));
4889                                 if (reset_context->job && reset_context->job->vm)
4890                                         tmp_adev->reset_task_info =
4891                                                 reset_context->job->vm->task_info;
4892                                 amdgpu_reset_capture_coredumpm(tmp_adev);
4893 #endif
4894                                 if (vram_lost) {
4895                                         DRM_INFO("VRAM is lost due to GPU reset!\n");
4896                                         amdgpu_inc_vram_lost(tmp_adev);
4897                                 }
4898
4899                                 r = amdgpu_device_fw_loading(tmp_adev);
4900                                 if (r)
4901                                         return r;
4902
4903                                 r = amdgpu_device_ip_resume_phase2(tmp_adev);
4904                                 if (r)
4905                                         goto out;
4906
4907                                 if (vram_lost)
4908                                         amdgpu_device_fill_reset_magic(tmp_adev);
4909
4910                                 /*
4911                                  * Add this ASIC as tracked as reset was already
4912                                  * complete successfully.
4913                                  */
4914                                 amdgpu_register_gpu_instance(tmp_adev);
4915
4916                                 if (!reset_context->hive &&
4917                                     tmp_adev->gmc.xgmi.num_physical_nodes > 1)
4918                                         amdgpu_xgmi_add_device(tmp_adev);
4919
4920                                 r = amdgpu_device_ip_late_init(tmp_adev);
4921                                 if (r)
4922                                         goto out;
4923
4924                                 drm_fb_helper_set_suspend_unlocked(adev_to_drm(tmp_adev)->fb_helper, false);
4925
4926                                 /*
4927                                  * The GPU enters bad state once faulty pages
4928                                  * by ECC has reached the threshold, and ras
4929                                  * recovery is scheduled next. So add one check
4930                                  * here to break recovery if it indeed exceeds
4931                                  * bad page threshold, and remind user to
4932                                  * retire this GPU or setting one bigger
4933                                  * bad_page_threshold value to fix this once
4934                                  * probing driver again.
4935                                  */
4936                                 if (!amdgpu_ras_eeprom_check_err_threshold(tmp_adev)) {
4937                                         /* must succeed. */
4938                                         amdgpu_ras_resume(tmp_adev);
4939                                 } else {
4940                                         r = -EINVAL;
4941                                         goto out;
4942                                 }
4943
4944                                 /* Update PSP FW topology after reset */
4945                                 if (reset_context->hive &&
4946                                     tmp_adev->gmc.xgmi.num_physical_nodes > 1)
4947                                         r = amdgpu_xgmi_update_topology(
4948                                                 reset_context->hive, tmp_adev);
4949                         }
4950                 }
4951
4952 out:
4953                 if (!r) {
4954                         amdgpu_irq_gpu_reset_resume_helper(tmp_adev);
4955                         r = amdgpu_ib_ring_tests(tmp_adev);
4956                         if (r) {
4957                                 dev_err(tmp_adev->dev, "ib ring test failed (%d).\n", r);
4958                                 need_full_reset = true;
4959                                 r = -EAGAIN;
4960                                 goto end;
4961                         }
4962                 }
4963
4964                 if (!r)
4965                         r = amdgpu_device_recover_vram(tmp_adev);
4966                 else
4967                         tmp_adev->asic_reset_res = r;
4968         }
4969
4970 end:
4971         if (need_full_reset)
4972                 set_bit(AMDGPU_NEED_FULL_RESET, &reset_context->flags);
4973         else
4974                 clear_bit(AMDGPU_NEED_FULL_RESET, &reset_context->flags);
4975         return r;
4976 }
4977
4978 static void amdgpu_device_set_mp1_state(struct amdgpu_device *adev)
4979 {
4980
4981         switch (amdgpu_asic_reset_method(adev)) {
4982         case AMD_RESET_METHOD_MODE1:
4983                 adev->mp1_state = PP_MP1_STATE_SHUTDOWN;
4984                 break;
4985         case AMD_RESET_METHOD_MODE2:
4986                 adev->mp1_state = PP_MP1_STATE_RESET;
4987                 break;
4988         default:
4989                 adev->mp1_state = PP_MP1_STATE_NONE;
4990                 break;
4991         }
4992 }
4993
4994 static void amdgpu_device_unset_mp1_state(struct amdgpu_device *adev)
4995 {
4996         amdgpu_vf_error_trans_all(adev);
4997         adev->mp1_state = PP_MP1_STATE_NONE;
4998 }
4999
5000 static void amdgpu_device_resume_display_audio(struct amdgpu_device *adev)
5001 {
5002         struct pci_dev *p = NULL;
5003
5004         p = pci_get_domain_bus_and_slot(pci_domain_nr(adev->pdev->bus),
5005                         adev->pdev->bus->number, 1);
5006         if (p) {
5007                 pm_runtime_enable(&(p->dev));
5008                 pm_runtime_resume(&(p->dev));
5009         }
5010 }
5011
5012 static int amdgpu_device_suspend_display_audio(struct amdgpu_device *adev)
5013 {
5014         enum amd_reset_method reset_method;
5015         struct pci_dev *p = NULL;
5016         u64 expires;
5017
5018         /*
5019          * For now, only BACO and mode1 reset are confirmed
5020          * to suffer the audio issue without proper suspended.
5021          */
5022         reset_method = amdgpu_asic_reset_method(adev);
5023         if ((reset_method != AMD_RESET_METHOD_BACO) &&
5024              (reset_method != AMD_RESET_METHOD_MODE1))
5025                 return -EINVAL;
5026
5027         p = pci_get_domain_bus_and_slot(pci_domain_nr(adev->pdev->bus),
5028                         adev->pdev->bus->number, 1);
5029         if (!p)
5030                 return -ENODEV;
5031
5032         expires = pm_runtime_autosuspend_expiration(&(p->dev));
5033         if (!expires)
5034                 /*
5035                  * If we cannot get the audio device autosuspend delay,
5036                  * a fixed 4S interval will be used. Considering 3S is
5037                  * the audio controller default autosuspend delay setting.
5038                  * 4S used here is guaranteed to cover that.
5039                  */
5040                 expires = ktime_get_mono_fast_ns() + NSEC_PER_SEC * 4ULL;
5041
5042         while (!pm_runtime_status_suspended(&(p->dev))) {
5043                 if (!pm_runtime_suspend(&(p->dev)))
5044                         break;
5045
5046                 if (expires < ktime_get_mono_fast_ns()) {
5047                         dev_warn(adev->dev, "failed to suspend display audio\n");
5048                         /* TODO: abort the succeeding gpu reset? */
5049                         return -ETIMEDOUT;
5050                 }
5051         }
5052
5053         pm_runtime_disable(&(p->dev));
5054
5055         return 0;
5056 }
5057
5058 static void amdgpu_device_recheck_guilty_jobs(
5059         struct amdgpu_device *adev, struct list_head *device_list_handle,
5060         struct amdgpu_reset_context *reset_context)
5061 {
5062         int i, r = 0;
5063
5064         for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
5065                 struct amdgpu_ring *ring = adev->rings[i];
5066                 int ret = 0;
5067                 struct drm_sched_job *s_job;
5068
5069                 if (!ring || !ring->sched.thread)
5070                         continue;
5071
5072                 s_job = list_first_entry_or_null(&ring->sched.pending_list,
5073                                 struct drm_sched_job, list);
5074                 if (s_job == NULL)
5075                         continue;
5076
5077                 /* clear job's guilty and depend the folowing step to decide the real one */
5078                 drm_sched_reset_karma(s_job);
5079                 drm_sched_resubmit_jobs_ext(&ring->sched, 1);
5080
5081                 if (!s_job->s_fence->parent) {
5082                         DRM_WARN("Failed to get a HW fence for job!");
5083                         continue;
5084                 }
5085
5086                 ret = dma_fence_wait_timeout(s_job->s_fence->parent, false, ring->sched.timeout);
5087                 if (ret == 0) { /* timeout */
5088                         DRM_ERROR("Found the real bad job! ring:%s, job_id:%llx\n",
5089                                                 ring->sched.name, s_job->id);
5090
5091
5092                         amdgpu_fence_driver_isr_toggle(adev, true);
5093
5094                         /* Clear this failed job from fence array */
5095                         amdgpu_fence_driver_clear_job_fences(ring);
5096
5097                         amdgpu_fence_driver_isr_toggle(adev, false);
5098
5099                         /* Since the job won't signal and we go for
5100                          * another resubmit drop this parent pointer
5101                          */
5102                         dma_fence_put(s_job->s_fence->parent);
5103                         s_job->s_fence->parent = NULL;
5104
5105                         /* set guilty */
5106                         drm_sched_increase_karma(s_job);
5107                         amdgpu_reset_prepare_hwcontext(adev, reset_context);
5108 retry:
5109                         /* do hw reset */
5110                         if (amdgpu_sriov_vf(adev)) {
5111                                 amdgpu_virt_fini_data_exchange(adev);
5112                                 r = amdgpu_device_reset_sriov(adev, false);
5113                                 if (r)
5114                                         adev->asic_reset_res = r;
5115                         } else {
5116                                 clear_bit(AMDGPU_SKIP_HW_RESET,
5117                                           &reset_context->flags);
5118                                 r = amdgpu_do_asic_reset(device_list_handle,
5119                                                          reset_context);
5120                                 if (r && r == -EAGAIN)
5121                                         goto retry;
5122                         }
5123
5124                         /*
5125                          * add reset counter so that the following
5126                          * resubmitted job could flush vmid
5127                          */
5128                         atomic_inc(&adev->gpu_reset_counter);
5129                         continue;
5130                 }
5131
5132                 /* got the hw fence, signal finished fence */
5133                 atomic_dec(ring->sched.score);
5134                 dma_fence_get(&s_job->s_fence->finished);
5135                 dma_fence_signal(&s_job->s_fence->finished);
5136                 dma_fence_put(&s_job->s_fence->finished);
5137
5138                 /* remove node from list and free the job */
5139                 spin_lock(&ring->sched.job_list_lock);
5140                 list_del_init(&s_job->list);
5141                 spin_unlock(&ring->sched.job_list_lock);
5142                 ring->sched.ops->free_job(s_job);
5143         }
5144 }
5145
5146 static inline void amdgpu_device_stop_pending_resets(struct amdgpu_device *adev)
5147 {
5148         struct amdgpu_ras *con = amdgpu_ras_get_context(adev);
5149
5150 #if defined(CONFIG_DEBUG_FS)
5151         if (!amdgpu_sriov_vf(adev))
5152                 cancel_work(&adev->reset_work);
5153 #endif
5154
5155         if (adev->kfd.dev)
5156                 cancel_work(&adev->kfd.reset_work);
5157
5158         if (amdgpu_sriov_vf(adev))
5159                 cancel_work(&adev->virt.flr_work);
5160
5161         if (con && adev->ras_enabled)
5162                 cancel_work(&con->recovery_work);
5163
5164 }
5165
5166
5167 /**
5168  * amdgpu_device_gpu_recover - reset the asic and recover scheduler
5169  *
5170  * @adev: amdgpu_device pointer
5171  * @job: which job trigger hang
5172  *
5173  * Attempt to reset the GPU if it has hung (all asics).
5174  * Attempt to do soft-reset or full-reset and reinitialize Asic
5175  * Returns 0 for success or an error on failure.
5176  */
5177
5178 int amdgpu_device_gpu_recover(struct amdgpu_device *adev,
5179                               struct amdgpu_job *job,
5180                               struct amdgpu_reset_context *reset_context)
5181 {
5182         struct list_head device_list, *device_list_handle =  NULL;
5183         bool job_signaled = false;
5184         struct amdgpu_hive_info *hive = NULL;
5185         struct amdgpu_device *tmp_adev = NULL;
5186         int i, r = 0;
5187         bool need_emergency_restart = false;
5188         bool audio_suspended = false;
5189         int tmp_vram_lost_counter;
5190         bool gpu_reset_for_dev_remove = false;
5191
5192         gpu_reset_for_dev_remove =
5193                         test_bit(AMDGPU_RESET_FOR_DEVICE_REMOVE, &reset_context->flags) &&
5194                                 test_bit(AMDGPU_NEED_FULL_RESET, &reset_context->flags);
5195
5196         /*
5197          * Special case: RAS triggered and full reset isn't supported
5198          */
5199         need_emergency_restart = amdgpu_ras_need_emergency_restart(adev);
5200
5201         /*
5202          * Flush RAM to disk so that after reboot
5203          * the user can read log and see why the system rebooted.
5204          */
5205         if (need_emergency_restart && amdgpu_ras_get_context(adev)->reboot) {
5206                 DRM_WARN("Emergency reboot.");
5207
5208                 ksys_sync_helper();
5209                 emergency_restart();
5210         }
5211
5212         dev_info(adev->dev, "GPU %s begin!\n",
5213                 need_emergency_restart ? "jobs stop":"reset");
5214
5215         if (!amdgpu_sriov_vf(adev))
5216                 hive = amdgpu_get_xgmi_hive(adev);
5217         if (hive)
5218                 mutex_lock(&hive->hive_lock);
5219
5220         reset_context->job = job;
5221         reset_context->hive = hive;
5222         /*
5223          * Build list of devices to reset.
5224          * In case we are in XGMI hive mode, resort the device list
5225          * to put adev in the 1st position.
5226          */
5227         INIT_LIST_HEAD(&device_list);
5228         if (!amdgpu_sriov_vf(adev) && (adev->gmc.xgmi.num_physical_nodes > 1)) {
5229                 list_for_each_entry(tmp_adev, &hive->device_list, gmc.xgmi.head) {
5230                         list_add_tail(&tmp_adev->reset_list, &device_list);
5231                         if (gpu_reset_for_dev_remove && adev->shutdown)
5232                                 tmp_adev->shutdown = true;
5233                 }
5234                 if (!list_is_first(&adev->reset_list, &device_list))
5235                         list_rotate_to_front(&adev->reset_list, &device_list);
5236                 device_list_handle = &device_list;
5237         } else {
5238                 list_add_tail(&adev->reset_list, &device_list);
5239                 device_list_handle = &device_list;
5240         }
5241
5242         /* We need to lock reset domain only once both for XGMI and single device */
5243         tmp_adev = list_first_entry(device_list_handle, struct amdgpu_device,
5244                                     reset_list);
5245         amdgpu_device_lock_reset_domain(tmp_adev->reset_domain);
5246
5247         /* block all schedulers and reset given job's ring */
5248         list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
5249
5250                 amdgpu_device_set_mp1_state(tmp_adev);
5251
5252                 /*
5253                  * Try to put the audio codec into suspend state
5254                  * before gpu reset started.
5255                  *
5256                  * Due to the power domain of the graphics device
5257                  * is shared with AZ power domain. Without this,
5258                  * we may change the audio hardware from behind
5259                  * the audio driver's back. That will trigger
5260                  * some audio codec errors.
5261                  */
5262                 if (!amdgpu_device_suspend_display_audio(tmp_adev))
5263                         audio_suspended = true;
5264
5265                 amdgpu_ras_set_error_query_ready(tmp_adev, false);
5266
5267                 cancel_delayed_work_sync(&tmp_adev->delayed_init_work);
5268
5269                 if (!amdgpu_sriov_vf(tmp_adev))
5270                         amdgpu_amdkfd_pre_reset(tmp_adev);
5271
5272                 /*
5273                  * Mark these ASICs to be reseted as untracked first
5274                  * And add them back after reset completed
5275                  */
5276                 amdgpu_unregister_gpu_instance(tmp_adev);
5277
5278                 drm_fb_helper_set_suspend_unlocked(adev_to_drm(tmp_adev)->fb_helper, true);
5279
5280                 /* disable ras on ALL IPs */
5281                 if (!need_emergency_restart &&
5282                       amdgpu_device_ip_need_full_reset(tmp_adev))
5283                         amdgpu_ras_suspend(tmp_adev);
5284
5285                 for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
5286                         struct amdgpu_ring *ring = tmp_adev->rings[i];
5287
5288                         if (!ring || !ring->sched.thread)
5289                                 continue;
5290
5291                         drm_sched_stop(&ring->sched, job ? &job->base : NULL);
5292
5293                         if (need_emergency_restart)
5294                                 amdgpu_job_stop_all_jobs_on_sched(&ring->sched);
5295                 }
5296                 atomic_inc(&tmp_adev->gpu_reset_counter);
5297         }
5298
5299         if (need_emergency_restart)
5300                 goto skip_sched_resume;
5301
5302         /*
5303          * Must check guilty signal here since after this point all old
5304          * HW fences are force signaled.
5305          *
5306          * job->base holds a reference to parent fence
5307          */
5308         if (job && dma_fence_is_signaled(&job->hw_fence)) {
5309                 job_signaled = true;
5310                 dev_info(adev->dev, "Guilty job already signaled, skipping HW reset");
5311                 goto skip_hw_reset;
5312         }
5313
5314 retry:  /* Rest of adevs pre asic reset from XGMI hive. */
5315         list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
5316                 if (gpu_reset_for_dev_remove) {
5317                         /* Workaroud for ASICs need to disable SMC first */
5318                         amdgpu_device_smu_fini_early(tmp_adev);
5319                 }
5320                 r = amdgpu_device_pre_asic_reset(tmp_adev, reset_context);
5321                 /*TODO Should we stop ?*/
5322                 if (r) {
5323                         dev_err(tmp_adev->dev, "GPU pre asic reset failed with err, %d for drm dev, %s ",
5324                                   r, adev_to_drm(tmp_adev)->unique);
5325                         tmp_adev->asic_reset_res = r;
5326                 }
5327
5328                 /*
5329                  * Drop all pending non scheduler resets. Scheduler resets
5330                  * were already dropped during drm_sched_stop
5331                  */
5332                 amdgpu_device_stop_pending_resets(tmp_adev);
5333         }
5334
5335         tmp_vram_lost_counter = atomic_read(&((adev)->vram_lost_counter));
5336         /* Actual ASIC resets if needed.*/
5337         /* Host driver will handle XGMI hive reset for SRIOV */
5338         if (amdgpu_sriov_vf(adev)) {
5339                 r = amdgpu_device_reset_sriov(adev, job ? false : true);
5340                 if (r)
5341                         adev->asic_reset_res = r;
5342
5343                 /* Aldebaran supports ras in SRIOV, so need resume ras during reset */
5344                 if (adev->ip_versions[GC_HWIP][0] == IP_VERSION(9, 4, 2))
5345                         amdgpu_ras_resume(adev);
5346         } else {
5347                 r = amdgpu_do_asic_reset(device_list_handle, reset_context);
5348                 if (r && r == -EAGAIN)
5349                         goto retry;
5350
5351                 if (!r && gpu_reset_for_dev_remove)
5352                         goto recover_end;
5353         }
5354
5355 skip_hw_reset:
5356
5357         /* Post ASIC reset for all devs .*/
5358         list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
5359
5360                 /*
5361                  * Sometimes a later bad compute job can block a good gfx job as gfx
5362                  * and compute ring share internal GC HW mutually. We add an additional
5363                  * guilty jobs recheck step to find the real guilty job, it synchronously
5364                  * submits and pends for the first job being signaled. If it gets timeout,
5365                  * we identify it as a real guilty job.
5366                  */
5367                 if (amdgpu_gpu_recovery == 2 &&
5368                         !(tmp_vram_lost_counter < atomic_read(&adev->vram_lost_counter)))
5369                         amdgpu_device_recheck_guilty_jobs(
5370                                 tmp_adev, device_list_handle, reset_context);
5371
5372                 for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
5373                         struct amdgpu_ring *ring = tmp_adev->rings[i];
5374
5375                         if (!ring || !ring->sched.thread)
5376                                 continue;
5377
5378                         /* No point to resubmit jobs if we didn't HW reset*/
5379                         if (!tmp_adev->asic_reset_res && !job_signaled)
5380                                 drm_sched_resubmit_jobs(&ring->sched);
5381
5382                         drm_sched_start(&ring->sched, !tmp_adev->asic_reset_res);
5383                 }
5384
5385                 if (adev->enable_mes)
5386                         amdgpu_mes_self_test(tmp_adev);
5387
5388                 if (!drm_drv_uses_atomic_modeset(adev_to_drm(tmp_adev)) && !job_signaled) {
5389                         drm_helper_resume_force_mode(adev_to_drm(tmp_adev));
5390                 }
5391
5392                 if (tmp_adev->asic_reset_res)
5393                         r = tmp_adev->asic_reset_res;
5394
5395                 tmp_adev->asic_reset_res = 0;
5396
5397                 if (r) {
5398                         /* bad news, how to tell it to userspace ? */
5399                         dev_info(tmp_adev->dev, "GPU reset(%d) failed\n", atomic_read(&tmp_adev->gpu_reset_counter));
5400                         amdgpu_vf_error_put(tmp_adev, AMDGIM_ERROR_VF_GPU_RESET_FAIL, 0, r);
5401                 } else {
5402                         dev_info(tmp_adev->dev, "GPU reset(%d) succeeded!\n", atomic_read(&tmp_adev->gpu_reset_counter));
5403                         if (amdgpu_acpi_smart_shift_update(adev_to_drm(tmp_adev), AMDGPU_SS_DEV_D0))
5404                                 DRM_WARN("smart shift update failed\n");
5405                 }
5406         }
5407
5408 skip_sched_resume:
5409         list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
5410                 /* unlock kfd: SRIOV would do it separately */
5411                 if (!need_emergency_restart && !amdgpu_sriov_vf(tmp_adev))
5412                         amdgpu_amdkfd_post_reset(tmp_adev);
5413
5414                 /* kfd_post_reset will do nothing if kfd device is not initialized,
5415                  * need to bring up kfd here if it's not be initialized before
5416                  */
5417                 if (!adev->kfd.init_complete)
5418                         amdgpu_amdkfd_device_init(adev);
5419
5420                 if (audio_suspended)
5421                         amdgpu_device_resume_display_audio(tmp_adev);
5422
5423                 amdgpu_device_unset_mp1_state(tmp_adev);
5424         }
5425
5426 recover_end:
5427         tmp_adev = list_first_entry(device_list_handle, struct amdgpu_device,
5428                                             reset_list);
5429         amdgpu_device_unlock_reset_domain(tmp_adev->reset_domain);
5430
5431         if (hive) {
5432                 mutex_unlock(&hive->hive_lock);
5433                 amdgpu_put_xgmi_hive(hive);
5434         }
5435
5436         if (r)
5437                 dev_info(adev->dev, "GPU reset end with ret = %d\n", r);
5438
5439         atomic_set(&adev->reset_domain->reset_res, r);
5440         return r;
5441 }
5442
5443 /**
5444  * amdgpu_device_get_pcie_info - fence pcie info about the PCIE slot
5445  *
5446  * @adev: amdgpu_device pointer
5447  *
5448  * Fetchs and stores in the driver the PCIE capabilities (gen speed
5449  * and lanes) of the slot the device is in. Handles APUs and
5450  * virtualized environments where PCIE config space may not be available.
5451  */
5452 static void amdgpu_device_get_pcie_info(struct amdgpu_device *adev)
5453 {
5454         struct pci_dev *pdev;
5455         enum pci_bus_speed speed_cap, platform_speed_cap;
5456         enum pcie_link_width platform_link_width;
5457
5458         if (amdgpu_pcie_gen_cap)
5459                 adev->pm.pcie_gen_mask = amdgpu_pcie_gen_cap;
5460
5461         if (amdgpu_pcie_lane_cap)
5462                 adev->pm.pcie_mlw_mask = amdgpu_pcie_lane_cap;
5463
5464         /* covers APUs as well */
5465         if (pci_is_root_bus(adev->pdev->bus)) {
5466                 if (adev->pm.pcie_gen_mask == 0)
5467                         adev->pm.pcie_gen_mask = AMDGPU_DEFAULT_PCIE_GEN_MASK;
5468                 if (adev->pm.pcie_mlw_mask == 0)
5469                         adev->pm.pcie_mlw_mask = AMDGPU_DEFAULT_PCIE_MLW_MASK;
5470                 return;
5471         }
5472
5473         if (adev->pm.pcie_gen_mask && adev->pm.pcie_mlw_mask)
5474                 return;
5475
5476         pcie_bandwidth_available(adev->pdev, NULL,
5477                                  &platform_speed_cap, &platform_link_width);
5478
5479         if (adev->pm.pcie_gen_mask == 0) {
5480                 /* asic caps */
5481                 pdev = adev->pdev;
5482                 speed_cap = pcie_get_speed_cap(pdev);
5483                 if (speed_cap == PCI_SPEED_UNKNOWN) {
5484                         adev->pm.pcie_gen_mask |= (CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN1 |
5485                                                   CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN2 |
5486                                                   CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN3);
5487                 } else {
5488                         if (speed_cap == PCIE_SPEED_32_0GT)
5489                                 adev->pm.pcie_gen_mask |= (CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN1 |
5490                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN2 |
5491                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN3 |
5492                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN4 |
5493                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN5);
5494                         else if (speed_cap == PCIE_SPEED_16_0GT)
5495                                 adev->pm.pcie_gen_mask |= (CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN1 |
5496                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN2 |
5497                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN3 |
5498                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN4);
5499                         else if (speed_cap == PCIE_SPEED_8_0GT)
5500                                 adev->pm.pcie_gen_mask |= (CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN1 |
5501                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN2 |
5502                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN3);
5503                         else if (speed_cap == PCIE_SPEED_5_0GT)
5504                                 adev->pm.pcie_gen_mask |= (CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN1 |
5505                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN2);
5506                         else
5507                                 adev->pm.pcie_gen_mask |= CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN1;
5508                 }
5509                 /* platform caps */
5510                 if (platform_speed_cap == PCI_SPEED_UNKNOWN) {
5511                         adev->pm.pcie_gen_mask |= (CAIL_PCIE_LINK_SPEED_SUPPORT_GEN1 |
5512                                                    CAIL_PCIE_LINK_SPEED_SUPPORT_GEN2);
5513                 } else {
5514                         if (platform_speed_cap == PCIE_SPEED_32_0GT)
5515                                 adev->pm.pcie_gen_mask |= (CAIL_PCIE_LINK_SPEED_SUPPORT_GEN1 |
5516                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN2 |
5517                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN3 |
5518                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN4 |
5519                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN5);
5520                         else if (platform_speed_cap == PCIE_SPEED_16_0GT)
5521                                 adev->pm.pcie_gen_mask |= (CAIL_PCIE_LINK_SPEED_SUPPORT_GEN1 |
5522                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN2 |
5523                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN3 |
5524                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN4);
5525                         else if (platform_speed_cap == PCIE_SPEED_8_0GT)
5526                                 adev->pm.pcie_gen_mask |= (CAIL_PCIE_LINK_SPEED_SUPPORT_GEN1 |
5527                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN2 |
5528                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN3);
5529                         else if (platform_speed_cap == PCIE_SPEED_5_0GT)
5530                                 adev->pm.pcie_gen_mask |= (CAIL_PCIE_LINK_SPEED_SUPPORT_GEN1 |
5531                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN2);
5532                         else
5533                                 adev->pm.pcie_gen_mask |= CAIL_PCIE_LINK_SPEED_SUPPORT_GEN1;
5534
5535                 }
5536         }
5537         if (adev->pm.pcie_mlw_mask == 0) {
5538                 if (platform_link_width == PCIE_LNK_WIDTH_UNKNOWN) {
5539                         adev->pm.pcie_mlw_mask |= AMDGPU_DEFAULT_PCIE_MLW_MASK;
5540                 } else {
5541                         switch (platform_link_width) {
5542                         case PCIE_LNK_X32:
5543                                 adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X32 |
5544                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X16 |
5545                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X12 |
5546                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X8 |
5547                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X4 |
5548                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
5549                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
5550                                 break;
5551                         case PCIE_LNK_X16:
5552                                 adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X16 |
5553                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X12 |
5554                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X8 |
5555                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X4 |
5556                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
5557                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
5558                                 break;
5559                         case PCIE_LNK_X12:
5560                                 adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X12 |
5561                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X8 |
5562                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X4 |
5563                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
5564                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
5565                                 break;
5566                         case PCIE_LNK_X8:
5567                                 adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X8 |
5568                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X4 |
5569                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
5570                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
5571                                 break;
5572                         case PCIE_LNK_X4:
5573                                 adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X4 |
5574                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
5575                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
5576                                 break;
5577                         case PCIE_LNK_X2:
5578                                 adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
5579                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
5580                                 break;
5581                         case PCIE_LNK_X1:
5582                                 adev->pm.pcie_mlw_mask = CAIL_PCIE_LINK_WIDTH_SUPPORT_X1;
5583                                 break;
5584                         default:
5585                                 break;
5586                         }
5587                 }
5588         }
5589 }
5590
5591 /**
5592  * amdgpu_device_is_peer_accessible - Check peer access through PCIe BAR
5593  *
5594  * @adev: amdgpu_device pointer
5595  * @peer_adev: amdgpu_device pointer for peer device trying to access @adev
5596  *
5597  * Return true if @peer_adev can access (DMA) @adev through the PCIe
5598  * BAR, i.e. @adev is "large BAR" and the BAR matches the DMA mask of
5599  * @peer_adev.
5600  */
5601 bool amdgpu_device_is_peer_accessible(struct amdgpu_device *adev,
5602                                       struct amdgpu_device *peer_adev)
5603 {
5604 #ifdef CONFIG_HSA_AMD_P2P
5605         uint64_t address_mask = peer_adev->dev->dma_mask ?
5606                 ~*peer_adev->dev->dma_mask : ~((1ULL << 32) - 1);
5607         resource_size_t aper_limit =
5608                 adev->gmc.aper_base + adev->gmc.aper_size - 1;
5609         bool p2p_access =
5610                 !adev->gmc.xgmi.connected_to_cpu &&
5611                 !(pci_p2pdma_distance(adev->pdev, peer_adev->dev, false) < 0);
5612
5613         return pcie_p2p && p2p_access && (adev->gmc.visible_vram_size &&
5614                 adev->gmc.real_vram_size == adev->gmc.visible_vram_size &&
5615                 !(adev->gmc.aper_base & address_mask ||
5616                   aper_limit & address_mask));
5617 #else
5618         return false;
5619 #endif
5620 }
5621
5622 int amdgpu_device_baco_enter(struct drm_device *dev)
5623 {
5624         struct amdgpu_device *adev = drm_to_adev(dev);
5625         struct amdgpu_ras *ras = amdgpu_ras_get_context(adev);
5626
5627         if (!amdgpu_device_supports_baco(adev_to_drm(adev)))
5628                 return -ENOTSUPP;
5629
5630         if (ras && adev->ras_enabled &&
5631             adev->nbio.funcs->enable_doorbell_interrupt)
5632                 adev->nbio.funcs->enable_doorbell_interrupt(adev, false);
5633
5634         return amdgpu_dpm_baco_enter(adev);
5635 }
5636
5637 int amdgpu_device_baco_exit(struct drm_device *dev)
5638 {
5639         struct amdgpu_device *adev = drm_to_adev(dev);
5640         struct amdgpu_ras *ras = amdgpu_ras_get_context(adev);
5641         int ret = 0;
5642
5643         if (!amdgpu_device_supports_baco(adev_to_drm(adev)))
5644                 return -ENOTSUPP;
5645
5646         ret = amdgpu_dpm_baco_exit(adev);
5647         if (ret)
5648                 return ret;
5649
5650         if (ras && adev->ras_enabled &&
5651             adev->nbio.funcs->enable_doorbell_interrupt)
5652                 adev->nbio.funcs->enable_doorbell_interrupt(adev, true);
5653
5654         if (amdgpu_passthrough(adev) &&
5655             adev->nbio.funcs->clear_doorbell_interrupt)
5656                 adev->nbio.funcs->clear_doorbell_interrupt(adev);
5657
5658         return 0;
5659 }
5660
5661 /**
5662  * amdgpu_pci_error_detected - Called when a PCI error is detected.
5663  * @pdev: PCI device struct
5664  * @state: PCI channel state
5665  *
5666  * Description: Called when a PCI error is detected.
5667  *
5668  * Return: PCI_ERS_RESULT_NEED_RESET or PCI_ERS_RESULT_DISCONNECT.
5669  */
5670 pci_ers_result_t amdgpu_pci_error_detected(struct pci_dev *pdev, pci_channel_state_t state)
5671 {
5672         struct drm_device *dev = pci_get_drvdata(pdev);
5673         struct amdgpu_device *adev = drm_to_adev(dev);
5674         int i;
5675
5676         DRM_INFO("PCI error: detected callback, state(%d)!!\n", state);
5677
5678         if (adev->gmc.xgmi.num_physical_nodes > 1) {
5679                 DRM_WARN("No support for XGMI hive yet...");
5680                 return PCI_ERS_RESULT_DISCONNECT;
5681         }
5682
5683         adev->pci_channel_state = state;
5684
5685         switch (state) {
5686         case pci_channel_io_normal:
5687                 return PCI_ERS_RESULT_CAN_RECOVER;
5688         /* Fatal error, prepare for slot reset */
5689         case pci_channel_io_frozen:
5690                 /*
5691                  * Locking adev->reset_domain->sem will prevent any external access
5692                  * to GPU during PCI error recovery
5693                  */
5694                 amdgpu_device_lock_reset_domain(adev->reset_domain);
5695                 amdgpu_device_set_mp1_state(adev);
5696
5697                 /*
5698                  * Block any work scheduling as we do for regular GPU reset
5699                  * for the duration of the recovery
5700                  */
5701                 for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
5702                         struct amdgpu_ring *ring = adev->rings[i];
5703
5704                         if (!ring || !ring->sched.thread)
5705                                 continue;
5706
5707                         drm_sched_stop(&ring->sched, NULL);
5708                 }
5709                 atomic_inc(&adev->gpu_reset_counter);
5710                 return PCI_ERS_RESULT_NEED_RESET;
5711         case pci_channel_io_perm_failure:
5712                 /* Permanent error, prepare for device removal */
5713                 return PCI_ERS_RESULT_DISCONNECT;
5714         }
5715
5716         return PCI_ERS_RESULT_NEED_RESET;
5717 }
5718
5719 /**
5720  * amdgpu_pci_mmio_enabled - Enable MMIO and dump debug registers
5721  * @pdev: pointer to PCI device
5722  */
5723 pci_ers_result_t amdgpu_pci_mmio_enabled(struct pci_dev *pdev)
5724 {
5725
5726         DRM_INFO("PCI error: mmio enabled callback!!\n");
5727
5728         /* TODO - dump whatever for debugging purposes */
5729
5730         /* This called only if amdgpu_pci_error_detected returns
5731          * PCI_ERS_RESULT_CAN_RECOVER. Read/write to the device still
5732          * works, no need to reset slot.
5733          */
5734
5735         return PCI_ERS_RESULT_RECOVERED;
5736 }
5737
5738 /**
5739  * amdgpu_pci_slot_reset - Called when PCI slot has been reset.
5740  * @pdev: PCI device struct
5741  *
5742  * Description: This routine is called by the pci error recovery
5743  * code after the PCI slot has been reset, just before we
5744  * should resume normal operations.
5745  */
5746 pci_ers_result_t amdgpu_pci_slot_reset(struct pci_dev *pdev)
5747 {
5748         struct drm_device *dev = pci_get_drvdata(pdev);
5749         struct amdgpu_device *adev = drm_to_adev(dev);
5750         int r, i;
5751         struct amdgpu_reset_context reset_context;
5752         u32 memsize;
5753         struct list_head device_list;
5754
5755         DRM_INFO("PCI error: slot reset callback!!\n");
5756
5757         memset(&reset_context, 0, sizeof(reset_context));
5758
5759         INIT_LIST_HEAD(&device_list);
5760         list_add_tail(&adev->reset_list, &device_list);
5761
5762         /* wait for asic to come out of reset */
5763         msleep(500);
5764
5765         /* Restore PCI confspace */
5766         amdgpu_device_load_pci_state(pdev);
5767
5768         /* confirm  ASIC came out of reset */
5769         for (i = 0; i < adev->usec_timeout; i++) {
5770                 memsize = amdgpu_asic_get_config_memsize(adev);
5771
5772                 if (memsize != 0xffffffff)
5773                         break;
5774                 udelay(1);
5775         }
5776         if (memsize == 0xffffffff) {
5777                 r = -ETIME;
5778                 goto out;
5779         }
5780
5781         reset_context.method = AMD_RESET_METHOD_NONE;
5782         reset_context.reset_req_dev = adev;
5783         set_bit(AMDGPU_NEED_FULL_RESET, &reset_context.flags);
5784         set_bit(AMDGPU_SKIP_HW_RESET, &reset_context.flags);
5785
5786         adev->no_hw_access = true;
5787         r = amdgpu_device_pre_asic_reset(adev, &reset_context);
5788         adev->no_hw_access = false;
5789         if (r)
5790                 goto out;
5791
5792         r = amdgpu_do_asic_reset(&device_list, &reset_context);
5793
5794 out:
5795         if (!r) {
5796                 if (amdgpu_device_cache_pci_state(adev->pdev))
5797                         pci_restore_state(adev->pdev);
5798
5799                 DRM_INFO("PCIe error recovery succeeded\n");
5800         } else {
5801                 DRM_ERROR("PCIe error recovery failed, err:%d", r);
5802                 amdgpu_device_unset_mp1_state(adev);
5803                 amdgpu_device_unlock_reset_domain(adev->reset_domain);
5804         }
5805
5806         return r ? PCI_ERS_RESULT_DISCONNECT : PCI_ERS_RESULT_RECOVERED;
5807 }
5808
5809 /**
5810  * amdgpu_pci_resume() - resume normal ops after PCI reset
5811  * @pdev: pointer to PCI device
5812  *
5813  * Called when the error recovery driver tells us that its
5814  * OK to resume normal operation.
5815  */
5816 void amdgpu_pci_resume(struct pci_dev *pdev)
5817 {
5818         struct drm_device *dev = pci_get_drvdata(pdev);
5819         struct amdgpu_device *adev = drm_to_adev(dev);
5820         int i;
5821
5822
5823         DRM_INFO("PCI error: resume callback!!\n");
5824
5825         /* Only continue execution for the case of pci_channel_io_frozen */
5826         if (adev->pci_channel_state != pci_channel_io_frozen)
5827                 return;
5828
5829         for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
5830                 struct amdgpu_ring *ring = adev->rings[i];
5831
5832                 if (!ring || !ring->sched.thread)
5833                         continue;
5834
5835
5836                 drm_sched_resubmit_jobs(&ring->sched);
5837                 drm_sched_start(&ring->sched, true);
5838         }
5839
5840         amdgpu_device_unset_mp1_state(adev);
5841         amdgpu_device_unlock_reset_domain(adev->reset_domain);
5842 }
5843
5844 bool amdgpu_device_cache_pci_state(struct pci_dev *pdev)
5845 {
5846         struct drm_device *dev = pci_get_drvdata(pdev);
5847         struct amdgpu_device *adev = drm_to_adev(dev);
5848         int r;
5849
5850         r = pci_save_state(pdev);
5851         if (!r) {
5852                 kfree(adev->pci_state);
5853
5854                 adev->pci_state = pci_store_saved_state(pdev);
5855
5856                 if (!adev->pci_state) {
5857                         DRM_ERROR("Failed to store PCI saved state");
5858                         return false;
5859                 }
5860         } else {
5861                 DRM_WARN("Failed to save PCI state, err:%d\n", r);
5862                 return false;
5863         }
5864
5865         return true;
5866 }
5867
5868 bool amdgpu_device_load_pci_state(struct pci_dev *pdev)
5869 {
5870         struct drm_device *dev = pci_get_drvdata(pdev);
5871         struct amdgpu_device *adev = drm_to_adev(dev);
5872         int r;
5873
5874         if (!adev->pci_state)
5875                 return false;
5876
5877         r = pci_load_saved_state(pdev, adev->pci_state);
5878
5879         if (!r) {
5880                 pci_restore_state(pdev);
5881         } else {
5882                 DRM_WARN("Failed to load PCI state, err:%d\n", r);
5883                 return false;
5884         }
5885
5886         return true;
5887 }
5888
5889 void amdgpu_device_flush_hdp(struct amdgpu_device *adev,
5890                 struct amdgpu_ring *ring)
5891 {
5892 #ifdef CONFIG_X86_64
5893         if ((adev->flags & AMD_IS_APU) && !amdgpu_passthrough(adev))
5894                 return;
5895 #endif
5896         if (adev->gmc.xgmi.connected_to_cpu)
5897                 return;
5898
5899         if (ring && ring->funcs->emit_hdp_flush)
5900                 amdgpu_ring_emit_hdp_flush(ring);
5901         else
5902                 amdgpu_asic_flush_hdp(adev, ring);
5903 }
5904
5905 void amdgpu_device_invalidate_hdp(struct amdgpu_device *adev,
5906                 struct amdgpu_ring *ring)
5907 {
5908 #ifdef CONFIG_X86_64
5909         if ((adev->flags & AMD_IS_APU) && !amdgpu_passthrough(adev))
5910                 return;
5911 #endif
5912         if (adev->gmc.xgmi.connected_to_cpu)
5913                 return;
5914
5915         amdgpu_asic_invalidate_hdp(adev, ring);
5916 }
5917
5918 int amdgpu_in_reset(struct amdgpu_device *adev)
5919 {
5920         return atomic_read(&adev->reset_domain->in_gpu_reset);
5921         }
5922
5923 /**
5924  * amdgpu_device_halt() - bring hardware to some kind of halt state
5925  *
5926  * @adev: amdgpu_device pointer
5927  *
5928  * Bring hardware to some kind of halt state so that no one can touch it
5929  * any more. It will help to maintain error context when error occurred.
5930  * Compare to a simple hang, the system will keep stable at least for SSH
5931  * access. Then it should be trivial to inspect the hardware state and
5932  * see what's going on. Implemented as following:
5933  *
5934  * 1. drm_dev_unplug() makes device inaccessible to user space(IOCTLs, etc),
5935  *    clears all CPU mappings to device, disallows remappings through page faults
5936  * 2. amdgpu_irq_disable_all() disables all interrupts
5937  * 3. amdgpu_fence_driver_hw_fini() signals all HW fences
5938  * 4. set adev->no_hw_access to avoid potential crashes after setp 5
5939  * 5. amdgpu_device_unmap_mmio() clears all MMIO mappings
5940  * 6. pci_disable_device() and pci_wait_for_pending_transaction()
5941  *    flush any in flight DMA operations
5942  */
5943 void amdgpu_device_halt(struct amdgpu_device *adev)
5944 {
5945         struct pci_dev *pdev = adev->pdev;
5946         struct drm_device *ddev = adev_to_drm(adev);
5947
5948         drm_dev_unplug(ddev);
5949
5950         amdgpu_irq_disable_all(adev);
5951
5952         amdgpu_fence_driver_hw_fini(adev);
5953
5954         adev->no_hw_access = true;
5955
5956         amdgpu_device_unmap_mmio(adev);
5957
5958         pci_disable_device(pdev);
5959         pci_wait_for_pending_transaction(pdev);
5960 }
5961
5962 u32 amdgpu_device_pcie_port_rreg(struct amdgpu_device *adev,
5963                                 u32 reg)
5964 {
5965         unsigned long flags, address, data;
5966         u32 r;
5967
5968         address = adev->nbio.funcs->get_pcie_port_index_offset(adev);
5969         data = adev->nbio.funcs->get_pcie_port_data_offset(adev);
5970
5971         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
5972         WREG32(address, reg * 4);
5973         (void)RREG32(address);
5974         r = RREG32(data);
5975         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
5976         return r;
5977 }
5978
5979 void amdgpu_device_pcie_port_wreg(struct amdgpu_device *adev,
5980                                 u32 reg, u32 v)
5981 {
5982         unsigned long flags, address, data;
5983
5984         address = adev->nbio.funcs->get_pcie_port_index_offset(adev);
5985         data = adev->nbio.funcs->get_pcie_port_data_offset(adev);
5986
5987         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
5988         WREG32(address, reg * 4);
5989         (void)RREG32(address);
5990         WREG32(data, v);
5991         (void)RREG32(data);
5992         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
5993 }
5994
5995 /**
5996  * amdgpu_device_switch_gang - switch to a new gang
5997  * @adev: amdgpu_device pointer
5998  * @gang: the gang to switch to
5999  *
6000  * Try to switch to a new gang.
6001  * Returns: NULL if we switched to the new gang or a reference to the current
6002  * gang leader.
6003  */
6004 struct dma_fence *amdgpu_device_switch_gang(struct amdgpu_device *adev,
6005                                             struct dma_fence *gang)
6006 {
6007         struct dma_fence *old = NULL;
6008
6009         do {
6010                 dma_fence_put(old);
6011                 rcu_read_lock();
6012                 old = dma_fence_get_rcu_safe(&adev->gang_submit);
6013                 rcu_read_unlock();
6014
6015                 if (old == gang)
6016                         break;
6017
6018                 if (!dma_fence_is_signaled(old))
6019                         return old;
6020
6021         } while (cmpxchg((struct dma_fence __force **)&adev->gang_submit,
6022                          old, gang) != old);
6023
6024         dma_fence_put(old);
6025         return NULL;
6026 }