drivers/gpu/drm/amd/amdgpu/amdgpu_device.c

   1 /*
   2  * Copyright 2008 Advanced Micro Devices, Inc.
   3  * Copyright 2008 Red Hat Inc.
   4  * Copyright 2009 Jerome Glisse.
   5  *
   6  * Permission is hereby granted, free of charge, to any person obtaining a
   7  * copy of this software and associated documentation files (the "Software"),
   8  * to deal in the Software without restriction, including without limitation
   9  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  10  * and/or sell copies of the Software, and to permit persons to whom the
  11  * Software is furnished to do so, subject to the following conditions:
  12  *
  13  * The above copyright notice and this permission notice shall be included in
  14  * all copies or substantial portions of the Software.
  15  *
  16  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  17  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  18  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
  19  * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  20  * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  21  * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  22  * OTHER DEALINGS IN THE SOFTWARE.
  23  *
  24  * Authors: Dave Airlie
  25  *          Alex Deucher
  26  *          Jerome Glisse
  27  */
  28 #include <linux/power_supply.h>
  29 #include <linux/kthread.h>
  30 #include <linux/module.h>
  31 #include <linux/console.h>
  32 #include <linux/slab.h>
  33 #include <linux/iommu.h>
  34 #include <linux/pci.h>
  35 #include <linux/devcoredump.h>
  36 #include <generated/utsrelease.h>
  37 #include <linux/pci-p2pdma.h>
  38
  39 #include <drm/drm_atomic_helper.h>
  40 #include <drm/drm_fb_helper.h>
  41 #include <drm/drm_probe_helper.h>
  42 #include <drm/amdgpu_drm.h>
  43 #include <linux/vgaarb.h>
  44 #include <linux/vga_switcheroo.h>
  45 #include <linux/efi.h>
  46 #include "amdgpu.h"
  47 #include "amdgpu_trace.h"
  48 #include "amdgpu_i2c.h"
  49 #include "atom.h"
  50 #include "amdgpu_atombios.h"
  51 #include "amdgpu_atomfirmware.h"
  52 #include "amd_pcie.h"
  53 #ifdef CONFIG_DRM_AMDGPU_SI
  54 #include "si.h"
  55 #endif
  56 #ifdef CONFIG_DRM_AMDGPU_CIK
  57 #include "cik.h"
  58 #endif
  59 #include "vi.h"
  60 #include "soc15.h"
  61 #include "nv.h"
  62 #include "bif/bif_4_1_d.h"
  63 #include <linux/firmware.h>
  64 #include "amdgpu_vf_error.h"
  65
  66 #include "amdgpu_amdkfd.h"
  67 #include "amdgpu_pm.h"
  68
  69 #include "amdgpu_xgmi.h"
  70 #include "amdgpu_ras.h"
  71 #include "amdgpu_pmu.h"
  72 #include "amdgpu_fru_eeprom.h"
  73 #include "amdgpu_reset.h"
  74
  75 #include <linux/suspend.h>
  76 #include <drm/task_barrier.h>
  77 #include <linux/pm_runtime.h>
  78
  79 #include <drm/drm_drv.h>
  80
  81 MODULE_FIRMWARE("amdgpu/vega10_gpu_info.bin");
  82 MODULE_FIRMWARE("amdgpu/vega12_gpu_info.bin");
  83 MODULE_FIRMWARE("amdgpu/raven_gpu_info.bin");
  84 MODULE_FIRMWARE("amdgpu/picasso_gpu_info.bin");
  85 MODULE_FIRMWARE("amdgpu/raven2_gpu_info.bin");
  86 MODULE_FIRMWARE("amdgpu/arcturus_gpu_info.bin");
  87 MODULE_FIRMWARE("amdgpu/navi12_gpu_info.bin");
  88
  89 #define AMDGPU_RESUME_MS                2000
  90 #define AMDGPU_MAX_RETRY_LIMIT          2
  91 #define AMDGPU_RETRY_SRIOV_RESET(r) ((r) == -EBUSY || (r) == -ETIMEDOUT || (r) == -EINVAL)
  92
  93 const char *amdgpu_asic_name[] = {
  94         "TAHITI",
  95         "PITCAIRN",
  96         "VERDE",
  97         "OLAND",
  98         "HAINAN",
  99         "BONAIRE",
 100         "KAVERI",
 101         "KABINI",
 102         "HAWAII",
 103         "MULLINS",
 104         "TOPAZ",
 105         "TONGA",
 106         "FIJI",
 107         "CARRIZO",
 108         "STONEY",
 109         "POLARIS10",
 110         "POLARIS11",
 111         "POLARIS12",
 112         "VEGAM",
 113         "VEGA10",
 114         "VEGA12",
 115         "VEGA20",
 116         "RAVEN",
 117         "ARCTURUS",
 118         "RENOIR",
 119         "ALDEBARAN",
 120         "NAVI10",
 121         "CYAN_SKILLFISH",
 122         "NAVI14",
 123         "NAVI12",
 124         "SIENNA_CICHLID",
 125         "NAVY_FLOUNDER",
 126         "VANGOGH",
 127         "DIMGREY_CAVEFISH",
 128         "BEIGE_GOBY",
 129         "YELLOW_CARP",
 130         "IP DISCOVERY",
 131         "LAST",
 132 };
 133
 134 /**
 135  * DOC: pcie_replay_count
 136  *
 137  * The amdgpu driver provides a sysfs API for reporting the total number
 138  * of PCIe replays (NAKs)
 139  * The file pcie_replay_count is used for this and returns the total
 140  * number of replays as a sum of the NAKs generated and NAKs received
 141  */
 142
 143 static ssize_t amdgpu_device_get_pcie_replay_count(struct device *dev,
 144                 struct device_attribute *attr, char *buf)
 145 {
 146         struct drm_device *ddev = dev_get_drvdata(dev);
 147         struct amdgpu_device *adev = drm_to_adev(ddev);
 148         uint64_t cnt = amdgpu_asic_get_pcie_replay_count(adev);
 149
 150         return sysfs_emit(buf, "%llu\n", cnt);
 151 }
 152
 153 static DEVICE_ATTR(pcie_replay_count, S_IRUGO,
 154                 amdgpu_device_get_pcie_replay_count, NULL);
 155
 156 static void amdgpu_device_get_pcie_info(struct amdgpu_device *adev);
 157
 158 /**
 159  * DOC: product_name
 160  *
 161  * The amdgpu driver provides a sysfs API for reporting the product name
 162  * for the device
 163  * The file serial_number is used for this and returns the product name
 164  * as returned from the FRU.
 165  * NOTE: This is only available for certain server cards
 166  */
 167
 168 static ssize_t amdgpu_device_get_product_name(struct device *dev,
 169                 struct device_attribute *attr, char *buf)
 170 {
 171         struct drm_device *ddev = dev_get_drvdata(dev);
 172         struct amdgpu_device *adev = drm_to_adev(ddev);
 173
 174         return sysfs_emit(buf, "%s\n", adev->product_name);
 175 }
 176
 177 static DEVICE_ATTR(product_name, S_IRUGO,
 178                 amdgpu_device_get_product_name, NULL);
 179
 180 /**
 181  * DOC: product_number
 182  *
 183  * The amdgpu driver provides a sysfs API for reporting the part number
 184  * for the device
 185  * The file serial_number is used for this and returns the part number
 186  * as returned from the FRU.
 187  * NOTE: This is only available for certain server cards
 188  */
 189
 190 static ssize_t amdgpu_device_get_product_number(struct device *dev,
 191                 struct device_attribute *attr, char *buf)
 192 {
 193         struct drm_device *ddev = dev_get_drvdata(dev);
 194         struct amdgpu_device *adev = drm_to_adev(ddev);
 195
 196         return sysfs_emit(buf, "%s\n", adev->product_number);
 197 }
 198
 199 static DEVICE_ATTR(product_number, S_IRUGO,
 200                 amdgpu_device_get_product_number, NULL);
 201
 202 /**
 203  * DOC: serial_number
 204  *
 205  * The amdgpu driver provides a sysfs API for reporting the serial number
 206  * for the device
 207  * The file serial_number is used for this and returns the serial number
 208  * as returned from the FRU.
 209  * NOTE: This is only available for certain server cards
 210  */
 211
 212 static ssize_t amdgpu_device_get_serial_number(struct device *dev,
 213                 struct device_attribute *attr, char *buf)
 214 {
 215         struct drm_device *ddev = dev_get_drvdata(dev);
 216         struct amdgpu_device *adev = drm_to_adev(ddev);
 217
 218         return sysfs_emit(buf, "%s\n", adev->serial);
 219 }
 220
 221 static DEVICE_ATTR(serial_number, S_IRUGO,
 222                 amdgpu_device_get_serial_number, NULL);
 223
 224 /**
 225  * amdgpu_device_supports_px - Is the device a dGPU with ATPX power control
 226  *
 227  * @dev: drm_device pointer
 228  *
 229  * Returns true if the device is a dGPU with ATPX power control,
 230  * otherwise return false.
 231  */
 232 bool amdgpu_device_supports_px(struct drm_device *dev)
 233 {
 234         struct amdgpu_device *adev = drm_to_adev(dev);
 235
 236         if ((adev->flags & AMD_IS_PX) && !amdgpu_is_atpx_hybrid())
 237                 return true;
 238         return false;
 239 }
 240
 241 /**
 242  * amdgpu_device_supports_boco - Is the device a dGPU with ACPI power resources
 243  *
 244  * @dev: drm_device pointer
 245  *
 246  * Returns true if the device is a dGPU with ACPI power control,
 247  * otherwise return false.
 248  */
 249 bool amdgpu_device_supports_boco(struct drm_device *dev)
 250 {
 251         struct amdgpu_device *adev = drm_to_adev(dev);
 252
 253         if (adev->has_pr3 ||
 254             ((adev->flags & AMD_IS_PX) && amdgpu_is_atpx_hybrid()))
 255                 return true;
 256         return false;
 257 }
 258
 259 /**
 260  * amdgpu_device_supports_baco - Does the device support BACO
 261  *
 262  * @dev: drm_device pointer
 263  *
 264  * Returns true if the device supporte BACO,
 265  * otherwise return false.
 266  */
 267 bool amdgpu_device_supports_baco(struct drm_device *dev)
 268 {
 269         struct amdgpu_device *adev = drm_to_adev(dev);
 270
 271         return amdgpu_asic_supports_baco(adev);
 272 }
 273
 274 /**
 275  * amdgpu_device_supports_smart_shift - Is the device dGPU with
 276  * smart shift support
 277  *
 278  * @dev: drm_device pointer
 279  *
 280  * Returns true if the device is a dGPU with Smart Shift support,
 281  * otherwise returns false.
 282  */
 283 bool amdgpu_device_supports_smart_shift(struct drm_device *dev)
 284 {
 285         return (amdgpu_device_supports_boco(dev) &&
 286                 amdgpu_acpi_is_power_shift_control_supported());
 287 }
 288
 289 /*
 290  * VRAM access helper functions
 291  */
 292
 293 /**
 294  * amdgpu_device_mm_access - access vram by MM_INDEX/MM_DATA
 295  *
 296  * @adev: amdgpu_device pointer
 297  * @pos: offset of the buffer in vram
 298  * @buf: virtual address of the buffer in system memory
 299  * @size: read/write size, sizeof(@buf) must > @size
 300  * @write: true - write to vram, otherwise - read from vram
 301  */
 302 void amdgpu_device_mm_access(struct amdgpu_device *adev, loff_t pos,
 303                              void *buf, size_t size, bool write)
 304 {
 305         unsigned long flags;
 306         uint32_t hi = ~0, tmp = 0;
 307         uint32_t *data = buf;
 308         uint64_t last;
 309         int idx;
 310
 311         if (!drm_dev_enter(adev_to_drm(adev), &idx))
 312                 return;
 313
 314         BUG_ON(!IS_ALIGNED(pos, 4) || !IS_ALIGNED(size, 4));
 315
 316         spin_lock_irqsave(&adev->mmio_idx_lock, flags);
 317         for (last = pos + size; pos < last; pos += 4) {
 318                 tmp = pos >> 31;
 319
 320                 WREG32_NO_KIQ(mmMM_INDEX, ((uint32_t)pos) | 0x80000000);
 321                 if (tmp != hi) {
 322                         WREG32_NO_KIQ(mmMM_INDEX_HI, tmp);
 323                         hi = tmp;
 324                 }
 325                 if (write)
 326                         WREG32_NO_KIQ(mmMM_DATA, *data++);
 327                 else
 328                         *data++ = RREG32_NO_KIQ(mmMM_DATA);
 329         }
 330
 331         spin_unlock_irqrestore(&adev->mmio_idx_lock, flags);
 332         drm_dev_exit(idx);
 333 }
 334
 335 /**
 336  * amdgpu_device_aper_access - access vram by vram aperature
 337  *
 338  * @adev: amdgpu_device pointer
 339  * @pos: offset of the buffer in vram
 340  * @buf: virtual address of the buffer in system memory
 341  * @size: read/write size, sizeof(@buf) must > @size
 342  * @write: true - write to vram, otherwise - read from vram
 343  *
 344  * The return value means how many bytes have been transferred.
 345  */
 346 size_t amdgpu_device_aper_access(struct amdgpu_device *adev, loff_t pos,
 347                                  void *buf, size_t size, bool write)
 348 {
 349 #ifdef CONFIG_64BIT
 350         void __iomem *addr;
 351         size_t count = 0;
 352         uint64_t last;
 353
 354         if (!adev->mman.aper_base_kaddr)
 355                 return 0;
 356
 357         last = min(pos + size, adev->gmc.visible_vram_size);
 358         if (last > pos) {
 359                 addr = adev->mman.aper_base_kaddr + pos;
 360                 count = last - pos;
 361
 362                 if (write) {
 363                         memcpy_toio(addr, buf, count);
 364                         mb();
 365                         amdgpu_device_flush_hdp(adev, NULL);
 366                 } else {
 367                         amdgpu_device_invalidate_hdp(adev, NULL);
 368                         mb();
 369                         memcpy_fromio(buf, addr, count);
 370                 }
 371
 372         }
 373
 374         return count;
 375 #else
 376         return 0;
 377 #endif
 378 }
 379
 380 /**
 381  * amdgpu_device_vram_access - read/write a buffer in vram
 382  *
 383  * @adev: amdgpu_device pointer
 384  * @pos: offset of the buffer in vram
 385  * @buf: virtual address of the buffer in system memory
 386  * @size: read/write size, sizeof(@buf) must > @size
 387  * @write: true - write to vram, otherwise - read from vram
 388  */
 389 void amdgpu_device_vram_access(struct amdgpu_device *adev, loff_t pos,
 390                                void *buf, size_t size, bool write)
 391 {
 392         size_t count;
 393
 394         /* try to using vram apreature to access vram first */
 395         count = amdgpu_device_aper_access(adev, pos, buf, size, write);
 396         size -= count;
 397         if (size) {
 398                 /* using MM to access rest vram */
 399                 pos += count;
 400                 buf += count;
 401                 amdgpu_device_mm_access(adev, pos, buf, size, write);
 402         }
 403 }
 404
 405 /*
 406  * register access helper functions.
 407  */
 408
 409 /* Check if hw access should be skipped because of hotplug or device error */
 410 bool amdgpu_device_skip_hw_access(struct amdgpu_device *adev)
 411 {
 412         if (adev->no_hw_access)
 413                 return true;
 414
 415 #ifdef CONFIG_LOCKDEP
 416         /*
 417          * This is a bit complicated to understand, so worth a comment. What we assert
 418          * here is that the GPU reset is not running on another thread in parallel.
 419          *
 420          * For this we trylock the read side of the reset semaphore, if that succeeds
 421          * we know that the reset is not running in paralell.
 422          *
 423          * If the trylock fails we assert that we are either already holding the read
 424          * side of the lock or are the reset thread itself and hold the write side of
 425          * the lock.
 426          */
 427         if (in_task()) {
 428                 if (down_read_trylock(&adev->reset_domain->sem))
 429                         up_read(&adev->reset_domain->sem);
 430                 else
 431                         lockdep_assert_held(&adev->reset_domain->sem);
 432         }
 433 #endif
 434         return false;
 435 }
 436
 437 /**
 438  * amdgpu_device_rreg - read a memory mapped IO or indirect register
 439  *
 440  * @adev: amdgpu_device pointer
 441  * @reg: dword aligned register offset
 442  * @acc_flags: access flags which require special behavior
 443  *
 444  * Returns the 32 bit value from the offset specified.
 445  */
 446 uint32_t amdgpu_device_rreg(struct amdgpu_device *adev,
 447                             uint32_t reg, uint32_t acc_flags)
 448 {
 449         uint32_t ret;
 450
 451         if (amdgpu_device_skip_hw_access(adev))
 452                 return 0;
 453
 454         if ((reg * 4) < adev->rmmio_size) {
 455                 if (!(acc_flags & AMDGPU_REGS_NO_KIQ) &&
 456                     amdgpu_sriov_runtime(adev) &&
 457                     down_read_trylock(&adev->reset_domain->sem)) {
 458                         ret = amdgpu_kiq_rreg(adev, reg);
 459                         up_read(&adev->reset_domain->sem);
 460                 } else {
 461                         ret = readl(((void __iomem *)adev->rmmio) + (reg * 4));
 462                 }
 463         } else {
 464                 ret = adev->pcie_rreg(adev, reg * 4);
 465         }
 466
 467         trace_amdgpu_device_rreg(adev->pdev->device, reg, ret);
 468
 469         return ret;
 470 }
 471
 472 /*
 473  * MMIO register read with bytes helper functions
 474  * @offset:bytes offset from MMIO start
 475  *
 476 */
 477
 478 /**
 479  * amdgpu_mm_rreg8 - read a memory mapped IO register
 480  *
 481  * @adev: amdgpu_device pointer
 482  * @offset: byte aligned register offset
 483  *
 484  * Returns the 8 bit value from the offset specified.
 485  */
 486 uint8_t amdgpu_mm_rreg8(struct amdgpu_device *adev, uint32_t offset)
 487 {
 488         if (amdgpu_device_skip_hw_access(adev))
 489                 return 0;
 490
 491         if (offset < adev->rmmio_size)
 492                 return (readb(adev->rmmio + offset));
 493         BUG();
 494 }
 495
 496 /*
 497  * MMIO register write with bytes helper functions
 498  * @offset:bytes offset from MMIO start
 499  * @value: the value want to be written to the register
 500  *
 501 */
 502 /**
 503  * amdgpu_mm_wreg8 - read a memory mapped IO register
 504  *
 505  * @adev: amdgpu_device pointer
 506  * @offset: byte aligned register offset
 507  * @value: 8 bit value to write
 508  *
 509  * Writes the value specified to the offset specified.
 510  */
 511 void amdgpu_mm_wreg8(struct amdgpu_device *adev, uint32_t offset, uint8_t value)
 512 {
 513         if (amdgpu_device_skip_hw_access(adev))
 514                 return;
 515
 516         if (offset < adev->rmmio_size)
 517                 writeb(value, adev->rmmio + offset);
 518         else
 519                 BUG();
 520 }
 521
 522 /**
 523  * amdgpu_device_wreg - write to a memory mapped IO or indirect register
 524  *
 525  * @adev: amdgpu_device pointer
 526  * @reg: dword aligned register offset
 527  * @v: 32 bit value to write to the register
 528  * @acc_flags: access flags which require special behavior
 529  *
 530  * Writes the value specified to the offset specified.
 531  */
 532 void amdgpu_device_wreg(struct amdgpu_device *adev,
 533                         uint32_t reg, uint32_t v,
 534                         uint32_t acc_flags)
 535 {
 536         if (amdgpu_device_skip_hw_access(adev))
 537                 return;
 538
 539         if ((reg * 4) < adev->rmmio_size) {
 540                 if (!(acc_flags & AMDGPU_REGS_NO_KIQ) &&
 541                     amdgpu_sriov_runtime(adev) &&
 542                     down_read_trylock(&adev->reset_domain->sem)) {
 543                         amdgpu_kiq_wreg(adev, reg, v);
 544                         up_read(&adev->reset_domain->sem);
 545                 } else {
 546                         writel(v, ((void __iomem *)adev->rmmio) + (reg * 4));
 547                 }
 548         } else {
 549                 adev->pcie_wreg(adev, reg * 4, v);
 550         }
 551
 552         trace_amdgpu_device_wreg(adev->pdev->device, reg, v);
 553 }
 554
 555 /**
 556  * amdgpu_mm_wreg_mmio_rlc -  write register either with direct/indirect mmio or with RLC path if in range
 557  *
 558  * @adev: amdgpu_device pointer
 559  * @reg: mmio/rlc register
 560  * @v: value to write
 561  *
 562  * this function is invoked only for the debugfs register access
 563  */
 564 void amdgpu_mm_wreg_mmio_rlc(struct amdgpu_device *adev,
 565                              uint32_t reg, uint32_t v)
 566 {
 567         if (amdgpu_device_skip_hw_access(adev))
 568                 return;
 569
 570         if (amdgpu_sriov_fullaccess(adev) &&
 571             adev->gfx.rlc.funcs &&
 572             adev->gfx.rlc.funcs->is_rlcg_access_range) {
 573                 if (adev->gfx.rlc.funcs->is_rlcg_access_range(adev, reg))
 574                         return amdgpu_sriov_wreg(adev, reg, v, 0, 0);
 575         } else if ((reg * 4) >= adev->rmmio_size) {
 576                 adev->pcie_wreg(adev, reg * 4, v);
 577         } else {
 578                 writel(v, ((void __iomem *)adev->rmmio) + (reg * 4));
 579         }
 580 }
 581
 582 /**
 583  * amdgpu_mm_rdoorbell - read a doorbell dword
 584  *
 585  * @adev: amdgpu_device pointer
 586  * @index: doorbell index
 587  *
 588  * Returns the value in the doorbell aperture at the
 589  * requested doorbell index (CIK).
 590  */
 591 u32 amdgpu_mm_rdoorbell(struct amdgpu_device *adev, u32 index)
 592 {
 593         if (amdgpu_device_skip_hw_access(adev))
 594                 return 0;
 595
 596         if (index < adev->doorbell.num_doorbells) {
 597                 return readl(adev->doorbell.ptr + index);
 598         } else {
 599                 DRM_ERROR("reading beyond doorbell aperture: 0x%08x!\n", index);
 600                 return 0;
 601         }
 602 }
 603
 604 /**
 605  * amdgpu_mm_wdoorbell - write a doorbell dword
 606  *
 607  * @adev: amdgpu_device pointer
 608  * @index: doorbell index
 609  * @v: value to write
 610  *
 611  * Writes @v to the doorbell aperture at the
 612  * requested doorbell index (CIK).
 613  */
 614 void amdgpu_mm_wdoorbell(struct amdgpu_device *adev, u32 index, u32 v)
 615 {
 616         if (amdgpu_device_skip_hw_access(adev))
 617                 return;
 618
 619         if (index < adev->doorbell.num_doorbells) {
 620                 writel(v, adev->doorbell.ptr + index);
 621         } else {
 622                 DRM_ERROR("writing beyond doorbell aperture: 0x%08x!\n", index);
 623         }
 624 }
 625
 626 /**
 627  * amdgpu_mm_rdoorbell64 - read a doorbell Qword
 628  *
 629  * @adev: amdgpu_device pointer
 630  * @index: doorbell index
 631  *
 632  * Returns the value in the doorbell aperture at the
 633  * requested doorbell index (VEGA10+).
 634  */
 635 u64 amdgpu_mm_rdoorbell64(struct amdgpu_device *adev, u32 index)
 636 {
 637         if (amdgpu_device_skip_hw_access(adev))
 638                 return 0;
 639
 640         if (index < adev->doorbell.num_doorbells) {
 641                 return atomic64_read((atomic64_t *)(adev->doorbell.ptr + index));
 642         } else {
 643                 DRM_ERROR("reading beyond doorbell aperture: 0x%08x!\n", index);
 644                 return 0;
 645         }
 646 }
 647
 648 /**
 649  * amdgpu_mm_wdoorbell64 - write a doorbell Qword
 650  *
 651  * @adev: amdgpu_device pointer
 652  * @index: doorbell index
 653  * @v: value to write
 654  *
 655  * Writes @v to the doorbell aperture at the
 656  * requested doorbell index (VEGA10+).
 657  */
 658 void amdgpu_mm_wdoorbell64(struct amdgpu_device *adev, u32 index, u64 v)
 659 {
 660         if (amdgpu_device_skip_hw_access(adev))
 661                 return;
 662
 663         if (index < adev->doorbell.num_doorbells) {
 664                 atomic64_set((atomic64_t *)(adev->doorbell.ptr + index), v);
 665         } else {
 666                 DRM_ERROR("writing beyond doorbell aperture: 0x%08x!\n", index);
 667         }
 668 }
 669
 670 /**
 671  * amdgpu_device_indirect_rreg - read an indirect register
 672  *
 673  * @adev: amdgpu_device pointer
 674  * @pcie_index: mmio register offset
 675  * @pcie_data: mmio register offset
 676  * @reg_addr: indirect register address to read from
 677  *
 678  * Returns the value of indirect register @reg_addr
 679  */
 680 u32 amdgpu_device_indirect_rreg(struct amdgpu_device *adev,
 681                                 u32 pcie_index, u32 pcie_data,
 682                                 u32 reg_addr)
 683 {
 684         unsigned long flags;
 685         u32 r;
 686         void __iomem *pcie_index_offset;
 687         void __iomem *pcie_data_offset;
 688
 689         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
 690         pcie_index_offset = (void __iomem *)adev->rmmio + pcie_index * 4;
 691         pcie_data_offset = (void __iomem *)adev->rmmio + pcie_data * 4;
 692
 693         writel(reg_addr, pcie_index_offset);
 694         readl(pcie_index_offset);
 695         r = readl(pcie_data_offset);
 696         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
 697
 698         return r;
 699 }
 700
 701 /**
 702  * amdgpu_device_indirect_rreg64 - read a 64bits indirect register
 703  *
 704  * @adev: amdgpu_device pointer
 705  * @pcie_index: mmio register offset
 706  * @pcie_data: mmio register offset
 707  * @reg_addr: indirect register address to read from
 708  *
 709  * Returns the value of indirect register @reg_addr
 710  */
 711 u64 amdgpu_device_indirect_rreg64(struct amdgpu_device *adev,
 712                                   u32 pcie_index, u32 pcie_data,
 713                                   u32 reg_addr)
 714 {
 715         unsigned long flags;
 716         u64 r;
 717         void __iomem *pcie_index_offset;
 718         void __iomem *pcie_data_offset;
 719
 720         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
 721         pcie_index_offset = (void __iomem *)adev->rmmio + pcie_index * 4;
 722         pcie_data_offset = (void __iomem *)adev->rmmio + pcie_data * 4;
 723
 724         /* read low 32 bits */
 725         writel(reg_addr, pcie_index_offset);
 726         readl(pcie_index_offset);
 727         r = readl(pcie_data_offset);
 728         /* read high 32 bits */
 729         writel(reg_addr + 4, pcie_index_offset);
 730         readl(pcie_index_offset);
 731         r |= ((u64)readl(pcie_data_offset) << 32);
 732         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
 733
 734         return r;
 735 }
 736
 737 /**
 738  * amdgpu_device_indirect_wreg - write an indirect register address
 739  *
 740  * @adev: amdgpu_device pointer
 741  * @pcie_index: mmio register offset
 742  * @pcie_data: mmio register offset
 743  * @reg_addr: indirect register offset
 744  * @reg_data: indirect register data
 745  *
 746  */
 747 void amdgpu_device_indirect_wreg(struct amdgpu_device *adev,
 748                                  u32 pcie_index, u32 pcie_data,
 749                                  u32 reg_addr, u32 reg_data)
 750 {
 751         unsigned long flags;
 752         void __iomem *pcie_index_offset;
 753         void __iomem *pcie_data_offset;
 754
 755         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
 756         pcie_index_offset = (void __iomem *)adev->rmmio + pcie_index * 4;
 757         pcie_data_offset = (void __iomem *)adev->rmmio + pcie_data * 4;
 758
 759         writel(reg_addr, pcie_index_offset);
 760         readl(pcie_index_offset);
 761         writel(reg_data, pcie_data_offset);
 762         readl(pcie_data_offset);
 763         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
 764 }
 765
 766 /**
 767  * amdgpu_device_indirect_wreg64 - write a 64bits indirect register address
 768  *
 769  * @adev: amdgpu_device pointer
 770  * @pcie_index: mmio register offset
 771  * @pcie_data: mmio register offset
 772  * @reg_addr: indirect register offset
 773  * @reg_data: indirect register data
 774  *
 775  */
 776 void amdgpu_device_indirect_wreg64(struct amdgpu_device *adev,
 777                                    u32 pcie_index, u32 pcie_data,
 778                                    u32 reg_addr, u64 reg_data)
 779 {
 780         unsigned long flags;
 781         void __iomem *pcie_index_offset;
 782         void __iomem *pcie_data_offset;
 783
 784         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
 785         pcie_index_offset = (void __iomem *)adev->rmmio + pcie_index * 4;
 786         pcie_data_offset = (void __iomem *)adev->rmmio + pcie_data * 4;
 787
 788         /* write low 32 bits */
 789         writel(reg_addr, pcie_index_offset);
 790         readl(pcie_index_offset);
 791         writel((u32)(reg_data & 0xffffffffULL), pcie_data_offset);
 792         readl(pcie_data_offset);
 793         /* write high 32 bits */
 794         writel(reg_addr + 4, pcie_index_offset);
 795         readl(pcie_index_offset);
 796         writel((u32)(reg_data >> 32), pcie_data_offset);
 797         readl(pcie_data_offset);
 798         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
 799 }
 800
 801 /**
 802  * amdgpu_invalid_rreg - dummy reg read function
 803  *
 804  * @adev: amdgpu_device pointer
 805  * @reg: offset of register
 806  *
 807  * Dummy register read function.  Used for register blocks
 808  * that certain asics don't have (all asics).
 809  * Returns the value in the register.
 810  */
 811 static uint32_t amdgpu_invalid_rreg(struct amdgpu_device *adev, uint32_t reg)
 812 {
 813         DRM_ERROR("Invalid callback to read register 0x%04X\n", reg);
 814         BUG();
 815         return 0;
 816 }
 817
 818 /**
 819  * amdgpu_invalid_wreg - dummy reg write function
 820  *
 821  * @adev: amdgpu_device pointer
 822  * @reg: offset of register
 823  * @v: value to write to the register
 824  *
 825  * Dummy register read function.  Used for register blocks
 826  * that certain asics don't have (all asics).
 827  */
 828 static void amdgpu_invalid_wreg(struct amdgpu_device *adev, uint32_t reg, uint32_t v)
 829 {
 830         DRM_ERROR("Invalid callback to write register 0x%04X with 0x%08X\n",
 831                   reg, v);
 832         BUG();
 833 }
 834
 835 /**
 836  * amdgpu_invalid_rreg64 - dummy 64 bit reg read function
 837  *
 838  * @adev: amdgpu_device pointer
 839  * @reg: offset of register
 840  *
 841  * Dummy register read function.  Used for register blocks
 842  * that certain asics don't have (all asics).
 843  * Returns the value in the register.
 844  */
 845 static uint64_t amdgpu_invalid_rreg64(struct amdgpu_device *adev, uint32_t reg)
 846 {
 847         DRM_ERROR("Invalid callback to read 64 bit register 0x%04X\n", reg);
 848         BUG();
 849         return 0;
 850 }
 851
 852 /**
 853  * amdgpu_invalid_wreg64 - dummy reg write function
 854  *
 855  * @adev: amdgpu_device pointer
 856  * @reg: offset of register
 857  * @v: value to write to the register
 858  *
 859  * Dummy register read function.  Used for register blocks
 860  * that certain asics don't have (all asics).
 861  */
 862 static void amdgpu_invalid_wreg64(struct amdgpu_device *adev, uint32_t reg, uint64_t v)
 863 {
 864         DRM_ERROR("Invalid callback to write 64 bit register 0x%04X with 0x%08llX\n",
 865                   reg, v);
 866         BUG();
 867 }
 868
 869 /**
 870  * amdgpu_block_invalid_rreg - dummy reg read function
 871  *
 872  * @adev: amdgpu_device pointer
 873  * @block: offset of instance
 874  * @reg: offset of register
 875  *
 876  * Dummy register read function.  Used for register blocks
 877  * that certain asics don't have (all asics).
 878  * Returns the value in the register.
 879  */
 880 static uint32_t amdgpu_block_invalid_rreg(struct amdgpu_device *adev,
 881                                           uint32_t block, uint32_t reg)
 882 {
 883         DRM_ERROR("Invalid callback to read register 0x%04X in block 0x%04X\n",
 884                   reg, block);
 885         BUG();
 886         return 0;
 887 }
 888
 889 /**
 890  * amdgpu_block_invalid_wreg - dummy reg write function
 891  *
 892  * @adev: amdgpu_device pointer
 893  * @block: offset of instance
 894  * @reg: offset of register
 895  * @v: value to write to the register
 896  *
 897  * Dummy register read function.  Used for register blocks
 898  * that certain asics don't have (all asics).
 899  */
 900 static void amdgpu_block_invalid_wreg(struct amdgpu_device *adev,
 901                                       uint32_t block,
 902                                       uint32_t reg, uint32_t v)
 903 {
 904         DRM_ERROR("Invalid block callback to write register 0x%04X in block 0x%04X with 0x%08X\n",
 905                   reg, block, v);
 906         BUG();
 907 }
 908
 909 /**
 910  * amdgpu_device_asic_init - Wrapper for atom asic_init
 911  *
 912  * @adev: amdgpu_device pointer
 913  *
 914  * Does any asic specific work and then calls atom asic init.
 915  */
 916 static int amdgpu_device_asic_init(struct amdgpu_device *adev)
 917 {
 918         amdgpu_asic_pre_asic_init(adev);
 919
 920         if (adev->ip_versions[GC_HWIP][0] >= IP_VERSION(11, 0, 0))
 921                 return amdgpu_atomfirmware_asic_init(adev, true);
 922         else
 923                 return amdgpu_atom_asic_init(adev->mode_info.atom_context);
 924 }
 925
 926 /**
 927  * amdgpu_device_vram_scratch_init - allocate the VRAM scratch page
 928  *
 929  * @adev: amdgpu_device pointer
 930  *
 931  * Allocates a scratch page of VRAM for use by various things in the
 932  * driver.
 933  */
 934 static int amdgpu_device_vram_scratch_init(struct amdgpu_device *adev)
 935 {
 936         return amdgpu_bo_create_kernel(adev, AMDGPU_GPU_PAGE_SIZE,
 937                                        PAGE_SIZE, AMDGPU_GEM_DOMAIN_VRAM,
 938                                        &adev->vram_scratch.robj,
 939                                        &adev->vram_scratch.gpu_addr,
 940                                        (void **)&adev->vram_scratch.ptr);
 941 }
 942
 943 /**
 944  * amdgpu_device_vram_scratch_fini - Free the VRAM scratch page
 945  *
 946  * @adev: amdgpu_device pointer
 947  *
 948  * Frees the VRAM scratch page.
 949  */
 950 static void amdgpu_device_vram_scratch_fini(struct amdgpu_device *adev)
 951 {
 952         amdgpu_bo_free_kernel(&adev->vram_scratch.robj, NULL, NULL);
 953 }
 954
 955 /**
 956  * amdgpu_device_program_register_sequence - program an array of registers.
 957  *
 958  * @adev: amdgpu_device pointer
 959  * @registers: pointer to the register array
 960  * @array_size: size of the register array
 961  *
 962  * Programs an array or registers with and and or masks.
 963  * This is a helper for setting golden registers.
 964  */
 965 void amdgpu_device_program_register_sequence(struct amdgpu_device *adev,
 966                                              const u32 *registers,
 967                                              const u32 array_size)
 968 {
 969         u32 tmp, reg, and_mask, or_mask;
 970         int i;
 971
 972         if (array_size % 3)
 973                 return;
 974
 975         for (i = 0; i < array_size; i +=3) {
 976                 reg = registers[i + 0];
 977                 and_mask = registers[i + 1];
 978                 or_mask = registers[i + 2];
 979
 980                 if (and_mask == 0xffffffff) {
 981                         tmp = or_mask;
 982                 } else {
 983                         tmp = RREG32(reg);
 984                         tmp &= ~and_mask;
 985                         if (adev->family >= AMDGPU_FAMILY_AI)
 986                                 tmp |= (or_mask & and_mask);
 987                         else
 988                                 tmp |= or_mask;
 989                 }
 990                 WREG32(reg, tmp);
 991         }
 992 }
 993
 994 /**
 995  * amdgpu_device_pci_config_reset - reset the GPU
 996  *
 997  * @adev: amdgpu_device pointer
 998  *
 999  * Resets the GPU using the pci config reset sequence.
1000  * Only applicable to asics prior to vega10.
1001  */
1002 void amdgpu_device_pci_config_reset(struct amdgpu_device *adev)
1003 {
1004         pci_write_config_dword(adev->pdev, 0x7c, AMDGPU_ASIC_RESET_DATA);
1005 }
1006
1007 /**
1008  * amdgpu_device_pci_reset - reset the GPU using generic PCI means
1009  *
1010  * @adev: amdgpu_device pointer
1011  *
1012  * Resets the GPU using generic pci reset interfaces (FLR, SBR, etc.).
1013  */
1014 int amdgpu_device_pci_reset(struct amdgpu_device *adev)
1015 {
1016         return pci_reset_function(adev->pdev);
1017 }
1018
1019 /*
1020  * GPU doorbell aperture helpers function.
1021  */
1022 /**
1023  * amdgpu_device_doorbell_init - Init doorbell driver information.
1024  *
1025  * @adev: amdgpu_device pointer
1026  *
1027  * Init doorbell driver information (CIK)
1028  * Returns 0 on success, error on failure.
1029  */
1030 static int amdgpu_device_doorbell_init(struct amdgpu_device *adev)
1031 {
1032
1033         /* No doorbell on SI hardware generation */
1034         if (adev->asic_type < CHIP_BONAIRE) {
1035                 adev->doorbell.base = 0;
1036                 adev->doorbell.size = 0;
1037                 adev->doorbell.num_doorbells = 0;
1038                 adev->doorbell.ptr = NULL;
1039                 return 0;
1040         }
1041
1042         if (pci_resource_flags(adev->pdev, 2) & IORESOURCE_UNSET)
1043                 return -EINVAL;
1044
1045         amdgpu_asic_init_doorbell_index(adev);
1046
1047         /* doorbell bar mapping */
1048         adev->doorbell.base = pci_resource_start(adev->pdev, 2);
1049         adev->doorbell.size = pci_resource_len(adev->pdev, 2);
1050
1051         if (adev->enable_mes) {
1052                 adev->doorbell.num_doorbells =
1053                         adev->doorbell.size / sizeof(u32);
1054         } else {
1055                 adev->doorbell.num_doorbells =
1056                         min_t(u32, adev->doorbell.size / sizeof(u32),
1057                               adev->doorbell_index.max_assignment+1);
1058                 if (adev->doorbell.num_doorbells == 0)
1059                         return -EINVAL;
1060
1061                 /* For Vega, reserve and map two pages on doorbell BAR since SDMA
1062                  * paging queue doorbell use the second page. The
1063                  * AMDGPU_DOORBELL64_MAX_ASSIGNMENT definition assumes all the
1064                  * doorbells are in the first page. So with paging queue enabled,
1065                  * the max num_doorbells should + 1 page (0x400 in dword)
1066                  */
1067                 if (adev->asic_type >= CHIP_VEGA10)
1068                         adev->doorbell.num_doorbells += 0x400;
1069         }
1070
1071         adev->doorbell.ptr = ioremap(adev->doorbell.base,
1072                                      adev->doorbell.num_doorbells *
1073                                      sizeof(u32));
1074         if (adev->doorbell.ptr == NULL)
1075                 return -ENOMEM;
1076
1077         return 0;
1078 }
1079
1080 /**
1081  * amdgpu_device_doorbell_fini - Tear down doorbell driver information.
1082  *
1083  * @adev: amdgpu_device pointer
1084  *
1085  * Tear down doorbell driver information (CIK)
1086  */
1087 static void amdgpu_device_doorbell_fini(struct amdgpu_device *adev)
1088 {
1089         iounmap(adev->doorbell.ptr);
1090         adev->doorbell.ptr = NULL;
1091 }
1092
1093
1094
1095 /*
1096  * amdgpu_device_wb_*()
1097  * Writeback is the method by which the GPU updates special pages in memory
1098  * with the status of certain GPU events (fences, ring pointers,etc.).
1099  */
1100
1101 /**
1102  * amdgpu_device_wb_fini - Disable Writeback and free memory
1103  *
1104  * @adev: amdgpu_device pointer
1105  *
1106  * Disables Writeback and frees the Writeback memory (all asics).
1107  * Used at driver shutdown.
1108  */
1109 static void amdgpu_device_wb_fini(struct amdgpu_device *adev)
1110 {
1111         if (adev->wb.wb_obj) {
1112                 amdgpu_bo_free_kernel(&adev->wb.wb_obj,
1113                                       &adev->wb.gpu_addr,
1114                                       (void **)&adev->wb.wb);
1115                 adev->wb.wb_obj = NULL;
1116         }
1117 }
1118
1119 /**
1120  * amdgpu_device_wb_init - Init Writeback driver info and allocate memory
1121  *
1122  * @adev: amdgpu_device pointer
1123  *
1124  * Initializes writeback and allocates writeback memory (all asics).
1125  * Used at driver startup.
1126  * Returns 0 on success or an -error on failure.
1127  */
1128 static int amdgpu_device_wb_init(struct amdgpu_device *adev)
1129 {
1130         int r;
1131
1132         if (adev->wb.wb_obj == NULL) {
1133                 /* AMDGPU_MAX_WB * sizeof(uint32_t) * 8 = AMDGPU_MAX_WB 256bit slots */
1134                 r = amdgpu_bo_create_kernel(adev, AMDGPU_MAX_WB * sizeof(uint32_t) * 8,
1135                                             PAGE_SIZE, AMDGPU_GEM_DOMAIN_GTT,
1136                                             &adev->wb.wb_obj, &adev->wb.gpu_addr,
1137                                             (void **)&adev->wb.wb);
1138                 if (r) {
1139                         dev_warn(adev->dev, "(%d) create WB bo failed\n", r);
1140                         return r;
1141                 }
1142
1143                 adev->wb.num_wb = AMDGPU_MAX_WB;
1144                 memset(&adev->wb.used, 0, sizeof(adev->wb.used));
1145
1146                 /* clear wb memory */
1147                 memset((char *)adev->wb.wb, 0, AMDGPU_MAX_WB * sizeof(uint32_t) * 8);
1148         }
1149
1150         return 0;
1151 }
1152
1153 /**
1154  * amdgpu_device_wb_get - Allocate a wb entry
1155  *
1156  * @adev: amdgpu_device pointer
1157  * @wb: wb index
1158  *
1159  * Allocate a wb slot for use by the driver (all asics).
1160  * Returns 0 on success or -EINVAL on failure.
1161  */
1162 int amdgpu_device_wb_get(struct amdgpu_device *adev, u32 *wb)
1163 {
1164         unsigned long offset = find_first_zero_bit(adev->wb.used, adev->wb.num_wb);
1165
1166         if (offset < adev->wb.num_wb) {
1167                 __set_bit(offset, adev->wb.used);
1168                 *wb = offset << 3; /* convert to dw offset */
1169                 return 0;
1170         } else {
1171                 return -EINVAL;
1172         }
1173 }
1174
1175 /**
1176  * amdgpu_device_wb_free - Free a wb entry
1177  *
1178  * @adev: amdgpu_device pointer
1179  * @wb: wb index
1180  *
1181  * Free a wb slot allocated for use by the driver (all asics)
1182  */
1183 void amdgpu_device_wb_free(struct amdgpu_device *adev, u32 wb)
1184 {
1185         wb >>= 3;
1186         if (wb < adev->wb.num_wb)
1187                 __clear_bit(wb, adev->wb.used);
1188 }
1189
1190 /**
1191  * amdgpu_device_resize_fb_bar - try to resize FB BAR
1192  *
1193  * @adev: amdgpu_device pointer
1194  *
1195  * Try to resize FB BAR to make all VRAM CPU accessible. We try very hard not
1196  * to fail, but if any of the BARs is not accessible after the size we abort
1197  * driver loading by returning -ENODEV.
1198  */
1199 int amdgpu_device_resize_fb_bar(struct amdgpu_device *adev)
1200 {
1201         int rbar_size = pci_rebar_bytes_to_size(adev->gmc.real_vram_size);
1202         struct pci_bus *root;
1203         struct resource *res;
1204         unsigned i;
1205         u16 cmd;
1206         int r;
1207
1208         /* Bypass for VF */
1209         if (amdgpu_sriov_vf(adev))
1210                 return 0;
1211
1212         /* skip if the bios has already enabled large BAR */
1213         if (adev->gmc.real_vram_size &&
1214             (pci_resource_len(adev->pdev, 0) >= adev->gmc.real_vram_size))
1215                 return 0;
1216
1217         /* Check if the root BUS has 64bit memory resources */
1218         root = adev->pdev->bus;
1219         while (root->parent)
1220                 root = root->parent;
1221
1222         pci_bus_for_each_resource(root, res, i) {
1223                 if (res && res->flags & (IORESOURCE_MEM | IORESOURCE_MEM_64) &&
1224                     res->start > 0x100000000ull)
1225                         break;
1226         }
1227
1228         /* Trying to resize is pointless without a root hub window above 4GB */
1229         if (!res)
1230                 return 0;
1231
1232         /* Limit the BAR size to what is available */
1233         rbar_size = min(fls(pci_rebar_get_possible_sizes(adev->pdev, 0)) - 1,
1234                         rbar_size);
1235
1236         /* Disable memory decoding while we change the BAR addresses and size */
1237         pci_read_config_word(adev->pdev, PCI_COMMAND, &cmd);
1238         pci_write_config_word(adev->pdev, PCI_COMMAND,
1239                               cmd & ~PCI_COMMAND_MEMORY);
1240
1241         /* Free the VRAM and doorbell BAR, we most likely need to move both. */
1242         amdgpu_device_doorbell_fini(adev);
1243         if (adev->asic_type >= CHIP_BONAIRE)
1244                 pci_release_resource(adev->pdev, 2);
1245
1246         pci_release_resource(adev->pdev, 0);
1247
1248         r = pci_resize_resource(adev->pdev, 0, rbar_size);
1249         if (r == -ENOSPC)
1250                 DRM_INFO("Not enough PCI address space for a large BAR.");
1251         else if (r && r != -ENOTSUPP)
1252                 DRM_ERROR("Problem resizing BAR0 (%d).", r);
1253
1254         pci_assign_unassigned_bus_resources(adev->pdev->bus);
1255
1256         /* When the doorbell or fb BAR isn't available we have no chance of
1257          * using the device.
1258          */
1259         r = amdgpu_device_doorbell_init(adev);
1260         if (r || (pci_resource_flags(adev->pdev, 0) & IORESOURCE_UNSET))
1261                 return -ENODEV;
1262
1263         pci_write_config_word(adev->pdev, PCI_COMMAND, cmd);
1264
1265         return 0;
1266 }
1267
1268 /*
1269  * GPU helpers function.
1270  */
1271 /**
1272  * amdgpu_device_need_post - check if the hw need post or not
1273  *
1274  * @adev: amdgpu_device pointer
1275  *
1276  * Check if the asic has been initialized (all asics) at driver startup
1277  * or post is needed if  hw reset is performed.
1278  * Returns true if need or false if not.
1279  */
1280 bool amdgpu_device_need_post(struct amdgpu_device *adev)
1281 {
1282         uint32_t reg;
1283
1284         if (amdgpu_sriov_vf(adev))
1285                 return false;
1286
1287         if (amdgpu_passthrough(adev)) {
1288                 /* for FIJI: In whole GPU pass-through virtualization case, after VM reboot
1289                  * some old smc fw still need driver do vPost otherwise gpu hang, while
1290                  * those smc fw version above 22.15 doesn't have this flaw, so we force
1291                  * vpost executed for smc version below 22.15
1292                  */
1293                 if (adev->asic_type == CHIP_FIJI) {
1294                         int err;
1295                         uint32_t fw_ver;
1296                         err = request_firmware(&adev->pm.fw, "amdgpu/fiji_smc.bin", adev->dev);
1297                         /* force vPost if error occured */
1298                         if (err)
1299                                 return true;
1300
1301                         fw_ver = *((uint32_t *)adev->pm.fw->data + 69);
1302                         if (fw_ver < 0x00160e00)
1303                                 return true;
1304                 }
1305         }
1306
1307         /* Don't post if we need to reset whole hive on init */
1308         if (adev->gmc.xgmi.pending_reset)
1309                 return false;
1310
1311         if (adev->has_hw_reset) {
1312                 adev->has_hw_reset = false;
1313                 return true;
1314         }
1315
1316         /* bios scratch used on CIK+ */
1317         if (adev->asic_type >= CHIP_BONAIRE)
1318                 return amdgpu_atombios_scratch_need_asic_init(adev);
1319
1320         /* check MEM_SIZE for older asics */
1321         reg = amdgpu_asic_get_config_memsize(adev);
1322
1323         if ((reg != 0) && (reg != 0xffffffff))
1324                 return false;
1325
1326         return true;
1327 }
1328
1329 /**
1330  * amdgpu_device_should_use_aspm - check if the device should program ASPM
1331  *
1332  * @adev: amdgpu_device pointer
1333  *
1334  * Confirm whether the module parameter and pcie bridge agree that ASPM should
1335  * be set for this device.
1336  *
1337  * Returns true if it should be used or false if not.
1338  */
1339 bool amdgpu_device_should_use_aspm(struct amdgpu_device *adev)
1340 {
1341         switch (amdgpu_aspm) {
1342         case -1:
1343                 break;
1344         case 0:
1345                 return false;
1346         case 1:
1347                 return true;
1348         default:
1349                 return false;
1350         }
1351         return pcie_aspm_enabled(adev->pdev);
1352 }
1353
1354 /* if we get transitioned to only one device, take VGA back */
1355 /**
1356  * amdgpu_device_vga_set_decode - enable/disable vga decode
1357  *
1358  * @pdev: PCI device pointer
1359  * @state: enable/disable vga decode
1360  *
1361  * Enable/disable vga decode (all asics).
1362  * Returns VGA resource flags.
1363  */
1364 static unsigned int amdgpu_device_vga_set_decode(struct pci_dev *pdev,
1365                 bool state)
1366 {
1367         struct amdgpu_device *adev = drm_to_adev(pci_get_drvdata(pdev));
1368         amdgpu_asic_set_vga_state(adev, state);
1369         if (state)
1370                 return VGA_RSRC_LEGACY_IO | VGA_RSRC_LEGACY_MEM |
1371                        VGA_RSRC_NORMAL_IO | VGA_RSRC_NORMAL_MEM;
1372         else
1373                 return VGA_RSRC_NORMAL_IO | VGA_RSRC_NORMAL_MEM;
1374 }
1375
1376 /**
1377  * amdgpu_device_check_block_size - validate the vm block size
1378  *
1379  * @adev: amdgpu_device pointer
1380  *
1381  * Validates the vm block size specified via module parameter.
1382  * The vm block size defines number of bits in page table versus page directory,
1383  * a page is 4KB so we have 12 bits offset, minimum 9 bits in the
1384  * page table and the remaining bits are in the page directory.
1385  */
1386 static void amdgpu_device_check_block_size(struct amdgpu_device *adev)
1387 {
1388         /* defines number of bits in page table versus page directory,
1389          * a page is 4KB so we have 12 bits offset, minimum 9 bits in the
1390          * page table and the remaining bits are in the page directory */
1391         if (amdgpu_vm_block_size == -1)
1392                 return;
1393
1394         if (amdgpu_vm_block_size < 9) {
1395                 dev_warn(adev->dev, "VM page table size (%d) too small\n",
1396                          amdgpu_vm_block_size);
1397                 amdgpu_vm_block_size = -1;
1398         }
1399 }
1400
1401 /**
1402  * amdgpu_device_check_vm_size - validate the vm size
1403  *
1404  * @adev: amdgpu_device pointer
1405  *
1406  * Validates the vm size in GB specified via module parameter.
1407  * The VM size is the size of the GPU virtual memory space in GB.
1408  */
1409 static void amdgpu_device_check_vm_size(struct amdgpu_device *adev)
1410 {
1411         /* no need to check the default value */
1412         if (amdgpu_vm_size == -1)
1413                 return;
1414
1415         if (amdgpu_vm_size < 1) {
1416                 dev_warn(adev->dev, "VM size (%d) too small, min is 1GB\n",
1417                          amdgpu_vm_size);
1418                 amdgpu_vm_size = -1;
1419         }
1420 }
1421
1422 static void amdgpu_device_check_smu_prv_buffer_size(struct amdgpu_device *adev)
1423 {
1424         struct sysinfo si;
1425         bool is_os_64 = (sizeof(void *) == 8);
1426         uint64_t total_memory;
1427         uint64_t dram_size_seven_GB = 0x1B8000000;
1428         uint64_t dram_size_three_GB = 0xB8000000;
1429
1430         if (amdgpu_smu_memory_pool_size == 0)
1431                 return;
1432
1433         if (!is_os_64) {
1434                 DRM_WARN("Not 64-bit OS, feature not supported\n");
1435                 goto def_value;
1436         }
1437         si_meminfo(&si);
1438         total_memory = (uint64_t)si.totalram * si.mem_unit;
1439
1440         if ((amdgpu_smu_memory_pool_size == 1) ||
1441                 (amdgpu_smu_memory_pool_size == 2)) {
1442                 if (total_memory < dram_size_three_GB)
1443                         goto def_value1;
1444         } else if ((amdgpu_smu_memory_pool_size == 4) ||
1445                 (amdgpu_smu_memory_pool_size == 8)) {
1446                 if (total_memory < dram_size_seven_GB)
1447                         goto def_value1;
1448         } else {
1449                 DRM_WARN("Smu memory pool size not supported\n");
1450                 goto def_value;
1451         }
1452         adev->pm.smu_prv_buffer_size = amdgpu_smu_memory_pool_size << 28;
1453
1454         return;
1455
1456 def_value1:
1457         DRM_WARN("No enough system memory\n");
1458 def_value:
1459         adev->pm.smu_prv_buffer_size = 0;
1460 }
1461
1462 static int amdgpu_device_init_apu_flags(struct amdgpu_device *adev)
1463 {
1464         if (!(adev->flags & AMD_IS_APU) ||
1465             adev->asic_type < CHIP_RAVEN)
1466                 return 0;
1467
1468         switch (adev->asic_type) {
1469         case CHIP_RAVEN:
1470                 if (adev->pdev->device == 0x15dd)
1471                         adev->apu_flags |= AMD_APU_IS_RAVEN;
1472                 if (adev->pdev->device == 0x15d8)
1473                         adev->apu_flags |= AMD_APU_IS_PICASSO;
1474                 break;
1475         case CHIP_RENOIR:
1476                 if ((adev->pdev->device == 0x1636) ||
1477                     (adev->pdev->device == 0x164c))
1478                         adev->apu_flags |= AMD_APU_IS_RENOIR;
1479                 else
1480                         adev->apu_flags |= AMD_APU_IS_GREEN_SARDINE;
1481                 break;
1482         case CHIP_VANGOGH:
1483                 adev->apu_flags |= AMD_APU_IS_VANGOGH;
1484                 break;
1485         case CHIP_YELLOW_CARP:
1486                 break;
1487         case CHIP_CYAN_SKILLFISH:
1488                 if ((adev->pdev->device == 0x13FE) ||
1489                     (adev->pdev->device == 0x143F))
1490                         adev->apu_flags |= AMD_APU_IS_CYAN_SKILLFISH2;
1491                 break;
1492         default:
1493                 break;
1494         }
1495
1496         return 0;
1497 }
1498
1499 /**
1500  * amdgpu_device_check_arguments - validate module params
1501  *
1502  * @adev: amdgpu_device pointer
1503  *
1504  * Validates certain module parameters and updates
1505  * the associated values used by the driver (all asics).
1506  */
1507 static int amdgpu_device_check_arguments(struct amdgpu_device *adev)
1508 {
1509         if (amdgpu_sched_jobs < 4) {
1510                 dev_warn(adev->dev, "sched jobs (%d) must be at least 4\n",
1511                          amdgpu_sched_jobs);
1512                 amdgpu_sched_jobs = 4;
1513         } else if (!is_power_of_2(amdgpu_sched_jobs)){
1514                 dev_warn(adev->dev, "sched jobs (%d) must be a power of 2\n",
1515                          amdgpu_sched_jobs);
1516                 amdgpu_sched_jobs = roundup_pow_of_two(amdgpu_sched_jobs);
1517         }
1518
1519         if (amdgpu_gart_size != -1 && amdgpu_gart_size < 32) {
1520                 /* gart size must be greater or equal to 32M */
1521                 dev_warn(adev->dev, "gart size (%d) too small\n",
1522                          amdgpu_gart_size);
1523                 amdgpu_gart_size = -1;
1524         }
1525
1526         if (amdgpu_gtt_size != -1 && amdgpu_gtt_size < 32) {
1527                 /* gtt size must be greater or equal to 32M */
1528                 dev_warn(adev->dev, "gtt size (%d) too small\n",
1529                                  amdgpu_gtt_size);
1530                 amdgpu_gtt_size = -1;
1531         }
1532
1533         /* valid range is between 4 and 9 inclusive */
1534         if (amdgpu_vm_fragment_size != -1 &&
1535             (amdgpu_vm_fragment_size > 9 || amdgpu_vm_fragment_size < 4)) {
1536                 dev_warn(adev->dev, "valid range is between 4 and 9\n");
1537                 amdgpu_vm_fragment_size = -1;
1538         }
1539
1540         if (amdgpu_sched_hw_submission < 2) {
1541                 dev_warn(adev->dev, "sched hw submission jobs (%d) must be at least 2\n",
1542                          amdgpu_sched_hw_submission);
1543                 amdgpu_sched_hw_submission = 2;
1544         } else if (!is_power_of_2(amdgpu_sched_hw_submission)) {
1545                 dev_warn(adev->dev, "sched hw submission jobs (%d) must be a power of 2\n",
1546                          amdgpu_sched_hw_submission);
1547                 amdgpu_sched_hw_submission = roundup_pow_of_two(amdgpu_sched_hw_submission);
1548         }
1549
1550         if (amdgpu_reset_method < -1 || amdgpu_reset_method > 4) {
1551                 dev_warn(adev->dev, "invalid option for reset method, reverting to default\n");
1552                 amdgpu_reset_method = -1;
1553         }
1554
1555         amdgpu_device_check_smu_prv_buffer_size(adev);
1556
1557         amdgpu_device_check_vm_size(adev);
1558
1559         amdgpu_device_check_block_size(adev);
1560
1561         adev->firmware.load_type = amdgpu_ucode_get_load_type(adev, amdgpu_fw_load_type);
1562
1563         return 0;
1564 }
1565
1566 /**
1567  * amdgpu_switcheroo_set_state - set switcheroo state
1568  *
1569  * @pdev: pci dev pointer
1570  * @state: vga_switcheroo state
1571  *
1572  * Callback for the switcheroo driver.  Suspends or resumes
1573  * the asics before or after it is powered up using ACPI methods.
1574  */
1575 static void amdgpu_switcheroo_set_state(struct pci_dev *pdev,
1576                                         enum vga_switcheroo_state state)
1577 {
1578         struct drm_device *dev = pci_get_drvdata(pdev);
1579         int r;
1580
1581         if (amdgpu_device_supports_px(dev) && state == VGA_SWITCHEROO_OFF)
1582                 return;
1583
1584         if (state == VGA_SWITCHEROO_ON) {
1585                 pr_info("switched on\n");
1586                 /* don't suspend or resume card normally */
1587                 dev->switch_power_state = DRM_SWITCH_POWER_CHANGING;
1588
1589                 pci_set_power_state(pdev, PCI_D0);
1590                 amdgpu_device_load_pci_state(pdev);
1591                 r = pci_enable_device(pdev);
1592                 if (r)
1593                         DRM_WARN("pci_enable_device failed (%d)\n", r);
1594                 amdgpu_device_resume(dev, true);
1595
1596                 dev->switch_power_state = DRM_SWITCH_POWER_ON;
1597         } else {
1598                 pr_info("switched off\n");
1599                 dev->switch_power_state = DRM_SWITCH_POWER_CHANGING;
1600                 amdgpu_device_suspend(dev, true);
1601                 amdgpu_device_cache_pci_state(pdev);
1602                 /* Shut down the device */
1603                 pci_disable_device(pdev);
1604                 pci_set_power_state(pdev, PCI_D3cold);
1605                 dev->switch_power_state = DRM_SWITCH_POWER_OFF;
1606         }
1607 }
1608
1609 /**
1610  * amdgpu_switcheroo_can_switch - see if switcheroo state can change
1611  *
1612  * @pdev: pci dev pointer
1613  *
1614  * Callback for the switcheroo driver.  Check of the switcheroo
1615  * state can be changed.
1616  * Returns true if the state can be changed, false if not.
1617  */
1618 static bool amdgpu_switcheroo_can_switch(struct pci_dev *pdev)
1619 {
1620         struct drm_device *dev = pci_get_drvdata(pdev);
1621
1622         /*
1623         * FIXME: open_count is protected by drm_global_mutex but that would lead to
1624         * locking inversion with the driver load path. And the access here is
1625         * completely racy anyway. So don't bother with locking for now.
1626         */
1627         return atomic_read(&dev->open_count) == 0;
1628 }
1629
1630 static const struct vga_switcheroo_client_ops amdgpu_switcheroo_ops = {
1631         .set_gpu_state = amdgpu_switcheroo_set_state,
1632         .reprobe = NULL,
1633         .can_switch = amdgpu_switcheroo_can_switch,
1634 };
1635
1636 /**
1637  * amdgpu_device_ip_set_clockgating_state - set the CG state
1638  *
1639  * @dev: amdgpu_device pointer
1640  * @block_type: Type of hardware IP (SMU, GFX, UVD, etc.)
1641  * @state: clockgating state (gate or ungate)
1642  *
1643  * Sets the requested clockgating state for all instances of
1644  * the hardware IP specified.
1645  * Returns the error code from the last instance.
1646  */
1647 int amdgpu_device_ip_set_clockgating_state(void *dev,
1648                                            enum amd_ip_block_type block_type,
1649                                            enum amd_clockgating_state state)
1650 {
1651         struct amdgpu_device *adev = dev;
1652         int i, r = 0;
1653
1654         for (i = 0; i < adev->num_ip_blocks; i++) {
1655                 if (!adev->ip_blocks[i].status.valid)
1656                         continue;
1657                 if (adev->ip_blocks[i].version->type != block_type)
1658                         continue;
1659                 if (!adev->ip_blocks[i].version->funcs->set_clockgating_state)
1660                         continue;
1661                 r = adev->ip_blocks[i].version->funcs->set_clockgating_state(
1662                         (void *)adev, state);
1663                 if (r)
1664                         DRM_ERROR("set_clockgating_state of IP block <%s> failed %d\n",
1665                                   adev->ip_blocks[i].version->funcs->name, r);
1666         }
1667         return r;
1668 }
1669
1670 /**
1671  * amdgpu_device_ip_set_powergating_state - set the PG state
1672  *
1673  * @dev: amdgpu_device pointer
1674  * @block_type: Type of hardware IP (SMU, GFX, UVD, etc.)
1675  * @state: powergating state (gate or ungate)
1676  *
1677  * Sets the requested powergating state for all instances of
1678  * the hardware IP specified.
1679  * Returns the error code from the last instance.
1680  */
1681 int amdgpu_device_ip_set_powergating_state(void *dev,
1682                                            enum amd_ip_block_type block_type,
1683                                            enum amd_powergating_state state)
1684 {
1685         struct amdgpu_device *adev = dev;
1686         int i, r = 0;
1687
1688         for (i = 0; i < adev->num_ip_blocks; i++) {
1689                 if (!adev->ip_blocks[i].status.valid)
1690                         continue;
1691                 if (adev->ip_blocks[i].version->type != block_type)
1692                         continue;
1693                 if (!adev->ip_blocks[i].version->funcs->set_powergating_state)
1694                         continue;
1695                 r = adev->ip_blocks[i].version->funcs->set_powergating_state(
1696                         (void *)adev, state);
1697                 if (r)
1698                         DRM_ERROR("set_powergating_state of IP block <%s> failed %d\n",
1699                                   adev->ip_blocks[i].version->funcs->name, r);
1700         }
1701         return r;
1702 }
1703
1704 /**
1705  * amdgpu_device_ip_get_clockgating_state - get the CG state
1706  *
1707  * @adev: amdgpu_device pointer
1708  * @flags: clockgating feature flags
1709  *
1710  * Walks the list of IPs on the device and updates the clockgating
1711  * flags for each IP.
1712  * Updates @flags with the feature flags for each hardware IP where
1713  * clockgating is enabled.
1714  */
1715 void amdgpu_device_ip_get_clockgating_state(struct amdgpu_device *adev,
1716                                             u64 *flags)
1717 {
1718         int i;
1719
1720         for (i = 0; i < adev->num_ip_blocks; i++) {
1721                 if (!adev->ip_blocks[i].status.valid)
1722                         continue;
1723                 if (adev->ip_blocks[i].version->funcs->get_clockgating_state)
1724                         adev->ip_blocks[i].version->funcs->get_clockgating_state((void *)adev, flags);
1725         }
1726 }
1727
1728 /**
1729  * amdgpu_device_ip_wait_for_idle - wait for idle
1730  *
1731  * @adev: amdgpu_device pointer
1732  * @block_type: Type of hardware IP (SMU, GFX, UVD, etc.)
1733  *
1734  * Waits for the request hardware IP to be idle.
1735  * Returns 0 for success or a negative error code on failure.
1736  */
1737 int amdgpu_device_ip_wait_for_idle(struct amdgpu_device *adev,
1738                                    enum amd_ip_block_type block_type)
1739 {
1740         int i, r;
1741
1742         for (i = 0; i < adev->num_ip_blocks; i++) {
1743                 if (!adev->ip_blocks[i].status.valid)
1744                         continue;
1745                 if (adev->ip_blocks[i].version->type == block_type) {
1746                         r = adev->ip_blocks[i].version->funcs->wait_for_idle((void *)adev);
1747                         if (r)
1748                                 return r;
1749                         break;
1750                 }
1751         }
1752         return 0;
1753
1754 }
1755
1756 /**
1757  * amdgpu_device_ip_is_idle - is the hardware IP idle
1758  *
1759  * @adev: amdgpu_device pointer
1760  * @block_type: Type of hardware IP (SMU, GFX, UVD, etc.)
1761  *
1762  * Check if the hardware IP is idle or not.
1763  * Returns true if it the IP is idle, false if not.
1764  */
1765 bool amdgpu_device_ip_is_idle(struct amdgpu_device *adev,
1766                               enum amd_ip_block_type block_type)
1767 {
1768         int i;
1769
1770         for (i = 0; i < adev->num_ip_blocks; i++) {
1771                 if (!adev->ip_blocks[i].status.valid)
1772                         continue;
1773                 if (adev->ip_blocks[i].version->type == block_type)
1774                         return adev->ip_blocks[i].version->funcs->is_idle((void *)adev);
1775         }
1776         return true;
1777
1778 }
1779
1780 /**
1781  * amdgpu_device_ip_get_ip_block - get a hw IP pointer
1782  *
1783  * @adev: amdgpu_device pointer
1784  * @type: Type of hardware IP (SMU, GFX, UVD, etc.)
1785  *
1786  * Returns a pointer to the hardware IP block structure
1787  * if it exists for the asic, otherwise NULL.
1788  */
1789 struct amdgpu_ip_block *
1790 amdgpu_device_ip_get_ip_block(struct amdgpu_device *adev,
1791                               enum amd_ip_block_type type)
1792 {
1793         int i;
1794
1795         for (i = 0; i < adev->num_ip_blocks; i++)
1796                 if (adev->ip_blocks[i].version->type == type)
1797                         return &adev->ip_blocks[i];
1798
1799         return NULL;
1800 }
1801
1802 /**
1803  * amdgpu_device_ip_block_version_cmp
1804  *
1805  * @adev: amdgpu_device pointer
1806  * @type: enum amd_ip_block_type
1807  * @major: major version
1808  * @minor: minor version
1809  *
1810  * return 0 if equal or greater
1811  * return 1 if smaller or the ip_block doesn't exist
1812  */
1813 int amdgpu_device_ip_block_version_cmp(struct amdgpu_device *adev,
1814                                        enum amd_ip_block_type type,
1815                                        u32 major, u32 minor)
1816 {
1817         struct amdgpu_ip_block *ip_block = amdgpu_device_ip_get_ip_block(adev, type);
1818
1819         if (ip_block && ((ip_block->version->major > major) ||
1820                         ((ip_block->version->major == major) &&
1821                         (ip_block->version->minor >= minor))))
1822                 return 0;
1823
1824         return 1;
1825 }
1826
1827 /**
1828  * amdgpu_device_ip_block_add
1829  *
1830  * @adev: amdgpu_device pointer
1831  * @ip_block_version: pointer to the IP to add
1832  *
1833  * Adds the IP block driver information to the collection of IPs
1834  * on the asic.
1835  */
1836 int amdgpu_device_ip_block_add(struct amdgpu_device *adev,
1837                                const struct amdgpu_ip_block_version *ip_block_version)
1838 {
1839         if (!ip_block_version)
1840                 return -EINVAL;
1841
1842         switch (ip_block_version->type) {
1843         case AMD_IP_BLOCK_TYPE_VCN:
1844                 if (adev->harvest_ip_mask & AMD_HARVEST_IP_VCN_MASK)
1845                         return 0;
1846                 break;
1847         case AMD_IP_BLOCK_TYPE_JPEG:
1848                 if (adev->harvest_ip_mask & AMD_HARVEST_IP_JPEG_MASK)
1849                         return 0;
1850                 break;
1851         default:
1852                 break;
1853         }
1854
1855         DRM_INFO("add ip block number %d <%s>\n", adev->num_ip_blocks,
1856                   ip_block_version->funcs->name);
1857
1858         adev->ip_blocks[adev->num_ip_blocks++].version = ip_block_version;
1859
1860         return 0;
1861 }
1862
1863 /**
1864  * amdgpu_device_enable_virtual_display - enable virtual display feature
1865  *
1866  * @adev: amdgpu_device pointer
1867  *
1868  * Enabled the virtual display feature if the user has enabled it via
1869  * the module parameter virtual_display.  This feature provides a virtual
1870  * display hardware on headless boards or in virtualized environments.
1871  * This function parses and validates the configuration string specified by
1872  * the user and configues the virtual display configuration (number of
1873  * virtual connectors, crtcs, etc.) specified.
1874  */
1875 static void amdgpu_device_enable_virtual_display(struct amdgpu_device *adev)
1876 {
1877         adev->enable_virtual_display = false;
1878
1879         if (amdgpu_virtual_display) {
1880                 const char *pci_address_name = pci_name(adev->pdev);
1881                 char *pciaddstr, *pciaddstr_tmp, *pciaddname_tmp, *pciaddname;
1882
1883                 pciaddstr = kstrdup(amdgpu_virtual_display, GFP_KERNEL);
1884                 pciaddstr_tmp = pciaddstr;
1885                 while ((pciaddname_tmp = strsep(&pciaddstr_tmp, ";"))) {
1886                         pciaddname = strsep(&pciaddname_tmp, ",");
1887                         if (!strcmp("all", pciaddname)
1888                             || !strcmp(pci_address_name, pciaddname)) {
1889                                 long num_crtc;
1890                                 int res = -1;
1891
1892                                 adev->enable_virtual_display = true;
1893
1894                                 if (pciaddname_tmp)
1895                                         res = kstrtol(pciaddname_tmp, 10,
1896                                                       &num_crtc);
1897
1898                                 if (!res) {
1899                                         if (num_crtc < 1)
1900                                                 num_crtc = 1;
1901                                         if (num_crtc > 6)
1902                                                 num_crtc = 6;
1903                                         adev->mode_info.num_crtc = num_crtc;
1904                                 } else {
1905                                         adev->mode_info.num_crtc = 1;
1906                                 }
1907                                 break;
1908                         }
1909                 }
1910
1911                 DRM_INFO("virtual display string:%s, %s:virtual_display:%d, num_crtc:%d\n",
1912                          amdgpu_virtual_display, pci_address_name,
1913                          adev->enable_virtual_display, adev->mode_info.num_crtc);
1914
1915                 kfree(pciaddstr);
1916         }
1917 }
1918
1919 void amdgpu_device_set_sriov_virtual_display(struct amdgpu_device *adev)
1920 {
1921         if (amdgpu_sriov_vf(adev) && !adev->enable_virtual_display) {
1922                 adev->mode_info.num_crtc = 1;
1923                 adev->enable_virtual_display = true;
1924                 DRM_INFO("virtual_display:%d, num_crtc:%d\n",
1925                          adev->enable_virtual_display, adev->mode_info.num_crtc);
1926         }
1927 }
1928
1929 /**
1930  * amdgpu_device_parse_gpu_info_fw - parse gpu info firmware
1931  *
1932  * @adev: amdgpu_device pointer
1933  *
1934  * Parses the asic configuration parameters specified in the gpu info
1935  * firmware and makes them availale to the driver for use in configuring
1936  * the asic.
1937  * Returns 0 on success, -EINVAL on failure.
1938  */
1939 static int amdgpu_device_parse_gpu_info_fw(struct amdgpu_device *adev)
1940 {
1941         const char *chip_name;
1942         char fw_name[40];
1943         int err;
1944         const struct gpu_info_firmware_header_v1_0 *hdr;
1945
1946         adev->firmware.gpu_info_fw = NULL;
1947
1948         if (adev->mman.discovery_bin) {
1949                 /*
1950                  * FIXME: The bounding box is still needed by Navi12, so
1951                  * temporarily read it from gpu_info firmware. Should be dropped
1952                  * when DAL no longer needs it.
1953                  */
1954                 if (adev->asic_type != CHIP_NAVI12)
1955                         return 0;
1956         }
1957
1958         switch (adev->asic_type) {
1959         default:
1960                 return 0;
1961         case CHIP_VEGA10:
1962                 chip_name = "vega10";
1963                 break;
1964         case CHIP_VEGA12:
1965                 chip_name = "vega12";
1966                 break;
1967         case CHIP_RAVEN:
1968                 if (adev->apu_flags & AMD_APU_IS_RAVEN2)
1969                         chip_name = "raven2";
1970                 else if (adev->apu_flags & AMD_APU_IS_PICASSO)
1971                         chip_name = "picasso";
1972                 else
1973                         chip_name = "raven";
1974                 break;
1975         case CHIP_ARCTURUS:
1976                 chip_name = "arcturus";
1977                 break;
1978         case CHIP_NAVI12:
1979                 chip_name = "navi12";
1980                 break;
1981         }
1982
1983         snprintf(fw_name, sizeof(fw_name), "amdgpu/%s_gpu_info.bin", chip_name);
1984         err = request_firmware(&adev->firmware.gpu_info_fw, fw_name, adev->dev);
1985         if (err) {
1986                 dev_err(adev->dev,
1987                         "Failed to load gpu_info firmware \"%s\"\n",
1988                         fw_name);
1989                 goto out;
1990         }
1991         err = amdgpu_ucode_validate(adev->firmware.gpu_info_fw);
1992         if (err) {
1993                 dev_err(adev->dev,
1994                         "Failed to validate gpu_info firmware \"%s\"\n",
1995                         fw_name);
1996                 goto out;
1997         }
1998
1999         hdr = (const struct gpu_info_firmware_header_v1_0 *)adev->firmware.gpu_info_fw->data;
2000         amdgpu_ucode_print_gpu_info_hdr(&hdr->header);
2001
2002         switch (hdr->version_major) {
2003         case 1:
2004         {
2005                 const struct gpu_info_firmware_v1_0 *gpu_info_fw =
2006                         (const struct gpu_info_firmware_v1_0 *)(adev->firmware.gpu_info_fw->data +
2007                                                                 le32_to_cpu(hdr->header.ucode_array_offset_bytes));
2008
2009                 /*
2010                  * Should be droped when DAL no longer needs it.
2011                  */
2012                 if (adev->asic_type == CHIP_NAVI12)
2013                         goto parse_soc_bounding_box;
2014
2015                 adev->gfx.config.max_shader_engines = le32_to_cpu(gpu_info_fw->gc_num_se);
2016                 adev->gfx.config.max_cu_per_sh = le32_to_cpu(gpu_info_fw->gc_num_cu_per_sh);
2017                 adev->gfx.config.max_sh_per_se = le32_to_cpu(gpu_info_fw->gc_num_sh_per_se);
2018                 adev->gfx.config.max_backends_per_se = le32_to_cpu(gpu_info_fw->gc_num_rb_per_se);
2019                 adev->gfx.config.max_texture_channel_caches =
2020                         le32_to_cpu(gpu_info_fw->gc_num_tccs);
2021                 adev->gfx.config.max_gprs = le32_to_cpu(gpu_info_fw->gc_num_gprs);
2022                 adev->gfx.config.max_gs_threads = le32_to_cpu(gpu_info_fw->gc_num_max_gs_thds);
2023                 adev->gfx.config.gs_vgt_table_depth = le32_to_cpu(gpu_info_fw->gc_gs_table_depth);
2024                 adev->gfx.config.gs_prim_buffer_depth = le32_to_cpu(gpu_info_fw->gc_gsprim_buff_depth);
2025                 adev->gfx.config.double_offchip_lds_buf =
2026                         le32_to_cpu(gpu_info_fw->gc_double_offchip_lds_buffer);
2027                 adev->gfx.cu_info.wave_front_size = le32_to_cpu(gpu_info_fw->gc_wave_size);
2028                 adev->gfx.cu_info.max_waves_per_simd =
2029                         le32_to_cpu(gpu_info_fw->gc_max_waves_per_simd);
2030                 adev->gfx.cu_info.max_scratch_slots_per_cu =
2031                         le32_to_cpu(gpu_info_fw->gc_max_scratch_slots_per_cu);
2032                 adev->gfx.cu_info.lds_size = le32_to_cpu(gpu_info_fw->gc_lds_size);
2033                 if (hdr->version_minor >= 1) {
2034                         const struct gpu_info_firmware_v1_1 *gpu_info_fw =
2035                                 (const struct gpu_info_firmware_v1_1 *)(adev->firmware.gpu_info_fw->data +
2036                                                                         le32_to_cpu(hdr->header.ucode_array_offset_bytes));
2037                         adev->gfx.config.num_sc_per_sh =
2038                                 le32_to_cpu(gpu_info_fw->num_sc_per_sh);
2039                         adev->gfx.config.num_packer_per_sc =
2040                                 le32_to_cpu(gpu_info_fw->num_packer_per_sc);
2041                 }
2042
2043 parse_soc_bounding_box:
2044                 /*
2045                  * soc bounding box info is not integrated in disocovery table,
2046                  * we always need to parse it from gpu info firmware if needed.
2047                  */
2048                 if (hdr->version_minor == 2) {
2049                         const struct gpu_info_firmware_v1_2 *gpu_info_fw =
2050                                 (const struct gpu_info_firmware_v1_2 *)(adev->firmware.gpu_info_fw->data +
2051                                                                         le32_to_cpu(hdr->header.ucode_array_offset_bytes));
2052                         adev->dm.soc_bounding_box = &gpu_info_fw->soc_bounding_box;
2053                 }
2054                 break;
2055         }
2056         default:
2057                 dev_err(adev->dev,
2058                         "Unsupported gpu_info table %d\n", hdr->header.ucode_version);
2059                 err = -EINVAL;
2060                 goto out;
2061         }
2062 out:
2063         return err;
2064 }
2065
2066 /**
2067  * amdgpu_device_ip_early_init - run early init for hardware IPs
2068  *
2069  * @adev: amdgpu_device pointer
2070  *
2071  * Early initialization pass for hardware IPs.  The hardware IPs that make
2072  * up each asic are discovered each IP's early_init callback is run.  This
2073  * is the first stage in initializing the asic.
2074  * Returns 0 on success, negative error code on failure.
2075  */
2076 static int amdgpu_device_ip_early_init(struct amdgpu_device *adev)
2077 {
2078         struct drm_device *dev = adev_to_drm(adev);
2079         struct pci_dev *parent;
2080         int i, r;
2081
2082         amdgpu_device_enable_virtual_display(adev);
2083
2084         if (amdgpu_sriov_vf(adev)) {
2085                 r = amdgpu_virt_request_full_gpu(adev, true);
2086                 if (r)
2087                         return r;
2088         }
2089
2090         switch (adev->asic_type) {
2091 #ifdef CONFIG_DRM_AMDGPU_SI
2092         case CHIP_VERDE:
2093         case CHIP_TAHITI:
2094         case CHIP_PITCAIRN:
2095         case CHIP_OLAND:
2096         case CHIP_HAINAN:
2097                 adev->family = AMDGPU_FAMILY_SI;
2098                 r = si_set_ip_blocks(adev);
2099                 if (r)
2100                         return r;
2101                 break;
2102 #endif
2103 #ifdef CONFIG_DRM_AMDGPU_CIK
2104         case CHIP_BONAIRE:
2105         case CHIP_HAWAII:
2106         case CHIP_KAVERI:
2107         case CHIP_KABINI:
2108         case CHIP_MULLINS:
2109                 if (adev->flags & AMD_IS_APU)
2110                         adev->family = AMDGPU_FAMILY_KV;
2111                 else
2112                         adev->family = AMDGPU_FAMILY_CI;
2113
2114                 r = cik_set_ip_blocks(adev);
2115                 if (r)
2116                         return r;
2117                 break;
2118 #endif
2119         case CHIP_TOPAZ:
2120         case CHIP_TONGA:
2121         case CHIP_FIJI:
2122         case CHIP_POLARIS10:
2123         case CHIP_POLARIS11:
2124         case CHIP_POLARIS12:
2125         case CHIP_VEGAM:
2126         case CHIP_CARRIZO:
2127         case CHIP_STONEY:
2128                 if (adev->flags & AMD_IS_APU)
2129                         adev->family = AMDGPU_FAMILY_CZ;
2130                 else
2131                         adev->family = AMDGPU_FAMILY_VI;
2132
2133                 r = vi_set_ip_blocks(adev);
2134                 if (r)
2135                         return r;
2136                 break;
2137         default:
2138                 r = amdgpu_discovery_set_ip_blocks(adev);
2139                 if (r)
2140                         return r;
2141                 break;
2142         }
2143
2144         if (amdgpu_has_atpx() &&
2145             (amdgpu_is_atpx_hybrid() ||
2146              amdgpu_has_atpx_dgpu_power_cntl()) &&
2147             ((adev->flags & AMD_IS_APU) == 0) &&
2148             !pci_is_thunderbolt_attached(to_pci_dev(dev->dev)))
2149                 adev->flags |= AMD_IS_PX;
2150
2151         if (!(adev->flags & AMD_IS_APU)) {
2152                 parent = pci_upstream_bridge(adev->pdev);
2153                 adev->has_pr3 = parent ? pci_pr3_present(parent) : false;
2154         }
2155
2156         amdgpu_amdkfd_device_probe(adev);
2157
2158         adev->pm.pp_feature = amdgpu_pp_feature_mask;
2159         if (amdgpu_sriov_vf(adev) || sched_policy == KFD_SCHED_POLICY_NO_HWS)
2160                 adev->pm.pp_feature &= ~PP_GFXOFF_MASK;
2161         if (amdgpu_sriov_vf(adev) && adev->asic_type == CHIP_SIENNA_CICHLID)
2162                 adev->pm.pp_feature &= ~PP_OVERDRIVE_MASK;
2163
2164         for (i = 0; i < adev->num_ip_blocks; i++) {
2165                 if ((amdgpu_ip_block_mask & (1 << i)) == 0) {
2166                         DRM_ERROR("disabled ip block: %d <%s>\n",
2167                                   i, adev->ip_blocks[i].version->funcs->name);
2168                         adev->ip_blocks[i].status.valid = false;
2169                 } else {
2170                         if (adev->ip_blocks[i].version->funcs->early_init) {
2171                                 r = adev->ip_blocks[i].version->funcs->early_init((void *)adev);
2172                                 if (r == -ENOENT) {
2173                                         adev->ip_blocks[i].status.valid = false;
2174                                 } else if (r) {
2175                                         DRM_ERROR("early_init of IP block <%s> failed %d\n",
2176                                                   adev->ip_blocks[i].version->funcs->name, r);
2177                                         return r;
2178                                 } else {
2179                                         adev->ip_blocks[i].status.valid = true;
2180                                 }
2181                         } else {
2182                                 adev->ip_blocks[i].status.valid = true;
2183                         }
2184                 }
2185                 /* get the vbios after the asic_funcs are set up */
2186                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_COMMON) {
2187                         r = amdgpu_device_parse_gpu_info_fw(adev);
2188                         if (r)
2189                                 return r;
2190
2191                         /* Read BIOS */
2192                         if (!amdgpu_get_bios(adev))
2193                                 return -EINVAL;
2194
2195                         r = amdgpu_atombios_init(adev);
2196                         if (r) {
2197                                 dev_err(adev->dev, "amdgpu_atombios_init failed\n");
2198                                 amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_ATOMBIOS_INIT_FAIL, 0, 0);
2199                                 return r;
2200                         }
2201
2202                         /*get pf2vf msg info at it's earliest time*/
2203                         if (amdgpu_sriov_vf(adev))
2204                                 amdgpu_virt_init_data_exchange(adev);
2205
2206                 }
2207         }
2208
2209         adev->cg_flags &= amdgpu_cg_mask;
2210         adev->pg_flags &= amdgpu_pg_mask;
2211
2212         return 0;
2213 }
2214
2215 static int amdgpu_device_ip_hw_init_phase1(struct amdgpu_device *adev)
2216 {
2217         int i, r;
2218
2219         for (i = 0; i < adev->num_ip_blocks; i++) {
2220                 if (!adev->ip_blocks[i].status.sw)
2221                         continue;
2222                 if (adev->ip_blocks[i].status.hw)
2223                         continue;
2224                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_COMMON ||
2225                     (amdgpu_sriov_vf(adev) && (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_PSP)) ||
2226                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_IH) {
2227                         r = adev->ip_blocks[i].version->funcs->hw_init(adev);
2228                         if (r) {
2229                                 DRM_ERROR("hw_init of IP block <%s> failed %d\n",
2230                                           adev->ip_blocks[i].version->funcs->name, r);
2231                                 return r;
2232                         }
2233                         adev->ip_blocks[i].status.hw = true;
2234                 }
2235         }
2236
2237         return 0;
2238 }
2239
2240 static int amdgpu_device_ip_hw_init_phase2(struct amdgpu_device *adev)
2241 {
2242         int i, r;
2243
2244         for (i = 0; i < adev->num_ip_blocks; i++) {
2245                 if (!adev->ip_blocks[i].status.sw)
2246                         continue;
2247                 if (adev->ip_blocks[i].status.hw)
2248                         continue;
2249                 r = adev->ip_blocks[i].version->funcs->hw_init(adev);
2250                 if (r) {
2251                         DRM_ERROR("hw_init of IP block <%s> failed %d\n",
2252                                   adev->ip_blocks[i].version->funcs->name, r);
2253                         return r;
2254                 }
2255                 adev->ip_blocks[i].status.hw = true;
2256         }
2257
2258         return 0;
2259 }
2260
2261 static int amdgpu_device_fw_loading(struct amdgpu_device *adev)
2262 {
2263         int r = 0;
2264         int i;
2265         uint32_t smu_version;
2266
2267         if (adev->asic_type >= CHIP_VEGA10) {
2268                 for (i = 0; i < adev->num_ip_blocks; i++) {
2269                         if (adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_PSP)
2270                                 continue;
2271
2272                         if (!adev->ip_blocks[i].status.sw)
2273                                 continue;
2274
2275                         /* no need to do the fw loading again if already done*/
2276                         if (adev->ip_blocks[i].status.hw == true)
2277                                 break;
2278
2279                         if (amdgpu_in_reset(adev) || adev->in_suspend) {
2280                                 r = adev->ip_blocks[i].version->funcs->resume(adev);
2281                                 if (r) {
2282                                         DRM_ERROR("resume of IP block <%s> failed %d\n",
2283                                                           adev->ip_blocks[i].version->funcs->name, r);
2284                                         return r;
2285                                 }
2286                         } else {
2287                                 r = adev->ip_blocks[i].version->funcs->hw_init(adev);
2288                                 if (r) {
2289                                         DRM_ERROR("hw_init of IP block <%s> failed %d\n",
2290                                                           adev->ip_blocks[i].version->funcs->name, r);
2291                                         return r;
2292                                 }
2293                         }
2294
2295                         adev->ip_blocks[i].status.hw = true;
2296                         break;
2297                 }
2298         }
2299
2300         if (!amdgpu_sriov_vf(adev) || adev->asic_type == CHIP_TONGA)
2301                 r = amdgpu_pm_load_smu_firmware(adev, &smu_version);
2302
2303         return r;
2304 }
2305
2306 static int amdgpu_device_init_schedulers(struct amdgpu_device *adev)
2307 {
2308         long timeout;
2309         int r, i;
2310
2311         for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
2312                 struct amdgpu_ring *ring = adev->rings[i];
2313
2314                 /* No need to setup the GPU scheduler for rings that don't need it */
2315                 if (!ring || ring->no_scheduler)
2316                         continue;
2317
2318                 switch (ring->funcs->type) {
2319                 case AMDGPU_RING_TYPE_GFX:
2320                         timeout = adev->gfx_timeout;
2321                         break;
2322                 case AMDGPU_RING_TYPE_COMPUTE:
2323                         timeout = adev->compute_timeout;
2324                         break;
2325                 case AMDGPU_RING_TYPE_SDMA:
2326                         timeout = adev->sdma_timeout;
2327                         break;
2328                 default:
2329                         timeout = adev->video_timeout;
2330                         break;
2331                 }
2332
2333                 r = drm_sched_init(&ring->sched, &amdgpu_sched_ops,
2334                                    ring->num_hw_submission, amdgpu_job_hang_limit,
2335                                    timeout, adev->reset_domain->wq,
2336                                    ring->sched_score, ring->name,
2337                                    adev->dev);
2338                 if (r) {
2339                         DRM_ERROR("Failed to create scheduler on ring %s.\n",
2340                                   ring->name);
2341                         return r;
2342                 }
2343         }
2344
2345         return 0;
2346 }
2347
2348
2349 /**
2350  * amdgpu_device_ip_init - run init for hardware IPs
2351  *
2352  * @adev: amdgpu_device pointer
2353  *
2354  * Main initialization pass for hardware IPs.  The list of all the hardware
2355  * IPs that make up the asic is walked and the sw_init and hw_init callbacks
2356  * are run.  sw_init initializes the software state associated with each IP
2357  * and hw_init initializes the hardware associated with each IP.
2358  * Returns 0 on success, negative error code on failure.
2359  */
2360 static int amdgpu_device_ip_init(struct amdgpu_device *adev)
2361 {
2362         int i, r;
2363
2364         r = amdgpu_ras_init(adev);
2365         if (r)
2366                 return r;
2367
2368         for (i = 0; i < adev->num_ip_blocks; i++) {
2369                 if (!adev->ip_blocks[i].status.valid)
2370                         continue;
2371                 r = adev->ip_blocks[i].version->funcs->sw_init((void *)adev);
2372                 if (r) {
2373                         DRM_ERROR("sw_init of IP block <%s> failed %d\n",
2374                                   adev->ip_blocks[i].version->funcs->name, r);
2375                         goto init_failed;
2376                 }
2377                 adev->ip_blocks[i].status.sw = true;
2378
2379                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_COMMON) {
2380                         /* need to do common hw init early so everything is set up for gmc */
2381                         r = adev->ip_blocks[i].version->funcs->hw_init((void *)adev);
2382                         if (r) {
2383                                 DRM_ERROR("hw_init %d failed %d\n", i, r);
2384                                 goto init_failed;
2385                         }
2386                         adev->ip_blocks[i].status.hw = true;
2387                 } else if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GMC) {
2388                         /* need to do gmc hw init early so we can allocate gpu mem */
2389                         /* Try to reserve bad pages early */
2390                         if (amdgpu_sriov_vf(adev))
2391                                 amdgpu_virt_exchange_data(adev);
2392
2393                         r = amdgpu_device_vram_scratch_init(adev);
2394                         if (r) {
2395                                 DRM_ERROR("amdgpu_vram_scratch_init failed %d\n", r);
2396                                 goto init_failed;
2397                         }
2398                         r = adev->ip_blocks[i].version->funcs->hw_init((void *)adev);
2399                         if (r) {
2400                                 DRM_ERROR("hw_init %d failed %d\n", i, r);
2401                                 goto init_failed;
2402                         }
2403                         r = amdgpu_device_wb_init(adev);
2404                         if (r) {
2405                                 DRM_ERROR("amdgpu_device_wb_init failed %d\n", r);
2406                                 goto init_failed;
2407                         }
2408                         adev->ip_blocks[i].status.hw = true;
2409
2410                         /* right after GMC hw init, we create CSA */
2411                         if (amdgpu_mcbp) {
2412                                 r = amdgpu_allocate_static_csa(adev, &adev->virt.csa_obj,
2413                                                                 AMDGPU_GEM_DOMAIN_VRAM,
2414                                                                 AMDGPU_CSA_SIZE);
2415                                 if (r) {
2416                                         DRM_ERROR("allocate CSA failed %d\n", r);
2417                                         goto init_failed;
2418                                 }
2419                         }
2420                 }
2421         }
2422
2423         if (amdgpu_sriov_vf(adev))
2424                 amdgpu_virt_init_data_exchange(adev);
2425
2426         r = amdgpu_ib_pool_init(adev);
2427         if (r) {
2428                 dev_err(adev->dev, "IB initialization failed (%d).\n", r);
2429                 amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_IB_INIT_FAIL, 0, r);
2430                 goto init_failed;
2431         }
2432
2433         r = amdgpu_ucode_create_bo(adev); /* create ucode bo when sw_init complete*/
2434         if (r)
2435                 goto init_failed;
2436
2437         r = amdgpu_device_ip_hw_init_phase1(adev);
2438         if (r)
2439                 goto init_failed;
2440
2441         r = amdgpu_device_fw_loading(adev);
2442         if (r)
2443                 goto init_failed;
2444
2445         r = amdgpu_device_ip_hw_init_phase2(adev);
2446         if (r)
2447                 goto init_failed;
2448
2449         /*
2450          * retired pages will be loaded from eeprom and reserved here,
2451          * it should be called after amdgpu_device_ip_hw_init_phase2  since
2452          * for some ASICs the RAS EEPROM code relies on SMU fully functioning
2453          * for I2C communication which only true at this point.
2454          *
2455          * amdgpu_ras_recovery_init may fail, but the upper only cares the
2456          * failure from bad gpu situation and stop amdgpu init process
2457          * accordingly. For other failed cases, it will still release all
2458          * the resource and print error message, rather than returning one
2459          * negative value to upper level.
2460          *
2461          * Note: theoretically, this should be called before all vram allocations
2462          * to protect retired page from abusing
2463          */
2464         r = amdgpu_ras_recovery_init(adev);
2465         if (r)
2466                 goto init_failed;
2467
2468         /**
2469          * In case of XGMI grab extra reference for reset domain for this device
2470          */
2471         if (adev->gmc.xgmi.num_physical_nodes > 1) {
2472                 if (amdgpu_xgmi_add_device(adev) == 0) {
2473                         if (!amdgpu_sriov_vf(adev)) {
2474                                 struct amdgpu_hive_info *hive = amdgpu_get_xgmi_hive(adev);
2475
2476                                 if (!hive->reset_domain ||
2477                                     !amdgpu_reset_get_reset_domain(hive->reset_domain)) {
2478                                         r = -ENOENT;
2479                                         amdgpu_put_xgmi_hive(hive);
2480                                         goto init_failed;
2481                                 }
2482
2483                                 /* Drop the early temporary reset domain we created for device */
2484                                 amdgpu_reset_put_reset_domain(adev->reset_domain);
2485                                 adev->reset_domain = hive->reset_domain;
2486                                 amdgpu_put_xgmi_hive(hive);
2487                         }
2488                 }
2489         }
2490
2491         r = amdgpu_device_init_schedulers(adev);
2492         if (r)
2493                 goto init_failed;
2494
2495         /* Don't init kfd if whole hive need to be reset during init */
2496         if (!adev->gmc.xgmi.pending_reset)
2497                 amdgpu_amdkfd_device_init(adev);
2498
2499         amdgpu_fru_get_product_info(adev);
2500
2501 init_failed:
2502         if (amdgpu_sriov_vf(adev))
2503                 amdgpu_virt_release_full_gpu(adev, true);
2504
2505         return r;
2506 }
2507
2508 /**
2509  * amdgpu_device_fill_reset_magic - writes reset magic to gart pointer
2510  *
2511  * @adev: amdgpu_device pointer
2512  *
2513  * Writes a reset magic value to the gart pointer in VRAM.  The driver calls
2514  * this function before a GPU reset.  If the value is retained after a
2515  * GPU reset, VRAM has not been lost.  Some GPU resets may destry VRAM contents.
2516  */
2517 static void amdgpu_device_fill_reset_magic(struct amdgpu_device *adev)
2518 {
2519         memcpy(adev->reset_magic, adev->gart.ptr, AMDGPU_RESET_MAGIC_NUM);
2520 }
2521
2522 /**
2523  * amdgpu_device_check_vram_lost - check if vram is valid
2524  *
2525  * @adev: amdgpu_device pointer
2526  *
2527  * Checks the reset magic value written to the gart pointer in VRAM.
2528  * The driver calls this after a GPU reset to see if the contents of
2529  * VRAM is lost or now.
2530  * returns true if vram is lost, false if not.
2531  */
2532 static bool amdgpu_device_check_vram_lost(struct amdgpu_device *adev)
2533 {
2534         if (memcmp(adev->gart.ptr, adev->reset_magic,
2535                         AMDGPU_RESET_MAGIC_NUM))
2536                 return true;
2537
2538         if (!amdgpu_in_reset(adev))
2539                 return false;
2540
2541         /*
2542          * For all ASICs with baco/mode1 reset, the VRAM is
2543          * always assumed to be lost.
2544          */
2545         switch (amdgpu_asic_reset_method(adev)) {
2546         case AMD_RESET_METHOD_BACO:
2547         case AMD_RESET_METHOD_MODE1:
2548                 return true;
2549         default:
2550                 return false;
2551         }
2552 }
2553
2554 /**
2555  * amdgpu_device_set_cg_state - set clockgating for amdgpu device
2556  *
2557  * @adev: amdgpu_device pointer
2558  * @state: clockgating state (gate or ungate)
2559  *
2560  * The list of all the hardware IPs that make up the asic is walked and the
2561  * set_clockgating_state callbacks are run.
2562  * Late initialization pass enabling clockgating for hardware IPs.
2563  * Fini or suspend, pass disabling clockgating for hardware IPs.
2564  * Returns 0 on success, negative error code on failure.
2565  */
2566
2567 int amdgpu_device_set_cg_state(struct amdgpu_device *adev,
2568                                enum amd_clockgating_state state)
2569 {
2570         int i, j, r;
2571
2572         if (amdgpu_emu_mode == 1)
2573                 return 0;
2574
2575         for (j = 0; j < adev->num_ip_blocks; j++) {
2576                 i = state == AMD_CG_STATE_GATE ? j : adev->num_ip_blocks - j - 1;
2577                 if (!adev->ip_blocks[i].status.late_initialized)
2578                         continue;
2579                 /* skip CG for GFX on S0ix */
2580                 if (adev->in_s0ix &&
2581                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GFX)
2582                         continue;
2583                 /* skip CG for VCE/UVD, it's handled specially */
2584                 if (adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_UVD &&
2585                     adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_VCE &&
2586                     adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_VCN &&
2587                     adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_JPEG &&
2588                     adev->ip_blocks[i].version->funcs->set_clockgating_state) {
2589                         /* enable clockgating to save power */
2590                         r = adev->ip_blocks[i].version->funcs->set_clockgating_state((void *)adev,
2591                                                                                      state);
2592                         if (r) {
2593                                 DRM_ERROR("set_clockgating_state(gate) of IP block <%s> failed %d\n",
2594                                           adev->ip_blocks[i].version->funcs->name, r);
2595                                 return r;
2596                         }
2597                 }
2598         }
2599
2600         return 0;
2601 }
2602
2603 int amdgpu_device_set_pg_state(struct amdgpu_device *adev,
2604                                enum amd_powergating_state state)
2605 {
2606         int i, j, r;
2607
2608         if (amdgpu_emu_mode == 1)
2609                 return 0;
2610
2611         for (j = 0; j < adev->num_ip_blocks; j++) {
2612                 i = state == AMD_PG_STATE_GATE ? j : adev->num_ip_blocks - j - 1;
2613                 if (!adev->ip_blocks[i].status.late_initialized)
2614                         continue;
2615                 /* skip PG for GFX on S0ix */
2616                 if (adev->in_s0ix &&
2617                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GFX)
2618                         continue;
2619                 /* skip CG for VCE/UVD, it's handled specially */
2620                 if (adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_UVD &&
2621                     adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_VCE &&
2622                     adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_VCN &&
2623                     adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_JPEG &&
2624                     adev->ip_blocks[i].version->funcs->set_powergating_state) {
2625                         /* enable powergating to save power */
2626                         r = adev->ip_blocks[i].version->funcs->set_powergating_state((void *)adev,
2627                                                                                         state);
2628                         if (r) {
2629                                 DRM_ERROR("set_powergating_state(gate) of IP block <%s> failed %d\n",
2630                                           adev->ip_blocks[i].version->funcs->name, r);
2631                                 return r;
2632                         }
2633                 }
2634         }
2635         return 0;
2636 }
2637
2638 static int amdgpu_device_enable_mgpu_fan_boost(void)
2639 {
2640         struct amdgpu_gpu_instance *gpu_ins;
2641         struct amdgpu_device *adev;
2642         int i, ret = 0;
2643
2644         mutex_lock(&mgpu_info.mutex);
2645
2646         /*
2647          * MGPU fan boost feature should be enabled
2648          * only when there are two or more dGPUs in
2649          * the system
2650          */
2651         if (mgpu_info.num_dgpu < 2)
2652                 goto out;
2653
2654         for (i = 0; i < mgpu_info.num_dgpu; i++) {
2655                 gpu_ins = &(mgpu_info.gpu_ins[i]);
2656                 adev = gpu_ins->adev;
2657                 if (!(adev->flags & AMD_IS_APU) &&
2658                     !gpu_ins->mgpu_fan_enabled) {
2659                         ret = amdgpu_dpm_enable_mgpu_fan_boost(adev);
2660                         if (ret)
2661                                 break;
2662
2663                         gpu_ins->mgpu_fan_enabled = 1;
2664                 }
2665         }
2666
2667 out:
2668         mutex_unlock(&mgpu_info.mutex);
2669
2670         return ret;
2671 }
2672
2673 /**
2674  * amdgpu_device_ip_late_init - run late init for hardware IPs
2675  *
2676  * @adev: amdgpu_device pointer
2677  *
2678  * Late initialization pass for hardware IPs.  The list of all the hardware
2679  * IPs that make up the asic is walked and the late_init callbacks are run.
2680  * late_init covers any special initialization that an IP requires
2681  * after all of the have been initialized or something that needs to happen
2682  * late in the init process.
2683  * Returns 0 on success, negative error code on failure.
2684  */
2685 static int amdgpu_device_ip_late_init(struct amdgpu_device *adev)
2686 {
2687         struct amdgpu_gpu_instance *gpu_instance;
2688         int i = 0, r;
2689
2690         for (i = 0; i < adev->num_ip_blocks; i++) {
2691                 if (!adev->ip_blocks[i].status.hw)
2692                         continue;
2693                 if (adev->ip_blocks[i].version->funcs->late_init) {
2694                         r = adev->ip_blocks[i].version->funcs->late_init((void *)adev);
2695                         if (r) {
2696                                 DRM_ERROR("late_init of IP block <%s> failed %d\n",
2697                                           adev->ip_blocks[i].version->funcs->name, r);
2698                                 return r;
2699                         }
2700                 }
2701                 adev->ip_blocks[i].status.late_initialized = true;
2702         }
2703
2704         r = amdgpu_ras_late_init(adev);
2705         if (r) {
2706                 DRM_ERROR("amdgpu_ras_late_init failed %d", r);
2707                 return r;
2708         }
2709
2710         amdgpu_ras_set_error_query_ready(adev, true);
2711
2712         amdgpu_device_set_cg_state(adev, AMD_CG_STATE_GATE);
2713         amdgpu_device_set_pg_state(adev, AMD_PG_STATE_GATE);
2714
2715         amdgpu_device_fill_reset_magic(adev);
2716
2717         r = amdgpu_device_enable_mgpu_fan_boost();
2718         if (r)
2719                 DRM_ERROR("enable mgpu fan boost failed (%d).\n", r);
2720
2721         /* For passthrough configuration on arcturus and aldebaran, enable special handling SBR */
2722         if (amdgpu_passthrough(adev) && ((adev->asic_type == CHIP_ARCTURUS && adev->gmc.xgmi.num_physical_nodes > 1)||
2723                                adev->asic_type == CHIP_ALDEBARAN ))
2724                 amdgpu_dpm_handle_passthrough_sbr(adev, true);
2725
2726         if (adev->gmc.xgmi.num_physical_nodes > 1) {
2727                 mutex_lock(&mgpu_info.mutex);
2728
2729                 /*
2730                  * Reset device p-state to low as this was booted with high.
2731                  *
2732                  * This should be performed only after all devices from the same
2733                  * hive get initialized.
2734                  *
2735                  * However, it's unknown how many device in the hive in advance.
2736                  * As this is counted one by one during devices initializations.
2737                  *
2738                  * So, we wait for all XGMI interlinked devices initialized.
2739                  * This may bring some delays as those devices may come from
2740                  * different hives. But that should be OK.
2741                  */
2742                 if (mgpu_info.num_dgpu == adev->gmc.xgmi.num_physical_nodes) {
2743                         for (i = 0; i < mgpu_info.num_gpu; i++) {
2744                                 gpu_instance = &(mgpu_info.gpu_ins[i]);
2745                                 if (gpu_instance->adev->flags & AMD_IS_APU)
2746                                         continue;
2747
2748                                 r = amdgpu_xgmi_set_pstate(gpu_instance->adev,
2749                                                 AMDGPU_XGMI_PSTATE_MIN);
2750                                 if (r) {
2751                                         DRM_ERROR("pstate setting failed (%d).\n", r);
2752                                         break;
2753                                 }
2754                         }
2755                 }
2756
2757                 mutex_unlock(&mgpu_info.mutex);
2758         }
2759
2760         return 0;
2761 }
2762
2763 /**
2764  * amdgpu_device_smu_fini_early - smu hw_fini wrapper
2765  *
2766  * @adev: amdgpu_device pointer
2767  *
2768  * For ASICs need to disable SMC first
2769  */
2770 static void amdgpu_device_smu_fini_early(struct amdgpu_device *adev)
2771 {
2772         int i, r;
2773
2774         if (adev->ip_versions[GC_HWIP][0] > IP_VERSION(9, 0, 0))
2775                 return;
2776
2777         for (i = 0; i < adev->num_ip_blocks; i++) {
2778                 if (!adev->ip_blocks[i].status.hw)
2779                         continue;
2780                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_SMC) {
2781                         r = adev->ip_blocks[i].version->funcs->hw_fini((void *)adev);
2782                         /* XXX handle errors */
2783                         if (r) {
2784                                 DRM_DEBUG("hw_fini of IP block <%s> failed %d\n",
2785                                           adev->ip_blocks[i].version->funcs->name, r);
2786                         }
2787                         adev->ip_blocks[i].status.hw = false;
2788                         break;
2789                 }
2790         }
2791 }
2792
2793 static int amdgpu_device_ip_fini_early(struct amdgpu_device *adev)
2794 {
2795         int i, r;
2796
2797         for (i = 0; i < adev->num_ip_blocks; i++) {
2798                 if (!adev->ip_blocks[i].version->funcs->early_fini)
2799                         continue;
2800
2801                 r = adev->ip_blocks[i].version->funcs->early_fini((void *)adev);
2802                 if (r) {
2803                         DRM_DEBUG("early_fini of IP block <%s> failed %d\n",
2804                                   adev->ip_blocks[i].version->funcs->name, r);
2805                 }
2806         }
2807
2808         amdgpu_device_set_pg_state(adev, AMD_PG_STATE_UNGATE);
2809         amdgpu_device_set_cg_state(adev, AMD_CG_STATE_UNGATE);
2810
2811         amdgpu_amdkfd_suspend(adev, false);
2812
2813         /* Workaroud for ASICs need to disable SMC first */
2814         amdgpu_device_smu_fini_early(adev);
2815
2816         for (i = adev->num_ip_blocks - 1; i >= 0; i--) {
2817                 if (!adev->ip_blocks[i].status.hw)
2818                         continue;
2819
2820                 r = adev->ip_blocks[i].version->funcs->hw_fini((void *)adev);
2821                 /* XXX handle errors */
2822                 if (r) {
2823                         DRM_DEBUG("hw_fini of IP block <%s> failed %d\n",
2824                                   adev->ip_blocks[i].version->funcs->name, r);
2825                 }
2826
2827                 adev->ip_blocks[i].status.hw = false;
2828         }
2829
2830         if (amdgpu_sriov_vf(adev)) {
2831                 if (amdgpu_virt_release_full_gpu(adev, false))
2832                         DRM_ERROR("failed to release exclusive mode on fini\n");
2833         }
2834
2835         return 0;
2836 }
2837
2838 /**
2839  * amdgpu_device_ip_fini - run fini for hardware IPs
2840  *
2841  * @adev: amdgpu_device pointer
2842  *
2843  * Main teardown pass for hardware IPs.  The list of all the hardware
2844  * IPs that make up the asic is walked and the hw_fini and sw_fini callbacks
2845  * are run.  hw_fini tears down the hardware associated with each IP
2846  * and sw_fini tears down any software state associated with each IP.
2847  * Returns 0 on success, negative error code on failure.
2848  */
2849 static int amdgpu_device_ip_fini(struct amdgpu_device *adev)
2850 {
2851         int i, r;
2852
2853         if (amdgpu_sriov_vf(adev) && adev->virt.ras_init_done)
2854                 amdgpu_virt_release_ras_err_handler_data(adev);
2855
2856         if (adev->gmc.xgmi.num_physical_nodes > 1)
2857                 amdgpu_xgmi_remove_device(adev);
2858
2859         amdgpu_amdkfd_device_fini_sw(adev);
2860
2861         for (i = adev->num_ip_blocks - 1; i >= 0; i--) {
2862                 if (!adev->ip_blocks[i].status.sw)
2863                         continue;
2864
2865                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GMC) {
2866                         amdgpu_ucode_free_bo(adev);
2867                         amdgpu_free_static_csa(&adev->virt.csa_obj);
2868                         amdgpu_device_wb_fini(adev);
2869                         amdgpu_device_vram_scratch_fini(adev);
2870                         amdgpu_ib_pool_fini(adev);
2871                 }
2872
2873                 r = adev->ip_blocks[i].version->funcs->sw_fini((void *)adev);
2874                 /* XXX handle errors */
2875                 if (r) {
2876                         DRM_DEBUG("sw_fini of IP block <%s> failed %d\n",
2877                                   adev->ip_blocks[i].version->funcs->name, r);
2878                 }
2879                 adev->ip_blocks[i].status.sw = false;
2880                 adev->ip_blocks[i].status.valid = false;
2881         }
2882
2883         for (i = adev->num_ip_blocks - 1; i >= 0; i--) {
2884                 if (!adev->ip_blocks[i].status.late_initialized)
2885                         continue;
2886                 if (adev->ip_blocks[i].version->funcs->late_fini)
2887                         adev->ip_blocks[i].version->funcs->late_fini((void *)adev);
2888                 adev->ip_blocks[i].status.late_initialized = false;
2889         }
2890
2891         amdgpu_ras_fini(adev);
2892
2893         return 0;
2894 }
2895
2896 /**
2897  * amdgpu_device_delayed_init_work_handler - work handler for IB tests
2898  *
2899  * @work: work_struct.
2900  */
2901 static void amdgpu_device_delayed_init_work_handler(struct work_struct *work)
2902 {
2903         struct amdgpu_device *adev =
2904                 container_of(work, struct amdgpu_device, delayed_init_work.work);
2905         int r;
2906
2907         r = amdgpu_ib_ring_tests(adev);
2908         if (r)
2909                 DRM_ERROR("ib ring test failed (%d).\n", r);
2910 }
2911
2912 static void amdgpu_device_delay_enable_gfx_off(struct work_struct *work)
2913 {
2914         struct amdgpu_device *adev =
2915                 container_of(work, struct amdgpu_device, gfx.gfx_off_delay_work.work);
2916
2917         WARN_ON_ONCE(adev->gfx.gfx_off_state);
2918         WARN_ON_ONCE(adev->gfx.gfx_off_req_count);
2919
2920         if (!amdgpu_dpm_set_powergating_by_smu(adev, AMD_IP_BLOCK_TYPE_GFX, true))
2921                 adev->gfx.gfx_off_state = true;
2922 }
2923
2924 /**
2925  * amdgpu_device_ip_suspend_phase1 - run suspend for hardware IPs (phase 1)
2926  *
2927  * @adev: amdgpu_device pointer
2928  *
2929  * Main suspend function for hardware IPs.  The list of all the hardware
2930  * IPs that make up the asic is walked, clockgating is disabled and the
2931  * suspend callbacks are run.  suspend puts the hardware and software state
2932  * in each IP into a state suitable for suspend.
2933  * Returns 0 on success, negative error code on failure.
2934  */
2935 static int amdgpu_device_ip_suspend_phase1(struct amdgpu_device *adev)
2936 {
2937         int i, r;
2938
2939         amdgpu_device_set_pg_state(adev, AMD_PG_STATE_UNGATE);
2940         amdgpu_device_set_cg_state(adev, AMD_CG_STATE_UNGATE);
2941
2942         /*
2943          * Per PMFW team's suggestion, driver needs to handle gfxoff
2944          * and df cstate features disablement for gpu reset(e.g. Mode1Reset)
2945          * scenario. Add the missing df cstate disablement here.
2946          */
2947         if (amdgpu_dpm_set_df_cstate(adev, DF_CSTATE_DISALLOW))
2948                 dev_warn(adev->dev, "Failed to disallow df cstate");
2949
2950         for (i = adev->num_ip_blocks - 1; i >= 0; i--) {
2951                 if (!adev->ip_blocks[i].status.valid)
2952                         continue;
2953
2954                 /* displays are handled separately */
2955                 if (adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_DCE)
2956                         continue;
2957
2958                 /* XXX handle errors */
2959                 r = adev->ip_blocks[i].version->funcs->suspend(adev);
2960                 /* XXX handle errors */
2961                 if (r) {
2962                         DRM_ERROR("suspend of IP block <%s> failed %d\n",
2963                                   adev->ip_blocks[i].version->funcs->name, r);
2964                         return r;
2965                 }
2966
2967                 adev->ip_blocks[i].status.hw = false;
2968         }
2969
2970         return 0;
2971 }
2972
2973 /**
2974  * amdgpu_device_ip_suspend_phase2 - run suspend for hardware IPs (phase 2)
2975  *
2976  * @adev: amdgpu_device pointer
2977  *
2978  * Main suspend function for hardware IPs.  The list of all the hardware
2979  * IPs that make up the asic is walked, clockgating is disabled and the
2980  * suspend callbacks are run.  suspend puts the hardware and software state
2981  * in each IP into a state suitable for suspend.
2982  * Returns 0 on success, negative error code on failure.
2983  */
2984 static int amdgpu_device_ip_suspend_phase2(struct amdgpu_device *adev)
2985 {
2986         int i, r;
2987
2988         if (adev->in_s0ix)
2989                 amdgpu_dpm_gfx_state_change(adev, sGpuChangeState_D3Entry);
2990
2991         for (i = adev->num_ip_blocks - 1; i >= 0; i--) {
2992                 if (!adev->ip_blocks[i].status.valid)
2993                         continue;
2994                 /* displays are handled in phase1 */
2995                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_DCE)
2996                         continue;
2997                 /* PSP lost connection when err_event_athub occurs */
2998                 if (amdgpu_ras_intr_triggered() &&
2999                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_PSP) {
3000                         adev->ip_blocks[i].status.hw = false;
3001                         continue;
3002                 }
3003
3004                 /* skip unnecessary suspend if we do not initialize them yet */
3005                 if (adev->gmc.xgmi.pending_reset &&
3006                     !(adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GMC ||
3007                       adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_SMC ||
3008                       adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_COMMON ||
3009                       adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_IH)) {
3010                         adev->ip_blocks[i].status.hw = false;
3011                         continue;
3012                 }
3013
3014                 /* skip suspend of gfx and psp for S0ix
3015                  * gfx is in gfxoff state, so on resume it will exit gfxoff just
3016                  * like at runtime. PSP is also part of the always on hardware
3017                  * so no need to suspend it.
3018                  */
3019                 if (adev->in_s0ix &&
3020                     (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_PSP ||
3021                      adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GFX))
3022                         continue;
3023
3024                 /* XXX handle errors */
3025                 r = adev->ip_blocks[i].version->funcs->suspend(adev);
3026                 /* XXX handle errors */
3027                 if (r) {
3028                         DRM_ERROR("suspend of IP block <%s> failed %d\n",
3029                                   adev->ip_blocks[i].version->funcs->name, r);
3030                 }
3031                 adev->ip_blocks[i].status.hw = false;
3032                 /* handle putting the SMC in the appropriate state */
3033                 if(!amdgpu_sriov_vf(adev)){
3034                         if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_SMC) {
3035                                 r = amdgpu_dpm_set_mp1_state(adev, adev->mp1_state);
3036                                 if (r) {
3037                                         DRM_ERROR("SMC failed to set mp1 state %d, %d\n",
3038                                                         adev->mp1_state, r);
3039                                         return r;
3040                                 }
3041                         }
3042                 }
3043         }
3044
3045         return 0;
3046 }
3047
3048 /**
3049  * amdgpu_device_ip_suspend - run suspend for hardware IPs
3050  *
3051  * @adev: amdgpu_device pointer
3052  *
3053  * Main suspend function for hardware IPs.  The list of all the hardware
3054  * IPs that make up the asic is walked, clockgating is disabled and the
3055  * suspend callbacks are run.  suspend puts the hardware and software state
3056  * in each IP into a state suitable for suspend.
3057  * Returns 0 on success, negative error code on failure.
3058  */
3059 int amdgpu_device_ip_suspend(struct amdgpu_device *adev)
3060 {
3061         int r;
3062
3063         if (amdgpu_sriov_vf(adev)) {
3064                 amdgpu_virt_fini_data_exchange(adev);
3065                 amdgpu_virt_request_full_gpu(adev, false);
3066         }
3067
3068         r = amdgpu_device_ip_suspend_phase1(adev);
3069         if (r)
3070                 return r;
3071         r = amdgpu_device_ip_suspend_phase2(adev);
3072
3073         if (amdgpu_sriov_vf(adev))
3074                 amdgpu_virt_release_full_gpu(adev, false);
3075
3076         return r;
3077 }
3078
3079 static int amdgpu_device_ip_reinit_early_sriov(struct amdgpu_device *adev)
3080 {
3081         int i, r;
3082
3083         static enum amd_ip_block_type ip_order[] = {
3084                 AMD_IP_BLOCK_TYPE_COMMON,
3085                 AMD_IP_BLOCK_TYPE_GMC,
3086                 AMD_IP_BLOCK_TYPE_PSP,
3087                 AMD_IP_BLOCK_TYPE_IH,
3088         };
3089
3090         for (i = 0; i < adev->num_ip_blocks; i++) {
3091                 int j;
3092                 struct amdgpu_ip_block *block;
3093
3094                 block = &adev->ip_blocks[i];
3095                 block->status.hw = false;
3096
3097                 for (j = 0; j < ARRAY_SIZE(ip_order); j++) {
3098
3099                         if (block->version->type != ip_order[j] ||
3100                                 !block->status.valid)
3101                                 continue;
3102
3103                         r = block->version->funcs->hw_init(adev);
3104                         DRM_INFO("RE-INIT-early: %s %s\n", block->version->funcs->name, r?"failed":"succeeded");
3105                         if (r)
3106                                 return r;
3107                         block->status.hw = true;
3108                 }
3109         }
3110
3111         return 0;
3112 }
3113
3114 static int amdgpu_device_ip_reinit_late_sriov(struct amdgpu_device *adev)
3115 {
3116         int i, r;
3117
3118         static enum amd_ip_block_type ip_order[] = {
3119                 AMD_IP_BLOCK_TYPE_SMC,
3120                 AMD_IP_BLOCK_TYPE_DCE,
3121                 AMD_IP_BLOCK_TYPE_GFX,
3122                 AMD_IP_BLOCK_TYPE_SDMA,
3123                 AMD_IP_BLOCK_TYPE_UVD,
3124                 AMD_IP_BLOCK_TYPE_VCE,
3125                 AMD_IP_BLOCK_TYPE_VCN
3126         };
3127
3128         for (i = 0; i < ARRAY_SIZE(ip_order); i++) {
3129                 int j;
3130                 struct amdgpu_ip_block *block;
3131
3132                 for (j = 0; j < adev->num_ip_blocks; j++) {
3133                         block = &adev->ip_blocks[j];
3134
3135                         if (block->version->type != ip_order[i] ||
3136                                 !block->status.valid ||
3137                                 block->status.hw)
3138                                 continue;
3139
3140                         if (block->version->type == AMD_IP_BLOCK_TYPE_SMC)
3141                                 r = block->version->funcs->resume(adev);
3142                         else
3143                                 r = block->version->funcs->hw_init(adev);
3144
3145                         DRM_INFO("RE-INIT-late: %s %s\n", block->version->funcs->name, r?"failed":"succeeded");
3146                         if (r)
3147                                 return r;
3148                         block->status.hw = true;
3149                 }
3150         }
3151
3152         return 0;
3153 }
3154
3155 /**
3156  * amdgpu_device_ip_resume_phase1 - run resume for hardware IPs
3157  *
3158  * @adev: amdgpu_device pointer
3159  *
3160  * First resume function for hardware IPs.  The list of all the hardware
3161  * IPs that make up the asic is walked and the resume callbacks are run for
3162  * COMMON, GMC, and IH.  resume puts the hardware into a functional state
3163  * after a suspend and updates the software state as necessary.  This
3164  * function is also used for restoring the GPU after a GPU reset.
3165  * Returns 0 on success, negative error code on failure.
3166  */
3167 static int amdgpu_device_ip_resume_phase1(struct amdgpu_device *adev)
3168 {
3169         int i, r;
3170
3171         for (i = 0; i < adev->num_ip_blocks; i++) {
3172                 if (!adev->ip_blocks[i].status.valid || adev->ip_blocks[i].status.hw)
3173                         continue;
3174                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_COMMON ||
3175                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GMC ||
3176                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_IH ||
3177                     (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_PSP && amdgpu_sriov_vf(adev))) {
3178
3179                         r = adev->ip_blocks[i].version->funcs->resume(adev);
3180                         if (r) {
3181                                 DRM_ERROR("resume of IP block <%s> failed %d\n",
3182                                           adev->ip_blocks[i].version->funcs->name, r);
3183                                 return r;
3184                         }
3185                         adev->ip_blocks[i].status.hw = true;
3186                 }
3187         }
3188
3189         return 0;
3190 }
3191
3192 /**
3193  * amdgpu_device_ip_resume_phase2 - run resume for hardware IPs
3194  *
3195  * @adev: amdgpu_device pointer
3196  *
3197  * First resume function for hardware IPs.  The list of all the hardware
3198  * IPs that make up the asic is walked and the resume callbacks are run for
3199  * all blocks except COMMON, GMC, and IH.  resume puts the hardware into a
3200  * functional state after a suspend and updates the software state as
3201  * necessary.  This function is also used for restoring the GPU after a GPU
3202  * reset.
3203  * Returns 0 on success, negative error code on failure.
3204  */
3205 static int amdgpu_device_ip_resume_phase2(struct amdgpu_device *adev)
3206 {
3207         int i, r;
3208
3209         for (i = 0; i < adev->num_ip_blocks; i++) {
3210                 if (!adev->ip_blocks[i].status.valid || adev->ip_blocks[i].status.hw)
3211                         continue;
3212                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_COMMON ||
3213                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GMC ||
3214                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_IH ||
3215                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_PSP)
3216                         continue;
3217                 r = adev->ip_blocks[i].version->funcs->resume(adev);
3218                 if (r) {
3219                         DRM_ERROR("resume of IP block <%s> failed %d\n",
3220                                   adev->ip_blocks[i].version->funcs->name, r);
3221                         return r;
3222                 }
3223                 adev->ip_blocks[i].status.hw = true;
3224
3225                 if (adev->in_s0ix && adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_SMC) {
3226                         /* disable gfxoff for IP resume. The gfxoff will be re-enabled in
3227                          * amdgpu_device_resume() after IP resume.
3228                          */
3229                         amdgpu_gfx_off_ctrl(adev, false);
3230                         DRM_DEBUG("will disable gfxoff for re-initializing other blocks\n");
3231                 }
3232
3233         }
3234
3235         return 0;
3236 }
3237
3238 /**
3239  * amdgpu_device_ip_resume - run resume for hardware IPs
3240  *
3241  * @adev: amdgpu_device pointer
3242  *
3243  * Main resume function for hardware IPs.  The hardware IPs
3244  * are split into two resume functions because they are
3245  * are also used in in recovering from a GPU reset and some additional
3246  * steps need to be take between them.  In this case (S3/S4) they are
3247  * run sequentially.
3248  * Returns 0 on success, negative error code on failure.
3249  */
3250 static int amdgpu_device_ip_resume(struct amdgpu_device *adev)
3251 {
3252         int r;
3253
3254         r = amdgpu_amdkfd_resume_iommu(adev);
3255         if (r)
3256                 return r;
3257
3258         r = amdgpu_device_ip_resume_phase1(adev);
3259         if (r)
3260                 return r;
3261
3262         r = amdgpu_device_fw_loading(adev);
3263         if (r)
3264                 return r;
3265
3266         r = amdgpu_device_ip_resume_phase2(adev);
3267
3268         return r;
3269 }
3270
3271 /**
3272  * amdgpu_device_detect_sriov_bios - determine if the board supports SR-IOV
3273  *
3274  * @adev: amdgpu_device pointer
3275  *
3276  * Query the VBIOS data tables to determine if the board supports SR-IOV.
3277  */
3278 static void amdgpu_device_detect_sriov_bios(struct amdgpu_device *adev)
3279 {
3280         if (amdgpu_sriov_vf(adev)) {
3281                 if (adev->is_atom_fw) {
3282                         if (amdgpu_atomfirmware_gpu_virtualization_supported(adev))
3283                                 adev->virt.caps |= AMDGPU_SRIOV_CAPS_SRIOV_VBIOS;
3284                 } else {
3285                         if (amdgpu_atombios_has_gpu_virtualization_table(adev))
3286                                 adev->virt.caps |= AMDGPU_SRIOV_CAPS_SRIOV_VBIOS;
3287                 }
3288
3289                 if (!(adev->virt.caps & AMDGPU_SRIOV_CAPS_SRIOV_VBIOS))
3290                         amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_NO_VBIOS, 0, 0);
3291         }
3292 }
3293
3294 /**
3295  * amdgpu_device_asic_has_dc_support - determine if DC supports the asic
3296  *
3297  * @asic_type: AMD asic type
3298  *
3299  * Check if there is DC (new modesetting infrastructre) support for an asic.
3300  * returns true if DC has support, false if not.
3301  */
3302 bool amdgpu_device_asic_has_dc_support(enum amd_asic_type asic_type)
3303 {
3304         switch (asic_type) {
3305 #ifdef CONFIG_DRM_AMDGPU_SI
3306         case CHIP_HAINAN:
3307 #endif
3308         case CHIP_TOPAZ:
3309                 /* chips with no display hardware */
3310                 return false;
3311 #if defined(CONFIG_DRM_AMD_DC)
3312         case CHIP_TAHITI:
3313         case CHIP_PITCAIRN:
3314         case CHIP_VERDE:
3315         case CHIP_OLAND:
3316                 /*
3317                  * We have systems in the wild with these ASICs that require
3318                  * LVDS and VGA support which is not supported with DC.
3319                  *
3320                  * Fallback to the non-DC driver here by default so as not to
3321                  * cause regressions.
3322                  */
3323 #if defined(CONFIG_DRM_AMD_DC_SI)
3324                 return amdgpu_dc > 0;
3325 #else
3326                 return false;
3327 #endif
3328         case CHIP_BONAIRE:
3329         case CHIP_KAVERI:
3330         case CHIP_KABINI:
3331         case CHIP_MULLINS:
3332                 /*
3333                  * We have systems in the wild with these ASICs that require
3334                  * VGA support which is not supported with DC.
3335                  *
3336                  * Fallback to the non-DC driver here by default so as not to
3337                  * cause regressions.
3338                  */
3339                 return amdgpu_dc > 0;
3340         default:
3341                 return amdgpu_dc != 0;
3342 #else
3343         default:
3344                 if (amdgpu_dc > 0)
3345                         DRM_INFO_ONCE("Display Core has been requested via kernel parameter "
3346                                          "but isn't supported by ASIC, ignoring\n");
3347                 return false;
3348 #endif
3349         }
3350 }
3351
3352 /**
3353  * amdgpu_device_has_dc_support - check if dc is supported
3354  *
3355  * @adev: amdgpu_device pointer
3356  *
3357  * Returns true for supported, false for not supported
3358  */
3359 bool amdgpu_device_has_dc_support(struct amdgpu_device *adev)
3360 {
3361         if (adev->enable_virtual_display ||
3362             (adev->harvest_ip_mask & AMD_HARVEST_IP_DMU_MASK))
3363                 return false;
3364
3365         return amdgpu_device_asic_has_dc_support(adev->asic_type);
3366 }
3367
3368 static void amdgpu_device_xgmi_reset_func(struct work_struct *__work)
3369 {
3370         struct amdgpu_device *adev =
3371                 container_of(__work, struct amdgpu_device, xgmi_reset_work);
3372         struct amdgpu_hive_info *hive = amdgpu_get_xgmi_hive(adev);
3373
3374         /* It's a bug to not have a hive within this function */
3375         if (WARN_ON(!hive))
3376                 return;
3377
3378         /*
3379          * Use task barrier to synchronize all xgmi reset works across the
3380          * hive. task_barrier_enter and task_barrier_exit will block
3381          * until all the threads running the xgmi reset works reach
3382          * those points. task_barrier_full will do both blocks.
3383          */
3384         if (amdgpu_asic_reset_method(adev) == AMD_RESET_METHOD_BACO) {
3385
3386                 task_barrier_enter(&hive->tb);
3387                 adev->asic_reset_res = amdgpu_device_baco_enter(adev_to_drm(adev));
3388
3389                 if (adev->asic_reset_res)
3390                         goto fail;
3391
3392                 task_barrier_exit(&hive->tb);
3393                 adev->asic_reset_res = amdgpu_device_baco_exit(adev_to_drm(adev));
3394
3395                 if (adev->asic_reset_res)
3396                         goto fail;
3397
3398                 if (adev->mmhub.ras && adev->mmhub.ras->ras_block.hw_ops &&
3399                     adev->mmhub.ras->ras_block.hw_ops->reset_ras_error_count)
3400                         adev->mmhub.ras->ras_block.hw_ops->reset_ras_error_count(adev);
3401         } else {
3402
3403                 task_barrier_full(&hive->tb);
3404                 adev->asic_reset_res =  amdgpu_asic_reset(adev);
3405         }
3406
3407 fail:
3408         if (adev->asic_reset_res)
3409                 DRM_WARN("ASIC reset failed with error, %d for drm dev, %s",
3410                          adev->asic_reset_res, adev_to_drm(adev)->unique);
3411         amdgpu_put_xgmi_hive(hive);
3412 }
3413
3414 static int amdgpu_device_get_job_timeout_settings(struct amdgpu_device *adev)
3415 {
3416         char *input = amdgpu_lockup_timeout;
3417         char *timeout_setting = NULL;
3418         int index = 0;
3419         long timeout;
3420         int ret = 0;
3421
3422         /*
3423          * By default timeout for non compute jobs is 10000
3424          * and 60000 for compute jobs.
3425          * In SR-IOV or passthrough mode, timeout for compute
3426          * jobs are 60000 by default.
3427          */
3428         adev->gfx_timeout = msecs_to_jiffies(10000);
3429         adev->sdma_timeout = adev->video_timeout = adev->gfx_timeout;
3430         if (amdgpu_sriov_vf(adev))
3431                 adev->compute_timeout = amdgpu_sriov_is_pp_one_vf(adev) ?
3432                                         msecs_to_jiffies(60000) : msecs_to_jiffies(10000);
3433         else
3434                 adev->compute_timeout =  msecs_to_jiffies(60000);
3435
3436         if (strnlen(input, AMDGPU_MAX_TIMEOUT_PARAM_LENGTH)) {
3437                 while ((timeout_setting = strsep(&input, ",")) &&
3438                                 strnlen(timeout_setting, AMDGPU_MAX_TIMEOUT_PARAM_LENGTH)) {
3439                         ret = kstrtol(timeout_setting, 0, &timeout);
3440                         if (ret)
3441                                 return ret;
3442
3443                         if (timeout == 0) {
3444                                 index++;
3445                                 continue;
3446                         } else if (timeout < 0) {
3447                                 timeout = MAX_SCHEDULE_TIMEOUT;
3448                                 dev_warn(adev->dev, "lockup timeout disabled");
3449                                 add_taint(TAINT_SOFTLOCKUP, LOCKDEP_STILL_OK);
3450                         } else {
3451                                 timeout = msecs_to_jiffies(timeout);
3452                         }
3453
3454                         switch (index++) {
3455                         case 0:
3456                                 adev->gfx_timeout = timeout;
3457                                 break;
3458                         case 1:
3459                                 adev->compute_timeout = timeout;
3460                                 break;
3461                         case 2:
3462                                 adev->sdma_timeout = timeout;
3463                                 break;
3464                         case 3:
3465                                 adev->video_timeout = timeout;
3466                                 break;
3467                         default:
3468                                 break;
3469                         }
3470                 }
3471                 /*
3472                  * There is only one value specified and
3473                  * it should apply to all non-compute jobs.
3474                  */
3475                 if (index == 1) {
3476                         adev->sdma_timeout = adev->video_timeout = adev->gfx_timeout;
3477                         if (amdgpu_sriov_vf(adev) || amdgpu_passthrough(adev))
3478                                 adev->compute_timeout = adev->gfx_timeout;
3479                 }
3480         }
3481
3482         return ret;
3483 }
3484
3485 /**
3486  * amdgpu_device_check_iommu_direct_map - check if RAM direct mapped to GPU
3487  *
3488  * @adev: amdgpu_device pointer
3489  *
3490  * RAM direct mapped to GPU if IOMMU is not enabled or is pass through mode
3491  */
3492 static void amdgpu_device_check_iommu_direct_map(struct amdgpu_device *adev)
3493 {
3494         struct iommu_domain *domain;
3495
3496         domain = iommu_get_domain_for_dev(adev->dev);
3497         if (!domain || domain->type == IOMMU_DOMAIN_IDENTITY)
3498                 adev->ram_is_direct_mapped = true;
3499 }
3500
3501 static const struct attribute *amdgpu_dev_attributes[] = {
3502         &dev_attr_product_name.attr,
3503         &dev_attr_product_number.attr,
3504         &dev_attr_serial_number.attr,
3505         &dev_attr_pcie_replay_count.attr,
3506         NULL
3507 };
3508
3509 /**
3510  * amdgpu_device_init - initialize the driver
3511  *
3512  * @adev: amdgpu_device pointer
3513  * @flags: driver flags
3514  *
3515  * Initializes the driver info and hw (all asics).
3516  * Returns 0 for success or an error on failure.
3517  * Called at driver startup.
3518  */
3519 int amdgpu_device_init(struct amdgpu_device *adev,
3520                        uint32_t flags)
3521 {
3522         struct drm_device *ddev = adev_to_drm(adev);
3523         struct pci_dev *pdev = adev->pdev;
3524         int r, i;
3525         bool px = false;
3526         u32 max_MBps;
3527
3528         adev->shutdown = false;
3529         adev->flags = flags;
3530
3531         if (amdgpu_force_asic_type >= 0 && amdgpu_force_asic_type < CHIP_LAST)
3532                 adev->asic_type = amdgpu_force_asic_type;
3533         else
3534                 adev->asic_type = flags & AMD_ASIC_MASK;
3535
3536         adev->usec_timeout = AMDGPU_MAX_USEC_TIMEOUT;
3537         if (amdgpu_emu_mode == 1)
3538                 adev->usec_timeout *= 10;
3539         adev->gmc.gart_size = 512 * 1024 * 1024;
3540         adev->accel_working = false;
3541         adev->num_rings = 0;
3542         RCU_INIT_POINTER(adev->gang_submit, dma_fence_get_stub());
3543         adev->mman.buffer_funcs = NULL;
3544         adev->mman.buffer_funcs_ring = NULL;
3545         adev->vm_manager.vm_pte_funcs = NULL;
3546         adev->vm_manager.vm_pte_num_scheds = 0;
3547         adev->gmc.gmc_funcs = NULL;
3548         adev->harvest_ip_mask = 0x0;
3549         adev->fence_context = dma_fence_context_alloc(AMDGPU_MAX_RINGS);
3550         bitmap_zero(adev->gfx.pipe_reserve_bitmap, AMDGPU_MAX_COMPUTE_QUEUES);
3551
3552         adev->smc_rreg = &amdgpu_invalid_rreg;
3553         adev->smc_wreg = &amdgpu_invalid_wreg;
3554         adev->pcie_rreg = &amdgpu_invalid_rreg;
3555         adev->pcie_wreg = &amdgpu_invalid_wreg;
3556         adev->pciep_rreg = &amdgpu_invalid_rreg;
3557         adev->pciep_wreg = &amdgpu_invalid_wreg;
3558         adev->pcie_rreg64 = &amdgpu_invalid_rreg64;
3559         adev->pcie_wreg64 = &amdgpu_invalid_wreg64;
3560         adev->uvd_ctx_rreg = &amdgpu_invalid_rreg;
3561         adev->uvd_ctx_wreg = &amdgpu_invalid_wreg;
3562         adev->didt_rreg = &amdgpu_invalid_rreg;
3563         adev->didt_wreg = &amdgpu_invalid_wreg;
3564         adev->gc_cac_rreg = &amdgpu_invalid_rreg;
3565         adev->gc_cac_wreg = &amdgpu_invalid_wreg;
3566         adev->audio_endpt_rreg = &amdgpu_block_invalid_rreg;
3567         adev->audio_endpt_wreg = &amdgpu_block_invalid_wreg;
3568
3569         DRM_INFO("initializing kernel modesetting (%s 0x%04X:0x%04X 0x%04X:0x%04X 0x%02X).\n",
3570                  amdgpu_asic_name[adev->asic_type], pdev->vendor, pdev->device,
3571                  pdev->subsystem_vendor, pdev->subsystem_device, pdev->revision);
3572
3573         /* mutex initialization are all done here so we
3574          * can recall function without having locking issues */
3575         mutex_init(&adev->firmware.mutex);
3576         mutex_init(&adev->pm.mutex);
3577         mutex_init(&adev->gfx.gpu_clock_mutex);
3578         mutex_init(&adev->srbm_mutex);
3579         mutex_init(&adev->gfx.pipe_reserve_mutex);
3580         mutex_init(&adev->gfx.gfx_off_mutex);
3581         mutex_init(&adev->grbm_idx_mutex);
3582         mutex_init(&adev->mn_lock);
3583         mutex_init(&adev->virt.vf_errors.lock);
3584         hash_init(adev->mn_hash);
3585         mutex_init(&adev->psp.mutex);
3586         mutex_init(&adev->notifier_lock);
3587         mutex_init(&adev->pm.stable_pstate_ctx_lock);
3588         mutex_init(&adev->benchmark_mutex);
3589
3590         amdgpu_device_init_apu_flags(adev);
3591
3592         r = amdgpu_device_check_arguments(adev);
3593         if (r)
3594                 return r;
3595
3596         spin_lock_init(&adev->mmio_idx_lock);
3597         spin_lock_init(&adev->smc_idx_lock);
3598         spin_lock_init(&adev->pcie_idx_lock);
3599         spin_lock_init(&adev->uvd_ctx_idx_lock);
3600         spin_lock_init(&adev->didt_idx_lock);
3601         spin_lock_init(&adev->gc_cac_idx_lock);
3602         spin_lock_init(&adev->se_cac_idx_lock);
3603         spin_lock_init(&adev->audio_endpt_idx_lock);
3604         spin_lock_init(&adev->mm_stats.lock);
3605
3606         INIT_LIST_HEAD(&adev->shadow_list);
3607         mutex_init(&adev->shadow_list_lock);
3608
3609         INIT_LIST_HEAD(&adev->reset_list);
3610
3611         INIT_LIST_HEAD(&adev->ras_list);
3612
3613         INIT_DELAYED_WORK(&adev->delayed_init_work,
3614                           amdgpu_device_delayed_init_work_handler);
3615         INIT_DELAYED_WORK(&adev->gfx.gfx_off_delay_work,
3616                           amdgpu_device_delay_enable_gfx_off);
3617
3618         INIT_WORK(&adev->xgmi_reset_work, amdgpu_device_xgmi_reset_func);
3619
3620         adev->gfx.gfx_off_req_count = 1;
3621         adev->gfx.gfx_off_residency = 0;
3622         adev->gfx.gfx_off_entrycount = 0;
3623         adev->pm.ac_power = power_supply_is_system_supplied() > 0;
3624
3625         atomic_set(&adev->throttling_logging_enabled, 1);
3626         /*
3627          * If throttling continues, logging will be performed every minute
3628          * to avoid log flooding. "-1" is subtracted since the thermal
3629          * throttling interrupt comes every second. Thus, the total logging
3630          * interval is 59 seconds(retelimited printk interval) + 1(waiting
3631          * for throttling interrupt) = 60 seconds.
3632          */
3633         ratelimit_state_init(&adev->throttling_logging_rs, (60 - 1) * HZ, 1);
3634         ratelimit_set_flags(&adev->throttling_logging_rs, RATELIMIT_MSG_ON_RELEASE);
3635
3636         /* Registers mapping */
3637         /* TODO: block userspace mapping of io register */
3638         if (adev->asic_type >= CHIP_BONAIRE) {
3639                 adev->rmmio_base = pci_resource_start(adev->pdev, 5);
3640                 adev->rmmio_size = pci_resource_len(adev->pdev, 5);
3641         } else {
3642                 adev->rmmio_base = pci_resource_start(adev->pdev, 2);
3643                 adev->rmmio_size = pci_resource_len(adev->pdev, 2);
3644         }
3645
3646         for (i = 0; i < AMD_IP_BLOCK_TYPE_NUM; i++)
3647                 atomic_set(&adev->pm.pwr_state[i], POWER_STATE_UNKNOWN);
3648
3649         adev->rmmio = ioremap(adev->rmmio_base, adev->rmmio_size);
3650         if (adev->rmmio == NULL) {
3651                 return -ENOMEM;
3652         }
3653         DRM_INFO("register mmio base: 0x%08X\n", (uint32_t)adev->rmmio_base);
3654         DRM_INFO("register mmio size: %u\n", (unsigned)adev->rmmio_size);
3655
3656         amdgpu_device_get_pcie_info(adev);
3657
3658         if (amdgpu_mcbp)
3659                 DRM_INFO("MCBP is enabled\n");
3660
3661         /*
3662          * Reset domain needs to be present early, before XGMI hive discovered
3663          * (if any) and intitialized to use reset sem and in_gpu reset flag
3664          * early on during init and before calling to RREG32.
3665          */
3666         adev->reset_domain = amdgpu_reset_create_reset_domain(SINGLE_DEVICE, "amdgpu-reset-dev");
3667         if (!adev->reset_domain)
3668                 return -ENOMEM;
3669
3670         /* detect hw virtualization here */
3671         amdgpu_detect_virtualization(adev);
3672
3673         r = amdgpu_device_get_job_timeout_settings(adev);
3674         if (r) {
3675                 dev_err(adev->dev, "invalid lockup_timeout parameter syntax\n");
3676                 return r;
3677         }
3678
3679         /* early init functions */
3680         r = amdgpu_device_ip_early_init(adev);
3681         if (r)
3682                 return r;
3683
3684         /* Enable TMZ based on IP_VERSION */
3685         amdgpu_gmc_tmz_set(adev);
3686
3687         amdgpu_gmc_noretry_set(adev);
3688         /* Need to get xgmi info early to decide the reset behavior*/
3689         if (adev->gmc.xgmi.supported) {
3690                 r = adev->gfxhub.funcs->get_xgmi_info(adev);
3691                 if (r)
3692                         return r;
3693         }
3694
3695         /* enable PCIE atomic ops */
3696         if (amdgpu_sriov_vf(adev))
3697                 adev->have_atomics_support = ((struct amd_sriov_msg_pf2vf_info *)
3698                         adev->virt.fw_reserve.p_pf2vf)->pcie_atomic_ops_support_flags ==
3699                         (PCI_EXP_DEVCAP2_ATOMIC_COMP32 | PCI_EXP_DEVCAP2_ATOMIC_COMP64);
3700         else
3701                 adev->have_atomics_support =
3702                         !pci_enable_atomic_ops_to_root(adev->pdev,
3703                                           PCI_EXP_DEVCAP2_ATOMIC_COMP32 |
3704                                           PCI_EXP_DEVCAP2_ATOMIC_COMP64);
3705         if (!adev->have_atomics_support)
3706                 dev_info(adev->dev, "PCIE atomic ops is not supported\n");
3707
3708         /* doorbell bar mapping and doorbell index init*/
3709         amdgpu_device_doorbell_init(adev);
3710
3711         if (amdgpu_emu_mode == 1) {
3712                 /* post the asic on emulation mode */
3713                 emu_soc_asic_init(adev);
3714                 goto fence_driver_init;
3715         }
3716
3717         amdgpu_reset_init(adev);
3718
3719         /* detect if we are with an SRIOV vbios */
3720         amdgpu_device_detect_sriov_bios(adev);
3721
3722         /* check if we need to reset the asic
3723          *  E.g., driver was not cleanly unloaded previously, etc.
3724          */
3725         if (!amdgpu_sriov_vf(adev) && amdgpu_asic_need_reset_on_init(adev)) {
3726                 if (adev->gmc.xgmi.num_physical_nodes) {
3727                         dev_info(adev->dev, "Pending hive reset.\n");
3728                         adev->gmc.xgmi.pending_reset = true;
3729                         /* Only need to init necessary block for SMU to handle the reset */
3730                         for (i = 0; i < adev->num_ip_blocks; i++) {
3731                                 if (!adev->ip_blocks[i].status.valid)
3732                                         continue;
3733                                 if (!(adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GMC ||
3734                                       adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_COMMON ||
3735                                       adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_IH ||
3736                                       adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_SMC)) {
3737                                         DRM_DEBUG("IP %s disabled for hw_init.\n",
3738                                                 adev->ip_blocks[i].version->funcs->name);
3739                                         adev->ip_blocks[i].status.hw = true;
3740                                 }
3741                         }
3742                 } else {
3743                         r = amdgpu_asic_reset(adev);
3744                         if (r) {
3745                                 dev_err(adev->dev, "asic reset on init failed\n");
3746                                 goto failed;
3747                         }
3748                 }
3749         }
3750
3751         pci_enable_pcie_error_reporting(adev->pdev);
3752
3753         /* Post card if necessary */
3754         if (amdgpu_device_need_post(adev)) {
3755                 if (!adev->bios) {
3756                         dev_err(adev->dev, "no vBIOS found\n");
3757                         r = -EINVAL;
3758                         goto failed;
3759                 }
3760                 DRM_INFO("GPU posting now...\n");
3761                 r = amdgpu_device_asic_init(adev);
3762                 if (r) {
3763                         dev_err(adev->dev, "gpu post error!\n");
3764                         goto failed;
3765                 }
3766         }
3767
3768         if (adev->is_atom_fw) {
3769                 /* Initialize clocks */
3770                 r = amdgpu_atomfirmware_get_clock_info(adev);
3771                 if (r) {
3772                         dev_err(adev->dev, "amdgpu_atomfirmware_get_clock_info failed\n");
3773                         amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_ATOMBIOS_GET_CLOCK_FAIL, 0, 0);
3774                         goto failed;
3775                 }
3776         } else {
3777                 /* Initialize clocks */
3778                 r = amdgpu_atombios_get_clock_info(adev);
3779                 if (r) {
3780                         dev_err(adev->dev, "amdgpu_atombios_get_clock_info failed\n");
3781                         amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_ATOMBIOS_GET_CLOCK_FAIL, 0, 0);
3782                         goto failed;
3783                 }
3784                 /* init i2c buses */
3785                 if (!amdgpu_device_has_dc_support(adev))
3786                         amdgpu_atombios_i2c_init(adev);
3787         }
3788
3789 fence_driver_init:
3790         /* Fence driver */
3791         r = amdgpu_fence_driver_sw_init(adev);
3792         if (r) {
3793                 dev_err(adev->dev, "amdgpu_fence_driver_sw_init failed\n");
3794                 amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_FENCE_INIT_FAIL, 0, 0);
3795                 goto failed;
3796         }
3797
3798         /* init the mode config */
3799         drm_mode_config_init(adev_to_drm(adev));
3800
3801         r = amdgpu_device_ip_init(adev);
3802         if (r) {
3803                 /* failed in exclusive mode due to timeout */
3804                 if (amdgpu_sriov_vf(adev) &&
3805                     !amdgpu_sriov_runtime(adev) &&
3806                     amdgpu_virt_mmio_blocked(adev) &&
3807                     !amdgpu_virt_wait_reset(adev)) {
3808                         dev_err(adev->dev, "VF exclusive mode timeout\n");
3809                         /* Don't send request since VF is inactive. */
3810                         adev->virt.caps &= ~AMDGPU_SRIOV_CAPS_RUNTIME;
3811                         adev->virt.ops = NULL;
3812                         r = -EAGAIN;
3813                         goto release_ras_con;
3814                 }
3815                 dev_err(adev->dev, "amdgpu_device_ip_init failed\n");
3816                 amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_AMDGPU_INIT_FAIL, 0, 0);
3817                 goto release_ras_con;
3818         }
3819
3820         amdgpu_fence_driver_hw_init(adev);
3821
3822         dev_info(adev->dev,
3823                 "SE %d, SH per SE %d, CU per SH %d, active_cu_number %d\n",
3824                         adev->gfx.config.max_shader_engines,
3825                         adev->gfx.config.max_sh_per_se,
3826                         adev->gfx.config.max_cu_per_sh,
3827                         adev->gfx.cu_info.number);
3828
3829         adev->accel_working = true;
3830
3831         amdgpu_vm_check_compute_bug(adev);
3832
3833         /* Initialize the buffer migration limit. */
3834         if (amdgpu_moverate >= 0)
3835                 max_MBps = amdgpu_moverate;
3836         else
3837                 max_MBps = 8; /* Allow 8 MB/s. */
3838         /* Get a log2 for easy divisions. */
3839         adev->mm_stats.log2_max_MBps = ilog2(max(1u, max_MBps));
3840
3841         r = amdgpu_pm_sysfs_init(adev);
3842         if (r) {
3843                 adev->pm_sysfs_en = false;
3844                 DRM_ERROR("registering pm debugfs failed (%d).\n", r);
3845         } else
3846                 adev->pm_sysfs_en = true;
3847
3848         r = amdgpu_ucode_sysfs_init(adev);
3849         if (r) {
3850                 adev->ucode_sysfs_en = false;
3851                 DRM_ERROR("Creating firmware sysfs failed (%d).\n", r);
3852         } else
3853                 adev->ucode_sysfs_en = true;
3854
3855         r = amdgpu_psp_sysfs_init(adev);
3856         if (r) {
3857                 adev->psp_sysfs_en = false;
3858                 if (!amdgpu_sriov_vf(adev))
3859                         DRM_ERROR("Creating psp sysfs failed\n");
3860         } else
3861                 adev->psp_sysfs_en = true;
3862
3863         /*
3864          * Register gpu instance before amdgpu_device_enable_mgpu_fan_boost.
3865          * Otherwise the mgpu fan boost feature will be skipped due to the
3866          * gpu instance is counted less.
3867          */
3868         amdgpu_register_gpu_instance(adev);
3869
3870         /* enable clockgating, etc. after ib tests, etc. since some blocks require
3871          * explicit gating rather than handling it automatically.
3872          */
3873         if (!adev->gmc.xgmi.pending_reset) {
3874                 r = amdgpu_device_ip_late_init(adev);
3875                 if (r) {
3876                         dev_err(adev->dev, "amdgpu_device_ip_late_init failed\n");
3877                         amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_AMDGPU_LATE_INIT_FAIL, 0, r);
3878                         goto release_ras_con;
3879                 }
3880                 /* must succeed. */
3881                 amdgpu_ras_resume(adev);
3882                 queue_delayed_work(system_wq, &adev->delayed_init_work,
3883                                    msecs_to_jiffies(AMDGPU_RESUME_MS));
3884         }
3885
3886         if (amdgpu_sriov_vf(adev))
3887                 flush_delayed_work(&adev->delayed_init_work);
3888
3889         r = sysfs_create_files(&adev->dev->kobj, amdgpu_dev_attributes);
3890         if (r)
3891                 dev_err(adev->dev, "Could not create amdgpu device attr\n");
3892
3893         if (IS_ENABLED(CONFIG_PERF_EVENTS))
3894                 r = amdgpu_pmu_init(adev);
3895         if (r)
3896                 dev_err(adev->dev, "amdgpu_pmu_init failed\n");
3897
3898         /* Have stored pci confspace at hand for restore in sudden PCI error */
3899         if (amdgpu_device_cache_pci_state(adev->pdev))
3900                 pci_restore_state(pdev);
3901
3902         /* if we have > 1 VGA cards, then disable the amdgpu VGA resources */
3903         /* this will fail for cards that aren't VGA class devices, just
3904          * ignore it */
3905         if ((adev->pdev->class >> 8) == PCI_CLASS_DISPLAY_VGA)
3906                 vga_client_register(adev->pdev, amdgpu_device_vga_set_decode);
3907
3908         if (amdgpu_device_supports_px(ddev)) {
3909                 px = true;
3910                 vga_switcheroo_register_client(adev->pdev,
3911                                                &amdgpu_switcheroo_ops, px);
3912                 vga_switcheroo_init_domain_pm_ops(adev->dev, &adev->vga_pm_domain);
3913         }
3914
3915         if (adev->gmc.xgmi.pending_reset)
3916                 queue_delayed_work(system_wq, &mgpu_info.delayed_reset_work,
3917                                    msecs_to_jiffies(AMDGPU_RESUME_MS));
3918
3919         amdgpu_device_check_iommu_direct_map(adev);
3920
3921         return 0;
3922
3923 release_ras_con:
3924         amdgpu_release_ras_context(adev);
3925
3926 failed:
3927         amdgpu_vf_error_trans_all(adev);
3928
3929         return r;
3930 }
3931
3932 static void amdgpu_device_unmap_mmio(struct amdgpu_device *adev)
3933 {
3934
3935         /* Clear all CPU mappings pointing to this device */
3936         unmap_mapping_range(adev->ddev.anon_inode->i_mapping, 0, 0, 1);
3937
3938         /* Unmap all mapped bars - Doorbell, registers and VRAM */
3939         amdgpu_device_doorbell_fini(adev);
3940
3941         iounmap(adev->rmmio);
3942         adev->rmmio = NULL;
3943         if (adev->mman.aper_base_kaddr)
3944                 iounmap(adev->mman.aper_base_kaddr);
3945         adev->mman.aper_base_kaddr = NULL;
3946
3947         /* Memory manager related */
3948         if (!adev->gmc.xgmi.connected_to_cpu) {
3949                 arch_phys_wc_del(adev->gmc.vram_mtrr);
3950                 arch_io_free_memtype_wc(adev->gmc.aper_base, adev->gmc.aper_size);
3951         }
3952 }
3953
3954 /**
3955  * amdgpu_device_fini_hw - tear down the driver
3956  *
3957  * @adev: amdgpu_device pointer
3958  *
3959  * Tear down the driver info (all asics).
3960  * Called at driver shutdown.
3961  */
3962 void amdgpu_device_fini_hw(struct amdgpu_device *adev)
3963 {
3964         dev_info(adev->dev, "amdgpu: finishing device.\n");
3965         flush_delayed_work(&adev->delayed_init_work);
3966         adev->shutdown = true;
3967
3968         /* make sure IB test finished before entering exclusive mode
3969          * to avoid preemption on IB test
3970          * */
3971         if (amdgpu_sriov_vf(adev)) {
3972                 amdgpu_virt_request_full_gpu(adev, false);
3973                 amdgpu_virt_fini_data_exchange(adev);
3974         }
3975
3976         /* disable all interrupts */
3977         amdgpu_irq_disable_all(adev);
3978         if (adev->mode_info.mode_config_initialized){
3979                 if (!drm_drv_uses_atomic_modeset(adev_to_drm(adev)))
3980                         drm_helper_force_disable_all(adev_to_drm(adev));
3981                 else
3982                         drm_atomic_helper_shutdown(adev_to_drm(adev));
3983         }
3984         amdgpu_fence_driver_hw_fini(adev);
3985
3986         if (adev->mman.initialized) {
3987                 flush_delayed_work(&adev->mman.bdev.wq);
3988                 ttm_bo_lock_delayed_workqueue(&adev->mman.bdev);
3989         }
3990
3991         if (adev->pm_sysfs_en)
3992                 amdgpu_pm_sysfs_fini(adev);
3993         if (adev->ucode_sysfs_en)
3994                 amdgpu_ucode_sysfs_fini(adev);
3995         if (adev->psp_sysfs_en)
3996                 amdgpu_psp_sysfs_fini(adev);
3997         sysfs_remove_files(&adev->dev->kobj, amdgpu_dev_attributes);
3998
3999         /* disable ras feature must before hw fini */
4000         amdgpu_ras_pre_fini(adev);
4001
4002         amdgpu_device_ip_fini_early(adev);
4003
4004         amdgpu_irq_fini_hw(adev);
4005
4006         if (adev->mman.initialized)
4007                 ttm_device_clear_dma_mappings(&adev->mman.bdev);
4008
4009         amdgpu_gart_dummy_page_fini(adev);
4010
4011         amdgpu_device_unmap_mmio(adev);
4012
4013 }
4014
4015 void amdgpu_device_fini_sw(struct amdgpu_device *adev)
4016 {
4017         int idx;
4018
4019         amdgpu_fence_driver_sw_fini(adev);
4020         amdgpu_device_ip_fini(adev);
4021         release_firmware(adev->firmware.gpu_info_fw);
4022         adev->firmware.gpu_info_fw = NULL;
4023         adev->accel_working = false;
4024         dma_fence_put(rcu_dereference_protected(adev->gang_submit, true));
4025
4026         amdgpu_reset_fini(adev);
4027
4028         /* free i2c buses */
4029         if (!amdgpu_device_has_dc_support(adev))
4030                 amdgpu_i2c_fini(adev);
4031
4032         if (amdgpu_emu_mode != 1)
4033                 amdgpu_atombios_fini(adev);
4034
4035         kfree(adev->bios);
4036         adev->bios = NULL;
4037         if (amdgpu_device_supports_px(adev_to_drm(adev))) {
4038                 vga_switcheroo_unregister_client(adev->pdev);
4039                 vga_switcheroo_fini_domain_pm_ops(adev->dev);
4040         }
4041         if ((adev->pdev->class >> 8) == PCI_CLASS_DISPLAY_VGA)
4042                 vga_client_unregister(adev->pdev);
4043
4044         if (drm_dev_enter(adev_to_drm(adev), &idx)) {
4045
4046                 iounmap(adev->rmmio);
4047                 adev->rmmio = NULL;
4048                 amdgpu_device_doorbell_fini(adev);
4049                 drm_dev_exit(idx);
4050         }
4051
4052         if (IS_ENABLED(CONFIG_PERF_EVENTS))
4053                 amdgpu_pmu_fini(adev);
4054         if (adev->mman.discovery_bin)
4055                 amdgpu_discovery_fini(adev);
4056
4057         amdgpu_reset_put_reset_domain(adev->reset_domain);
4058         adev->reset_domain = NULL;
4059
4060         kfree(adev->pci_state);
4061
4062 }
4063
4064 /**
4065  * amdgpu_device_evict_resources - evict device resources
4066  * @adev: amdgpu device object
4067  *
4068  * Evicts all ttm device resources(vram BOs, gart table) from the lru list
4069  * of the vram memory type. Mainly used for evicting device resources
4070  * at suspend time.
4071  *
4072  */
4073 static int amdgpu_device_evict_resources(struct amdgpu_device *adev)
4074 {
4075         int ret;
4076
4077         /* No need to evict vram on APUs for suspend to ram or s2idle */
4078         if ((adev->in_s3 || adev->in_s0ix) && (adev->flags & AMD_IS_APU))
4079                 return 0;
4080
4081         ret = amdgpu_ttm_evict_resources(adev, TTM_PL_VRAM);
4082         if (ret)
4083                 DRM_WARN("evicting device resources failed\n");
4084         return ret;
4085 }
4086
4087 /*
4088  * Suspend & resume.
4089  */
4090 /**
4091  * amdgpu_device_suspend - initiate device suspend
4092  *
4093  * @dev: drm dev pointer
4094  * @fbcon : notify the fbdev of suspend
4095  *
4096  * Puts the hw in the suspend state (all asics).
4097  * Returns 0 for success or an error on failure.
4098  * Called at driver suspend.
4099  */
4100 int amdgpu_device_suspend(struct drm_device *dev, bool fbcon)
4101 {
4102         struct amdgpu_device *adev = drm_to_adev(dev);
4103         int r = 0;
4104
4105         if (dev->switch_power_state == DRM_SWITCH_POWER_OFF)
4106                 return 0;
4107
4108         adev->in_suspend = true;
4109
4110         if (amdgpu_sriov_vf(adev)) {
4111                 amdgpu_virt_fini_data_exchange(adev);
4112                 r = amdgpu_virt_request_full_gpu(adev, false);
4113                 if (r)
4114                         return r;
4115         }
4116
4117         if (amdgpu_acpi_smart_shift_update(dev, AMDGPU_SS_DEV_D3))
4118                 DRM_WARN("smart shift update failed\n");
4119
4120         drm_kms_helper_poll_disable(dev);
4121
4122         if (fbcon)
4123                 drm_fb_helper_set_suspend_unlocked(adev_to_drm(adev)->fb_helper, true);
4124
4125         cancel_delayed_work_sync(&adev->delayed_init_work);
4126
4127         amdgpu_ras_suspend(adev);
4128
4129         amdgpu_device_ip_suspend_phase1(adev);
4130
4131         if (!adev->in_s0ix)
4132                 amdgpu_amdkfd_suspend(adev, adev->in_runpm);
4133
4134         r = amdgpu_device_evict_resources(adev);
4135         if (r)
4136                 return r;
4137
4138         amdgpu_fence_driver_hw_fini(adev);
4139
4140         amdgpu_device_ip_suspend_phase2(adev);
4141
4142         if (amdgpu_sriov_vf(adev))
4143                 amdgpu_virt_release_full_gpu(adev, false);
4144
4145         return 0;
4146 }
4147
4148 /**
4149  * amdgpu_device_resume - initiate device resume
4150  *
4151  * @dev: drm dev pointer
4152  * @fbcon : notify the fbdev of resume
4153  *
4154  * Bring the hw back to operating state (all asics).
4155  * Returns 0 for success or an error on failure.
4156  * Called at driver resume.
4157  */
4158 int amdgpu_device_resume(struct drm_device *dev, bool fbcon)
4159 {
4160         struct amdgpu_device *adev = drm_to_adev(dev);
4161         int r = 0;
4162
4163         if (amdgpu_sriov_vf(adev)) {
4164                 r = amdgpu_virt_request_full_gpu(adev, true);
4165                 if (r)
4166                         return r;
4167         }
4168
4169         if (dev->switch_power_state == DRM_SWITCH_POWER_OFF)
4170                 return 0;
4171
4172         if (adev->in_s0ix)
4173                 amdgpu_dpm_gfx_state_change(adev, sGpuChangeState_D0Entry);
4174
4175         /* post card */
4176         if (amdgpu_device_need_post(adev)) {
4177                 r = amdgpu_device_asic_init(adev);
4178                 if (r)
4179                         dev_err(adev->dev, "amdgpu asic init failed\n");
4180         }
4181
4182         r = amdgpu_device_ip_resume(adev);
4183
4184         /* no matter what r is, always need to properly release full GPU */
4185         if (amdgpu_sriov_vf(adev)) {
4186                 amdgpu_virt_init_data_exchange(adev);
4187                 amdgpu_virt_release_full_gpu(adev, true);
4188         }
4189
4190         if (r) {
4191                 dev_err(adev->dev, "amdgpu_device_ip_resume failed (%d).\n", r);
4192                 return r;
4193         }
4194         amdgpu_fence_driver_hw_init(adev);
4195
4196         r = amdgpu_device_ip_late_init(adev);
4197         if (r)
4198                 return r;
4199
4200         queue_delayed_work(system_wq, &adev->delayed_init_work,
4201                            msecs_to_jiffies(AMDGPU_RESUME_MS));
4202
4203         if (!adev->in_s0ix) {
4204                 r = amdgpu_amdkfd_resume(adev, adev->in_runpm);
4205                 if (r)
4206                         return r;
4207         }
4208
4209         /* Make sure IB tests flushed */
4210         if (amdgpu_sriov_vf(adev))
4211                 amdgpu_irq_gpu_reset_resume_helper(adev);
4212         flush_delayed_work(&adev->delayed_init_work);
4213
4214         if (adev->in_s0ix) {
4215                 /* re-enable gfxoff after IP resume. This re-enables gfxoff after
4216                  * it was disabled for IP resume in amdgpu_device_ip_resume_phase2().
4217                  */
4218                 amdgpu_gfx_off_ctrl(adev, true);
4219                 DRM_DEBUG("will enable gfxoff for the mission mode\n");
4220         }
4221         if (fbcon)
4222                 drm_fb_helper_set_suspend_unlocked(adev_to_drm(adev)->fb_helper, false);
4223
4224         drm_kms_helper_poll_enable(dev);
4225
4226         amdgpu_ras_resume(adev);
4227
4228         if (adev->mode_info.num_crtc) {
4229                 /*
4230                  * Most of the connector probing functions try to acquire runtime pm
4231                  * refs to ensure that the GPU is powered on when connector polling is
4232                  * performed. Since we're calling this from a runtime PM callback,
4233                  * trying to acquire rpm refs will cause us to deadlock.
4234                  *
4235                  * Since we're guaranteed to be holding the rpm lock, it's safe to
4236                  * temporarily disable the rpm helpers so this doesn't deadlock us.
4237                  */
4238 #ifdef CONFIG_PM
4239                 dev->dev->power.disable_depth++;
4240 #endif
4241                 if (!adev->dc_enabled)
4242                         drm_helper_hpd_irq_event(dev);
4243                 else
4244                         drm_kms_helper_hotplug_event(dev);
4245 #ifdef CONFIG_PM
4246                 dev->dev->power.disable_depth--;
4247 #endif
4248         }
4249         adev->in_suspend = false;
4250
4251         if (amdgpu_acpi_smart_shift_update(dev, AMDGPU_SS_DEV_D0))
4252                 DRM_WARN("smart shift update failed\n");
4253
4254         return 0;
4255 }
4256
4257 /**
4258  * amdgpu_device_ip_check_soft_reset - did soft reset succeed
4259  *
4260  * @adev: amdgpu_device pointer
4261  *
4262  * The list of all the hardware IPs that make up the asic is walked and
4263  * the check_soft_reset callbacks are run.  check_soft_reset determines
4264  * if the asic is still hung or not.
4265  * Returns true if any of the IPs are still in a hung state, false if not.
4266  */
4267 static bool amdgpu_device_ip_check_soft_reset(struct amdgpu_device *adev)
4268 {
4269         int i;
4270         bool asic_hang = false;
4271
4272         if (amdgpu_sriov_vf(adev))
4273                 return true;
4274
4275         if (amdgpu_asic_need_full_reset(adev))
4276                 return true;
4277
4278         for (i = 0; i < adev->num_ip_blocks; i++) {
4279                 if (!adev->ip_blocks[i].status.valid)
4280                         continue;
4281                 if (adev->ip_blocks[i].version->funcs->check_soft_reset)
4282                         adev->ip_blocks[i].status.hang =
4283                                 adev->ip_blocks[i].version->funcs->check_soft_reset(adev);
4284                 if (adev->ip_blocks[i].status.hang) {
4285                         dev_info(adev->dev, "IP block:%s is hung!\n", adev->ip_blocks[i].version->funcs->name);
4286                         asic_hang = true;
4287                 }
4288         }
4289         return asic_hang;
4290 }
4291
4292 /**
4293  * amdgpu_device_ip_pre_soft_reset - prepare for soft reset
4294  *
4295  * @adev: amdgpu_device pointer
4296  *
4297  * The list of all the hardware IPs that make up the asic is walked and the
4298  * pre_soft_reset callbacks are run if the block is hung.  pre_soft_reset
4299  * handles any IP specific hardware or software state changes that are
4300  * necessary for a soft reset to succeed.
4301  * Returns 0 on success, negative error code on failure.
4302  */
4303 static int amdgpu_device_ip_pre_soft_reset(struct amdgpu_device *adev)
4304 {
4305         int i, r = 0;
4306
4307         for (i = 0; i < adev->num_ip_blocks; i++) {
4308                 if (!adev->ip_blocks[i].status.valid)
4309                         continue;
4310                 if (adev->ip_blocks[i].status.hang &&
4311                     adev->ip_blocks[i].version->funcs->pre_soft_reset) {
4312                         r = adev->ip_blocks[i].version->funcs->pre_soft_reset(adev);
4313                         if (r)
4314                                 return r;
4315                 }
4316         }
4317
4318         return 0;
4319 }
4320
4321 /**
4322  * amdgpu_device_ip_need_full_reset - check if a full asic reset is needed
4323  *
4324  * @adev: amdgpu_device pointer
4325  *
4326  * Some hardware IPs cannot be soft reset.  If they are hung, a full gpu
4327  * reset is necessary to recover.
4328  * Returns true if a full asic reset is required, false if not.
4329  */
4330 static bool amdgpu_device_ip_need_full_reset(struct amdgpu_device *adev)
4331 {
4332         int i;
4333
4334         if (amdgpu_asic_need_full_reset(adev))
4335                 return true;
4336
4337         for (i = 0; i < adev->num_ip_blocks; i++) {
4338                 if (!adev->ip_blocks[i].status.valid)
4339                         continue;
4340                 if ((adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GMC) ||
4341                     (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_SMC) ||
4342                     (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_ACP) ||
4343                     (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_DCE) ||
4344                      adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_PSP) {
4345                         if (adev->ip_blocks[i].status.hang) {
4346                                 dev_info(adev->dev, "Some block need full reset!\n");
4347                                 return true;
4348                         }
4349                 }
4350         }
4351         return false;
4352 }
4353
4354 /**
4355  * amdgpu_device_ip_soft_reset - do a soft reset
4356  *
4357  * @adev: amdgpu_device pointer
4358  *
4359  * The list of all the hardware IPs that make up the asic is walked and the
4360  * soft_reset callbacks are run if the block is hung.  soft_reset handles any
4361  * IP specific hardware or software state changes that are necessary to soft
4362  * reset the IP.
4363  * Returns 0 on success, negative error code on failure.
4364  */
4365 static int amdgpu_device_ip_soft_reset(struct amdgpu_device *adev)
4366 {
4367         int i, r = 0;
4368
4369         for (i = 0; i < adev->num_ip_blocks; i++) {
4370                 if (!adev->ip_blocks[i].status.valid)
4371                         continue;
4372                 if (adev->ip_blocks[i].status.hang &&
4373                     adev->ip_blocks[i].version->funcs->soft_reset) {
4374                         r = adev->ip_blocks[i].version->funcs->soft_reset(adev);
4375                         if (r)
4376                                 return r;
4377                 }
4378         }
4379
4380         return 0;
4381 }
4382
4383 /**
4384  * amdgpu_device_ip_post_soft_reset - clean up from soft reset
4385  *
4386  * @adev: amdgpu_device pointer
4387  *
4388  * The list of all the hardware IPs that make up the asic is walked and the
4389  * post_soft_reset callbacks are run if the asic was hung.  post_soft_reset
4390  * handles any IP specific hardware or software state changes that are
4391  * necessary after the IP has been soft reset.
4392  * Returns 0 on success, negative error code on failure.
4393  */
4394 static int amdgpu_device_ip_post_soft_reset(struct amdgpu_device *adev)
4395 {
4396         int i, r = 0;
4397
4398         for (i = 0; i < adev->num_ip_blocks; i++) {
4399                 if (!adev->ip_blocks[i].status.valid)
4400                         continue;
4401                 if (adev->ip_blocks[i].status.hang &&
4402                     adev->ip_blocks[i].version->funcs->post_soft_reset)
4403                         r = adev->ip_blocks[i].version->funcs->post_soft_reset(adev);
4404                 if (r)
4405                         return r;
4406         }
4407
4408         return 0;
4409 }
4410
4411 /**
4412  * amdgpu_device_recover_vram - Recover some VRAM contents
4413  *
4414  * @adev: amdgpu_device pointer
4415  *
4416  * Restores the contents of VRAM buffers from the shadows in GTT.  Used to
4417  * restore things like GPUVM page tables after a GPU reset where
4418  * the contents of VRAM might be lost.
4419  *
4420  * Returns:
4421  * 0 on success, negative error code on failure.
4422  */
4423 static int amdgpu_device_recover_vram(struct amdgpu_device *adev)
4424 {
4425         struct dma_fence *fence = NULL, *next = NULL;
4426         struct amdgpu_bo *shadow;
4427         struct amdgpu_bo_vm *vmbo;
4428         long r = 1, tmo;
4429
4430         if (amdgpu_sriov_runtime(adev))
4431                 tmo = msecs_to_jiffies(8000);
4432         else
4433                 tmo = msecs_to_jiffies(100);
4434
4435         dev_info(adev->dev, "recover vram bo from shadow start\n");
4436         mutex_lock(&adev->shadow_list_lock);
4437         list_for_each_entry(vmbo, &adev->shadow_list, shadow_list) {
4438                 shadow = &vmbo->bo;
4439                 /* No need to recover an evicted BO */
4440                 if (shadow->tbo.resource->mem_type != TTM_PL_TT ||
4441                     shadow->tbo.resource->start == AMDGPU_BO_INVALID_OFFSET ||
4442                     shadow->parent->tbo.resource->mem_type != TTM_PL_VRAM)
4443                         continue;
4444
4445                 r = amdgpu_bo_restore_shadow(shadow, &next);
4446                 if (r)
4447                         break;
4448
4449                 if (fence) {
4450                         tmo = dma_fence_wait_timeout(fence, false, tmo);
4451                         dma_fence_put(fence);
4452                         fence = next;
4453                         if (tmo == 0) {
4454                                 r = -ETIMEDOUT;
4455                                 break;
4456                         } else if (tmo < 0) {
4457                                 r = tmo;
4458                                 break;
4459                         }
4460                 } else {
4461                         fence = next;
4462                 }
4463         }
4464         mutex_unlock(&adev->shadow_list_lock);
4465
4466         if (fence)
4467                 tmo = dma_fence_wait_timeout(fence, false, tmo);
4468         dma_fence_put(fence);
4469
4470         if (r < 0 || tmo <= 0) {
4471                 dev_err(adev->dev, "recover vram bo from shadow failed, r is %ld, tmo is %ld\n", r, tmo);
4472                 return -EIO;
4473         }
4474
4475         dev_info(adev->dev, "recover vram bo from shadow done\n");
4476         return 0;
4477 }
4478
4479
4480 /**
4481  * amdgpu_device_reset_sriov - reset ASIC for SR-IOV vf
4482  *
4483  * @adev: amdgpu_device pointer
4484  * @from_hypervisor: request from hypervisor
4485  *
4486  * do VF FLR and reinitialize Asic
4487  * return 0 means succeeded otherwise failed
4488  */
4489 static int amdgpu_device_reset_sriov(struct amdgpu_device *adev,
4490                                      bool from_hypervisor)
4491 {
4492         int r;
4493         struct amdgpu_hive_info *hive = NULL;
4494         int retry_limit = 0;
4495
4496 retry:
4497         amdgpu_amdkfd_pre_reset(adev);
4498
4499         if (from_hypervisor)
4500                 r = amdgpu_virt_request_full_gpu(adev, true);
4501         else
4502                 r = amdgpu_virt_reset_gpu(adev);
4503         if (r)
4504                 return r;
4505
4506         /* Resume IP prior to SMC */
4507         r = amdgpu_device_ip_reinit_early_sriov(adev);
4508         if (r)
4509                 goto error;
4510
4511         amdgpu_virt_init_data_exchange(adev);
4512
4513         r = amdgpu_device_fw_loading(adev);
4514         if (r)
4515                 return r;
4516
4517         /* now we are okay to resume SMC/CP/SDMA */
4518         r = amdgpu_device_ip_reinit_late_sriov(adev);
4519         if (r)
4520                 goto error;
4521
4522         hive = amdgpu_get_xgmi_hive(adev);
4523         /* Update PSP FW topology after reset */
4524         if (hive && adev->gmc.xgmi.num_physical_nodes > 1)
4525                 r = amdgpu_xgmi_update_topology(hive, adev);
4526
4527         if (hive)
4528                 amdgpu_put_xgmi_hive(hive);
4529
4530         if (!r) {
4531                 amdgpu_irq_gpu_reset_resume_helper(adev);
4532                 r = amdgpu_ib_ring_tests(adev);
4533
4534                 amdgpu_amdkfd_post_reset(adev);
4535         }
4536
4537 error:
4538         if (!r && adev->virt.gim_feature & AMDGIM_FEATURE_GIM_FLR_VRAMLOST) {
4539                 amdgpu_inc_vram_lost(adev);
4540                 r = amdgpu_device_recover_vram(adev);
4541         }
4542         amdgpu_virt_release_full_gpu(adev, true);
4543
4544         if (AMDGPU_RETRY_SRIOV_RESET(r)) {
4545                 if (retry_limit < AMDGPU_MAX_RETRY_LIMIT) {
4546                         retry_limit++;
4547                         goto retry;
4548                 } else
4549                         DRM_ERROR("GPU reset retry is beyond the retry limit\n");
4550         }
4551
4552         return r;
4553 }
4554
4555 /**
4556  * amdgpu_device_has_job_running - check if there is any job in mirror list
4557  *
4558  * @adev: amdgpu_device pointer
4559  *
4560  * check if there is any job in mirror list
4561  */
4562 bool amdgpu_device_has_job_running(struct amdgpu_device *adev)
4563 {
4564         int i;
4565         struct drm_sched_job *job;
4566
4567         for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
4568                 struct amdgpu_ring *ring = adev->rings[i];
4569
4570                 if (!ring || !ring->sched.thread)
4571                         continue;
4572
4573                 spin_lock(&ring->sched.job_list_lock);
4574                 job = list_first_entry_or_null(&ring->sched.pending_list,
4575                                                struct drm_sched_job, list);
4576                 spin_unlock(&ring->sched.job_list_lock);
4577                 if (job)
4578                         return true;
4579         }
4580         return false;
4581 }
4582
4583 /**
4584  * amdgpu_device_should_recover_gpu - check if we should try GPU recovery
4585  *
4586  * @adev: amdgpu_device pointer
4587  *
4588  * Check amdgpu_gpu_recovery and SRIOV status to see if we should try to recover
4589  * a hung GPU.
4590  */
4591 bool amdgpu_device_should_recover_gpu(struct amdgpu_device *adev)
4592 {
4593
4594         if (amdgpu_gpu_recovery == 0)
4595                 goto disabled;
4596
4597         /* Skip soft reset check in fatal error mode */
4598         if (!amdgpu_ras_is_poison_mode_supported(adev))
4599                 return true;
4600
4601         if (!amdgpu_device_ip_check_soft_reset(adev)) {
4602                 dev_info(adev->dev,"Timeout, but no hardware hang detected.\n");
4603                 return false;
4604         }
4605
4606         if (amdgpu_sriov_vf(adev))
4607                 return true;
4608
4609         if (amdgpu_gpu_recovery == -1) {
4610                 switch (adev->asic_type) {
4611 #ifdef CONFIG_DRM_AMDGPU_SI
4612                 case CHIP_VERDE:
4613                 case CHIP_TAHITI:
4614                 case CHIP_PITCAIRN:
4615                 case CHIP_OLAND:
4616                 case CHIP_HAINAN:
4617 #endif
4618 #ifdef CONFIG_DRM_AMDGPU_CIK
4619                 case CHIP_KAVERI:
4620                 case CHIP_KABINI:
4621                 case CHIP_MULLINS:
4622 #endif
4623                 case CHIP_CARRIZO:
4624                 case CHIP_STONEY:
4625                 case CHIP_CYAN_SKILLFISH:
4626                         goto disabled;
4627                 default:
4628                         break;
4629                 }
4630         }
4631
4632         return true;
4633
4634 disabled:
4635                 dev_info(adev->dev, "GPU recovery disabled.\n");
4636                 return false;
4637 }
4638
4639 int amdgpu_device_mode1_reset(struct amdgpu_device *adev)
4640 {
4641         u32 i;
4642         int ret = 0;
4643
4644         amdgpu_atombios_scratch_regs_engine_hung(adev, true);
4645
4646         dev_info(adev->dev, "GPU mode1 reset\n");
4647
4648         /* disable BM */
4649         pci_clear_master(adev->pdev);
4650
4651         amdgpu_device_cache_pci_state(adev->pdev);
4652
4653         if (amdgpu_dpm_is_mode1_reset_supported(adev)) {
4654                 dev_info(adev->dev, "GPU smu mode1 reset\n");
4655                 ret = amdgpu_dpm_mode1_reset(adev);
4656         } else {
4657                 dev_info(adev->dev, "GPU psp mode1 reset\n");
4658                 ret = psp_gpu_reset(adev);
4659         }
4660
4661         if (ret)
4662                 dev_err(adev->dev, "GPU mode1 reset failed\n");
4663
4664         amdgpu_device_load_pci_state(adev->pdev);
4665
4666         /* wait for asic to come out of reset */
4667         for (i = 0; i < adev->usec_timeout; i++) {
4668                 u32 memsize = adev->nbio.funcs->get_memsize(adev);
4669
4670                 if (memsize != 0xffffffff)
4671                         break;
4672                 udelay(1);
4673         }
4674
4675         amdgpu_atombios_scratch_regs_engine_hung(adev, false);
4676         return ret;
4677 }
4678
4679 int amdgpu_device_pre_asic_reset(struct amdgpu_device *adev,
4680                                  struct amdgpu_reset_context *reset_context)
4681 {
4682         int i, r = 0;
4683         struct amdgpu_job *job = NULL;
4684         bool need_full_reset =
4685                 test_bit(AMDGPU_NEED_FULL_RESET, &reset_context->flags);
4686
4687         if (reset_context->reset_req_dev == adev)
4688                 job = reset_context->job;
4689
4690         if (amdgpu_sriov_vf(adev)) {
4691                 /* stop the data exchange thread */
4692                 amdgpu_virt_fini_data_exchange(adev);
4693         }
4694
4695         amdgpu_fence_driver_isr_toggle(adev, true);
4696
4697         /* block all schedulers and reset given job's ring */
4698         for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
4699                 struct amdgpu_ring *ring = adev->rings[i];
4700
4701                 if (!ring || !ring->sched.thread)
4702                         continue;
4703
4704                 /*clear job fence from fence drv to avoid force_completion
4705                  *leave NULL and vm flush fence in fence drv */
4706                 amdgpu_fence_driver_clear_job_fences(ring);
4707
4708                 /* after all hw jobs are reset, hw fence is meaningless, so force_completion */
4709                 amdgpu_fence_driver_force_completion(ring);
4710         }
4711
4712         amdgpu_fence_driver_isr_toggle(adev, false);
4713
4714         if (job && job->vm)
4715                 drm_sched_increase_karma(&job->base);
4716
4717         r = amdgpu_reset_prepare_hwcontext(adev, reset_context);
4718         /* If reset handler not implemented, continue; otherwise return */
4719         if (r == -ENOSYS)
4720                 r = 0;
4721         else
4722                 return r;
4723
4724         /* Don't suspend on bare metal if we are not going to HW reset the ASIC */
4725         if (!amdgpu_sriov_vf(adev)) {
4726
4727                 if (!need_full_reset)
4728                         need_full_reset = amdgpu_device_ip_need_full_reset(adev);
4729
4730                 if (!need_full_reset && amdgpu_gpu_recovery) {
4731                         amdgpu_device_ip_pre_soft_reset(adev);
4732                         r = amdgpu_device_ip_soft_reset(adev);
4733                         amdgpu_device_ip_post_soft_reset(adev);
4734                         if (r || amdgpu_device_ip_check_soft_reset(adev)) {
4735                                 dev_info(adev->dev, "soft reset failed, will fallback to full reset!\n");
4736                                 need_full_reset = true;
4737                         }
4738                 }
4739
4740                 if (need_full_reset)
4741                         r = amdgpu_device_ip_suspend(adev);
4742                 if (need_full_reset)
4743                         set_bit(AMDGPU_NEED_FULL_RESET, &reset_context->flags);
4744                 else
4745                         clear_bit(AMDGPU_NEED_FULL_RESET,
4746                                   &reset_context->flags);
4747         }
4748
4749         return r;
4750 }
4751
4752 static int amdgpu_reset_reg_dumps(struct amdgpu_device *adev)
4753 {
4754         int i;
4755
4756         lockdep_assert_held(&adev->reset_domain->sem);
4757
4758         for (i = 0; i < adev->num_regs; i++) {
4759                 adev->reset_dump_reg_value[i] = RREG32(adev->reset_dump_reg_list[i]);
4760                 trace_amdgpu_reset_reg_dumps(adev->reset_dump_reg_list[i],
4761                                              adev->reset_dump_reg_value[i]);
4762         }
4763
4764         return 0;
4765 }
4766
4767 #ifdef CONFIG_DEV_COREDUMP
4768 static ssize_t amdgpu_devcoredump_read(char *buffer, loff_t offset,
4769                 size_t count, void *data, size_t datalen)
4770 {
4771         struct drm_printer p;
4772         struct amdgpu_device *adev = data;
4773         struct drm_print_iterator iter;
4774         int i;
4775
4776         iter.data = buffer;
4777         iter.offset = 0;
4778         iter.start = offset;
4779         iter.remain = count;
4780
4781         p = drm_coredump_printer(&iter);
4782
4783         drm_printf(&p, "**** AMDGPU Device Coredump ****\n");
4784         drm_printf(&p, "kernel: " UTS_RELEASE "\n");
4785         drm_printf(&p, "module: " KBUILD_MODNAME "\n");
4786         drm_printf(&p, "time: %lld.%09ld\n", adev->reset_time.tv_sec, adev->reset_time.tv_nsec);
4787         if (adev->reset_task_info.pid)
4788                 drm_printf(&p, "process_name: %s PID: %d\n",
4789                            adev->reset_task_info.process_name,
4790                            adev->reset_task_info.pid);
4791
4792         if (adev->reset_vram_lost)
4793                 drm_printf(&p, "VRAM is lost due to GPU reset!\n");
4794         if (adev->num_regs) {
4795                 drm_printf(&p, "AMDGPU register dumps:\nOffset:     Value:\n");
4796
4797                 for (i = 0; i < adev->num_regs; i++)
4798                         drm_printf(&p, "0x%08x: 0x%08x\n",
4799                                    adev->reset_dump_reg_list[i],
4800                                    adev->reset_dump_reg_value[i]);
4801         }
4802
4803         return count - iter.remain;
4804 }
4805
4806 static void amdgpu_devcoredump_free(void *data)
4807 {
4808 }
4809
4810 static void amdgpu_reset_capture_coredumpm(struct amdgpu_device *adev)
4811 {
4812         struct drm_device *dev = adev_to_drm(adev);
4813
4814         ktime_get_ts64(&adev->reset_time);
4815         dev_coredumpm(dev->dev, THIS_MODULE, adev, 0, GFP_KERNEL,
4816                       amdgpu_devcoredump_read, amdgpu_devcoredump_free);
4817 }
4818 #endif
4819
4820 int amdgpu_do_asic_reset(struct list_head *device_list_handle,
4821                          struct amdgpu_reset_context *reset_context)
4822 {
4823         struct amdgpu_device *tmp_adev = NULL;
4824         bool need_full_reset, skip_hw_reset, vram_lost = false;
4825         int r = 0;
4826         bool gpu_reset_for_dev_remove = 0;
4827
4828         /* Try reset handler method first */
4829         tmp_adev = list_first_entry(device_list_handle, struct amdgpu_device,
4830                                     reset_list);
4831         amdgpu_reset_reg_dumps(tmp_adev);
4832
4833         reset_context->reset_device_list = device_list_handle;
4834         r = amdgpu_reset_perform_reset(tmp_adev, reset_context);
4835         /* If reset handler not implemented, continue; otherwise return */
4836         if (r == -ENOSYS)
4837                 r = 0;
4838         else
4839                 return r;
4840
4841         /* Reset handler not implemented, use the default method */
4842         need_full_reset =
4843                 test_bit(AMDGPU_NEED_FULL_RESET, &reset_context->flags);
4844         skip_hw_reset = test_bit(AMDGPU_SKIP_HW_RESET, &reset_context->flags);
4845
4846         gpu_reset_for_dev_remove =
4847                 test_bit(AMDGPU_RESET_FOR_DEVICE_REMOVE, &reset_context->flags) &&
4848                         test_bit(AMDGPU_NEED_FULL_RESET, &reset_context->flags);
4849
4850         /*
4851          * ASIC reset has to be done on all XGMI hive nodes ASAP
4852          * to allow proper links negotiation in FW (within 1 sec)
4853          */
4854         if (!skip_hw_reset && need_full_reset) {
4855                 list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
4856                         /* For XGMI run all resets in parallel to speed up the process */
4857                         if (tmp_adev->gmc.xgmi.num_physical_nodes > 1) {
4858                                 tmp_adev->gmc.xgmi.pending_reset = false;
4859                                 if (!queue_work(system_unbound_wq, &tmp_adev->xgmi_reset_work))
4860                                         r = -EALREADY;
4861                         } else
4862                                 r = amdgpu_asic_reset(tmp_adev);
4863
4864                         if (r) {
4865                                 dev_err(tmp_adev->dev, "ASIC reset failed with error, %d for drm dev, %s",
4866                                          r, adev_to_drm(tmp_adev)->unique);
4867                                 break;
4868                         }
4869                 }
4870
4871                 /* For XGMI wait for all resets to complete before proceed */
4872                 if (!r) {
4873                         list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
4874                                 if (tmp_adev->gmc.xgmi.num_physical_nodes > 1) {
4875                                         flush_work(&tmp_adev->xgmi_reset_work);
4876                                         r = tmp_adev->asic_reset_res;
4877                                         if (r)
4878                                                 break;
4879                                 }
4880                         }
4881                 }
4882         }
4883
4884         if (!r && amdgpu_ras_intr_triggered()) {
4885                 list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
4886                         if (tmp_adev->mmhub.ras && tmp_adev->mmhub.ras->ras_block.hw_ops &&
4887                             tmp_adev->mmhub.ras->ras_block.hw_ops->reset_ras_error_count)
4888                                 tmp_adev->mmhub.ras->ras_block.hw_ops->reset_ras_error_count(tmp_adev);
4889                 }
4890
4891                 amdgpu_ras_intr_cleared();
4892         }
4893
4894         /* Since the mode1 reset affects base ip blocks, the
4895          * phase1 ip blocks need to be resumed. Otherwise there
4896          * will be a BIOS signature error and the psp bootloader
4897          * can't load kdb on the next amdgpu install.
4898          */
4899         if (gpu_reset_for_dev_remove) {
4900                 list_for_each_entry(tmp_adev, device_list_handle, reset_list)
4901                         amdgpu_device_ip_resume_phase1(tmp_adev);
4902
4903                 goto end;
4904         }
4905
4906         list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
4907                 if (need_full_reset) {
4908                         /* post card */
4909                         r = amdgpu_device_asic_init(tmp_adev);
4910                         if (r) {
4911                                 dev_warn(tmp_adev->dev, "asic atom init failed!");
4912                         } else {
4913                                 dev_info(tmp_adev->dev, "GPU reset succeeded, trying to resume\n");
4914                                 r = amdgpu_amdkfd_resume_iommu(tmp_adev);
4915                                 if (r)
4916                                         goto out;
4917
4918                                 r = amdgpu_device_ip_resume_phase1(tmp_adev);
4919                                 if (r)
4920                                         goto out;
4921
4922                                 vram_lost = amdgpu_device_check_vram_lost(tmp_adev);
4923 #ifdef CONFIG_DEV_COREDUMP
4924                                 tmp_adev->reset_vram_lost = vram_lost;
4925                                 memset(&tmp_adev->reset_task_info, 0,
4926                                                 sizeof(tmp_adev->reset_task_info));
4927                                 if (reset_context->job && reset_context->job->vm)
4928                                         tmp_adev->reset_task_info =
4929                                                 reset_context->job->vm->task_info;
4930                                 amdgpu_reset_capture_coredumpm(tmp_adev);
4931 #endif
4932                                 if (vram_lost) {
4933                                         DRM_INFO("VRAM is lost due to GPU reset!\n");
4934                                         amdgpu_inc_vram_lost(tmp_adev);
4935                                 }
4936
4937                                 r = amdgpu_device_fw_loading(tmp_adev);
4938                                 if (r)
4939                                         return r;
4940
4941                                 r = amdgpu_device_ip_resume_phase2(tmp_adev);
4942                                 if (r)
4943                                         goto out;
4944
4945                                 if (vram_lost)
4946                                         amdgpu_device_fill_reset_magic(tmp_adev);
4947
4948                                 /*
4949                                  * Add this ASIC as tracked as reset was already
4950                                  * complete successfully.
4951                                  */
4952                                 amdgpu_register_gpu_instance(tmp_adev);
4953
4954                                 if (!reset_context->hive &&
4955                                     tmp_adev->gmc.xgmi.num_physical_nodes > 1)
4956                                         amdgpu_xgmi_add_device(tmp_adev);
4957
4958                                 r = amdgpu_device_ip_late_init(tmp_adev);
4959                                 if (r)
4960                                         goto out;
4961
4962                                 drm_fb_helper_set_suspend_unlocked(adev_to_drm(tmp_adev)->fb_helper, false);
4963
4964                                 /*
4965                                  * The GPU enters bad state once faulty pages
4966                                  * by ECC has reached the threshold, and ras
4967                                  * recovery is scheduled next. So add one check
4968                                  * here to break recovery if it indeed exceeds
4969                                  * bad page threshold, and remind user to
4970                                  * retire this GPU or setting one bigger
4971                                  * bad_page_threshold value to fix this once
4972                                  * probing driver again.
4973                                  */
4974                                 if (!amdgpu_ras_eeprom_check_err_threshold(tmp_adev)) {
4975                                         /* must succeed. */
4976                                         amdgpu_ras_resume(tmp_adev);
4977                                 } else {
4978                                         r = -EINVAL;
4979                                         goto out;
4980                                 }
4981
4982                                 /* Update PSP FW topology after reset */
4983                                 if (reset_context->hive &&
4984                                     tmp_adev->gmc.xgmi.num_physical_nodes > 1)
4985                                         r = amdgpu_xgmi_update_topology(
4986                                                 reset_context->hive, tmp_adev);
4987                         }
4988                 }
4989
4990 out:
4991                 if (!r) {
4992                         amdgpu_irq_gpu_reset_resume_helper(tmp_adev);
4993                         r = amdgpu_ib_ring_tests(tmp_adev);
4994                         if (r) {
4995                                 dev_err(tmp_adev->dev, "ib ring test failed (%d).\n", r);
4996                                 need_full_reset = true;
4997                                 r = -EAGAIN;
4998                                 goto end;
4999                         }
5000                 }
5001
5002                 if (!r)
5003                         r = amdgpu_device_recover_vram(tmp_adev);
5004                 else
5005                         tmp_adev->asic_reset_res = r;
5006         }
5007
5008 end:
5009         if (need_full_reset)
5010                 set_bit(AMDGPU_NEED_FULL_RESET, &reset_context->flags);
5011         else
5012                 clear_bit(AMDGPU_NEED_FULL_RESET, &reset_context->flags);
5013         return r;
5014 }
5015
5016 static void amdgpu_device_set_mp1_state(struct amdgpu_device *adev)
5017 {
5018
5019         switch (amdgpu_asic_reset_method(adev)) {
5020         case AMD_RESET_METHOD_MODE1:
5021                 adev->mp1_state = PP_MP1_STATE_SHUTDOWN;
5022                 break;
5023         case AMD_RESET_METHOD_MODE2:
5024                 adev->mp1_state = PP_MP1_STATE_RESET;
5025                 break;
5026         default:
5027                 adev->mp1_state = PP_MP1_STATE_NONE;
5028                 break;
5029         }
5030 }
5031
5032 static void amdgpu_device_unset_mp1_state(struct amdgpu_device *adev)
5033 {
5034         amdgpu_vf_error_trans_all(adev);
5035         adev->mp1_state = PP_MP1_STATE_NONE;
5036 }
5037
5038 static void amdgpu_device_resume_display_audio(struct amdgpu_device *adev)
5039 {
5040         struct pci_dev *p = NULL;
5041
5042         p = pci_get_domain_bus_and_slot(pci_domain_nr(adev->pdev->bus),
5043                         adev->pdev->bus->number, 1);
5044         if (p) {
5045                 pm_runtime_enable(&(p->dev));
5046                 pm_runtime_resume(&(p->dev));
5047         }
5048 }
5049
5050 static int amdgpu_device_suspend_display_audio(struct amdgpu_device *adev)
5051 {
5052         enum amd_reset_method reset_method;
5053         struct pci_dev *p = NULL;
5054         u64 expires;
5055
5056         /*
5057          * For now, only BACO and mode1 reset are confirmed
5058          * to suffer the audio issue without proper suspended.
5059          */
5060         reset_method = amdgpu_asic_reset_method(adev);
5061         if ((reset_method != AMD_RESET_METHOD_BACO) &&
5062              (reset_method != AMD_RESET_METHOD_MODE1))
5063                 return -EINVAL;
5064
5065         p = pci_get_domain_bus_and_slot(pci_domain_nr(adev->pdev->bus),
5066                         adev->pdev->bus->number, 1);
5067         if (!p)
5068                 return -ENODEV;
5069
5070         expires = pm_runtime_autosuspend_expiration(&(p->dev));
5071         if (!expires)
5072                 /*
5073                  * If we cannot get the audio device autosuspend delay,
5074                  * a fixed 4S interval will be used. Considering 3S is
5075                  * the audio controller default autosuspend delay setting.
5076                  * 4S used here is guaranteed to cover that.
5077                  */
5078                 expires = ktime_get_mono_fast_ns() + NSEC_PER_SEC * 4ULL;
5079
5080         while (!pm_runtime_status_suspended(&(p->dev))) {
5081                 if (!pm_runtime_suspend(&(p->dev)))
5082                         break;
5083
5084                 if (expires < ktime_get_mono_fast_ns()) {
5085                         dev_warn(adev->dev, "failed to suspend display audio\n");
5086                         /* TODO: abort the succeeding gpu reset? */
5087                         return -ETIMEDOUT;
5088                 }
5089         }
5090
5091         pm_runtime_disable(&(p->dev));
5092
5093         return 0;
5094 }
5095
5096 static inline void amdgpu_device_stop_pending_resets(struct amdgpu_device *adev)
5097 {
5098         struct amdgpu_ras *con = amdgpu_ras_get_context(adev);
5099
5100 #if defined(CONFIG_DEBUG_FS)
5101         if (!amdgpu_sriov_vf(adev))
5102                 cancel_work(&adev->reset_work);
5103 #endif
5104
5105         if (adev->kfd.dev)
5106                 cancel_work(&adev->kfd.reset_work);
5107
5108         if (amdgpu_sriov_vf(adev))
5109                 cancel_work(&adev->virt.flr_work);
5110
5111         if (con && adev->ras_enabled)
5112                 cancel_work(&con->recovery_work);
5113
5114 }
5115
5116 /**
5117  * amdgpu_device_gpu_recover - reset the asic and recover scheduler
5118  *
5119  * @adev: amdgpu_device pointer
5120  * @job: which job trigger hang
5121  *
5122  * Attempt to reset the GPU if it has hung (all asics).
5123  * Attempt to do soft-reset or full-reset and reinitialize Asic
5124  * Returns 0 for success or an error on failure.
5125  */
5126
5127 int amdgpu_device_gpu_recover(struct amdgpu_device *adev,
5128                               struct amdgpu_job *job,
5129                               struct amdgpu_reset_context *reset_context)
5130 {
5131         struct list_head device_list, *device_list_handle =  NULL;
5132         bool job_signaled = false;
5133         struct amdgpu_hive_info *hive = NULL;
5134         struct amdgpu_device *tmp_adev = NULL;
5135         int i, r = 0;
5136         bool need_emergency_restart = false;
5137         bool audio_suspended = false;
5138         bool gpu_reset_for_dev_remove = false;
5139
5140         gpu_reset_for_dev_remove =
5141                         test_bit(AMDGPU_RESET_FOR_DEVICE_REMOVE, &reset_context->flags) &&
5142                                 test_bit(AMDGPU_NEED_FULL_RESET, &reset_context->flags);
5143
5144         /*
5145          * Special case: RAS triggered and full reset isn't supported
5146          */
5147         need_emergency_restart = amdgpu_ras_need_emergency_restart(adev);
5148
5149         /*
5150          * Flush RAM to disk so that after reboot
5151          * the user can read log and see why the system rebooted.
5152          */
5153         if (need_emergency_restart && amdgpu_ras_get_context(adev)->reboot) {
5154                 DRM_WARN("Emergency reboot.");
5155
5156                 ksys_sync_helper();
5157                 emergency_restart();
5158         }
5159
5160         dev_info(adev->dev, "GPU %s begin!\n",
5161                 need_emergency_restart ? "jobs stop":"reset");
5162
5163         if (!amdgpu_sriov_vf(adev))
5164                 hive = amdgpu_get_xgmi_hive(adev);
5165         if (hive)
5166                 mutex_lock(&hive->hive_lock);
5167
5168         reset_context->job = job;
5169         reset_context->hive = hive;
5170         /*
5171          * Build list of devices to reset.
5172          * In case we are in XGMI hive mode, resort the device list
5173          * to put adev in the 1st position.
5174          */
5175         INIT_LIST_HEAD(&device_list);
5176         if (!amdgpu_sriov_vf(adev) && (adev->gmc.xgmi.num_physical_nodes > 1)) {
5177                 list_for_each_entry(tmp_adev, &hive->device_list, gmc.xgmi.head) {
5178                         list_add_tail(&tmp_adev->reset_list, &device_list);
5179                         if (gpu_reset_for_dev_remove && adev->shutdown)
5180                                 tmp_adev->shutdown = true;
5181                 }
5182                 if (!list_is_first(&adev->reset_list, &device_list))
5183                         list_rotate_to_front(&adev->reset_list, &device_list);
5184                 device_list_handle = &device_list;
5185         } else {
5186                 list_add_tail(&adev->reset_list, &device_list);
5187                 device_list_handle = &device_list;
5188         }
5189
5190         /* We need to lock reset domain only once both for XGMI and single device */
5191         tmp_adev = list_first_entry(device_list_handle, struct amdgpu_device,
5192                                     reset_list);
5193         amdgpu_device_lock_reset_domain(tmp_adev->reset_domain);
5194
5195         /* block all schedulers and reset given job's ring */
5196         list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
5197
5198                 amdgpu_device_set_mp1_state(tmp_adev);
5199
5200                 /*
5201                  * Try to put the audio codec into suspend state
5202                  * before gpu reset started.
5203                  *
5204                  * Due to the power domain of the graphics device
5205                  * is shared with AZ power domain. Without this,
5206                  * we may change the audio hardware from behind
5207                  * the audio driver's back. That will trigger
5208                  * some audio codec errors.
5209                  */
5210                 if (!amdgpu_device_suspend_display_audio(tmp_adev))
5211                         audio_suspended = true;
5212
5213                 amdgpu_ras_set_error_query_ready(tmp_adev, false);
5214
5215                 cancel_delayed_work_sync(&tmp_adev->delayed_init_work);
5216
5217                 if (!amdgpu_sriov_vf(tmp_adev))
5218                         amdgpu_amdkfd_pre_reset(tmp_adev);
5219
5220                 /*
5221                  * Mark these ASICs to be reseted as untracked first
5222                  * And add them back after reset completed
5223                  */
5224                 amdgpu_unregister_gpu_instance(tmp_adev);
5225
5226                 drm_fb_helper_set_suspend_unlocked(adev_to_drm(tmp_adev)->fb_helper, true);
5227
5228                 /* disable ras on ALL IPs */
5229                 if (!need_emergency_restart &&
5230                       amdgpu_device_ip_need_full_reset(tmp_adev))
5231                         amdgpu_ras_suspend(tmp_adev);
5232
5233                 for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
5234                         struct amdgpu_ring *ring = tmp_adev->rings[i];
5235
5236                         if (!ring || !ring->sched.thread)
5237                                 continue;
5238
5239                         drm_sched_stop(&ring->sched, job ? &job->base : NULL);
5240
5241                         if (need_emergency_restart)
5242                                 amdgpu_job_stop_all_jobs_on_sched(&ring->sched);
5243                 }
5244                 atomic_inc(&tmp_adev->gpu_reset_counter);
5245         }
5246
5247         if (need_emergency_restart)
5248                 goto skip_sched_resume;
5249
5250         /*
5251          * Must check guilty signal here since after this point all old
5252          * HW fences are force signaled.
5253          *
5254          * job->base holds a reference to parent fence
5255          */
5256         if (job && dma_fence_is_signaled(&job->hw_fence)) {
5257                 job_signaled = true;
5258                 dev_info(adev->dev, "Guilty job already signaled, skipping HW reset");
5259                 goto skip_hw_reset;
5260         }
5261
5262 retry:  /* Rest of adevs pre asic reset from XGMI hive. */
5263         list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
5264                 if (gpu_reset_for_dev_remove) {
5265                         /* Workaroud for ASICs need to disable SMC first */
5266                         amdgpu_device_smu_fini_early(tmp_adev);
5267                 }
5268                 r = amdgpu_device_pre_asic_reset(tmp_adev, reset_context);
5269                 /*TODO Should we stop ?*/
5270                 if (r) {
5271                         dev_err(tmp_adev->dev, "GPU pre asic reset failed with err, %d for drm dev, %s ",
5272                                   r, adev_to_drm(tmp_adev)->unique);
5273                         tmp_adev->asic_reset_res = r;
5274                 }
5275
5276                 /*
5277                  * Drop all pending non scheduler resets. Scheduler resets
5278                  * were already dropped during drm_sched_stop
5279                  */
5280                 amdgpu_device_stop_pending_resets(tmp_adev);
5281         }
5282
5283         /* Actual ASIC resets if needed.*/
5284         /* Host driver will handle XGMI hive reset for SRIOV */
5285         if (amdgpu_sriov_vf(adev)) {
5286                 r = amdgpu_device_reset_sriov(adev, job ? false : true);
5287                 if (r)
5288                         adev->asic_reset_res = r;
5289
5290                 /* Aldebaran supports ras in SRIOV, so need resume ras during reset */
5291                 if (adev->ip_versions[GC_HWIP][0] == IP_VERSION(9, 4, 2))
5292                         amdgpu_ras_resume(adev);
5293         } else {
5294                 r = amdgpu_do_asic_reset(device_list_handle, reset_context);
5295                 if (r && r == -EAGAIN)
5296                         goto retry;
5297
5298                 if (!r && gpu_reset_for_dev_remove)
5299                         goto recover_end;
5300         }
5301
5302 skip_hw_reset:
5303
5304         /* Post ASIC reset for all devs .*/
5305         list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
5306
5307                 for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
5308                         struct amdgpu_ring *ring = tmp_adev->rings[i];
5309
5310                         if (!ring || !ring->sched.thread)
5311                                 continue;
5312
5313                         drm_sched_start(&ring->sched, true);
5314                 }
5315
5316                 if (adev->enable_mes && adev->ip_versions[GC_HWIP][0] != IP_VERSION(11, 0, 3))
5317                         amdgpu_mes_self_test(tmp_adev);
5318
5319                 if (!drm_drv_uses_atomic_modeset(adev_to_drm(tmp_adev)) && !job_signaled) {
5320                         drm_helper_resume_force_mode(adev_to_drm(tmp_adev));
5321                 }
5322
5323                 if (tmp_adev->asic_reset_res)
5324                         r = tmp_adev->asic_reset_res;
5325
5326                 tmp_adev->asic_reset_res = 0;
5327
5328                 if (r) {
5329                         /* bad news, how to tell it to userspace ? */
5330                         dev_info(tmp_adev->dev, "GPU reset(%d) failed\n", atomic_read(&tmp_adev->gpu_reset_counter));
5331                         amdgpu_vf_error_put(tmp_adev, AMDGIM_ERROR_VF_GPU_RESET_FAIL, 0, r);
5332                 } else {
5333                         dev_info(tmp_adev->dev, "GPU reset(%d) succeeded!\n", atomic_read(&tmp_adev->gpu_reset_counter));
5334                         if (amdgpu_acpi_smart_shift_update(adev_to_drm(tmp_adev), AMDGPU_SS_DEV_D0))
5335                                 DRM_WARN("smart shift update failed\n");
5336                 }
5337         }
5338
5339 skip_sched_resume:
5340         list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
5341                 /* unlock kfd: SRIOV would do it separately */
5342                 if (!need_emergency_restart && !amdgpu_sriov_vf(tmp_adev))
5343                         amdgpu_amdkfd_post_reset(tmp_adev);
5344
5345                 /* kfd_post_reset will do nothing if kfd device is not initialized,
5346                  * need to bring up kfd here if it's not be initialized before
5347                  */
5348                 if (!adev->kfd.init_complete)
5349                         amdgpu_amdkfd_device_init(adev);
5350
5351                 if (audio_suspended)
5352                         amdgpu_device_resume_display_audio(tmp_adev);
5353
5354                 amdgpu_device_unset_mp1_state(tmp_adev);
5355
5356                 amdgpu_ras_set_error_query_ready(tmp_adev, true);
5357         }
5358
5359 recover_end:
5360         tmp_adev = list_first_entry(device_list_handle, struct amdgpu_device,
5361                                             reset_list);
5362         amdgpu_device_unlock_reset_domain(tmp_adev->reset_domain);
5363
5364         if (hive) {
5365                 mutex_unlock(&hive->hive_lock);
5366                 amdgpu_put_xgmi_hive(hive);
5367         }
5368
5369         if (r)
5370                 dev_info(adev->dev, "GPU reset end with ret = %d\n", r);
5371
5372         atomic_set(&adev->reset_domain->reset_res, r);
5373         return r;
5374 }
5375
5376 /**
5377  * amdgpu_device_get_pcie_info - fence pcie info about the PCIE slot
5378  *
5379  * @adev: amdgpu_device pointer
5380  *
5381  * Fetchs and stores in the driver the PCIE capabilities (gen speed
5382  * and lanes) of the slot the device is in. Handles APUs and
5383  * virtualized environments where PCIE config space may not be available.
5384  */
5385 static void amdgpu_device_get_pcie_info(struct amdgpu_device *adev)
5386 {
5387         struct pci_dev *pdev;
5388         enum pci_bus_speed speed_cap, platform_speed_cap;
5389         enum pcie_link_width platform_link_width;
5390
5391         if (amdgpu_pcie_gen_cap)
5392                 adev->pm.pcie_gen_mask = amdgpu_pcie_gen_cap;
5393
5394         if (amdgpu_pcie_lane_cap)
5395                 adev->pm.pcie_mlw_mask = amdgpu_pcie_lane_cap;
5396
5397         /* covers APUs as well */
5398         if (pci_is_root_bus(adev->pdev->bus)) {
5399                 if (adev->pm.pcie_gen_mask == 0)
5400                         adev->pm.pcie_gen_mask = AMDGPU_DEFAULT_PCIE_GEN_MASK;
5401                 if (adev->pm.pcie_mlw_mask == 0)
5402                         adev->pm.pcie_mlw_mask = AMDGPU_DEFAULT_PCIE_MLW_MASK;
5403                 return;
5404         }
5405
5406         if (adev->pm.pcie_gen_mask && adev->pm.pcie_mlw_mask)
5407                 return;
5408
5409         pcie_bandwidth_available(adev->pdev, NULL,
5410                                  &platform_speed_cap, &platform_link_width);
5411
5412         if (adev->pm.pcie_gen_mask == 0) {
5413                 /* asic caps */
5414                 pdev = adev->pdev;
5415                 speed_cap = pcie_get_speed_cap(pdev);
5416                 if (speed_cap == PCI_SPEED_UNKNOWN) {
5417                         adev->pm.pcie_gen_mask |= (CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN1 |
5418                                                   CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN2 |
5419                                                   CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN3);
5420                 } else {
5421                         if (speed_cap == PCIE_SPEED_32_0GT)
5422                                 adev->pm.pcie_gen_mask |= (CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN1 |
5423                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN2 |
5424                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN3 |
5425                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN4 |
5426                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN5);
5427                         else if (speed_cap == PCIE_SPEED_16_0GT)
5428                                 adev->pm.pcie_gen_mask |= (CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN1 |
5429                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN2 |
5430                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN3 |
5431                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN4);
5432                         else if (speed_cap == PCIE_SPEED_8_0GT)
5433                                 adev->pm.pcie_gen_mask |= (CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN1 |
5434                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN2 |
5435                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN3);
5436                         else if (speed_cap == PCIE_SPEED_5_0GT)
5437                                 adev->pm.pcie_gen_mask |= (CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN1 |
5438                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN2);
5439                         else
5440                                 adev->pm.pcie_gen_mask |= CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN1;
5441                 }
5442                 /* platform caps */
5443                 if (platform_speed_cap == PCI_SPEED_UNKNOWN) {
5444                         adev->pm.pcie_gen_mask |= (CAIL_PCIE_LINK_SPEED_SUPPORT_GEN1 |
5445                                                    CAIL_PCIE_LINK_SPEED_SUPPORT_GEN2);
5446                 } else {
5447                         if (platform_speed_cap == PCIE_SPEED_32_0GT)
5448                                 adev->pm.pcie_gen_mask |= (CAIL_PCIE_LINK_SPEED_SUPPORT_GEN1 |
5449                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN2 |
5450                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN3 |
5451                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN4 |
5452                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN5);
5453                         else if (platform_speed_cap == PCIE_SPEED_16_0GT)
5454                                 adev->pm.pcie_gen_mask |= (CAIL_PCIE_LINK_SPEED_SUPPORT_GEN1 |
5455                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN2 |
5456                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN3 |
5457                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN4);
5458                         else if (platform_speed_cap == PCIE_SPEED_8_0GT)
5459                                 adev->pm.pcie_gen_mask |= (CAIL_PCIE_LINK_SPEED_SUPPORT_GEN1 |
5460                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN2 |
5461                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN3);
5462                         else if (platform_speed_cap == PCIE_SPEED_5_0GT)
5463                                 adev->pm.pcie_gen_mask |= (CAIL_PCIE_LINK_SPEED_SUPPORT_GEN1 |
5464                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN2);
5465                         else
5466                                 adev->pm.pcie_gen_mask |= CAIL_PCIE_LINK_SPEED_SUPPORT_GEN1;
5467
5468                 }
5469         }
5470         if (adev->pm.pcie_mlw_mask == 0) {
5471                 if (platform_link_width == PCIE_LNK_WIDTH_UNKNOWN) {
5472                         adev->pm.pcie_mlw_mask |= AMDGPU_DEFAULT_PCIE_MLW_MASK;
5473                 } else {
5474                         switch (platform_link_width) {
5475                         case PCIE_LNK_X32:
5476                                 adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X32 |
5477                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X16 |
5478                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X12 |
5479                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X8 |
5480                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X4 |
5481                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
5482                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
5483                                 break;
5484                         case PCIE_LNK_X16:
5485                                 adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X16 |
5486                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X12 |
5487                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X8 |
5488                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X4 |
5489                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
5490                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
5491                                 break;
5492                         case PCIE_LNK_X12:
5493                                 adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X12 |
5494                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X8 |
5495                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X4 |
5496                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
5497                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
5498                                 break;
5499                         case PCIE_LNK_X8:
5500                                 adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X8 |
5501                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X4 |
5502                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
5503                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
5504                                 break;
5505                         case PCIE_LNK_X4:
5506                                 adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X4 |
5507                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
5508                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
5509                                 break;
5510                         case PCIE_LNK_X2:
5511                                 adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
5512                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
5513                                 break;
5514                         case PCIE_LNK_X1:
5515                                 adev->pm.pcie_mlw_mask = CAIL_PCIE_LINK_WIDTH_SUPPORT_X1;
5516                                 break;
5517                         default:
5518                                 break;
5519                         }
5520                 }
5521         }
5522 }
5523
5524 /**
5525  * amdgpu_device_is_peer_accessible - Check peer access through PCIe BAR
5526  *
5527  * @adev: amdgpu_device pointer
5528  * @peer_adev: amdgpu_device pointer for peer device trying to access @adev
5529  *
5530  * Return true if @peer_adev can access (DMA) @adev through the PCIe
5531  * BAR, i.e. @adev is "large BAR" and the BAR matches the DMA mask of
5532  * @peer_adev.
5533  */
5534 bool amdgpu_device_is_peer_accessible(struct amdgpu_device *adev,
5535                                       struct amdgpu_device *peer_adev)
5536 {
5537 #ifdef CONFIG_HSA_AMD_P2P
5538         uint64_t address_mask = peer_adev->dev->dma_mask ?
5539                 ~*peer_adev->dev->dma_mask : ~((1ULL << 32) - 1);
5540         resource_size_t aper_limit =
5541                 adev->gmc.aper_base + adev->gmc.aper_size - 1;
5542         bool p2p_access =
5543                 !adev->gmc.xgmi.connected_to_cpu &&
5544                 !(pci_p2pdma_distance(adev->pdev, peer_adev->dev, false) < 0);
5545
5546         return pcie_p2p && p2p_access && (adev->gmc.visible_vram_size &&
5547                 adev->gmc.real_vram_size == adev->gmc.visible_vram_size &&
5548                 !(adev->gmc.aper_base & address_mask ||
5549                   aper_limit & address_mask));
5550 #else
5551         return false;
5552 #endif
5553 }
5554
5555 int amdgpu_device_baco_enter(struct drm_device *dev)
5556 {
5557         struct amdgpu_device *adev = drm_to_adev(dev);
5558         struct amdgpu_ras *ras = amdgpu_ras_get_context(adev);
5559
5560         if (!amdgpu_device_supports_baco(adev_to_drm(adev)))
5561                 return -ENOTSUPP;
5562
5563         if (ras && adev->ras_enabled &&
5564             adev->nbio.funcs->enable_doorbell_interrupt)
5565                 adev->nbio.funcs->enable_doorbell_interrupt(adev, false);
5566
5567         return amdgpu_dpm_baco_enter(adev);
5568 }
5569
5570 int amdgpu_device_baco_exit(struct drm_device *dev)
5571 {
5572         struct amdgpu_device *adev = drm_to_adev(dev);
5573         struct amdgpu_ras *ras = amdgpu_ras_get_context(adev);
5574         int ret = 0;
5575
5576         if (!amdgpu_device_supports_baco(adev_to_drm(adev)))
5577                 return -ENOTSUPP;
5578
5579         ret = amdgpu_dpm_baco_exit(adev);
5580         if (ret)
5581                 return ret;
5582
5583         if (ras && adev->ras_enabled &&
5584             adev->nbio.funcs->enable_doorbell_interrupt)
5585                 adev->nbio.funcs->enable_doorbell_interrupt(adev, true);
5586
5587         if (amdgpu_passthrough(adev) &&
5588             adev->nbio.funcs->clear_doorbell_interrupt)
5589                 adev->nbio.funcs->clear_doorbell_interrupt(adev);
5590
5591         return 0;
5592 }
5593
5594 /**
5595  * amdgpu_pci_error_detected - Called when a PCI error is detected.
5596  * @pdev: PCI device struct
5597  * @state: PCI channel state
5598  *
5599  * Description: Called when a PCI error is detected.
5600  *
5601  * Return: PCI_ERS_RESULT_NEED_RESET or PCI_ERS_RESULT_DISCONNECT.
5602  */
5603 pci_ers_result_t amdgpu_pci_error_detected(struct pci_dev *pdev, pci_channel_state_t state)
5604 {
5605         struct drm_device *dev = pci_get_drvdata(pdev);
5606         struct amdgpu_device *adev = drm_to_adev(dev);
5607         int i;
5608
5609         DRM_INFO("PCI error: detected callback, state(%d)!!\n", state);
5610
5611         if (adev->gmc.xgmi.num_physical_nodes > 1) {
5612                 DRM_WARN("No support for XGMI hive yet...");
5613                 return PCI_ERS_RESULT_DISCONNECT;
5614         }
5615
5616         adev->pci_channel_state = state;
5617
5618         switch (state) {
5619         case pci_channel_io_normal:
5620                 return PCI_ERS_RESULT_CAN_RECOVER;
5621         /* Fatal error, prepare for slot reset */
5622         case pci_channel_io_frozen:
5623                 /*
5624                  * Locking adev->reset_domain->sem will prevent any external access
5625                  * to GPU during PCI error recovery
5626                  */
5627                 amdgpu_device_lock_reset_domain(adev->reset_domain);
5628                 amdgpu_device_set_mp1_state(adev);
5629
5630                 /*
5631                  * Block any work scheduling as we do for regular GPU reset
5632                  * for the duration of the recovery
5633                  */
5634                 for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
5635                         struct amdgpu_ring *ring = adev->rings[i];
5636
5637                         if (!ring || !ring->sched.thread)
5638                                 continue;
5639
5640                         drm_sched_stop(&ring->sched, NULL);
5641                 }
5642                 atomic_inc(&adev->gpu_reset_counter);
5643                 return PCI_ERS_RESULT_NEED_RESET;
5644         case pci_channel_io_perm_failure:
5645                 /* Permanent error, prepare for device removal */
5646                 return PCI_ERS_RESULT_DISCONNECT;
5647         }
5648
5649         return PCI_ERS_RESULT_NEED_RESET;
5650 }
5651
5652 /**
5653  * amdgpu_pci_mmio_enabled - Enable MMIO and dump debug registers
5654  * @pdev: pointer to PCI device
5655  */
5656 pci_ers_result_t amdgpu_pci_mmio_enabled(struct pci_dev *pdev)
5657 {
5658
5659         DRM_INFO("PCI error: mmio enabled callback!!\n");
5660
5661         /* TODO - dump whatever for debugging purposes */
5662
5663         /* This called only if amdgpu_pci_error_detected returns
5664          * PCI_ERS_RESULT_CAN_RECOVER. Read/write to the device still
5665          * works, no need to reset slot.
5666          */
5667
5668         return PCI_ERS_RESULT_RECOVERED;
5669 }
5670
5671 /**
5672  * amdgpu_pci_slot_reset - Called when PCI slot has been reset.
5673  * @pdev: PCI device struct
5674  *
5675  * Description: This routine is called by the pci error recovery
5676  * code after the PCI slot has been reset, just before we
5677  * should resume normal operations.
5678  */
5679 pci_ers_result_t amdgpu_pci_slot_reset(struct pci_dev *pdev)
5680 {
5681         struct drm_device *dev = pci_get_drvdata(pdev);
5682         struct amdgpu_device *adev = drm_to_adev(dev);
5683         int r, i;
5684         struct amdgpu_reset_context reset_context;
5685         u32 memsize;
5686         struct list_head device_list;
5687
5688         DRM_INFO("PCI error: slot reset callback!!\n");
5689
5690         memset(&reset_context, 0, sizeof(reset_context));
5691
5692         INIT_LIST_HEAD(&device_list);
5693         list_add_tail(&adev->reset_list, &device_list);
5694
5695         /* wait for asic to come out of reset */
5696         msleep(500);
5697
5698         /* Restore PCI confspace */
5699         amdgpu_device_load_pci_state(pdev);
5700
5701         /* confirm  ASIC came out of reset */
5702         for (i = 0; i < adev->usec_timeout; i++) {
5703                 memsize = amdgpu_asic_get_config_memsize(adev);
5704
5705                 if (memsize != 0xffffffff)
5706                         break;
5707                 udelay(1);
5708         }
5709         if (memsize == 0xffffffff) {
5710                 r = -ETIME;
5711                 goto out;
5712         }
5713
5714         reset_context.method = AMD_RESET_METHOD_NONE;
5715         reset_context.reset_req_dev = adev;
5716         set_bit(AMDGPU_NEED_FULL_RESET, &reset_context.flags);
5717         set_bit(AMDGPU_SKIP_HW_RESET, &reset_context.flags);
5718
5719         adev->no_hw_access = true;
5720         r = amdgpu_device_pre_asic_reset(adev, &reset_context);
5721         adev->no_hw_access = false;
5722         if (r)
5723                 goto out;
5724
5725         r = amdgpu_do_asic_reset(&device_list, &reset_context);
5726
5727 out:
5728         if (!r) {
5729                 if (amdgpu_device_cache_pci_state(adev->pdev))
5730                         pci_restore_state(adev->pdev);
5731
5732                 DRM_INFO("PCIe error recovery succeeded\n");
5733         } else {
5734                 DRM_ERROR("PCIe error recovery failed, err:%d", r);
5735                 amdgpu_device_unset_mp1_state(adev);
5736                 amdgpu_device_unlock_reset_domain(adev->reset_domain);
5737         }
5738
5739         return r ? PCI_ERS_RESULT_DISCONNECT : PCI_ERS_RESULT_RECOVERED;
5740 }
5741
5742 /**
5743  * amdgpu_pci_resume() - resume normal ops after PCI reset
5744  * @pdev: pointer to PCI device
5745  *
5746  * Called when the error recovery driver tells us that its
5747  * OK to resume normal operation.
5748  */
5749 void amdgpu_pci_resume(struct pci_dev *pdev)
5750 {
5751         struct drm_device *dev = pci_get_drvdata(pdev);
5752         struct amdgpu_device *adev = drm_to_adev(dev);
5753         int i;
5754
5755
5756         DRM_INFO("PCI error: resume callback!!\n");
5757
5758         /* Only continue execution for the case of pci_channel_io_frozen */
5759         if (adev->pci_channel_state != pci_channel_io_frozen)
5760                 return;
5761
5762         for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
5763                 struct amdgpu_ring *ring = adev->rings[i];
5764
5765                 if (!ring || !ring->sched.thread)
5766                         continue;
5767
5768                 drm_sched_start(&ring->sched, true);
5769         }
5770
5771         amdgpu_device_unset_mp1_state(adev);
5772         amdgpu_device_unlock_reset_domain(adev->reset_domain);
5773 }
5774
5775 bool amdgpu_device_cache_pci_state(struct pci_dev *pdev)
5776 {
5777         struct drm_device *dev = pci_get_drvdata(pdev);
5778         struct amdgpu_device *adev = drm_to_adev(dev);
5779         int r;
5780
5781         r = pci_save_state(pdev);
5782         if (!r) {
5783                 kfree(adev->pci_state);
5784
5785                 adev->pci_state = pci_store_saved_state(pdev);
5786
5787                 if (!adev->pci_state) {
5788                         DRM_ERROR("Failed to store PCI saved state");
5789                         return false;
5790                 }
5791         } else {
5792                 DRM_WARN("Failed to save PCI state, err:%d\n", r);
5793                 return false;
5794         }
5795
5796         return true;
5797 }
5798
5799 bool amdgpu_device_load_pci_state(struct pci_dev *pdev)
5800 {
5801         struct drm_device *dev = pci_get_drvdata(pdev);
5802         struct amdgpu_device *adev = drm_to_adev(dev);
5803         int r;
5804
5805         if (!adev->pci_state)
5806                 return false;
5807
5808         r = pci_load_saved_state(pdev, adev->pci_state);
5809
5810         if (!r) {
5811                 pci_restore_state(pdev);
5812         } else {
5813                 DRM_WARN("Failed to load PCI state, err:%d\n", r);
5814                 return false;
5815         }
5816
5817         return true;
5818 }
5819
5820 void amdgpu_device_flush_hdp(struct amdgpu_device *adev,
5821                 struct amdgpu_ring *ring)
5822 {
5823 #ifdef CONFIG_X86_64
5824         if ((adev->flags & AMD_IS_APU) && !amdgpu_passthrough(adev))
5825                 return;
5826 #endif
5827         if (adev->gmc.xgmi.connected_to_cpu)
5828                 return;
5829
5830         if (ring && ring->funcs->emit_hdp_flush)
5831                 amdgpu_ring_emit_hdp_flush(ring);
5832         else
5833                 amdgpu_asic_flush_hdp(adev, ring);
5834 }
5835
5836 void amdgpu_device_invalidate_hdp(struct amdgpu_device *adev,
5837                 struct amdgpu_ring *ring)
5838 {
5839 #ifdef CONFIG_X86_64
5840         if ((adev->flags & AMD_IS_APU) && !amdgpu_passthrough(adev))
5841                 return;
5842 #endif
5843         if (adev->gmc.xgmi.connected_to_cpu)
5844                 return;
5845
5846         amdgpu_asic_invalidate_hdp(adev, ring);
5847 }
5848
5849 int amdgpu_in_reset(struct amdgpu_device *adev)
5850 {
5851         return atomic_read(&adev->reset_domain->in_gpu_reset);
5852         }
5853
5854 /**
5855  * amdgpu_device_halt() - bring hardware to some kind of halt state
5856  *
5857  * @adev: amdgpu_device pointer
5858  *
5859  * Bring hardware to some kind of halt state so that no one can touch it
5860  * any more. It will help to maintain error context when error occurred.
5861  * Compare to a simple hang, the system will keep stable at least for SSH
5862  * access. Then it should be trivial to inspect the hardware state and
5863  * see what's going on. Implemented as following:
5864  *
5865  * 1. drm_dev_unplug() makes device inaccessible to user space(IOCTLs, etc),
5866  *    clears all CPU mappings to device, disallows remappings through page faults
5867  * 2. amdgpu_irq_disable_all() disables all interrupts
5868  * 3. amdgpu_fence_driver_hw_fini() signals all HW fences
5869  * 4. set adev->no_hw_access to avoid potential crashes after setp 5
5870  * 5. amdgpu_device_unmap_mmio() clears all MMIO mappings
5871  * 6. pci_disable_device() and pci_wait_for_pending_transaction()
5872  *    flush any in flight DMA operations
5873  */
5874 void amdgpu_device_halt(struct amdgpu_device *adev)
5875 {
5876         struct pci_dev *pdev = adev->pdev;
5877         struct drm_device *ddev = adev_to_drm(adev);
5878
5879         drm_dev_unplug(ddev);
5880
5881         amdgpu_irq_disable_all(adev);
5882
5883         amdgpu_fence_driver_hw_fini(adev);
5884
5885         adev->no_hw_access = true;
5886
5887         amdgpu_device_unmap_mmio(adev);
5888
5889         pci_disable_device(pdev);
5890         pci_wait_for_pending_transaction(pdev);
5891 }
5892
5893 u32 amdgpu_device_pcie_port_rreg(struct amdgpu_device *adev,
5894                                 u32 reg)
5895 {
5896         unsigned long flags, address, data;
5897         u32 r;
5898
5899         address = adev->nbio.funcs->get_pcie_port_index_offset(adev);
5900         data = adev->nbio.funcs->get_pcie_port_data_offset(adev);
5901
5902         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
5903         WREG32(address, reg * 4);
5904         (void)RREG32(address);
5905         r = RREG32(data);
5906         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
5907         return r;
5908 }
5909
5910 void amdgpu_device_pcie_port_wreg(struct amdgpu_device *adev,
5911                                 u32 reg, u32 v)
5912 {
5913         unsigned long flags, address, data;
5914
5915         address = adev->nbio.funcs->get_pcie_port_index_offset(adev);
5916         data = adev->nbio.funcs->get_pcie_port_data_offset(adev);
5917
5918         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
5919         WREG32(address, reg * 4);
5920         (void)RREG32(address);
5921         WREG32(data, v);
5922         (void)RREG32(data);
5923         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
5924 }
5925
5926 /**
5927  * amdgpu_device_switch_gang - switch to a new gang
5928  * @adev: amdgpu_device pointer
5929  * @gang: the gang to switch to
5930  *
5931  * Try to switch to a new gang.
5932  * Returns: NULL if we switched to the new gang or a reference to the current
5933  * gang leader.
5934  */
5935 struct dma_fence *amdgpu_device_switch_gang(struct amdgpu_device *adev,
5936                                             struct dma_fence *gang)
5937 {
5938         struct dma_fence *old = NULL;
5939
5940         do {
5941                 dma_fence_put(old);
5942                 rcu_read_lock();
5943                 old = dma_fence_get_rcu_safe(&adev->gang_submit);
5944                 rcu_read_unlock();
5945
5946                 if (old == gang)
5947                         break;
5948
5949                 if (!dma_fence_is_signaled(old))
5950                         return old;
5951
5952         } while (cmpxchg((struct dma_fence __force **)&adev->gang_submit,
5953                          old, gang) != old);
5954
5955         dma_fence_put(old);
5956         return NULL;
5957 }
5958
5959 bool amdgpu_device_has_display_hardware(struct amdgpu_device *adev)
5960 {
5961         switch (adev->asic_type) {
5962 #ifdef CONFIG_DRM_AMDGPU_SI
5963         case CHIP_HAINAN:
5964 #endif
5965         case CHIP_TOPAZ:
5966                 /* chips with no display hardware */
5967                 return false;
5968 #ifdef CONFIG_DRM_AMDGPU_SI
5969         case CHIP_TAHITI:
5970         case CHIP_PITCAIRN:
5971         case CHIP_VERDE:
5972         case CHIP_OLAND:
5973 #endif
5974 #ifdef CONFIG_DRM_AMDGPU_CIK
5975         case CHIP_BONAIRE:
5976         case CHIP_HAWAII:
5977         case CHIP_KAVERI:
5978         case CHIP_KABINI:
5979         case CHIP_MULLINS:
5980 #endif
5981         case CHIP_TONGA:
5982         case CHIP_FIJI:
5983         case CHIP_POLARIS10:
5984         case CHIP_POLARIS11:
5985         case CHIP_POLARIS12:
5986         case CHIP_VEGAM:
5987         case CHIP_CARRIZO:
5988         case CHIP_STONEY:
5989                 /* chips with display hardware */
5990                 return true;
5991         default:
5992                 /* IP discovery */
5993                 if (!adev->ip_versions[DCE_HWIP][0] ||
5994                     (adev->harvest_ip_mask & AMD_HARVEST_IP_DMU_MASK))
5995                         return false;
5996                 return true;
5997         }
5998 }